This file is indexed.

/usr/lib/python2.7/dist-packages/cogent/db/ensembl/species.py is in python-cogent 1.9-9.

This file is owned by root:root, with mode 0o644.

The actual contents of the file can be viewed below.

  1
  2
  3
  4
  5
  6
  7
  8
  9
 10
 11
 12
 13
 14
 15
 16
 17
 18
 19
 20
 21
 22
 23
 24
 25
 26
 27
 28
 29
 30
 31
 32
 33
 34
 35
 36
 37
 38
 39
 40
 41
 42
 43
 44
 45
 46
 47
 48
 49
 50
 51
 52
 53
 54
 55
 56
 57
 58
 59
 60
 61
 62
 63
 64
 65
 66
 67
 68
 69
 70
 71
 72
 73
 74
 75
 76
 77
 78
 79
 80
 81
 82
 83
 84
 85
 86
 87
 88
 89
 90
 91
 92
 93
 94
 95
 96
 97
 98
 99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
from cogent.util.table import Table
from cogent.db.ensembl.util import CaseInsensitiveString

__author__ = "Gavin Huttley"
__copyright__ = "Copyright 2007-2016, The Cogent Project"
__credits__ = ["Gavin Huttley", "Jason Merkin"]
__license__ = "GPL"
__version__ = "1.9"
__maintainer__ = "Gavin Huttley"
__email__ = "Gavin.Huttley@anu.edu.au"
__status__ = "alpha"

_species_common_map = [['Acyrthosiphon pisum', 'A.pisum'],
                       ['Aedes aegypti', 'A.aegypti'],
                       ['Anolis carolinensis', 'Anole lizard'],
                       ['Anopheles gambiae', 'A.gambiae'],
                       ['Apis mellifera', 'Honeybee'],
                       ['Arabidopsis lyrata', 'A.lyrata'],
                       ['Arabidopsis thaliana', 'A.thaliana'],
                       ['Aspergillus clavatus', 'A.clavatus'],
                       ['Aspergillus flavus', 'A.flavus'],
                       ['Aspergillus fumigatus', 'A.fumigatus'],
                       ['Aspergillus fumigatusa1163', 'A.fumigatusa1163'],
                       ['Aspergillus nidulans', 'A.nidulans'],
                       ['Aspergillus niger', 'A.niger'],
                       ['Aspergillus oryzae', 'A.oryzae'],
                       ['Aspergillus terreus', 'A.terreus'],
                       ['Bacillus collection', 'Bacillus'],
                       ['Borrelia collection', 'Borrelia'],
                       ['Bos taurus', 'Cow'],
                       ['Brachypodium distachyon', 'B.distachyon'],
                       ['Buchnera collection', 'Buchnera'],
                       ['Caenorhabditis brenneri', 'C.brenneri'],
                       ['Caenorhabditis briggsae', 'C.briggsae'],
                       ['Caenorhabditis elegans', 'C.elegans'],
                       ['Caenorhabditis japonica', 'C.japonica'],
                       ['Caenorhabditis remanei', 'C.remanei'],
                       ['Callithrix jacchus', 'Marmoset'],
                       ['Canis familiaris', 'Dog'],
                       ['Cavia porcellus', 'Guinea Pig'],
                       ['Choloepus hoffmanni', 'Sloth'],
                       ['Ciona intestinalis', 'C.intestinalis'],
                       ['Ciona savignyi', 'C.savignyi'],
                       ['Culex quinquefasciatus', 'C.quinquefasciatus'],
                       ['Danio rerio', 'Zebrafish'],
                       ['Dasypus novemcinctus', 'Armadillo'],
                       ['Dictyostelium discoideum', 'D.discoideum'],
                       ['Dipodomys ordii', 'Kangaroo rat'],
                       ['Drosophila ananassae', 'D.ananassae'],
                       ['Drosophila erecta', 'D.erecta'],
                       ['Drosophila grimshawi', 'D.grimshawi'],
                       ['Drosophila melanogaster', 'D.melanogaster'],
                       ['Drosophila mojavensis', 'D.mojavensis'],
                       ['Drosophila persimilis', 'D.persimilis'],
                       ['Drosophila pseudoobscura', 'D.pseudoobscura'],
                       ['Drosophila sechellia', 'D.sechellia'],
                       ['Drosophila simulans', 'D.simulans'],
                       ['Drosophila virilis', 'D.virilis'],
                       ['Drosophila willistoni', 'D.willistoni'],
                       ['Drosophila yakuba', 'D.yakuba'],
                       ['Echinops telfairi', 'Tenrec'],
                       ['Equus caballus', 'Horse'],
                       ['Erinaceus europaeus', 'Hedgehog'],
                       ['Escherichia shigella', 'E.shigella'],
                       ['Felis catus', 'Cat'],
                       ['Gallus gallus', 'Chicken'],
                       ['Gasterosteus aculeatus', 'Stickleback'],
                       ['Gorilla gorilla', 'Gorilla'],
                       ['Homo sapiens', 'Human'],
                       ['Ictidomys tridecemlineatus', 'Squirrel'],
                       ['Ixodes scapularis', 'I.scapularis'],
                       ['Loxodonta africana', 'Elephant'],
                       ['Macaca mulatta', 'Macaque'],
                       ['Macropus eugenii', 'Wallaby'],
                       ['Microcebus murinus', 'Mouse lemur'],
                       ['Monodelphis domestica', 'Opossum'],
                       ['Mus musculus', 'Mouse'],
                       ['Mycobacterium collection', 'Mycobacterium'],
                       ['Myotis lucifugus', 'Microbat'],
                       ['Neisseria collection', 'Neisseria'],
                       ['Nematostella vectensis', 'N.vectensis'],
                       ['Neosartorya fischeri', 'N.fischeri'],
                       ['Neurospora crassa', 'N.crassa'],
                       ['Ochotona princeps', 'Pika'],
                       ['Ornithorhynchus anatinus', 'Platypus'],
                       ['Oryctolagus cuniculus', 'Rabbit'],
                       ['Oryza indica', 'O.indica'],
                       ['Oryza sativa', 'O.sativa'],
                       ['Oryzias latipes', 'Medaka'],
                       ['Otolemur garnettii', 'Bushbaby'],
                       ['Pan troglodytes', 'Chimp'],
                       ['Pediculus humanus', 'P.humanus'],
                       ['Petromyzon marinus', 'Lamprey'],
                       ['Phaeodactylum tricornutum', 'P.tricornutum'],
                       ['Physcomitrella patens', 'P.patens'],
                       ['Phytophthora infestans', 'P.infestans'],
                       ['Phytophthora ramorum', 'P.ramorum'],
                       ['Phytophthora sojae', 'P.sojae'],
                       ['Plasmodium berghei', 'P.berghei'],
                       ['Plasmodium chabaudi', 'P.chabaudi'],
                       ['Plasmodium falciparum', 'P.falciparum'],
                       ['Plasmodium knowlesi', 'P.knowlesi'],
                       ['Plasmodium vivax', 'P.vivax'],
                       ['Pongo abelii', 'Orangutan'],
                       ['Populus trichocarpa', 'P.trichocarpa'],
                       ['Pristionchus pacificus', 'P.pacificus'],
                       ['Procavia capensis', 'Rock hyrax'],
                       ['Pteropus vampyrus', 'Flying fox'],
                       ['Puccinia graministritici', 'P.graministritici'],
                       ['Pyrococcus collection', 'Pyrococcus'],
                       ['Rattus norvegicus', 'Rat'],
                       ['Saccharomyces cerevisiae', 'S.cerevisiae'],
                       ['Schistosoma mansoni', 'S.mansoni'],
                       ['Schizosaccharomyces pombe', 'S.pombe'],
                       ['Sorex araneus', 'Shrew'],
                       ['Sorghum bicolor', 'S.bicolor'],
                       ['Staphylococcus collection', 'Staphylococcus'],
                       ['Streptococcus collection', 'Streptococcus'],
                       ['Strongylocentrotus purpuratus', 'S.purpuratus'],
                       ['Sus scrofa', 'Pig'],
                       ['Taeniopygia guttata', 'Zebra finch'],
                       ['Takifugu rubripes', 'Fugu'],
                       ['Tarsius syrichta', 'Tarsier'],
                       ['Tetraodon nigroviridis', 'Tetraodon'],
                       ['Thalassiosira pseudonana', 'T.pseudonana'],
                       ['Trichoplax adhaerens', 'T.adhaerens'],
                       ['Tupaia belangeri', 'Tree Shrew'],
                       ['Tursiops truncatus', 'Bottlenose dolphin'],
                       ['Vicugna pacos', 'Alpaca'],
                       ['Vitis vinifera', 'V.vinifera'],
                       ['Wolbachia collection', 'Wolbachia'],
                       ['Xenopus tropicalis', 'Xenopus'],
                       ['Zea mays', 'Z.mays']]

class SpeciesNameMap(dict):
    """mapping between common names and latin names"""
    def __init__(self, species_common = _species_common_map):
        """provides latin name:common name mappings"""
        self._species_common = {}
        self._common_species = {}
        self._species_ensembl = {}
        self._ensembl_species = {}
        for species_name, common_name in species_common:
            self.amendSpecies(CaseInsensitiveString(species_name),
                              CaseInsensitiveString(common_name))
    
    def __str__(self):
        rows = []
        for common in self._common_species:
            species = self._common_species[common]
            ensembl = self._species_ensembl[species]
            rows += [[common, species, ensembl]]
        return str(Table(['Common Name', 'Species Name', 'Ensembl Db Prefix'],
                    rows=rows, space=2).sorted())
    
    def __repr__(self):
        return 'Available species: %s' % ("'"+\
                "'; '".join(self._common_species.keys())+"'")
    
    def getCommonName(self, name, level='raise'):
        """returns the common name for the given name (which can be either a
        species name or the ensembl version)"""
        name = CaseInsensitiveString(name)
        if name in self._ensembl_species:
            name = self._ensembl_species[name]
        
        if name in self._species_common:
            common_name = self._species_common[name]
        elif name in self._common_species:
            common_name = name
        else:
            common_name = None
        
        if common_name is None:
            msg = "Unknown species name: %s" % name
            if level == 'raise':
                raise RuntimeError(msg)
            elif level == 'warn':
                print "WARN: %s" % msg
        
        return str(common_name)
    
    def getSpeciesName(self, name, level='ignore'):
        """returns the species name for the given common name"""
        name = CaseInsensitiveString(name)
        if name in self._species_common:
            return str(name)
        species_name = None
        level = level.lower().strip()
        name = name
        for data in [self._common_species, self._ensembl_species]:
            if name in data:
                species_name = data[name]
        if species_name is None:
            msg = "Unknown common name: %s" % name
            if level == 'raise':
                raise RuntimeError(msg)
            elif level == 'warn':
                print "WARN: %s" % msg
        return str(species_name)
    
    def getSpeciesNames(self):
        """returns the list of species names"""
        names = self._species_common.keys()
        names.sort()
        return [str(n) for n in names]
    
    def getEnsemblDbPrefix(self, name):
        """returns a string of the species name in the format used by
        ensembl"""
        name = CaseInsensitiveString(name)
        if name in self._common_species:
            name = self._common_species[name]
        try:
            species_name = self.getSpeciesName(name, level='raise')
        except RuntimeError:
            if name not in self._species_common:
                raise RuntimeError("Unknown name %s" % name)
            species_name = name
        
        return str(species_name.lower().replace(" ","_"))
    
    def getComparaName(self, name):
        """returns string matching a compara instance attribute name for a
        species"""
        name = self.getCommonName(name)
        if '.' in name:
            name = name.replace('.', '')
        else:
            name = name.title()
        
        name = name.split()
        return ''.join(name)
    
    def _purge_species(self, species_name):
        """removes a species record"""
        species_name = CaseInsensitiveString(species_name)
        if not species_name in self._species_common:
            return
        common_name = self._species_common.pop(species_name)
        ensembl_name= self._species_ensembl.pop(species_name)
        self._ensembl_species.pop(ensembl_name)
        self._common_species.pop(common_name)
    
    def amendSpecies(self, species_name, common_name):
        """add a new species, and common name"""
        species_name = CaseInsensitiveString(species_name)
        common_name = CaseInsensitiveString(common_name)
        assert "_" not in species_name,\
                        "'_' in species_name, not a Latin name?"
        self._purge_species(species_name) # remove if existing
        self._species_common[species_name] = common_name
        self._common_species[common_name] = species_name
        ensembl_name = species_name.lower().replace(" ","_")
        self._species_ensembl[species_name] = ensembl_name
        self._ensembl_species[ensembl_name] = species_name
        return

Species = SpeciesNameMap()