{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,9]],"date-time":"2026-05-09T18:16:49Z","timestamp":1778350609053,"version":"3.51.4"},"reference-count":60,"publisher":"Springer Science and Business Media LLC","issue":"1","content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["BMC Bioinformatics"],"DOI":"10.1186\/1471-2105-4-41","type":"journal-article","created":{"date-parts":[[2003,10,21]],"date-time":"2003-10-21T02:27:22Z","timestamp":1066703242000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3725,"title":["The COG database: an updated version includes eukaryotes"],"prefix":"10.1186","volume":"4","author":[{"given":"Roman L","family":"Tatusov","sequence":"first","affiliation":[]},{"given":"Natalie D","family":"Fedorova","sequence":"additional","affiliation":[]},{"given":"John D","family":"Jackson","sequence":"additional","affiliation":[]},{"given":"Aviva R","family":"Jacobs","sequence":"additional","affiliation":[]},{"given":"Boris","family":"Kiryutin","sequence":"additional","affiliation":[]},{"given":"Eugene V","family":"Koonin","sequence":"additional","affiliation":[]},{"given":"Dmitri M","family":"Krylov","sequence":"additional","affiliation":[]},{"given":"Raja","family":"Mazumder","sequence":"additional","affiliation":[]},{"given":"Sergei L","family":"Mekhedov","sequence":"additional","affiliation":[]},{"given":"Anastasia N","family":"Nikolskaya","sequence":"additional","affiliation":[]},{"given":"B Sridhar","family":"Rao","sequence":"additional","affiliation":[]},{"given":"Sergei","family":"Smirnov","sequence":"additional","affiliation":[]},{"given":"Alexander V","family":"Sverdlov","sequence":"additional","affiliation":[]},{"given":"Sona","family":"Vasudevan","sequence":"additional","affiliation":[]},{"given":"Yuri I","family":"Wolf","sequence":"additional","affiliation":[]},{"given":"Jodie J","family":"Yin","sequence":"additional","affiliation":[]},{"given":"Darren A","family":"Natale","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2003,9,11]]},"reference":[{"key":"91_CR1","doi-asserted-by":"publisher","first-page":"99","DOI":"10.2307\/2412448","volume":"19","author":"WM Fitch","year":"1970","unstructured":"Fitch WM: Distinguishing homologous from analogous proteins.\n                           Systematic Zoology 1970, 19: 99\u2013106.","journal-title":"Systematic Zoology"},{"key":"91_CR2","doi-asserted-by":"publisher","first-page":"227","DOI":"10.1016\/S0168-9525(00)02005-9","volume":"16","author":"WM Fitch","year":"2000","unstructured":"Fitch WM: Homology a personal view on some of the problems.\n                           Trends Genet 2000, 16: 227\u2013231. 10.1016\/S0168-9525(00)02005-9","journal-title":"Trends Genet"},{"key":"91_CR3","doi-asserted-by":"publisher","first-page":"609","DOI":"10.1126\/science.278.5338.609","volume":"278","author":"S Henikoff","year":"1997","unstructured":"Henikoff S, Greene EA, Pietrokovski S, Bork P, Attwood TK, Hood L: Gene families: the taxonomy of protein paralogs and chimeras.\n                           Science 1997, 278: 609\u2013614. 10.1126\/science.278.5338.609","journal-title":"Science"},{"key":"91_CR4","doi-asserted-by":"publisher","first-page":"619","DOI":"10.1016\/S0168-9525(02)02793-2","volume":"18","author":"EL Sonnhammer","year":"2002","unstructured":"Sonnhammer EL, Koonin EV: Orthology, paralogy and proposed classification for paralog subtypes.\n                           Trends Genet 2002, 18: 619\u2013620. 10.1016\/S0168-9525(02)02793-2","journal-title":"Trends Genet"},{"key":"91_CR5","doi-asserted-by":"publisher","first-page":"233","DOI":"10.1006\/jmbi.2000.3550","volume":"297","author":"CA Wilson","year":"2000","unstructured":"Wilson CA, Kreychman J, Gerstein M: Assessing annotation transfer for genomics: quantifying the relations between protein sequence, structure and function through traditional and probabilistic scores.\n                           J Mol Biol 2000, 297: 233\u2013249. 10.1006\/jmbi.2000.3550","journal-title":"J Mol Biol"},{"key":"91_CR6","doi-asserted-by":"publisher","first-page":"545","DOI":"10.1093\/nar\/29.2.545","volume":"29","author":"T Sicheritz-Ponten","year":"2001","unstructured":"Sicheritz-Ponten T, Andersson SG: A phylogenomic approach to microbial evolution.\n                           Nucleic Acids Res 2001, 29: 545\u2013552. 10.1093\/nar\/29.2.545","journal-title":"Nucleic Acids Res"},{"key":"91_CR7","doi-asserted-by":"publisher","first-page":"14","DOI":"10.1186\/1471-2105-3-14","volume":"3","author":"CM Zmasek","year":"2002","unstructured":"Zmasek CM, Eddy SR: RIO: Analyzing proteomes by automated phylogenomics using resampled inference of orthologs.\n                           BMC Bioinformatics 2002, 3: 14. 10.1186\/1471-2105-3-14","journal-title":"BMC Bioinformatics"},{"key":"91_CR8","doi-asserted-by":"publisher","first-page":"92","DOI":"10.1093\/bioinformatics\/18.1.92","volume":"18","author":"CE Storm","year":"2002","unstructured":"Storm CE, Sonnhammer EL: Automated ortholog inference from phylogenetic trees and calculation of orthology reliability.\n                           Bioinformatics 2002, 18: 92\u201399. 10.1093\/bioinformatics\/18.1.92","journal-title":"Bioinformatics"},{"key":"91_CR9","doi-asserted-by":"publisher","first-page":"631","DOI":"10.1126\/science.278.5338.631","volume":"278","author":"RL Tatusov","year":"1997","unstructured":"Tatusov RL, Koonin EV, Lipman DJ: A genomic perspective on protein families.\n                           Science 1997, 278: 631\u2013637. 10.1126\/science.278.5338.631","journal-title":"Science"},{"key":"91_CR10","doi-asserted-by":"publisher","first-page":"5849","DOI":"10.1073\/pnas.95.11.5849","volume":"95","author":"MA Huynen","year":"1998","unstructured":"Huynen MA, Bork P: Measuring genome evolution.\n                           Proc Natl Acad Sci U S A 1998, 95: 5849\u20135856. 10.1073\/pnas.95.11.5849","journal-title":"Proc Natl Acad Sci U S A"},{"key":"91_CR11","doi-asserted-by":"publisher","first-page":"5334","DOI":"10.1073\/pnas.97.10.5334","volume":"97","author":"MG Montague","year":"2000","unstructured":"Montague MG, Hutchison CA 3rd: Gene content phylogeny of herpesviruses.\n                           Proc Natl Acad Sci U S A 2000, 97: 5334\u20135339. 10.1073\/pnas.97.10.5334","journal-title":"Proc Natl Acad Sci U S A"},{"key":"91_CR12","doi-asserted-by":"publisher","first-page":"555","DOI":"10.1101\/gr.GR-1660R","volume":"11","author":"IK Jordan","year":"2001","unstructured":"Jordan IK, Makarova KS, Spouge JL, Wolf YI, Koonin EV: Lineage-specific gene expansions in bacterial and archaeal genomes.\n                           Genome Res 2001, 11: 555\u2013565. 10.1101\/gr.GR-1660R","journal-title":"Genome Res"},{"key":"91_CR13","doi-asserted-by":"publisher","first-page":"1041","DOI":"10.1006\/jmbi.2000.5197","volume":"314","author":"M Remm","year":"2001","unstructured":"Remm M, Storm CE, Sonnhammer EL: Automatic clustering of orthologs and in-paralogs from pairwise species comparisons.\n                           J Mol Biol 2001, 314: 1041\u20131052. 10.1006\/jmbi.2000.5197","journal-title":"J Mol Biol"},{"key":"91_CR14","doi-asserted-by":"publisher","first-page":"1048","DOI":"10.1101\/gr.174302","volume":"12","author":"O Lespinet","year":"2002","unstructured":"Lespinet O, Wolf YI, Koonin EV, Aravind L: The role of lineage-specific gene family expansion in the evolution of eukaryotes.\n                           Genome Res 2002, 12: 1048\u20131059. 10.1101\/gr.174302","journal-title":"Genome Res"},{"key":"91_CR15","doi-asserted-by":"publisher","first-page":"22","DOI":"10.1093\/nar\/29.1.22","volume":"29","author":"RL Tatusov","year":"2001","unstructured":"Tatusov RL, Natale DA, Garkavtsev IV, Tatusova TA, Shankavaram UT, Rao BS, Kiryutin B, Galperin MY, Fedorova ND, Koonin EV: The COG database: new developments in phylogenetic classification of proteins from complete genomes.\n                           Nucleic Acids Res 2001, 29: 22\u201328. 10.1093\/nar\/29.1.22","journal-title":"Nucleic Acids Res"},{"key":"91_CR16","doi-asserted-by":"publisher","first-page":"4644","DOI":"10.1073\/pnas.032671499","volume":"99","author":"AI Slesarev","year":"2002","unstructured":"Slesarev AI, Mezhevaya KV, Makarova KS, Polushin NN, Shcherbinina OV, Shakhova VV, Belova GI, Aravind L, Natale DA, Rogozin IB, Tatusov RL, Wolf YI, Stetter KO, Malykh AG, Koonin EV, Kozyavkin SA: The complete genome of hyperthermophile Methanopyrus kandleri AV19 and monophyly of archaeal methanogens.\n                           Proc Natl Acad Sci U S A 2002, 99: 4644\u20134649. 10.1073\/pnas.032671499","journal-title":"Proc Natl Acad Sci U S A"},{"key":"91_CR17","first-page":"RESEARCH0009","volume":"5","author":"DA Natale","year":"2001","unstructured":"Natale DA, Shankavaram UT, Galperin MY, Wolf YI, Aravind L, Koonin EV: Genome annotation using clusters of orthologous groups of proteins (COGs) \u2013 towards understanding the first genome of a Crenarchaeon.\n                           Genome Biology 2001, 5: RESEARCH0009.","journal-title":"Genome Biology"},{"key":"91_CR18","doi-asserted-by":"publisher","first-page":"4823","DOI":"10.1128\/JB.183.16.4823-4838.2001","volume":"183","author":"J Nolling","year":"2001","unstructured":"Nolling J, Breton G, Omelchenko MV, Makarova KS, Zeng Q, Gibson R, Lee HM, Dubois J, Qiu D, Hitti J, Wolf YI, Tatusov RL, Sabathe F, Doucette-Stamm L, Soucaille P, Daly MJ, Bennett GN, Koonin EV, Smith DR: Genome sequence and comparative analysis of the solvent-producing bacterium Clostridium acetobutylicum.\n                           J Bacteriol 2001, 183: 4823\u20134838. 10.1128\/JB.183.16.4823-4838.2001","journal-title":"J Bacteriol"},{"key":"91_CR19","doi-asserted-by":"publisher","first-page":"852","DOI":"10.1038\/35101614","volume":"413","author":"M McClelland","year":"2001","unstructured":"McClelland M, Sanderson KE, Spieth J, Clifton SW, Latreille P, Courtney L, Porwollik S, Ali J, Dante M, Du F, Hou S, Layman D, Leonard S, Nguyen C, Scott K, Holmes A, Grewal N, Mulvaney E, Ryan E, Sun H, Florea L, Miller W, Stoneking T, Nhan M, Waterston R, Wilson RK: Complete genome sequence of Salmonella enterica serovar Typhimurium LT2.\n                           Nature 2001, 413: 852\u2013856. 10.1038\/35101614","journal-title":"Nature"},{"key":"91_CR20","doi-asserted-by":"publisher","first-page":"44","DOI":"10.1128\/MMBR.65.1.44-79.2001","volume":"65","author":"KS Makarova","year":"2001","unstructured":"Makarova KS, Aravind L, Wolf YI, Tatusov RL, Minton KW, Koonin EV, Daly MJ: Genome of the extremely radiation-resistant bacterium Deinococcus radiodurans viewed from the perspective of comparative genomics.\n                           Microbiol Mol Biol Rev 2001, 65: 44\u201379. 10.1128\/MMBR.65.1.44-79.2001","journal-title":"Microbiol Mol Biol Rev"},{"key":"91_CR21","doi-asserted-by":"publisher","first-page":"RESEARCH0053","DOI":"10.1186\/gb-2001-2-12-research0053","volume":"2","author":"IK Jordan","year":"2001","unstructured":"Jordan IK, Kondrashov FA, Rogozin IB, Tatusov RL, Wolf YI, Koonin EV: Constant relative rate of protein evolution and detection of functional diversification among bacterial, archaeal and eukaryotic proteins.\n                           Genome Biol 2001, 2: RESEARCH0053. 10.1186\/gb-2001-2-12-research0053","journal-title":"Genome Biol"},{"key":"91_CR22","doi-asserted-by":"publisher","first-page":"7940","DOI":"10.1073\/pnas.141236298","volume":"98","author":"I Yanai","year":"2001","unstructured":"Yanai I, Derti A, DeLisi C: Genes linked by fusion events are generally of the same functional category: A systematic analysis of 30 microbial genomes.\n                           Proc Natl Acad Sci U S A 2001, 98: 7940\u20137945. 10.1073\/pnas.141236298","journal-title":"Proc Natl Acad Sci U S A"},{"key":"91_CR23","doi-asserted-by":"publisher","first-page":"981","DOI":"10.1101\/gr.GR1653R","volume":"11","author":"O Lecompte","year":"2001","unstructured":"Lecompte O, Ripp R, Puzos-Barbe V, Duprat S, Heilig R, Dietrich J, Thierry JC, Poch O: Genome evolution at the genus level: comparison of three complete genomes of hyperthermophilic archaea.\n                           Genome Res 2001, 11: 981\u2013993. 10.1101\/gr.GR1653R","journal-title":"Genome Res"},{"key":"91_CR24","doi-asserted-by":"publisher","first-page":"709","DOI":"10.1146\/annurev.micro.55.1.709","volume":"55","author":"EV Koonin","year":"2001","unstructured":"Koonin EV, Makarova KS, Aravind L: Horizontal gene transfer in prokaryotes: quantification and classification.\n                           Annu Rev Microbiol 2001, 55: 709\u2013742. 10.1146\/annurev.micro.55.1.709","journal-title":"Annu Rev Microbiol"},{"key":"91_CR25","doi-asserted-by":"publisher","first-page":"962","DOI":"10.1101\/gr.87702. Article published online before print in May 2002","volume":"12","author":"IK Jordan","year":"2002","unstructured":"Jordan IK, Rogozin IB, Wolf YI, Koonin EV: Essential genes are more evolutionarily conserved than are nonessential genes in bacteria.\n                           Genome Res 2002, 12: 962\u2013968. 10.1101\/gr.87702. Article published online before print in May 2002","journal-title":"Genome Res"},{"key":"91_CR26","doi-asserted-by":"publisher","first-page":"850","DOI":"10.1038\/nrg931","volume":"3","author":"JJ Wernegreen","year":"2002","unstructured":"Wernegreen JJ: Genome evolution in bacterial endosymbionts of insects.\n                           Nat Rev Genet 2002, 3: 850\u2013861. 10.1038\/nrg931","journal-title":"Nat Rev Genet"},{"key":"91_CR27","first-page":"401","volume":"2","author":"S Casjens","year":"2000","unstructured":"Casjens S: Borrelia genomes in the year 2000.\n                           J Mol Microbiol Biotechnol 2000, 2: 401\u2013410.","journal-title":"J Mol Microbiol Biotechnol"},{"key":"91_CR28","doi-asserted-by":"publisher","first-page":"619","DOI":"10.1046\/j.1365-2958.1997.4821861.x","volume":"25","author":"EV Koonin","year":"1997","unstructured":"Koonin EV, Mushegian AR, Galperin MY, Walker DR: Comparison of archaeal and bacterial genomes: computer analysis of protein sequences predicts novel functions and suggests a chimeric origin for the archaea.\n                           Mol Microbiol 1997, 25: 619\u2013637. 10.1046\/j.1365-2958.1997.4821861.x","journal-title":"Mol Microbiol"},{"key":"91_CR29","doi-asserted-by":"publisher","first-page":"17","DOI":"10.1101\/gr.176501","volume":"12","author":"B Snel","year":"2002","unstructured":"Snel B, Bork P, Huynen MA: Genomes in flux: the evolution of archaeal and proteobacterial gene content.\n                           Genome Res 2002, 12: 17\u201325. 10.1101\/gr.176501","journal-title":"Genome Res"},{"key":"91_CR30","doi-asserted-by":"publisher","first-page":"8","DOI":"10.1186\/1471-2148-1-8","volume":"1","author":"YI Wolf","year":"2001","unstructured":"Wolf YI, Rogozin IB, Grishin NV, Tatusov RL, Koonin EV: Genome trees constructed using five different approaches suggest new major bacterial clades.\n                           BMC Evol Biol 2001, 1: 8. 10.1186\/1471-2148-1-8","journal-title":"BMC Evol Biol"},{"key":"91_CR31","doi-asserted-by":"publisher","first-page":"2","DOI":"10.1186\/1471-2148-3-2","volume":"3","author":"BG Mirkin","year":"2003","unstructured":"Mirkin BG, Fenner TI, Galperin MY, Koonin EV: Algorithms for computing parsimonious evolutionary scenarios for genome evolution, the last universal common ancestor and dominance of horizontal gene transfer in the evolution of prokaryotes.\n                           BMC Evol Biol 2003, 3: 2. 10.1186\/1471-2148-3-2","journal-title":"BMC Evol Biol"},{"key":"91_CR32","doi-asserted-by":"publisher","first-page":"860","DOI":"10.1038\/35057062","volume":"409","author":"ES Lander","year":"2001","unstructured":"Lander ES, Linton LM, Birren B, Nusbaum C, Zody MC, Baldwin J, Devon K, Dewar K, Doyle M, FitzHugh W, Funke R, Gage D, Harris K, Heaford A, Howland J, Kann L, Lehoczky J, LeVine R, McEwan P, McKernan K, Meldrim J, Mesirov JP, Miranda C, Morris W, Naylor J, Raymond C, Rosetti M, Santos R, Sheridan A, Sougnez C, Stange-Thomann N, Stojanovic N, Subramanian A, Wyman D, Rogers J, Sulston J, Ainscough R, Beck S, Bentley D, Burton J, Clee C, Carter N, Coulson A, Deadman R, Deloukas P, Dunham A, Dunham I, Durbin R, French L, Grafham D, Gregory S, Hubbard T, Humphray S, Hunt A, Jones M, Lloyd C, McMurray A, Matthews L, Mercer S, Milne S, Mullikin JC, Mungall A, Plumb R, Ross M, Shownkeen R, Sims S, Waterston RH, Wilson RK, Hillier LW, McPherson JD, Marra MA, Mardis ER, Fulton LA, Chinwalla AT, Pepin KH, Gish WR, Chissoe SL, Wendl MC, Delehaunty KD, Miner TL, Delehaunty A, Kramer JB, Cook LL, Fulton RS, Johnson DL, Minx PJ, Clifton SW, Hawkins T, Branscomb E, Predki P, Richardson P, Wenning S, Slezak T, Doggett N, Cheng JF, Olsen A, Lucas S, Elkin C, Uberbacher E, Frazier M, et al.: Initial sequencing and analysis of the human genome.\n                           Nature 2001, 409: 860\u2013921. 10.1038\/35057062","journal-title":"Nature"},{"key":"91_CR33","doi-asserted-by":"publisher","first-page":"2185","DOI":"10.1126\/science.287.5461.2185","volume":"287","author":"MD Adams","year":"2000","unstructured":"Adams MD, Celniker SE, Holt RA, Evans CA, Gocayne JD, Amanatides PG, Scherer SE, Li PW, Hoskins RA, Galle RF, et al.: The genome sequence of Drosophila melanogaster.\n                           Science 2000, 287: 2185\u20132195. 10.1126\/science.287.5461.2185","journal-title":"Science"},{"key":"91_CR34","doi-asserted-by":"publisher","first-page":"2012","DOI":"10.1126\/science.282.5396.2012","volume":"282","author":"Consortium TCeS","year":"1998","unstructured":"Consortium TCeS: Genome sequence of the nematode C. elegans: a platform for investigating biology.\n                           Science 1998, 282: 2012\u20132018. 10.1126\/science.282.5396.2012","journal-title":"Science"},{"key":"91_CR35","doi-asserted-by":"publisher","first-page":"796","DOI":"10.1038\/35048692","volume":"408","author":"Initiative","year":"2000","unstructured":"Initiative: TAG Analysis of the genome sequence of the flowering plant Arabidopsis thaliana.\n                           Nature 2000, 408: 796\u2013815. 10.1038\/35048692","journal-title":"Nature"},{"key":"91_CR36","doi-asserted-by":"publisher","first-page":"563","DOI":"10.1126\/science.274.5287.546","volume":"274","author":"A Goffeau","year":"1996","unstructured":"Goffeau A, Barrell BG, Bussey H, Davis RW, Dujon B, Feldmann H, Galibert F, Hoheisel JD, Jacq C, Johnston M, Louis EJ, Mewes HW, Murakami Y, Philippsen P, Tettelin H, Oliver SG: Life with 6000 genes.\n                           Science 1996, 274: 563\u2013567. 10.1126\/science.274.5287.546","journal-title":"Science"},{"key":"91_CR37","doi-asserted-by":"publisher","first-page":"871","DOI":"10.1038\/nature724","volume":"415","author":"V Wood","year":"2002","unstructured":"Wood V, Gwilliam R, Rajandream MA, Lyne M, Lyne R, Stewart A, Sgouros J, Peat N, Hayles J, Baker S, Basham D, Bowman S, Brooks K, Brown D, Brown S, Chillingworth T, Churcher C, Collins M, Connor R, Cronin A, Davis P, Feltwell T, Fraser A, Gentles S, Goble A, Hamlin N, Harris D, Hidalgo J, Hodgson G, Holroyd S, Hornsby T, Howarth S, Huckle EJ, Hunt S, Jagels K, James K, Jones L, Jones M, Leather S, McDonald S, McLean J, Mooney P, Moule S, Mungall K, Murphy L, Niblett D, Odell C, Oliver K, O'Neil S, Pearson D, Quail MA, Rabbinowitsch E, Rutherford K, Rutter S, Saunders D, Seeger K, Sharp S, Skelton J, Simmonds M, Squares R, Squares S, Stevens K, Taylor K, Taylor RG, Tivey A, Walsh S, Warren T, Whitehead S, Woodward J, Volckaert G, Aert R, Robben J, Grymonprez B, Weltjens I, Vanstreels E, Rieger M, Schafer M, Muller-Auer S, Gabel C, Fuchs M, Dusterhoft A, Fritzc C, Holzer E, Moestl D, Hilbert H, Borzym K, Langer I, Beck A, Lehrach H, Reinhardt R, Pohl TM, Eger P, Zimmermann W, Wedler H, Wambutt R, Purnelle B, Goffeau A, Cadieu E, Dreano S, Gloux S, et al.: The genome sequence of Schizosaccharomyces pombe.\n                           Nature 2002, 415: 871\u2013880. 10.1038\/nature724","journal-title":"Nature"},{"key":"91_CR38","doi-asserted-by":"publisher","first-page":"450","DOI":"10.1038\/35106579","volume":"414","author":"MD Katinka","year":"2001","unstructured":"Katinka MD, Duprat S, Cornillot E, Metenier G, Thomarat F, Prensier G, Barbe V, Peyretaillade E, Brottier P, Wincker P, Delbac F, El Alaoui H, Peyret P, Saurin W, Gouy M, Weissenbach J, Vivares CP: Genome sequence and gene compaction of the eukaryote parasite Encephalitozoon cuniculi.\n                           Nature 2001, 414: 450\u2013453. 10.1038\/35106579","journal-title":"Nature"},{"key":"91_CR39","doi-asserted-by":"publisher","first-page":"573","DOI":"10.1016\/S0092-8674(00)80867-3","volume":"101","author":"EV Koonin","year":"2000","unstructured":"Koonin EV, Aravind L, Kondrashov AS: The impact of comparative genomics on our understanding of evolution.\n                           Cell 2000, 101: 573\u2013576.","journal-title":"Cell"},{"key":"91_CR40","doi-asserted-by":"publisher","first-page":"383","DOI":"10.1093\/nar\/gkg087","volume":"31","author":"A Marchler-Bauer","year":"2003","unstructured":"Marchler-Bauer A, Anderson JB, DeWeese-Scott C, Fedorova ND, Geer LY, He S, Hurwitz DI, Jackson JD, Jacobs AR, Lanczycki CJ, Liebert CA, Liu C, Madej T, Marchler GH, Mazumder R, Nikolskaya AN, Panchenko AR, Rao BS, Shoemaker BA, Simonyan V, Song JS, Thiessen PA, Vasudevan S, Wang Y, Yamashita RA, Yin JJ, Bryant SH: CDD: a curated Entrez database of conserved domain alignments.\n                           Nucleic Acids Res 2003, 31: 383\u2013387. 10.1093\/nar\/gkg087","journal-title":"Nucleic Acids Res"},{"key":"91_CR41","doi-asserted-by":"crossref","first-page":"608","DOI":"10.1101\/gr.9.7.608","volume":"9","author":"KS Makarova","year":"1999","unstructured":"Makarova KS, Aravind L, Galperin MY, Grishin NV, Tatusov RL, Wolf YI, Koonin EV: Comparative genomics of the Archaea (Euryarchaeota): evolution of conserved protein families, the stable core, and the variable shell.\n                           Genome Res 1999, 9: 608\u2013628.","journal-title":"Genome Res"},{"key":"91_CR42","doi-asserted-by":"publisher","first-page":"838","DOI":"10.1038\/nrg929","volume":"3","author":"SB Hedges","year":"2002","unstructured":"Hedges SB: The origin and evolution of model organisms.\n                           Nat Rev Genet 2002, 3: 838\u2013849. 10.1038\/nrg929","journal-title":"Nat Rev Genet"},{"key":"91_CR43","doi-asserted-by":"publisher","first-page":"1146","DOI":"10.1093\/embo-reports\/kvf248","volume":"3","author":"A Pesce","year":"2002","unstructured":"Pesce A, Bolognesi M, Bocedi A, Ascenzi P, Dewilde S, Moens L, Hankeln T, Burmester T: Neuroglobin and cytoglobin. Fresh blood for the vertebrate globin family.\n                           EMBO Rep 2002, 3: 1146\u20131151. 10.1093\/embo-reports\/kvf248","journal-title":"EMBO Rep"},{"key":"91_CR44","doi-asserted-by":"publisher","first-page":"1665","DOI":"10.1093\/nar\/25.9.1665","volume":"25","author":"AF Neuwald","year":"1997","unstructured":"Neuwald AF, Liu JS, Lipman DJ, Lawrence CE: Extracting protein alignment models from the sequence database.\n                           Nucleic Acids Res 1997, 25: 1665\u20131677. 10.1093\/nar\/25.9.1665","journal-title":"Nucleic Acids Res"},{"key":"91_CR45","doi-asserted-by":"publisher","first-page":"31581","DOI":"10.1074\/jbc.M004141200","volume":"275","author":"PR Gardner","year":"2000","unstructured":"Gardner PR, Gardner AM, Martin LA, Dou Y, Li T, Olson JS, Zhu H, Riggs AF: Nitric-oxide dioxygenase activity and function of flavohemoglobins. sensitivity to nitric oxide and carbon monoxide inhibition.\n                           J Biol Chem 2000, 275: 31581\u201331587. 10.1074\/jbc.M004141200","journal-title":"J Biol Chem"},{"key":"91_CR46","doi-asserted-by":"publisher","first-page":"345","DOI":"10.1016\/S0065-3233(00)54010-8","volume":"54","author":"MJ Huynen","year":"2000","unstructured":"Huynen MJ, Snel B: Gene and context: integrative approaches to genome analysis.\n                           Adv Prot Chem 2000, 54: 345\u2013379.","journal-title":"Adv Prot Chem"},{"key":"91_CR47","doi-asserted-by":"publisher","first-page":"366","DOI":"10.1016\/S0959-440X(00)00098-1","volume":"10","author":"M Huynen","year":"2000","unstructured":"Huynen M, Snel B, Lathe W, Bork P: Exploitation of gene context.\n                           Curr Opin Struct Biol 2000, 10: 366\u2013370. 10.1016\/S0959-440X(00)00098-1","journal-title":"Curr Opin Struct Biol"},{"key":"91_CR48","doi-asserted-by":"publisher","first-page":"356","DOI":"10.1101\/gr.GR-1619R","volume":"11","author":"YI Wolf","year":"2001","unstructured":"Wolf YI, Rogozin IB, Kondrashov AS, Koonin EV: Genome alignment, evolution of prokaryotic genome organization and prediction of gene function using genomic context.\n                           Genome Res 2001, 11: 356\u2013372. 10.1101\/gr.GR-1619R","journal-title":"Genome Res"},{"key":"91_CR49","doi-asserted-by":"publisher","first-page":"991","DOI":"10.1016\/S0092-8674(00)80284-6","volume":"89","author":"GJ Olsen","year":"1997","unstructured":"Olsen GJ, Woese CR: Archaeal genomics: an overview.\n                           Cell 1997, 89: 991\u2013994.","journal-title":"Cell"},{"key":"91_CR50","doi-asserted-by":"publisher","first-page":"64","DOI":"10.1016\/S0968-0004(98)01334-6","volume":"24","author":"HH Winkler","year":"1999","unstructured":"Winkler HH, Neuhaus HE: Non-mitochondrial ATP transport.\n                           Trends Biochem Sci 1999, 24: 64\u201368. 10.1016\/S0968-0004(98)01334-6","journal-title":"Trends Biochem Sci"},{"key":"91_CR51","doi-asserted-by":"publisher","first-page":"173","DOI":"10.1016\/S0168-9525(99)01704-7","volume":"15","author":"YI Wolf","year":"1999","unstructured":"Wolf YI, Aravind L, Koonin EV: Rickettsiae and Chlamydiae: evidence of horizontal gene transfer and gene exchange.\n                           Trends Genet 1999, 15: 173\u2013175. 10.1016\/S0168-9525(99)01704-7","journal-title":"Trends Genet"},{"key":"91_CR52","doi-asserted-by":"publisher","first-page":"523","DOI":"10.1038\/35097083","volume":"413","author":"J Parkhill","year":"2001","unstructured":"Parkhill J, Wren BW, Thomson NR, Titball RW, Holden MT, Prentice MB, Sebaihia M, James KD, Churcher C, Mungall KL, Baker S, Basham D, Bentley SD, Brooks K, Cerdeno-Tarraga AM, Chillingworth T, Cronin A, Davies RM, Davis P, Dougan G, Feltwell T, Hamlin N, Holroyd S, Jagels K, Karlyshev AV, Leather S, Moule S, Oyston PC, Quail M, Rutherford K, Simmonds M, Skelton J, Stevens K, Whitehead S, Barrell BG: Genome sequence of Yersinia pestis, the causative agent of plague.\n                           Nature 2001, 413: 523\u2013527. 10.1038\/35097083","journal-title":"Nature"},{"key":"91_CR53","doi-asserted-by":"publisher","first-page":"520","DOI":"10.1038\/nature01262","volume":"420","author":"RH Waterston","year":"2002","unstructured":"Waterston RH, Lindblad-Toh K, Birney E, Rogers J, Abril JF, Agarwal P, Agarwala R, Ainscough R, Alexandersson M, An P, Antonarakis SE, Attwood J, Baertsch R, Bailey J, Barlow K, Beck S, Berry E, Birren B, Bloom T, Bork P, Botcherby M, Bray N, Brent MR, Brown DG, Brown SD, Bult C, Burton J, Butler J, Campbell RD, Carninci P, Cawley S, Chiaromonte F, Chinwalla AT, Church DM, Clamp M, Clee C, Collins FS, Cook LL, Copley RR, Coulson A, Couronne O, Cuff J, Curwen V, Cutts T, Daly M, David R, Davies J, Delehaunty KD, Deri J, Dermitzakis ET, Dewey C, Dickens NJ, Diekhans M, Dodge S, Dubchak I, Dunn DM, Eddy SR, Elnitski L, Emes RD, Eswara P, Eyras E, Felsenfeld A, Fewell GA, Flicek P, Foley K, Frankel WN, Fulton LA, Fulton RS, Furey TS, Gage D, Gibbs RA, Glusman G, Gnerre S, Goldman N, Goodstadt L, Grafham D, Graves TA, Green ED, Gregory S, Guigo R, Guyer M, Hardison RC, Haussler D, Hayashizaki Y, Hillier LW, Hinrichs A, Hlavina W, Holzer T, Hsu F, Hua A, Hubbard T, Hunt A, Jackson I, Jaffe DB, Johnson LS, Jones M, Jones TA, Joy A, Kamal M, Karlsson EK, et al.: Initial sequencing and comparative analysis of the mouse genome.\n                           Nature 2002, 420: 520\u2013562. 10.1038\/nature01262","journal-title":"Nature"},{"key":"91_CR54","doi-asserted-by":"publisher","first-page":"1301","DOI":"10.1126\/science.1072104","volume":"297","author":"S Aparicio","year":"2002","unstructured":"Aparicio S, Chapman J, Stupka E, Putnam N, Chia JM, Dehal P, Christoffels A, Rash S, Hoon S, Smit A, Gelpke MD, Roach J, Oh T, Ho IY, Wong M, Detter C, Verhoef F, Predki P, Tay A, Lucas S, Richardson P, Smith SF, Clark MS, Edwards YJ, Doggett N, Zharkikh A, Tavtigian SV, Pruss D, Barnstead M, Evans C, Baden H, Powell J, Glusman G, Rowen L, Hood L, Tan YH, Elgar G, Hawkins T, Venkatesh B, Rokhsar D, Brenner S: Whole-genome shotgun assembly and analysis of the genome of Fugu rubripes.\n                           Science 2002, 297: 1301\u20131310. 10.1126\/science.1072104","journal-title":"Science"},{"key":"91_CR55","doi-asserted-by":"publisher","first-page":"129","DOI":"10.1126\/science.1076181","volume":"298","author":"RA Holt","year":"2002","unstructured":"Holt RA, Subramanian GM, Halpern A, Sutton GG, Charlab R, Nusskern DR, Wincker P, Clark AG, Ribeiro JM, Wides R, Salzberg SL, Loftus B, Yandell M, Majoros WH, Rusch DB, Lai Z, Kraft CL, Abril JF, Anthouard V, Arensburger P, Atkinson PW, Baden H, de Berardinis V, Baldwin D, Benes V, Biedler J, Blass C, Bolanos R, Boscus D, Barnstead M, Cai S, Center A, Chatuverdi K, Christophides GK, Chrystal MA, Clamp M, Cravchik A, Curwen V, Dana A, Delcher A, Dew I, Evans CA, Flanigan M, Grundschober-Freimoser A, Friedli L, Gu Z, Guan P, Guigo R, Hillenmeyer ME, Hladun SL, Hogan JR, Hong YS, Hoover J, Jaillon O, Ke Z, Kodira C, Kokoza E, Koutsos A, Letunic I, Levitsky A, Liang Y, Lin JJ, Lobo NF, Lopez JR, Malek JA, McIntosh TC, Meister S, Miller J, Mobarry C, Mongin E, Murphy SD, O'Brochta DA, Pfannkoch C, Qi R, Regier MA, Remington K, Shao H, Sharakhova MV, Sitter CD, Shetty J, Smith TJ, Strong R, Sun J, Thomasova D, Ton LQ, Topalis P, Tu Z, Unger MF, Walenz B, Wang A, Wang J, Wang M, Wang X, Woodford KJ, Wortman JR, Wu M, Yao A, Zdobnov EM, Zhang H, Zhao Q, et al.: The genome sequence of the malaria mosquito Anopheles gambiae.\n                           Science 2002, 298: 129\u2013149. 10.1126\/science.1076181","journal-title":"Science"},{"key":"91_CR56","doi-asserted-by":"publisher","first-page":"2157","DOI":"10.1126\/science.1080049","volume":"298","author":"P Dehal","year":"2002","unstructured":"Dehal P, Satou Y, Campbell RK, Chapman J, Degnan B, De Tomaso A, Davidson B, Di Gregorio A, Gelpke M, Goodstein DM, Harafuji N, Hastings KE, Ho I, Hotta K, Huang W, Kawashima T, Lemaire P, Martinez D, Meinertzhagen IA, Necula S, Nonaka M, Putnam N, Rash S, Saiga H, Satake M, Terry A, Yamada L, Wang HG, Awazu S, Azumi K, Boore J, Branno M, Chin-Bow S, DeSantis R, Doyle S, Francino P, Keys DN, Haga S, Hayashi H, Hino K, Imai KS, Inaba K, Kano S, Kobayashi K, Kobayashi M, Lee BI, Makabe KW, Manohar C, Matassi G, Medina M, Mochizuki Y, Mount S, Morishita T, Miura S, Nakayama A, Nishizaka S, Nomoto H, Ohta F, Oishi K, Rigoutsos I, Sano M, Sasaki A, Sasakura Y, Shoguchi E, Shin-i T, Spagnuolo A, Stainier D, Suzuki MM, Tassy O, Takatori N, Tokuoka M, Yagi K, Yoshizaki F, Wada S, Zhang C, Hyatt PD, Larimer F, Detter C, Doggett N, Glavina T, Hawkins T, Richardson P, Lucas S, Kohara Y, Levine M, Satoh N, Rokhsar DS: The draft genome of Ciona intestinalis: insights into chordate and vertebrate origins.\n                           Science 2002, 298: 2157\u20132167. 10.1126\/science.1080049","journal-title":"Science"},{"key":"91_CR57","doi-asserted-by":"publisher","first-page":"498","DOI":"10.1038\/nature01097","volume":"419","author":"MJ Gardner","year":"2002","unstructured":"Gardner MJ, Hall N, Fung E, White O, Berriman M, Hyman RW, Carlton JM, Pain A, Nelson KE, Bowman S, Paulsen IT, James K, Eisen JA, Rutherford K, Salzberg SL, Craig A, Kyes S, Chan MS, Nene V, Shallom SJ, Suh B, Peterson J, Angiuoli S, Pertea M, Allen J, Selengut J, Haft D, Mather MW, Vaidya AB, Martin DM, Fairlamb AH, Fraunholz MJ, Roos DS, Ralph SA, McFadden GI, Cummings LM, Subramanian GM, Mungall C, Venter JC, Carucci DJ, Hoffman SL, Newbold C, Davis RW, Fraser CM, Barrell B: Genome sequence of the human malaria parasite Plasmodium falciparum.\n                           Nature 2002, 419: 498\u2013511. 10.1038\/nature01097","journal-title":"Nature"},{"key":"91_CR58","doi-asserted-by":"publisher","first-page":"3389","DOI":"10.1093\/nar\/25.17.3389","volume":"25","author":"SF Altschul","year":"1997","unstructured":"Altschul SF, Madden TL, Schaffer AA, Zhang J, Zhang Z, Miller W, Lipman DJ: Gapped BLAST and PSI-BLAST: a new generation of protein database search programs.\n                           Nucleic Acids Res 1997, 25: 3389\u20133402. 10.1093\/nar\/25.17.3389","journal-title":"Nucleic Acids Res"},{"key":"91_CR59","doi-asserted-by":"publisher","first-page":"554","DOI":"10.1016\/S0076-6879(96)66035-2","volume":"266","author":"JC Wootton","year":"1996","unstructured":"Wootton JC, Federhen S: Analysis of compositionally biased regions in sequence databases.\n                           Methods Enzymol 1996, 266: 554\u2013571.","journal-title":"Methods Enzymol"},{"key":"91_CR60","doi-asserted-by":"publisher","first-page":"5857","DOI":"10.1073\/pnas.95.11.5857","volume":"95","author":"J Schultz","year":"1998","unstructured":"Schultz J, Milpetz F, Bork P, Ponting CP: SMART, a simple modular architecture research tool: identification of signaling domains.\n                           Proc Natl Acad Sci U S A 1998, 95: 5857\u20135864. 10.1073\/pnas.95.11.5857","journal-title":"Proc Natl Acad Sci U S A"}],"container-title":["BMC Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/1471-2105-4-41.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,13]],"date-time":"2024-09-13T11:57:21Z","timestamp":1726228641000},"score":1,"resource":{"primary":{"URL":"https:\/\/bmcbioinformatics.biomedcentral.com\/articles\/10.1186\/1471-2105-4-41"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2003,9,11]]},"references-count":60,"journal-issue":{"issue":"1","published-online":{"date-parts":[[2003,12]]}},"alternative-id":["91"],"URL":"https:\/\/doi.org\/10.1186\/1471-2105-4-41","relation":{"has-review":[{"id-type":"doi","id":"10.3410\/f.1015729.198003","asserted-by":"object"}]},"ISSN":["1471-2105"],"issn-type":[{"value":"1471-2105","type":"electronic"}],"subject":[],"published":{"date-parts":[[2003,9,11]]},"assertion":[{"value":"20 May 2003","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"11 September 2003","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"11 September 2003","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}],"article-number":"41"}}