{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,9]],"date-time":"2026-01-09T23:35:41Z","timestamp":1768001741773,"version":"3.49.0"},"reference-count":99,"publisher":"Springer Science and Business Media LLC","issue":"7","license":[{"start":{"date-parts":[[2003,7,1]],"date-time":"2003-07-01T00:00:00Z","timestamp":1057017600000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Nat Rev Genet"],"published-print":{"date-parts":[[2003,7]]},"DOI":"10.1038\/nrg1113","type":"journal-article","created":{"date-parts":[[2003,7,1]],"date-time":"2003-07-01T15:06:25Z","timestamp":1057071985000},"page":"508-519","source":"Crossref","is-referenced-by-count":90,"title":["Classification schemes for protein structure and function"],"prefix":"10.1038","volume":"4","author":[{"given":"Christos A.","family":"Ouzounis","sequence":"first","affiliation":[]},{"given":"Richard M. R.","family":"Coulson","sequence":"additional","affiliation":[]},{"given":"Anton J.","family":"Enright","sequence":"additional","affiliation":[]},{"given":"Victor","family":"Kunin","sequence":"additional","affiliation":[]},{"given":"Jos\u00e9 B.","family":"Pereira-Leal","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"BFnrg1113_CR1","first-page":"167","volume-title":"Philosophy of Biology","author":"M Ridley","year":"1989","unstructured":"Ridley, M. in Philosophy of Biology (ed. Ruse, M.) 167\u2013179 (Macmillan Publishing Co., New York, 1989)."},{"key":"BFnrg1113_CR2","volume-title":"A Short History of Biology","author":"I Asimov","year":"1964","unstructured":"Asimov, I. A Short History of Biology (Thomas Nelson & Sons Ltd., London, 1964)."},{"key":"BFnrg1113_CR3","doi-asserted-by":"crossref","first-page":"823","DOI":"10.1038\/35015694","volume":"405","author":"D Eisenberg","year":"2000","unstructured":"Eisenberg, D., Marcotte, E. M., Xenarios, I. & Yeates, T. O. Protein function in the post-genomic era. Nature 405, 823\u2013826 (2000).","journal-title":"Nature"},{"key":"BFnrg1113_CR4","doi-asserted-by":"crossref","first-page":"884","DOI":"10.1002\/(SICI)1521-1878(199811)20:11<884::AID-BIES3>3.0.CO;2-H","volume":"20","author":"MB Swindells","year":"1998","unstructured":"Swindells, M. B., Orengo, C. A., Jones, D. T., Hutchinson, E. G. & Thornton, J. M. Contemporary approaches to protein structure classification. Bioessays 20, 884\u2013891 (1998).","journal-title":"Bioessays"},{"key":"BFnrg1113_CR5","doi-asserted-by":"crossref","first-page":"321","DOI":"10.1016\/S0079-6107(00)00013-4","volume":"73","author":"A Heger","year":"2000","unstructured":"Heger, A. & Holm, L. Towards a covering set of protein family profiles. Prog. Biophys. Mol. Biol. 73, 321\u2013337 (2000). A comprehensive analysis of strategies and resources for protein-sequence clustering and protein-family identification.","journal-title":"Prog. Biophys. Mol. Biol."},{"key":"BFnrg1113_CR6","doi-asserted-by":"crossref","first-page":"5","DOI":"10.1016\/S1367-5931(02)00003-0","volume":"7","author":"J Liu","year":"2003","unstructured":"Liu, J. & Rost, B. Domains, motifs and clusters in the protein universe. Curr. Opin. Chem. Biol. 7, 5\u201311 (2003). An overview of present methods for protein-sequence clustering.","journal-title":"Curr. Opin. Chem. Biol."},{"key":"BFnrg1113_CR7","first-page":"536","volume":"247","author":"AG Murzin","year":"1995","unstructured":"Murzin, A. G., Brenner, S. E., Hubbart, T. & Chothia, C. SCOP: a structural classification of proteins database for the investigation of sequences and structures. J. Mol. Biol. 247, 536\u2013540 (1995).","journal-title":"J. Mol. Biol."},{"key":"BFnrg1113_CR8","doi-asserted-by":"crossref","first-page":"264","DOI":"10.1093\/nar\/30.1.264","volume":"30","author":"L Lo Conte","year":"2002","unstructured":"Lo Conte, L., Brenner, S. E., Hubbard, T. J., Chothia, C. & Murzin, A. G. SCOP database in 2002: refinements accommodate structural genomics. Nucl. Acids Res. 30, 264\u2013267 (2002).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR9","doi-asserted-by":"crossref","first-page":"1093","DOI":"10.1016\/S0969-2126(97)00260-8","volume":"5","author":"CA Orengo","year":"1997","unstructured":"Orengo, C. A. et al. CATH- a hierarchic classification of protein domain structures. Structure 5, 1093\u20131108 (1997).","journal-title":"Structure"},{"key":"BFnrg1113_CR10","doi-asserted-by":"crossref","first-page":"452","DOI":"10.1093\/nar\/gkg062","volume":"31","author":"FM Pearl","year":"2003","unstructured":"Pearl, F. M. et al. The CATH database: an extended protein family resource for structural and functional genomics. Nucl. Acids Res. 31, 452\u2013455 (2003).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR11","doi-asserted-by":"crossref","first-page":"1691","DOI":"10.1002\/pro.5560011217","volume":"1","author":"L Holm","year":"1992","unstructured":"Holm, L., Ouzounis, C., Sander, C., Tuparev, G. & Vriend, G. A database of protein structure families with common folding motifs. Protein Sci. 1, 1691\u20131698 (1992).","journal-title":"Protein Sci."},{"key":"BFnrg1113_CR12","doi-asserted-by":"crossref","first-page":"316","DOI":"10.1093\/nar\/26.1.316","volume":"26","author":"L Holm","year":"1998","unstructured":"Holm, L. & Sander, C. Touring protein fold space with Dali\/FSSP. Nucl. Acids Res. 26, 316\u2013319 (1998).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR13","doi-asserted-by":"crossref","first-page":"617","DOI":"10.1016\/S0076-6879(96)66038-8","volume":"266","author":"CA Orengo","year":"1996","unstructured":"Orengo, C. A. & Taylor, W. R. SSAP: sequential structure alignment program for protein structure comparison. Methods Enzymol. 266, 617\u2013635 (1996).","journal-title":"Methods Enzymol."},{"key":"BFnrg1113_CR14","doi-asserted-by":"crossref","first-page":"123","DOI":"10.1006\/jmbi.1993.1489","volume":"233","author":"L Holm","year":"1993","unstructured":"Holm, L. & Sander, C. Protein structure comparison by alignment of distance matrices. J. Mol. Biol. 233, 123\u2013138 (1993).","journal-title":"J. Mol. Biol."},{"key":"BFnrg1113_CR15","doi-asserted-by":"publisher","first-page":"478","DOI":"10.1016\/S0968-0004(00)89105-7","volume":"20","author":"L Holm","year":"1995","unstructured":"Holm, L. & Sander, C. Dali: a network tool for protein structure comparison. Trends Biochem. Sci. 20, 478\u2013480 (1995).","journal-title":"Trends Biochem. Sci."},{"key":"BFnrg1113_CR16","doi-asserted-by":"crossref","first-page":"595","DOI":"10.1126\/science.273.5275.595","volume":"273","author":"L Holm","year":"1996","unstructured":"Holm, L. & Sander, C. Mapping the protein universe. Science 273, 595\u2013602 (1996).","journal-title":"Science"},{"key":"BFnrg1113_CR17","doi-asserted-by":"crossref","first-page":"369","DOI":"10.1016\/S0959-440X(97)80054-1","volume":"7","author":"SE Brenner","year":"1997","unstructured":"Brenner, S. E., Chothia, C. & Hubbard, T. J. Population statistics of protein structures: lessons from structural classifications. Curr. Opin. Struct. Biol. 7, 369\u2013376 (1997).","journal-title":"Curr. Opin. Struct. Biol."},{"key":"BFnrg1113_CR18","doi-asserted-by":"crossref","first-page":"243","DOI":"10.1146\/annurev.genom.3.022502.103227","volume":"3","author":"SK Burley","year":"2002","unstructured":"Burley, S. K. & Bonanno, J. B. Structuring the universe of proteins. Ann. Rev. Genomics Hum. Genet. 3, 243\u2013262 (2002).","journal-title":"Ann. Rev. Genomics Hum. Genet."},{"key":"BFnrg1113_CR19","doi-asserted-by":"crossref","first-page":"2577","DOI":"10.1002\/bip.360221211","volume":"22","author":"W Kabsch","year":"1983","unstructured":"Kabsch, W. & Sander, C. Dictionary of protein secondary structure: pattern recognition of hydrogen-bonded and geometrical features. Biopolymers 22, 2577\u20132637 (1983).","journal-title":"Biopolymers"},{"key":"BFnrg1113_CR20","doi-asserted-by":"crossref","first-page":"56","DOI":"10.1002\/prot.340090107","volume":"9","author":"C Sander","year":"1991","unstructured":"Sander, C. & Schneider, R. Database of homology-derived protein structures and the structural meaning of sequence alignment. Proteins 9, 56\u201368 (1991).","journal-title":"Proteins"},{"key":"BFnrg1113_CR21","doi-asserted-by":"crossref","first-page":"313","DOI":"10.1093\/nar\/26.1.313","volume":"26","author":"C Dodge","year":"1998","unstructured":"Dodge, C., Schneider, R. & Sander, C. The HSSP database of protein structure-sequence alignments and family profiles. Nucl. Acids Res. 26, 313\u2013315 (1998).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR22","doi-asserted-by":"crossref","first-page":"405","DOI":"10.1002\/(SICI)1097-0134(199707)28:3<405::AID-PROT10>3.0.CO;2-L","volume":"28","author":"EL Sonnhammer","year":"1997","unstructured":"Sonnhammer, E. L., Eddy, S. R. & Durbin, R. Pfam: a comprehensive database of protein domain families based on seed alignments. Proteins 28, 405\u2013420 (1997).","journal-title":"Proteins"},{"key":"BFnrg1113_CR23","doi-asserted-by":"crossref","first-page":"276","DOI":"10.1093\/nar\/30.1.276","volume":"30","author":"A Bateman","year":"2002","unstructured":"Bateman, A. et al. The Pfam protein families database. Nucl. Acids Res. 30, 276\u2013280 (2002).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR24","first-page":"3590","volume":"22","author":"TK Attwood","year":"1994","unstructured":"Attwood, T. K., Beck, M. E., Bleasby, A. J. & Parry-Smith, D. J. PRINTS \u2014 a database of protein motif fingerprints. Nucl. Acids Res. 22, 3590\u20133596 (1994).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR25","doi-asserted-by":"crossref","first-page":"400","DOI":"10.1093\/nar\/gkg030","volume":"31","author":"TK Attwood","year":"2003","unstructured":"Attwood, T. K. et al. PRINTS and its automatic supplement, prePRINTS. Nucl. Acids Res. 31, 400\u2013402 (2003).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR26","doi-asserted-by":"crossref","first-page":"5857","DOI":"10.1073\/pnas.95.11.5857","volume":"95","author":"J Schultz","year":"1998","unstructured":"Schultz, J., Milpets, F., Bork, P. & Ponting, C. P. SMART, a simple modular architecture research tool: identification of signaling domains. Proc. Natl Acad. Sci. USA 95, 5857\u20135864 (1998).","journal-title":"Proc. Natl Acad. Sci. USA"},{"key":"BFnrg1113_CR27","doi-asserted-by":"crossref","first-page":"242","DOI":"10.1093\/nar\/30.1.242","volume":"30","author":"I Letunic","year":"2002","unstructured":"Letunic, I. et al. Recent improvements to the SMART domain-based sequence annotation resource. Nucl. Acids Res. 30, 242\u2013244 (2002).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR28","doi-asserted-by":"crossref","first-page":"2241","DOI":"10.1093\/nar\/19.suppl.2241","volume":"19","author":"A Bairoch","year":"1991","unstructured":"Bairoch, A. PROSITE: a dictionary of sites and patterns in proteins. Nucl. Acids Res. 19, 2241\u20132245 (1991).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR29","doi-asserted-by":"crossref","first-page":"235","DOI":"10.1093\/nar\/30.1.235","volume":"30","author":"L Falquet","year":"2002","unstructured":"Falquet, L. et al. The PROSITE database, its status in 2002. Nucl. Acids Res. 30, 235\u2013238 (2002).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR30","doi-asserted-by":"crossref","first-page":"41","DOI":"10.1093\/nar\/29.1.41","volume":"29","author":"DH Haft","year":"2001","unstructured":"Haft, D. H. et al. TIGRFAMs: a protein family resource for the functional identification of proteins. Nucl. Acids Res. 29, 41\u201343 (2001).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR31","doi-asserted-by":"crossref","first-page":"371","DOI":"10.1093\/nar\/gkg128","volume":"31","author":"DH Haft","year":"2003","unstructured":"Haft, D. H., Selengut, J. D. & White, O. The TIGRFAMs database of protein families. Nucl. Acids Res. 31, 371\u2013373 (2003).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR32","doi-asserted-by":"crossref","first-page":"323","DOI":"10.1093\/nar\/26.1.323","volume":"26","author":"F Corpet","year":"1998","unstructured":"Corpet, F., Gouzy, J. & Kahn, D. The ProDom database of protein domain families. Nucl. Acids Res. 26, 323\u2013326 (1998).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR33","doi-asserted-by":"crossref","first-page":"267","DOI":"10.1093\/nar\/28.1.267","volume":"28","author":"F Corpet","year":"2000","unstructured":"Corpet, F., Servant, F., Gouzy, J. & Kahn, D. ProDom and ProDom-CG: tools for protein domain analysis and whole genome comparisons. Nucl. Acids Res. 28, 267\u2013269 (2000).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR34","doi-asserted-by":"crossref","first-page":"6565","DOI":"10.1093\/nar\/19.23.6565","volume":"19","author":"S Henikoff","year":"1991","unstructured":"Henikoff, S. & Henikoff, J. G. Automated assembly of protein blocks for database searching. Nucl. Acids Res. 19, 6565\u201365672 (1991).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR35","doi-asserted-by":"crossref","first-page":"471","DOI":"10.1093\/bioinformatics\/15.6.471","volume":"15","author":"S Henikoff","year":"1999","unstructured":"Henikoff, S., Henikoff, J. G. & Pietrokovski, S. Blocks+: a non-redundant database of protein alignment blocks derived from multiple compilations. Bioinformatics 15, 471\u2013479 (1999).","journal-title":"Bioinformatics"},{"key":"BFnrg1113_CR36","doi-asserted-by":"crossref","first-page":"5865","DOI":"10.1073\/pnas.95.11.5865","volume":"95","author":"CG Nevill-Maning","year":"1998","unstructured":"Nevill-Maning, C. G., Wu, T. D. & Brutlag, D. L. Highly specific protein sequence motifs for genome analysis. Proc. Natl Acad. Sci. USA 95, 5865\u20135871 (1998).","journal-title":"Proc. Natl Acad. Sci. USA"},{"key":"BFnrg1113_CR37","doi-asserted-by":"crossref","first-page":"202","DOI":"10.1093\/nar\/29.1.202","volume":"29","author":"JY Huang","year":"2001","unstructured":"Huang, J. Y. & Brutlag, D. L. The EMOTIF database. Nucl. Acids Res. 29, 202\u2013204 (2001).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR38","doi-asserted-by":"crossref","first-page":"3901","DOI":"10.1093\/nar\/gkf464","volume":"30","author":"I Rigoutsos","year":"2002","unstructured":"Rigoutsos, I., Huynh, T., Floratos, A., Parida, L. & Platt, D. Dictionary-driven protein annotation. Nucl. Acids Res. 30, 3901\u20133916 (2002).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR39","doi-asserted-by":"crossref","first-page":"299","DOI":"10.1093\/nar\/30.1.299","volume":"30","author":"A Krause","year":"2002","unstructured":"Krause, A., Haas, S. A., Coward, E. & Vingron, M. SYSTERS, GeneNet, SpliceNest: exploring sequence space from genome to protein. Nucl. Acids Res. 30, 299\u2013300 (2002).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR40","doi-asserted-by":"crossref","first-page":"33","DOI":"10.1093\/nar\/29.1.33","volume":"29","author":"EV Kriventseva","year":"2001","unstructured":"Kriventseva, E. V., Fleischmann, W., Zdobnov, E. M. & Apweiler, R. CluSTr: a database of clusters of SWISS-PROT+TrEMBL proteins. Nucl. Acids Res. 29, 33\u201336 (2001).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR41","doi-asserted-by":"crossref","first-page":"388","DOI":"10.1093\/nar\/gkg035","volume":"31","author":"EV Kriventseva","year":"2003","unstructured":"Kriventseva, E. V., Servant, F. & Apweiler, R. Improvements to CluSTr: the database of SWISS-PROT+TrEMBL protein clusters. Nucl. Acids Res. 31, 388\u2013389 (2003).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR42","doi-asserted-by":"crossref","first-page":"631","DOI":"10.1126\/science.278.5338.631","volume":"278","author":"RL Tatusov","year":"1997","unstructured":"Tatusov, R. L., Koonin, E. V. & Lipman, D. J. A genomic perspective on protein families. Science 278, 631\u2013637 (1997).","journal-title":"Science"},{"key":"BFnrg1113_CR43","doi-asserted-by":"crossref","first-page":"28","DOI":"10.1093\/nar\/gkg033","volume":"31","author":"DL Wheeler","year":"2003","unstructured":"Wheeler, D. L. et al. Database resources of the National Center for Biotechnology Information. Nucl. Acids Res. 31, 28\u201333 (2003).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR44","doi-asserted-by":"crossref","first-page":"360","DOI":"10.1002\/(SICI)1097-0134(19991115)37:3<360::AID-PROT5>3.0.CO;2-Z","volume":"37","author":"G Yona","year":"1999","unstructured":"Yona, G., Linial, N. & Linial, M. ProtoMap: automatic classification of protein sequences, a hierarchy of protein families, and local maps of the protein space. Proteins 37, 360\u2013378 (1999).","journal-title":"Proteins"},{"key":"BFnrg1113_CR45","doi-asserted-by":"crossref","first-page":"49","DOI":"10.1093\/nar\/28.1.49","volume":"28","author":"G Yona","year":"2000","unstructured":"Yona, G., Linial, N. & Linial, M. ProtoMap: automatic classification of protein sequences and hierarchy of protein families. Nucl. Acids Res. 28, 49\u201355 (2000).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR46","doi-asserted-by":"crossref","first-page":"249","DOI":"10.1093\/bioinformatics\/17.3.249","volume":"17","author":"KA Silverstein","year":"2001","unstructured":"Silverstein, K. A., Shoop, E., Johnson, J. E. & Retzel, E. F. MetaFam: a unified classification of protein families. I. Overview and statistics. Bioinformatics 17, 249\u2013261 (2001).","journal-title":"Bioinformatics"},{"key":"BFnrg1113_CR47","doi-asserted-by":"crossref","first-page":"262","DOI":"10.1093\/bioinformatics\/17.3.262","volume":"17","author":"E Shoop","year":"2001","unstructured":"Shoop, E., Silverstein, K. A., Johnson, J. E. & Retzel, E. F. MetaFam: a unified classification of protein families. II. Schema and query capabilities. Bioinformatics 17, 262\u2013271 (2001).","journal-title":"Bioinformatics"},{"key":"BFnrg1113_CR48","doi-asserted-by":"crossref","unstructured":"Enright, A. J., Kunin, V. & Ouzounis, C. A. Protein families and TRIBEs in genome sequence space. Nucl. Acids Res. (in the press).","DOI":"10.1093\/nar\/gkg495"},{"key":"BFnrg1113_CR49","doi-asserted-by":"crossref","first-page":"315","DOI":"10.1093\/nar\/gkg046","volume":"31","author":"NJ Mulder","year":"2003","unstructured":"Mulder, N. J. et al. The InterPro database, 2003 brings increased coverage and new features. Nucl. Acids Res. 31, 315\u2013318 (2003).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR50","doi-asserted-by":"crossref","first-page":"55","DOI":"10.1093\/bioinformatics\/14.1.55","volume":"14","author":"I Rigoutsos","year":"1998","unstructured":"Rigoutsos, I. & Floratos, A. Combinatorial pattern discovery in biological sequences: the TEIRESIAS algorithm. Bioinformatics 14, 55\u201367 (1998).","journal-title":"Bioinformatics"},{"key":"BFnrg1113_CR51","doi-asserted-by":"crossref","first-page":"1575","DOI":"10.1093\/nar\/30.7.1575","volume":"30","author":"AJ Enright","year":"2002","unstructured":"Enright, A. J., van Dongen, S. & Ouzounis, C. A. An efficient algorithm for large-scale detection of protein families. Nucl. Acids Res. 30, 1575\u20131584 (2002).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR52","doi-asserted-by":"crossref","first-page":"3626","DOI":"10.1093\/nar\/22.17.3626","volume":"22","author":"A Bairoch","year":"1993","unstructured":"Bairoch, A. The ENZYME data bank. Nucl. Acids Res. 22, 3626\u20133627 (1993).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR53","doi-asserted-by":"crossref","first-page":"304","DOI":"10.1093\/nar\/28.1.304","volume":"28","author":"A Bairoch","year":"2000","unstructured":"Bairoch, A. The ENZYME database in 2000. Nucl. Acids Res. 28, 304\u2013305 (2000).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR54","doi-asserted-by":"crossref","first-page":"46","DOI":"10.1093\/nar\/24.1.46","volume":"24","author":"JI Garrels","year":"1996","unstructured":"Garrels, J. I. YPD \u2014 a database for the proteins of Saccharomyces cerevisiae. Nucl. Acids Res. 24, 46\u201349 (1996).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR55","doi-asserted-by":"crossref","first-page":"69","DOI":"10.1093\/nar\/27.1.69","volume":"27","author":"PE Hodges","year":"1999","unstructured":"Hodges, P. E., McKee, A. H., Davis, B. P., Payne, W. E. & Garrels, J. I. The Yeast Proteome Database (YPD): a model for the organization and presentation of genome-wide functional data. Nucl. Acids Res. 27, 69\u201373 (1999).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR56","doi-asserted-by":"crossref","first-page":"73","DOI":"10.1093\/nar\/26.1.73","volume":"26","author":"JM Cherry","year":"1998","unstructured":"Cherry, J. M. et al. SGD: Saccharomyces Genome Database. Nucl. Acids Res. 26, 73\u201379 (1998).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR57","doi-asserted-by":"crossref","first-page":"69","DOI":"10.1093\/nar\/30.1.69","volume":"30","author":"SS Dwight","year":"2002","unstructured":"Dwight, S. S. et al. Saccharomyces Genome Database (SGD) provides secondary gene annotation using the Gene Ontology (GO). Nucl. Acids Res. 30, 69\u201372 (2002).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR58","doi-asserted-by":"crossref","first-page":"44","DOI":"10.1093\/nar\/27.1.44","volume":"27","author":"HW Mewes","year":"1999","unstructured":"Mewes, H. W. et al. MIPS: a database for genomes and protein sequences. Nucl. Acids Res. 27, 44\u201348 (1999).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR59","doi-asserted-by":"crossref","first-page":"31","DOI":"10.1093\/nar\/30.1.31","volume":"30","author":"HW Mewes","year":"2002","unstructured":"Mewes, H. W. et al. MIPS: a database for genomes and protein sequences. Nucl. Acids Res. 30, 31\u201334 (2002).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR60","doi-asserted-by":"crossref","first-page":"123","DOI":"10.1093\/nar\/28.1.123","volume":"28","author":"R Overbeek","year":"2000","unstructured":"Overbeek, R. et al. WIT: integrated system for high-throughput genome sequence analysis and metabolic reconstruction. Nucl. Acids Res. 28, 123\u2013125 (2000).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR61","doi-asserted-by":"crossref","first-page":"3442","DOI":"10.1093\/nar\/28.18.3442","volume":"28","author":"B Snel","year":"2000","unstructured":"Snel, B., Lehmann, G., Bork, P. & Huynen, M. A. STRING: a web-server to retrieve and display the repeatedly occurring neighbourhood of a gene. Nucl. Acids Res. 28, 3442\u20133444 (2000).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR62","doi-asserted-by":"crossref","first-page":"258","DOI":"10.1093\/nar\/gkg034","volume":"31","author":"C von Mering","year":"2003","unstructured":"von Mering, C. et al. STRING: a database of predicted functional associations between proteins. Nucl. Acids Res. 31, 258\u2013261 (2003).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR63","doi-asserted-by":"crossref","first-page":"751","DOI":"10.1126\/science.285.5428.751","volume":"285","author":"EM Marcotte","year":"1999","unstructured":"Marcotte, E. M. et al. Detecting protein function and protein\u2013protein interactions from genome sequences. Science 285, 751\u2013753 (1999).","journal-title":"Science"},{"key":"BFnrg1113_CR64","doi-asserted-by":"crossref","first-page":"4285","DOI":"10.1073\/pnas.96.8.4285","volume":"96","author":"M Pellegrini","year":"1999","unstructured":"Pellegrini, M., Marcotte, E. M., Thompson, M. J., Eisenberg, D. & Yeates, T. O. Assigning protein functions by comparative genome analysis: protein phylogenetic profiles. Proc. Natl Acad. Sci. USA 96, 4285\u20134288 (1999). This paper introduces the concept of phylogenetic profiles, and the idea that similar phylogenetic profiles indicate functional association between genes.","journal-title":"Proc. Natl Acad. Sci. USA"},{"key":"BFnrg1113_CR65","doi-asserted-by":"crossref","first-page":"0031","DOI":"10.1186\/gb-2001-2-9-research0034","volume":"2","author":"AJ Enright","year":"2001","unstructured":"Enright, A. J. & Ouzounis, C. A. Functional associations of proteins in entire genomes via exhaustive detection of gene fusion. Genome Biol. 2, 0031\u20130037 (2001).","journal-title":"Genome Biol."},{"key":"BFnrg1113_CR66","doi-asserted-by":"crossref","first-page":"86","DOI":"10.1038\/47056","volume":"402","author":"AJ Enright","year":"1999","unstructured":"Enright, A. J., Iliopoulos, I., Kyrpides, N. C. & Ouzounis, C. A. Protein interaction maps for complete genomes based on gene fusion events. Nature 402, 86\u201390 (1999).","journal-title":"Nature"},{"key":"BFnrg1113_CR67","doi-asserted-by":"crossref","first-page":"7940","DOI":"10.1073\/pnas.141236298","volume":"98","author":"I Yanai","year":"2001","unstructured":"Yanai, I., Derti, A. & DeLici, C. Genes linked by fusion events are generally of the same functional category: a systematic analysis of 30 microbial genomes. Proc. Natl Acad. Sci. USA 98, 7940\u20137945 (2001). This paper is a 'proof of principle' that gene-fusion events can be used to infer functional associations, as proposed in references 63 and 65.","journal-title":"Proc. Natl Acad. Sci. USA"},{"key":"BFnrg1113_CR68","doi-asserted-by":"crossref","first-page":"306","DOI":"10.1093\/nar\/30.1.306","volume":"30","author":"JC Mellor","year":"2002","unstructured":"Mellor, J. C., Yanai, I., Clodfelter, K. H., Mintseris, J. & DeLisi, C. Predictome: a database of putative functional links between proteins. Nucl. Acids Res. 30, 306\u2013309 (2002).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR69","doi-asserted-by":"crossref","first-page":"862","DOI":"10.1128\/MMBR.57.4.862-952.1993","volume":"57","author":"M Riley","year":"1993","unstructured":"Riley, M. Functions of the gene products of Escherichia coli. Microbiol. Rev. 57, 862\u2013952 (1993). The original comprehensive functional-classification scheme, developed for the gene products of the E. coli genome.","journal-title":"Microbiol. Rev."},{"key":"BFnrg1113_CR70","doi-asserted-by":"crossref","first-page":"205","DOI":"10.1089\/mcg.2000.5.205","volume":"5","author":"MH Serres","year":"2000","unstructured":"Serres, M. H. & Riley, M. MultiFun, a multifunctional classification scheme for Escherichia coli K-12 gene products. Microb. Comp. Genomics 5, 205\u2013222 (2000).","journal-title":"Microb. Comp. Genomics"},{"key":"BFnrg1113_CR71","doi-asserted-by":"crossref","first-page":"391","DOI":"10.1093\/bioinformatics\/15.5.391","volume":"15","author":"MA Andrade","year":"1999","unstructured":"Andrade, M. A. et al. Automated genome sequence analysis and annotation. Bioinformatics 15, 391\u2013412 (1999).","journal-title":"Bioinformatics"},{"key":"BFnrg1113_CR72","doi-asserted-by":"crossref","first-page":"542","DOI":"10.1093\/bioinformatics\/14.6.542","volume":"14","author":"J Tamames","year":"1998","unstructured":"Tamames, J., Ouzounis, C., Casari, G., Sander, C. & Valencia, A. EUCLID: automatic classification of proteins in functional classes by their database annotations. Bioinformatics 14, 542\u2013543 (1998).","journal-title":"Bioinformatics"},{"key":"BFnrg1113_CR73","doi-asserted-by":"crossref","first-page":"25","DOI":"10.1038\/75556","volume":"25","author":"MA Ashburner","year":"2000","unstructured":"Ashburner, M. A. et al. Gene ontology: tool for the unification of biology. Nature Genet. 25, 25\u201329 (2000). This paper describes the development of a dynamic controlled vocabulary for the functional annotation of eukaryotic gene products.","journal-title":"Nature Genet."},{"key":"BFnrg1113_CR74","doi-asserted-by":"crossref","first-page":"32","DOI":"10.1093\/nar\/24.1.32","volume":"24","author":"PD Karp","year":"1996","unstructured":"Karp, P. D., Riley, M., Paley, S. M. & Pellegrini-Toole, A. EcoCyc: an encyclopedia of Escherichia coli genes and metabolism. Nucl. Acids Res. 24, 32\u201339 (1996).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR75","first-page":"116","volume":"4","author":"PD Karp","year":"1996","unstructured":"Karp, P. D., Ouzounis, C. & Paley, S. HinCyc: a knowledge base of the complete genome and metabolic pathways of H. influenzae. Proc. Int. Conf. Intell. Syst. Mol. Biol. 4, 116\u2013124 (1996).","journal-title":"Proc. Int. Conf. Intell. Syst. Mol. Biol."},{"key":"BFnrg1113_CR76","doi-asserted-by":"crossref","first-page":"59","DOI":"10.1093\/nar\/30.1.59","volume":"30","author":"PD Karp","year":"2002","unstructured":"Karp, P. D., Riley, M., Paley, S. M. & Pellegrini-Toole, A. The MetaCyc database. Nucl. Acids Res. 30, 59\u201361 (2002).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR77","doi-asserted-by":"crossref","first-page":"42","DOI":"10.1093\/nar\/30.1.42","volume":"30","author":"M Kanehisa","year":"2002","unstructured":"Kanehisa, M., Goto, S., Kawashima, S. & Nakaya, A. The KEGG databases at GenomeNet. Nucl. Acids Res. 30, 42\u201346 (2002).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR78","doi-asserted-by":"crossref","first-page":"29","DOI":"10.1093\/nar\/27.1.29","volume":"27","author":"H Ogata","year":"1999","unstructured":"Ogata, H. et al. KEGG: Kyoto Encyclopedia of Genes and Genomes. Nucl. Acids Res. 27, 29\u201334 (1999).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR79","doi-asserted-by":"crossref","first-page":"289","DOI":"10.1093\/nar\/28.1.289","volume":"28","author":"I Xenarios","year":"2000","unstructured":"Xenarios, I. et al. DIP: the database of interacting proteins. Nucl. Acids Res. 28, 289\u2013291 (2000).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR80","doi-asserted-by":"crossref","first-page":"303","DOI":"10.1093\/nar\/30.1.303","volume":"30","author":"I Xenarios","year":"2002","unstructured":"Xenarios, I. et al. DIP, the Database of Interacting Protiens: a research tool for studying cellular networks of protein interactions. Nucl. Acids Res. 30, 303\u2013305 (2002).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR81","doi-asserted-by":"crossref","first-page":"80","DOI":"10.1093\/nar\/30.1.80","volume":"30","author":"G Habeler","year":"2002","unstructured":"Habeler, G. et al. YPL.db: the Yeast Protein Localization database. Nucl. Acids Res. 30, 80\u201383 (2002).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR82","doi-asserted-by":"crossref","first-page":"81","DOI":"10.1093\/nar\/28.1.81","volume":"28","author":"A Kumar","year":"2000","unstructured":"Kumar, A. et al. TRIPLES: a database of gene function in Saccharomyces cerevisiae. Nucl. Acids Res. 28, 81\u201384 (2000).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR83","doi-asserted-by":"crossref","first-page":"73","DOI":"10.1093\/nar\/30.1.73","volume":"30","author":"A Kumar","year":"2002","unstructured":"Kumar, A. et al. The TRIPLES database: a community resource for yeast molecular biology. Nucl. Acids Res. 30, 73\u201375 (2002).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR84","doi-asserted-by":"crossref","first-page":"135","DOI":"10.1016\/S0014-5793(01)03293-8","volume":"513","author":"A Zanzoni","year":"2002","unstructured":"Zanzoni, A. et al. MINT: a Molecular INTeraction database. FEBS Lett. 513, 135\u2013140 (2002).","journal-title":"FEBS Lett."},{"key":"BFnrg1113_CR85","doi-asserted-by":"crossref","first-page":"242","DOI":"10.1093\/nar\/29.1.242","volume":"29","author":"GD Bader","year":"2001","unstructured":"Bader, G. D. et al. BIND \u2014 the Biomolecular Interaction Network Database. Nucl. Acids Res. 29, 242\u2013245 (2001).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR86","doi-asserted-by":"crossref","first-page":"248","DOI":"10.1093\/nar\/gkg056","volume":"31","author":"GD Bader","year":"2003","unstructured":"Bader, G. D., Betel, D. & Hogue, C. W. BIND: the Biomolecular Interaction Network Database. Nucl. Acids Res. 31, 248\u2013250 (2003).","journal-title":"Nucl. Acids Res."},{"key":"BFnrg1113_CR87","doi-asserted-by":"crossref","first-page":"211","DOI":"10.1038\/35051615","volume":"409","author":"JC Rain","year":"2001","unstructured":"Rain, J. C. et al. The protein\u2013protein interaction map of Helicobacter pylori. Nature 409, 211\u2013215 (2001). The only genome-wide protein-interaction map, so far, to be constructed for a prokaryote.","journal-title":"Nature"},{"key":"BFnrg1113_CR88","doi-asserted-by":"crossref","first-page":"141","DOI":"10.1038\/415141a","volume":"415","author":"AC Gavin","year":"2002","unstructured":"Gavin, A. C. et al. Functional organization of the yeast proteome by systematic analysis of protein complexes. Nature 415, 141\u2013147 (2002). This paper describes the identification of yeast-protein complexes using large-scale tandem-affinity purification coupled to mass spectrometry.","journal-title":"Nature"},{"key":"BFnrg1113_CR89","doi-asserted-by":"crossref","first-page":"2","DOI":"10.1186\/1471-2105-4-2","volume":"4","author":"GD Bader","year":"2003","unstructured":"Bader, G. D. & Hogue, C. W. An automated method for finding molecular complexes in large protein interaction networks. BMC Bioinformatics 4, 2 (2003).","journal-title":"BMC Bioinformatics"},{"key":"BFnrg1113_CR90","doi-asserted-by":"crossref","first-page":"56","DOI":"10.1007\/s101420000005","volume":"1","author":"SC Rison","year":"2000","unstructured":"Rison, S. C., Hodgman, T. C. & Thornton, J. M. Comparison of functional annotation schemes for genomes. Funct. Integr. Genomics 1, 56\u201369 (2000). An in-depth analysis and comparison of present functional classification schemes.","journal-title":"Funct. Integr. Genomics"},{"key":"BFnrg1113_CR91","doi-asserted-by":"crossref","first-page":"717","DOI":"10.1093\/bioinformatics\/btg077","volume":"19","author":"I Iliopoulos","year":"2003","unstructured":"Iliopoulos, I. et al. Evaluation of annotation strategies using an entire genome sequence. Bioinformatics 19, 717\u2013726 (2003).","journal-title":"Bioinformatics"},{"key":"BFnrg1113_CR92","doi-asserted-by":"crossref","first-page":"218","DOI":"10.1038\/nature01256","volume":"420","author":"EV Koonin","year":"2002","unstructured":"Koonin, E. V., Wolf, Y. I. & Karev, G. P. The structure of the protein universe and genome evolution. Nature 420, 218\u2013223 (2002).","journal-title":"Nature"},{"key":"BFnrg1113_CR93","doi-asserted-by":"crossref","first-page":"399","DOI":"10.1038\/nature750","volume":"417","author":"C von Mering","year":"2002","unstructured":"von Mering, C. et al. Comparative assessment of large-scale data sets of protein\u2013protein interactions. Nature 417, 399\u2013403 (2002).","journal-title":"Nature"},{"key":"BFnrg1113_CR94","doi-asserted-by":"crossref","first-page":"349","DOI":"10.1074\/mcp.M100037-MCP200","volume":"1","author":"CM Deane","year":"2002","unstructured":"Deane, C. M., Salwinski, L., Xenarios, I. & Eisenberg, D. Protein interactions: two methods for assessment of the reliability of high throughput observations. Mol. Cell Proteomics 1, 349\u2013356 (2002).","journal-title":"Mol. Cell Proteomics"},{"key":"BFnrg1113_CR95","doi-asserted-by":"crossref","first-page":"510","DOI":"10.1126\/science.214.4520.510","volume":"214","author":"E Mayr","year":"1981","unstructured":"Mayr, E. Biological classification: toward a synthesis of opposing methodologies. Science 214, 510\u2013516 (1981).","journal-title":"Science"},{"key":"BFnrg1113_CR96","first-page":"21","volume":"28","author":"TK Jenssen","year":"2001","unstructured":"Jenssen, T. K., Laegreid, A., Komorowski, J. & Hovig, E. A literature network of human genes for high-throughput analysis of gene expression. Nature Genet. 28, 21\u201328 (2001). An automated analysis of the biomedical literature that identifies large-scale functional associations between thousands of human genes.","journal-title":"Nature Genet."},{"key":"BFnrg1113_CR97","doi-asserted-by":"crossref","first-page":"754","DOI":"10.1126\/science.282.5389.754","volume":"282","author":"RS Stephens","year":"1998","unstructured":"Stephens, R. S. et al. Genome sequence of an obligate intracellular pathogen of humans: Chlamydia trachomatis. Science 282, 754\u2013759 (1998).","journal-title":"Science"},{"key":"BFnrg1113_CR98","doi-asserted-by":"crossref","first-page":"95","DOI":"10.1002\/1097-0061(20000630)17:2<95::AID-YEA16>3.0.CO;2-H","volume":"17","author":"M Fromont-Racine","year":"2000","unstructured":"Fromont-Racine, M. et al. Genome-wide protein interaction screens reveal functional networks involving Sm-like proteins. Yeast 17, 95\u2013110 (2000). This paper describes the first large-scale use of two-hybrid arrays to identify protein interactions in yeast.","journal-title":"Yeast"},{"key":"BFnrg1113_CR99","doi-asserted-by":"crossref","first-page":"623","DOI":"10.1038\/35001009","volume":"403","author":"P Uetz","year":"2000","unstructured":"Uetz, P. et al. A comprehensive analysis of protein\u2013protein interactions in Saccharomyces cerevisiae. Nature 403, 623\u2013627 (2000).","journal-title":"Nature"}],"container-title":["Nature Reviews Genetics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/www.nature.com\/articles\/nrg1113.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/www.nature.com\/articles\/nrg1113","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/www.nature.com\/articles\/nrg1113.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,5,19]],"date-time":"2023-05-19T03:55:45Z","timestamp":1684468545000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.nature.com\/articles\/nrg1113"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2003,7]]},"references-count":99,"journal-issue":{"issue":"7","published-print":{"date-parts":[[2003,7]]}},"alternative-id":["BFnrg1113"],"URL":"https:\/\/doi.org\/10.1038\/nrg1113","relation":{},"ISSN":["1471-0056","1471-0064"],"issn-type":[{"value":"1471-0056","type":"print"},{"value":"1471-0064","type":"electronic"}],"subject":[],"published":{"date-parts":[[2003,7]]}}}