{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,4]],"date-time":"2026-03-04T23:37:45Z","timestamp":1772667465609,"version":"3.50.1"},"reference-count":32,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2012,10,13]],"date-time":"2012-10-13T00:00:00Z","timestamp":1350086400000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/2.0"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["BMC Bioinformatics"],"published-print":{"date-parts":[[2012,12]]},"DOI":"10.1186\/1471-2105-13-264","type":"journal-article","created":{"date-parts":[[2012,10,13]],"date-time":"2012-10-13T04:38:10Z","timestamp":1350103090000},"source":"Crossref","is-referenced-by-count":21,"title":["Sifting through genomes with iterative-sequence clustering produces a large, phylogenetically diverse protein-family resource"],"prefix":"10.1186","volume":"13","author":[{"given":"Thomas J","family":"Sharpton","sequence":"first","affiliation":[]},{"given":"Guillaume","family":"Jospin","sequence":"additional","affiliation":[]},{"given":"Dongying","family":"Wu","sequence":"additional","affiliation":[]},{"given":"Morgan GI","family":"Langille","sequence":"additional","affiliation":[]},{"given":"Katherine S","family":"Pollard","sequence":"additional","affiliation":[]},{"given":"Jonathan A","family":"Eisen","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2012,10,13]]},"reference":[{"issue":"21","key":"5411_CR1","doi-asserted-by":"publisher","first-page":"6688","DOI":"10.1093\/nar\/gkn668","volume":"36","author":"EV Koonin","year":"2008","unstructured":"Koonin EV, Wolf YI: Genomics of bacteria and archaea: the emerging dynamic view of the prokaryotic world. Nucleic Acids Res 2008, 36(21):6688\u20136719. 10.1093\/nar\/gkn668","journal-title":"Nucleic Acids Res"},{"issue":"6819","key":"5411_CR2","doi-asserted-by":"publisher","first-page":"529","DOI":"10.1038\/35054089","volume":"409","author":"NT Perna","year":"2001","unstructured":"Perna NT, et al.: Genome sequence of enterohaemorrhagic Escherichia coli O157:H7. Nature 2001, 409(6819):529\u2013533. 10.1038\/35054089","journal-title":"Nature"},{"issue":"39","key":"5411_CR3","doi-asserted-by":"publisher","first-page":"13950","DOI":"10.1073\/pnas.0506758102","volume":"102","author":"H Tettelin","year":"2005","unstructured":"Tettelin H, et al.: Genome analysis of multiple pathogenic isolates of Streptococcus agalactiae: implications for the microbial \u201cpan-genome\u201d. Proc Natl Acad Sci USA 2005, 102(39):13950\u201313955. 10.1073\/pnas.0506758102","journal-title":"Proc Natl Acad Sci USA"},{"issue":"20","key":"5411_CR4","doi-asserted-by":"publisher","first-page":"6881","DOI":"10.1128\/JB.00619-08","volume":"190","author":"DA Rasko","year":"2008","unstructured":"Rasko DA, et al.: The pangenome structure of Escherichia coli: comparative genomic analysis of E. coli commensal and pathogenic isolates. J Bacteriol 2008, 190(20):6881\u20136893. 10.1128\/JB.00619-08","journal-title":"J Bacteriol"},{"issue":"7276","key":"5411_CR5","doi-asserted-by":"publisher","first-page":"1056","DOI":"10.1038\/nature08656","volume":"462","author":"D Wu","year":"2009","unstructured":"Wu D, et al.: A phylogeny-driven genomic encyclopaedia of Bacteria and Archaea. Nature 2009, 462(7276):1056\u20131060. 10.1038\/nature08656","journal-title":"Nature"},{"issue":"3","key":"5411_CR6","doi-asserted-by":"publisher","first-page":"e16","DOI":"10.1371\/journal.pbio.0050016","volume":"5","author":"S Yooseph","year":"2007","unstructured":"Yooseph S, et al.: The Sorcerer II Global Ocean Sampling expedition: expanding the universe of protein families. PLoS Biol 2007, 5(3):e16. 10.1371\/journal.pbio.0050016","journal-title":"PLoS Biol"},{"issue":"5338","key":"5411_CR7","doi-asserted-by":"publisher","first-page":"631","DOI":"10.1126\/science.278.5338.631","volume":"278","author":"RL Tatusov","year":"1997","unstructured":"Tatusov RL, Koonin EV, Lipman DJ: A genomic perspective on protein families. Science 1997, 278(5338):631\u2013637. 10.1126\/science.278.5338.631","journal-title":"Science"},{"issue":"Database issue","key":"5411_CR8","first-page":"D190-5","volume":"36","author":"TU Consortium","year":"2008","unstructured":"Consortium TU: The universal protein resource (UniProt). Nucleic Acids Res 2008, 36(Database issue):D190\u20135.","journal-title":"Nucleic Acids Res"},{"issue":"1","key":"5411_CR9","doi-asserted-by":"publisher","first-page":"27","DOI":"10.1093\/nar\/28.1.27","volume":"28","author":"M Kanehisa","year":"2000","unstructured":"Kanehisa M, Goto S: KEGG: kyoto encyclopedia of genes and genomes. Nucleic Acids Res 2000, 28(1):27\u201330. 10.1093\/nar\/28.1.27","journal-title":"Nucleic Acids Res"},{"issue":"Database issue","key":"5411_CR10","doi-asserted-by":"publisher","first-page":"D471","DOI":"10.1093\/nar\/gkn661","volume":"37","author":"T Lima","year":"2009","unstructured":"Lima T, et al.: HAMAP: a database of completely sequenced microbial proteome sets and manually curated microbial protein families in UniProtKB\/Swiss-Prot. Nucleic Acids Res 2009, 37(Database issue):D471-D478.","journal-title":"Nucleic Acids Res"},{"issue":"20","key":"5411_CR11","doi-asserted-by":"publisher","first-page":"6643","DOI":"10.1093\/nar\/gkp698","volume":"37","author":"F Meyer","year":"2009","unstructured":"Meyer F, Overbeek R, Rodriguez A: FIGfams: yet another set of protein families. Nucleic Acids Res 2009, 37(20):6643\u20136654. 10.1093\/nar\/gkp698","journal-title":"Nucleic Acids Res"},{"issue":"Database issue","key":"5411_CR12","doi-asserted-by":"publisher","first-page":"D290","DOI":"10.1093\/nar\/gkr1065","volume":"40","author":"M Punta","year":"2012","unstructured":"Punta M, et al.: The Pfam protein families database. Nucleic Acids Res 2012, 40(Database issue):D290-D301.","journal-title":"Nucleic Acids Res"},{"issue":"1","key":"5411_CR13","doi-asserted-by":"publisher","first-page":"371","DOI":"10.1093\/nar\/gkg128","volume":"31","author":"DH Haft","year":"2003","unstructured":"Haft DH, Selengut JD, White O: The TIGRFAMs database of protein families. Nucleic Acids Res 2003, 31(1):371\u2013373. 10.1093\/nar\/gkg128","journal-title":"Nucleic Acids Res"},{"issue":"1","key":"5411_CR14","doi-asserted-by":"publisher","first-page":"334","DOI":"10.1093\/nar\/gkg115","volume":"31","author":"PD Thomas","year":"2003","unstructured":"Thomas PD, et al.: PANTHER: a browsable database of gene products organized by biological function, using curated protein family and subfamily classification. Nucleic Acids Res 2003, 31(1):334\u2013341. 10.1093\/nar\/gkg115","journal-title":"Nucleic Acids Res"},{"issue":"9","key":"5411_CR15","doi-asserted-by":"publisher","first-page":"R83","DOI":"10.1186\/gb-2006-7-9-r83","volume":"7","author":"N Krishnamurthy","year":"2006","unstructured":"Krishnamurthy N, et al.: PhyloFacts: an online structural phylogenomic encyclopedia for protein functional and structural classification. Genome Biol 2006, 7(9):R83. 10.1186\/gb-2006-7-9-r83","journal-title":"Genome Biol"},{"issue":"Database issue","key":"5411_CR16","doi-asserted-by":"publisher","first-page":"D216","DOI":"10.1093\/nar\/gkn734","volume":"37","author":"W Klimke","year":"2009","unstructured":"Klimke W, et al.: The National Center for Biotechnology Information\u2019s Protein Clusters Database. Nucleic Acids Res 2009, 37(Database issue):D216-D223.","journal-title":"Nucleic Acids Res"},{"issue":"Database issue","key":"5411_CR17","doi-asserted-by":"publisher","first-page":"D284","DOI":"10.1093\/nar\/gkr1060","volume":"40","author":"S Powell","year":"2012","unstructured":"Powell S, et al.: eggNOG v3.0: orthologous groups covering 1133 organisms at 41 different taxonomic ranges. Nucleic Acids Res 2012, 40(Database issue):D284-D289.","journal-title":"Nucleic Acids Res"},{"issue":"3","key":"5411_CR18","doi-asserted-by":"publisher","first-page":"225","DOI":"10.1093\/bib\/bbl004","volume":"7","author":"I Friedberg","year":"2006","unstructured":"Friedberg I: Automated protein function prediction\u2013the genomic challenge. Brief Bioinform 2006, 7(3):225\u2013242. 10.1093\/bib\/bbl004","journal-title":"Brief Bioinform"},{"issue":"10","key":"5411_CR19","doi-asserted-by":"publisher","first-page":"1722","DOI":"10.1101\/gr.087551.108","volume":"19","author":"TJ Sharpton","year":"2009","unstructured":"Sharpton TJ, et al.: Comparative genomic analyses of the human fungal pathogens Coccidioides and their relatives. Genome Res 2009, 19(10):1722\u20131731. 10.1101\/gr.087551.108","journal-title":"Genome Res"},{"issue":"3","key":"5411_CR20","doi-asserted-by":"publisher","first-page":"e9773","DOI":"10.1371\/journal.pone.0009773","volume":"5","author":"WP Inskeep","year":"2010","unstructured":"Inskeep WP, et al.: Metagenomes from high-temperature chemotrophic systems reveal geochemical controls on microbial community structure and function. PLoS One 2010, 5(3):e9773. 10.1371\/journal.pone.0009773","journal-title":"PLoS One"},{"issue":"7","key":"5411_CR21","doi-asserted-by":"publisher","first-page":"1575","DOI":"10.1093\/nar\/30.7.1575","volume":"30","author":"AJ Enright","year":"2002","unstructured":"Enright AJ, Van Dongen S, Ouzounis CA: An efficient algorithm for large-scale detection of protein families. Nucleic Acids Res 2002, 30(7):1575\u20131584. 10.1093\/nar\/30.7.1575","journal-title":"Nucleic Acids Res"},{"key":"5411_CR22","first-page":"RRN1198","volume":"2","author":"K Liu","year":"2010","unstructured":"Liu K, Linder CR, Warnow T: Multiple sequence alignment: a major challenge to large-scale phylogenetics. PLoS Curr 2010, 2: RRN1198.","journal-title":"PLoS Curr"},{"key":"5411_CR23","doi-asserted-by":"publisher","first-page":"37","DOI":"10.1007\/978-1-60761-977-2_3","volume":"694","author":"J McDowall","year":"2011","unstructured":"McDowall J, Hunter S: InterPro protein classification. Methods Mol Biol 2011, 694: 37\u201347. 10.1007\/978-1-60761-977-2_3","journal-title":"Methods Mol Biol"},{"issue":"4","key":"5411_CR24","doi-asserted-by":"publisher","first-page":"132","DOI":"10.1016\/S0168-9525(99)01706-0","volume":"15","author":"SE Brenner","year":"1999","unstructured":"Brenner SE: Errors in genome annotation. Trends Genet 1999, 15(4):132\u2013133. 10.1016\/S0168-9525(99)01706-0","journal-title":"Trends Genet"},{"key":"5411_CR25","first-page":"D546","volume":"39","author":"S Sun","year":"2011","unstructured":"Sun S, et al.: Community cyberinfrastructure for Advanced Microbial Ecology Research and Analysis: the CAMERA resource. Database issue 2011, 39: D546-D551.","journal-title":"Database issue"},{"issue":"3","key":"5411_CR26","doi-asserted-by":"publisher","first-page":"403","DOI":"10.1016\/S0022-2836(05)80360-2","volume":"215","author":"SF Altschul","year":"1990","unstructured":"Altschul SF, et al.: Basic local alignment search tool. J Mol Biol 1990, 215(3):403\u2013410.","journal-title":"J Mol Biol"},{"issue":"5","key":"5411_CR27","doi-asserted-by":"publisher","first-page":"1792","DOI":"10.1093\/nar\/gkh340","volume":"32","author":"RC Edgar","year":"2004","unstructured":"Edgar RC: MUSCLE: multiple sequence alignment with high accuracy and high throughput. Nucleic Acids Res 2004, 32(5):1792\u20131797. 10.1093\/nar\/gkh340","journal-title":"Nucleic Acids Res"},{"issue":"3","key":"5411_CR28","doi-asserted-by":"publisher","first-page":"307","DOI":"10.1093\/sysbio\/syq010","volume":"59","author":"S Guindon","year":"2010","unstructured":"Guindon S, et al.: New algorithms and methods to estimate maximum-likelihood phylogenies: assessing the performance of PhyML 3.0. Syst Biol 2010, 59(3):307\u2013321. 10.1093\/sysbio\/syq010","journal-title":"Syst Biol"},{"issue":"10","key":"5411_CR29","doi-asserted-by":"publisher","first-page":"e1002195","DOI":"10.1371\/journal.pcbi.1002195","volume":"7","author":"SR Eddy","year":"2011","unstructured":"Eddy SR: Accelerated Profile HMM Searches. PLoS Comput Biol 2011, 7(10):e1002195. 10.1371\/journal.pcbi.1002195","journal-title":"PLoS Comput Biol"},{"issue":"3","key":"5411_CR30","doi-asserted-by":"publisher","first-page":"e9490","DOI":"10.1371\/journal.pone.0009490","volume":"5","author":"MN Price","year":"2010","unstructured":"Price MN, Dehal PS, Arkin AP: FastTree 2\u2013approximately maximum-likelihood trees for large alignments. PLoS One 2010, 5(3):e9490. 10.1371\/journal.pone.0009490","journal-title":"PLoS One"},{"issue":"Database issue","key":"5411_CR31","doi-asserted-by":"publisher","first-page":"D115","DOI":"10.1093\/nar\/gkr1044","volume":"40","author":"VM Markowitz","year":"2012","unstructured":"Markowitz VM, et al.: IMG: the Integrated Microbial Genomes database and comparative analysis system. Nucleic Acids Res 2012, 40(Database issue):D115-D122.","journal-title":"Nucleic Acids Res"},{"key":"5411_CR32","first-page":"1695","volume":"Complex Systems","author":"G Csardi","year":"2006","unstructured":"Csardi G, Nepusz T: The igraph software package for complex network research. InterJournal 2006, Complex Systems: 1695.","journal-title":"InterJournal"}],"container-title":["BMC Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/1471-2105-13-264.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1186\/1471-2105-13-264\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/1471-2105-13-264.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,1,23]],"date-time":"2019-01-23T06:04:06Z","timestamp":1548223446000},"score":1,"resource":{"primary":{"URL":"https:\/\/bmcbioinformatics.biomedcentral.com\/articles\/10.1186\/1471-2105-13-264"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2012,10,13]]},"references-count":32,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2012,12]]}},"alternative-id":["5411"],"URL":"https:\/\/doi.org\/10.1186\/1471-2105-13-264","relation":{},"ISSN":["1471-2105"],"issn-type":[{"value":"1471-2105","type":"electronic"}],"subject":[],"published":{"date-parts":[[2012,10,13]]},"article-number":"264"}}