{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,31]],"date-time":"2026-01-31T05:14:41Z","timestamp":1769836481924,"version":"3.49.0"},"reference-count":37,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2009,10,2]],"date-time":"2009-10-02T00:00:00Z","timestamp":1254441600000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/2.0"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["BMC Bioinformatics"],"published-print":{"date-parts":[[2009,12]]},"DOI":"10.1186\/1471-2105-10-316","type":"journal-article","created":{"date-parts":[[2009,10,7]],"date-time":"2009-10-07T10:13:47Z","timestamp":1254910427000},"source":"Crossref","is-referenced-by-count":81,"title":["Unsupervised statistical clustering of environmental shotgun sequences"],"prefix":"10.1186","volume":"10","author":[{"given":"Andrey","family":"Kislyuk","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Srijak","family":"Bhatnagar","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jonathan","family":"Dushoff","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Joshua S","family":"Weitz","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2009,10,2]]},"reference":[{"issue":"6978","key":"3046_CR1","doi-asserted-by":"publisher","first-page":"37","DOI":"10.1038\/nature02340","volume":"428","author":"GW Tyson","year":"2004","unstructured":"Tyson GW, Chapman J, Hugenholtz P, Allen EE, Ram RJ, Richardson PM, Solovyev VV, Rubin EM, Rokhsar DS, Banfield JF: Community structure and metabolism through reconstruction of microbial genomes from the environment. Nature 2004, 428(6978):37\u201343. 10.1038\/nature02340","journal-title":"Nature"},{"issue":"5721","key":"3046_CR2","doi-asserted-by":"publisher","first-page":"554","DOI":"10.1126\/science.1107851","volume":"308","author":"SG Tringe","year":"2005","unstructured":"Tringe SG, von Mering C, Kobayashi A, Salamov AA, Chen K, Chang HW, Podar M, Short JM, Mathur EJ, Detter JC, Bork P, Hugenholtz P, Rubin EM: Comparative Metagenomics of Microbial Communities. Science 2005, 308(5721):554\u2013557. 10.1126\/science.1107851","journal-title":"Science"},{"issue":"3","key":"3046_CR3","doi-asserted-by":"publisher","first-page":"e77","DOI":"10.1371\/journal.pbio.0050077","volume":"5","author":"DB Rusch","year":"2007","unstructured":"Rusch DB, Halpern AL, Sutton G, Heidelberg KB, Williamson S, Yooseph S, Wu D, Eisen JA, Hoffman JM, Remington K, Beeson K, Tran B, Smith H, Baden-Tillson H, Stewart C, Thorpe J, Freeman J, Andrews-Pfannkoch C, Venter JE, Li K, Kravitz S, Heidelberg JF, Utterback T, Rogers YH, Falc\u00f3n LI, Souza V, Bonilla-Rosso G, Eguiarte LE, Karl DM, Sathyendranath S, Platt T, Bermingham E, Gallardo V, Tamayo-Castillo G, Ferrari MR, Strausberg RL, Nealson K, Friedman R, Frazier M, Venter CJ: The Sorcerer II Global Ocean Sampling Expedition: Northwest Atlantic through Eastern Tropical Pacific. PLoS Biology 2007, 5(3):e77. 10.1371\/journal.pbio.0050077","journal-title":"PLoS Biology"},{"issue":"7169","key":"3046_CR4","doi-asserted-by":"publisher","first-page":"560","DOI":"10.1038\/nature06269","volume":"450","author":"F Warnecke","year":"2007","unstructured":"Warnecke F, Luginb\u00fchl P, Ivanova N, Ghassemian M, Richardson TH, Stege JT, Cayouette M, Mchardy AC, Djordjevic G, Aboushadi N, Sorek R, Tringe SG, Podar M, Martin HG, Kunin V, Dalevi D, Madejska J, Kirton E, Platt D, Szeto E, Salamov A, Barry K, Mikhailova N, Kyrpides NC, Matson EG, Ottesen EA, Zhang X, Hern\u00e1ndez M, Murillo C, Acosta LG, Rigoutsos I, Tamayo G, Green BD, Chang C, Rubin EM, Mathur EJ, Robertson DE, Hugenholtz P, Leadbetter JR: Metagenomic and functional analysis of hindgut microbiota of a wood-feeding higher termite. Nature 2007, 450(7169):560\u2013565. 10.1038\/nature06269","journal-title":"Nature"},{"issue":"5778","key":"3046_CR5","doi-asserted-by":"publisher","first-page":"1355","DOI":"10.1126\/science.1124234","volume":"312","author":"SR Gill","year":"2006","unstructured":"Gill SR, Pop M, Deboy RT, Eckburg PB, Turnbaugh PJ, Samuel BS, Gordon JI, Relman DA, Fraser-Liggett CM, Nelson KE: Metagenomic Analysis of the Human Distal Gut Microbiome. Science 2006, 312(5778):1355\u20131359. 10.1126\/science.1124234","journal-title":"Science"},{"issue":"5802","key":"3046_CR6","doi-asserted-by":"publisher","first-page":"1113","DOI":"10.1126\/science.1131412","volume":"314","author":"JP Noonan","year":"2006","unstructured":"Noonan JP, Coop G, Kudaravalli S, Smith D, Krause J, Alessi J, Chen F, Platt D, P\u00e4\u00e4bo S, Pritchard JK, Rubin EM: Sequencing and analysis of Neanderthal genomic DNA. Science 2006, 314(5802):1113\u20131118. 10.1126\/science.1131412","journal-title":"Science"},{"issue":"5","key":"3046_CR7","doi-asserted-by":"publisher","first-page":"1233","DOI":"10.1111\/j.1462-2920.2007.01247.x","volume":"9","author":"F Not","year":"2007","unstructured":"Not F, Gausling R, Azam F, Heidelberg JF, Worden AZ: Vertical distribution of picoeukaryotic diversity in the Sargasso Sea. Environmental Microbiology 2007, 9(5):1233\u20131252. 10.1111\/j.1462-2920.2007.01247.x","journal-title":"Environmental Microbiology"},{"key":"3046_CR8","series-title":"PLoS Biol","volume-title":"The marine viromes of four oceanic regions","author":"FE Angly","year":"2006","unstructured":"Angly FE, Felts B, Breitbart M, Salamon P, Edwards RA, Carlson C, Chan AM, Haynes M, Kelley S, Liu H, Mahaffy JM, Mueller JE, Nulton J, Olson R, Parsons R, Rayhawk S, Suttle CA, Rohwer F: The marine viromes of four oceanic regions. PLoS Biol 2006., 4(11): 10.1371\/journal.pbio.0040368"},{"issue":"11","key":"3046_CR9","doi-asserted-by":"publisher","first-page":"e1000255","DOI":"10.1371\/journal.pgen.1000255","volume":"4","author":"SM Huse","year":"2008","unstructured":"Huse SM, Dethlefsen L, Huber JA, Welch DM, Relman DA, Sogin ML: Exploring Microbial Diversity and Taxonomy Using SSU rRNA Hypervariable Tag Sequencing. PLoS Genet 2008, 4(11):e1000255. 10.1371\/journal.pgen.1000255","journal-title":"PLoS Genet"},{"issue":"32","key":"3046_CR10","doi-asserted-by":"publisher","first-page":"12115","DOI":"10.1073\/pnas.0605127103","volume":"103","author":"ML Sogin","year":"2006","unstructured":"Sogin ML, Morrison HG, Huber JA, Welch DM, Huse SM, Neal PR, Arrieta JM, Herndl GJ: Microbial diversity in the deep sea and the underexplored \" rare biosphere\". Proceedings of the National Academy of Sciences 2006, 103(32):12115\u201312120. 10.1073\/pnas.0605127103","journal-title":"Proceedings of the National Academy of Sciences"},{"issue":"4","key":"3046_CR11","doi-asserted-by":"publisher","first-page":"669","DOI":"10.1128\/MMBR.68.4.669-685.2004","volume":"68","author":"J Handelsman","year":"2004","unstructured":"Handelsman J: Metagenomics: application of genomics to uncultured microorganisms. Microbiol Mol Biol Rev 2004, 68(4):669\u2013685. 10.1128\/MMBR.68.4.669-685.2004","journal-title":"Microbiol Mol Biol Rev"},{"key":"3046_CR12","doi-asserted-by":"crossref","unstructured":"Yooseph S, Sutton G, Rusch DB, Halpern AL, Williamson SJ, Remington K, Eisen JA, Heidelberg KB, Manning G, Li W, Jaroszewski L, Cieplak P, Miller CS, Li H, Mashiyama STT, Joachimiak MP, van Belle C, Chandonia JM, Soergel DA, Zhai Y, Natarajan K, Lee S, Raphael BJ, Bafna V, Friedman R, Brenner SE, Godzik A, Eisenberg D, Dixon JE, Taylor SS, Strausberg RL, Frazier M, Venter JC: The Sorcerer II Global Ocean Sampling Expedition: Expanding the Universe of Protein Families. PLoS Biol 2007., 5(3): 10.1371\/journal.pbio.0050016","DOI":"10.1371\/journal.pbio.0050016"},{"issue":"7187","key":"3046_CR13","doi-asserted-by":"publisher","first-page":"629","DOI":"10.1038\/nature06810","volume":"452","author":"EA Dinsdale","year":"2008","unstructured":"Dinsdale EA, Edwards RA, Hall D, Angly F, Breitbart M, Brulc JM, Furlan M, Desnues C, Haynes M, Li L, McDaniel L, Moran MAA, Nelson KE, Nilsson C, Olson R, Paul J, Brito BRR, Ruan Y, Swan BK, Stevens R, Valentine DL, Thurber RVV, Wegley L, White BA, Rohwer F: Functional metagenomic profiling of nine biomes. Nature 2008, 452(7187):629\u2013632. 10.1038\/nature06810","journal-title":"Nature"},{"issue":"6839","key":"3046_CR14","doi-asserted-by":"publisher","first-page":"786","DOI":"10.1038\/35081051","volume":"411","author":"O B\u00e9j\u00e0","year":"2001","unstructured":"B\u00e9j\u00e0 O, Spudich EN, Spudich JL, Leclerc M, DeLong EF: Proteorhodopsin phototrophy in the ocean. Nature 2001, 411(6839):786\u2013789. 10.1038\/35081051","journal-title":"Nature"},{"issue":"3","key":"3046_CR15","doi-asserted-by":"crossref","first-page":"695","DOI":"10.1128\/AEM.59.3.695-700.1993","volume":"59","author":"G Muyzer","year":"1993","unstructured":"Muyzer G, de Waal EC, Uitterlinden AG: Profiling of complex microbial populations by denaturing gradient gel electrophoresis analysis of polymerase chain reaction-amplified genes coding for 16S rRNA. Appl Environ Microbiol 1993, 59(3):695\u2013700.","journal-title":"Appl Environ Microbiol"},{"issue":"7057","key":"3046_CR16","doi-asserted-by":"crossref","first-page":"376","DOI":"10.1038\/nature03959","volume":"437","author":"M Margulies","year":"2005","unstructured":"Margulies M, Egholm M, Altman WE, Attiya S, Bader JS, Bemben LA, Berka J, Braverman MS, Chen YJ, Chen Z, Dewell SB, Du L, Fierro JM, Gomes XV, Godwin BC, He W, Helgesen S, Ho CH, Irzyk GP, Jando SC, Alenquer MLI, Jarvie TP, Jirage KB, Kim JB, Knight JR, Lanza JR, Leamon JH, Lefkowitz SM, Lei M, Li J, Lohman KL, Lu H, Makhijani VB, Mcdade KE, Mckenna MP, Myers EW, Nickerson E, Nobile JR, Plant R, Puc BP, Ronan MT, Roth GT, Sarkis GJ, Simons JF, Simpson JW, Srinivasan M, Tartaro KR, Tomasz A, Vogt KA, Volkmer GA, Wang SH, Wang Y, Weiner MP, Yu P, Begley RF, Rothberg JM: Genome sequencing in microfabricated high-density picolitre reactors. Nature 2005, 437(7057):376\u2013380.","journal-title":"Nature"},{"issue":"6","key":"3046_CR17","doi-asserted-by":"publisher","first-page":"545","DOI":"10.1016\/j.gde.2006.10.009","volume":"16","author":"DR Bentley","year":"2006","unstructured":"Bentley DR: Whole-genome re-sequencing. Current Opinion in Genetics & Development 2006, 16(6):545\u2013552. 10.1016\/j.gde.2006.10.009","journal-title":"Current Opinion in Genetics & Development"},{"issue":"5741","key":"3046_CR18","doi-asserted-by":"publisher","first-page":"1728","DOI":"10.1126\/science.1117389","volume":"309","author":"J Shendure","year":"2005","unstructured":"Shendure J, Porreca GJ, Reppas NB, Lin X, Mccutcheon JP, Rosenbaum AM, Wang MD, Zhang K, Mitra RD, Church GM: Accurate Multiplex Polony Sequencing of an Evolved Bacterial Genome. Science 2005, 309(5741):1728\u20131732. 10.1126\/science.1117389","journal-title":"Science"},{"issue":"20","key":"3046_CR19","doi-asserted-by":"publisher","first-page":"6955","DOI":"10.1073\/pnas.82.20.6955","volume":"82","author":"DJ Lane","year":"1985","unstructured":"Lane DJ, Pace B, Olsen GJ, Stahl DA, Sogin ML, Pace NR: Rapid determination of 16S ribosomal RNA sequences for phylogenetic analyses. Proceedings of the National Academy of Sciences 1985, 82(20):6955\u20136959. 10.1073\/pnas.82.20.6955","journal-title":"Proceedings of the National Academy of Sciences"},{"issue":"16","key":"3046_CR20","doi-asserted-by":"publisher","first-page":"10234","DOI":"10.1073\/pnas.162359199","volume":"99","author":"BB Ward","year":"2002","unstructured":"Ward BB: How many species of prokaryotes are there? Proc Natl Acad Sci USA 2002, 99(16):10234\u201310236. 10.1073\/pnas.162359199","journal-title":"Proc Natl Acad Sci USA"},{"issue":"3","key":"3046_CR21","doi-asserted-by":"publisher","first-page":"377","DOI":"10.1101\/gr.5969107","volume":"17","author":"DH Huson","year":"2007","unstructured":"Huson DH, Auch AF, Qi J, Schuster SC: MEGAN analysis of metagenomic data. Genome Res 2007, 17(3):377\u2013386. 10.1101\/gr.5969107","journal-title":"Genome Res"},{"issue":"7","key":"3046_CR22","doi-asserted-by":"publisher","first-page":"283","DOI":"10.1016\/S0168-9525(00)89076-9","volume":"11","author":"S Kariin","year":"1995","unstructured":"Kariin S, Burge C: Dinucleotide relative abundance extremes: a genomic signature. Trends in Genetics 1995, 11(7):283\u2013290. 10.1016\/S0168-9525(00)89076-9","journal-title":"Trends in Genetics"},{"issue":"10","key":"3046_CR23","doi-asserted-by":"publisher","first-page":"1391","DOI":"10.1093\/oxfordjournals.molbev.a026048","volume":"16","author":"PJ Deschavanne","year":"1999","unstructured":"Deschavanne PJ, Giron A, Vilain J, Fagot G, Fertil B: Genomic signature: characterization and classification of species assessed by chaos game representation of sequences. Mol Biol Evol 1999, 16(10):1391\u20131399.","journal-title":"Mol Biol Evol"},{"key":"3046_CR24","doi-asserted-by":"publisher","first-page":"63","DOI":"10.1038\/nmeth976","volume":"4","author":"AC Mchardy","year":"2006","unstructured":"Mchardy AC, Mart\u00edn HG, Tsirigos A, Hugenholtz P, Rigoutsos I: Accurate phylogenetic classification of variable-length DNA fragments. Nature Methods 2006, 4: 63\u201372. 10.1038\/nmeth976","journal-title":"Nature Methods"},{"key":"3046_CR25","volume-title":"Research in Computational Molecular Biology, 12th Annual International Conference, RECOMB 2008, Singapore, March 30 - April 2, 2008. Proceedings, Lecture Notes in Computer Science","author":"S Chatterji","year":"2008","unstructured":"Chatterji S, Yamazaki I, Bai Z, Eisen J: CompostBin: A DNA composition-based algorithm for binning environmental shotgun reads. In Research in Computational Molecular Biology, 12th Annual International Conference, RECOMB 2008, Singapore, March 30 - April 2, 2008. Proceedings, Lecture Notes in Computer Science. Volume 4955. Springer; 2008."},{"issue":"4","key":"3046_CR26","doi-asserted-by":"publisher","first-page":"693","DOI":"10.1101\/gr.634603","volume":"13","author":"T Abe","year":"2003","unstructured":"Abe T, Kanaya S, Kinouchi M, Ichiba Y, Kozuki T, Ikemura T: Informatics for unveiling hidden genome signatures. Genome research 2003, 13(4):693\u2013702. 10.1101\/gr.634603","journal-title":"Genome research"},{"key":"3046_CR27","doi-asserted-by":"publisher","first-page":"513701","DOI":"10.1155\/2008\/513701","volume":"2008","author":"CK Chan","year":"2008","unstructured":"Chan CK, Hsu AL, Tang SL, Halgamuge SK: Using growing self-organising maps to improve the binning process in environmental whole-genome shotgun sequencing. Journal of biomedicine & biotechnology 2008, 2008: 513701.","journal-title":"Journal of biomedicine & biotechnology"},{"key":"3046_CR28","doi-asserted-by":"publisher","first-page":"215","DOI":"10.1186\/1471-2105-9-215","volume":"9","author":"CKK Chan","year":"2008","unstructured":"Chan CKK, Hsu AL, Halgamuge SK, Tang SL: Binning sequences using very sparse labels within a metagenome. BMC Bioinformatics 2008, 9: 215. 10.1186\/1471-2105-9-215","journal-title":"BMC Bioinformatics"},{"issue":"9","key":"3046_CR29","doi-asserted-by":"publisher","first-page":"938","DOI":"10.1111\/j.1462-2920.2004.00624.x","volume":"6","author":"H Teeling","year":"2004","unstructured":"Teeling H, Meyerdierks A, Bauer M, Amann R, Gl\u00f6ckner FO: Application of tetranucleotide frequencies for the assignment of genomic fragments. Environ Microbiol 2004, 6(9):938\u2013947. 10.1111\/j.1462-2920.2004.00624.x","journal-title":"Environ Microbiol"},{"key":"3046_CR30","doi-asserted-by":"publisher","first-page":"163","DOI":"10.1186\/1471-2105-5-163","volume":"5","author":"H Teeling","year":"2004","unstructured":"Teeling H, Waldmann J, Lombardot T, Bauer M, Gl\u00f6ckner FO: TETRA: a web-service and a stand-alone program for the analysis and comparison of tetranucleotide usage patterns in DNA sequences. BMC Bioinformatics 2004, 5: 163. 10.1186\/1471-2105-5-163","journal-title":"BMC Bioinformatics"},{"issue":"7114","key":"3046_CR31","doi-asserted-by":"publisher","first-page":"950","DOI":"10.1038\/nature05192","volume":"443","author":"T Woyke","year":"2006","unstructured":"Woyke T, Teeling H, Ivanova NN, Huntemann M, Richter M, Gloeckner FO, Boffelli D, Anderson IJ, Barry KW, Shapiro HJ, Szeto E, Kyrpides NC, Mussmann M, Amann R, Bergin C, Ruehland C, Rubin EM, Dubilier N: Symbiosis insights through metagenomic analysis of a microbial consortium. Nature 2006, 443(7114):950\u2013955. 10.1038\/nature05192","journal-title":"Nature"},{"key":"3046_CR32","unstructured":"A Genomic Encyclopedia of Bacteria and Archaea (GEBA)[ http:\/\/www.jgi.doe.gov\/programs\/GEBA\/index.html ]"},{"key":"3046_CR33","unstructured":"LikelyBin webpage[ http:\/\/ecotheory.biology.gatech.edu\/likelybin ]"},{"issue":"6","key":"3046_CR34","doi-asserted-by":"publisher","first-page":"495","DOI":"10.1038\/nmeth1043","volume":"4","author":"K Mavromatis","year":"2007","unstructured":"Mavromatis K, Ivanova N, Barry K, Shapiro H, Goltsman E, McHardy AC, Rigoutsos I, Salamov A, Korzeniewski F, Land M, Lapidus A, Grigoriev I, Richardson P, Hugenholtz P, Kyrpides NC: Use of simulated data sets to evaluate the fidelity of metagenomic processing methods. Nature methods 2007, 4(6):495\u2013500. 10.1038\/nmeth1043","journal-title":"Nature methods"},{"key":"3046_CR35","volume-title":"Likelihood, Bayesian and MCMC Methods in Quantitative Genetics","author":"D Sorensen","year":"2007","unstructured":"Sorensen D, Gianola D: Likelihood, Bayesian and MCMC Methods in Quantitative Genetics. Springer; 2007."},{"issue":"16","key":"3046_CR36","doi-asserted-by":"publisher","first-page":"9184","DOI":"10.1073\/pnas.96.16.9184","volume":"96","author":"A Campbell","year":"1999","unstructured":"Campbell A, Mr\u00e1zek J, Karlin S: Genome signature comparisons among prokaryote, plasmid, and mitochondrial DNA. Proceedings of the National Academy of Sciences of the United States of America 1999, 96(16):9184\u20139189. 10.1073\/pnas.96.16.9184","journal-title":"Proceedings of the National Academy of Sciences of the United States of America"},{"key":"3046_CR37","unstructured":"FAMeS: Fidelity of Analysis of Metagenomic Samples[ http:\/\/fames.jgi-psf.org\/ ]"}],"container-title":["BMC Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/1471-2105-10-316.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1186\/1471-2105-10-316\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/1471-2105-10-316.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,5,22]],"date-time":"2020-05-22T21:12:51Z","timestamp":1590181971000},"score":1,"resource":{"primary":{"URL":"https:\/\/bmcbioinformatics.biomedcentral.com\/articles\/10.1186\/1471-2105-10-316"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2009,10,2]]},"references-count":37,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2009,12]]}},"alternative-id":["3046"],"URL":"https:\/\/doi.org\/10.1186\/1471-2105-10-316","relation":{},"ISSN":["1471-2105"],"issn-type":[{"value":"1471-2105","type":"electronic"}],"subject":[],"published":{"date-parts":[[2009,10,2]]},"article-number":"316"}}