{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,12]],"date-time":"2025-10-12T03:38:29Z","timestamp":1760240309014,"version":"3.37.3"},"reference-count":42,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2017,9,20]],"date-time":"2017-09-20T00:00:00Z","timestamp":1505865600000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0\/"},{"start":{"date-parts":[[2017,9,20]],"date-time":"2017-09-20T00:00:00Z","timestamp":1505865600000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61673324","61503314"],"award-info":[{"award-number":["61673324","61503314"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","award":["DMS-1518001","OCE-1136818"],"award-info":[{"award-number":["DMS-1518001","OCE-1136818"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000002","name":"National Institutes of Health","doi-asserted-by":"publisher","award":["R01GM120624"],"award-info":[{"award-number":["R01GM120624"]}],"id":[{"id":"10.13039\/100000002","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100004543","name":"China Scholarship Council","doi-asserted-by":"publisher","award":["201606315011"],"award-info":[{"award-number":["201606315011"]}],"id":[{"id":"10.13039\/501100004543","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100003392","name":"Natural Science Foundation of Fujian Province","doi-asserted-by":"publisher","award":["2016J01316"],"award-info":[{"award-number":["2016J01316"]}],"id":[{"id":"10.13039\/501100003392","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["BMC Bioinformatics"],"published-print":{"date-parts":[[2017,12]]},"DOI":"10.1186\/s12859-017-1835-1","type":"journal-article","created":{"date-parts":[[2017,9,20]],"date-time":"2017-09-20T14:41:54Z","timestamp":1505918514000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":16,"title":["Improving contig binning of metagenomic data using $$ {d}_2^S $$ oligonucleotide frequency dissimilarity"],"prefix":"10.1186","volume":"18","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-8766-5950","authenticated-orcid":false,"given":"Ying","family":"Wang","sequence":"first","affiliation":[]},{"given":"Kun","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Yang Young","family":"Lu","sequence":"additional","affiliation":[]},{"given":"Fengzhu","family":"Sun","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2017,9,20]]},"reference":[{"key":"1835_CR1","doi-asserted-by":"publisher","first-page":"525","DOI":"10.1146\/annurev.genet.38.072902.091216","volume":"38","author":"CS Riesenfeld","year":"2004","unstructured":"Riesenfeld CS, Schloss PD, Handelsman J. Metagenomics: genomic analysis of microbial communities. Annu Rev Genet. 2004;38:525\u201352.","journal-title":"Annu Rev Genet"},{"issue":"6","key":"1835_CR2","doi-asserted-by":"publisher","first-page":"669","DOI":"10.1093\/bib\/bbs054","volume":"13","author":"SS Mande","year":"2012","unstructured":"Mande SS, Mohammed MH, Ghosh TS. Classification of metagenomic sequences: methods and challenges. Brief Bioinform. 2012;13(6):669\u201381.","journal-title":"Brief Bioinform"},{"key":"1835_CR3","doi-asserted-by":"publisher","first-page":"48","DOI":"10.1016\/j.csbj.2016.11.005","volume":"15","author":"K Sedlar","year":"2017","unstructured":"Sedlar K, Kupkova K, Provaznik I. Bioinformatics strategies for taxonomy independent binning and visualization of sequences in shotgun metagenomics. Comput Struct Biotechnol J. 2017;15:48\u201355.","journal-title":"Comput Struct Biotechnol J"},{"key":"1835_CR4","doi-asserted-by":"publisher","first-page":"1144","DOI":"10.1038\/nmeth.3103","volume":"11","author":"J Alneberg","year":"2014","unstructured":"Alneberg J, et al. Binning metagenomic contigs by coverage and composition. Nat Methods. 2014;11:1144\u20136.","journal-title":"Nat Methods"},{"issue":"6","key":"1835_CR5","doi-asserted-by":"crossref","first-page":"791","DOI":"10.1093\/bioinformatics\/btw290","volume":"33","author":"YY Lu","year":"2017","unstructured":"Lu YY, et al. COCACOLA: binning metagenomic contigs using sequence COmposition, read CoverAge, CO-alignment, and paired-end read LinkAge. Bioinformatics. 2017;33(6):791\u20138.","journal-title":"Bioinformatics"},{"issue":"3","key":"1835_CR6","doi-asserted-by":"publisher","first-page":"377","DOI":"10.1101\/gr.5969107","volume":"17","author":"DH Huson","year":"2007","unstructured":"Huson DH, et al. MEGAN analysis of metagenomic data. Genome Res. 2007;17(3):377\u201386.","journal-title":"Genome Res"},{"issue":"3","key":"1835_CR7","doi-asserted-by":"publisher","first-page":"R46","DOI":"10.1186\/gb-2014-15-3-r46","volume":"15","author":"DE Wood","year":"2014","unstructured":"Wood DE, Salzberg SL. Kraken: ultrafast metagenomic sequence classification using exact alignments. Genome Biol. 2014;15(3):R46.","journal-title":"Genome Biol"},{"issue":"D1","key":"1835_CR8","doi-asserted-by":"publisher","first-page":"D279","DOI":"10.1093\/nar\/gkv1344","volume":"44","author":"RD Finn","year":"2016","unstructured":"Finn RD, et al. The Pfam protein families database: towards a more sustainable future. Nucleic Acids Res. 2016;44(D1):D279\u201385.","journal-title":"Nucleic Acids Res"},{"issue":"1","key":"1835_CR9","doi-asserted-by":"publisher","first-page":"127","DOI":"10.1093\/bioinformatics\/btq619","volume":"27","author":"GL Rosen","year":"2011","unstructured":"Rosen GL, Reichenberger ER, Rosenfeld AM. NBC: the naive Bayes classification tool webserver for taxonomic classification of metagenomic reads. Bioinformatics. 2011;27(1):127\u20139.","journal-title":"Bioinformatics"},{"issue":"1","key":"1835_CR10","doi-asserted-by":"publisher","first-page":"316","DOI":"10.1186\/1471-2105-10-316","volume":"10","author":"A Kislyuk","year":"2009","unstructured":"Kislyuk A, et al. Unsupervised statistical clustering of environmental shotgun sequences. BMC Bioinformatics. 2009;10(1):316.","journal-title":"BMC Bioinformatics"},{"issue":"1","key":"1835_CR11","doi-asserted-by":"publisher","first-page":"544","DOI":"10.1186\/1471-2105-11-544","volume":"11","author":"DR Kelley","year":"2010","unstructured":"Kelley DR, Salzberg SL. Clustering metagenomic sequences with interpolated Markov models. BMC Bioinformatics. 2010;11(1):544.","journal-title":"BMC Bioinformatics"},{"key":"1835_CR12","doi-asserted-by":"publisher","first-page":"410","DOI":"10.3389\/fmicb.2012.00410","volume":"3","author":"M Strous","year":"2012","unstructured":"Strous M, et al. The binning of metagenomic contigs for microbial physiology of mixed cultures. Front Microbiol. 2012;3:410.","journal-title":"Front Microbiol"},{"issue":"1","key":"1835_CR13","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s40168-014-0066-1","volume":"3","author":"CC Laczny","year":"2015","unstructured":"Laczny CC, et al. VizBin-an application for reference-independent visualization and human-augmented binning of metagenomic data. Microbiome. 2015;3(1):1.","journal-title":"Microbiome"},{"issue":"11","key":"1835_CR14","doi-asserted-by":"publisher","first-page":"1489","DOI":"10.1093\/bioinformatics\/btr186","volume":"27","author":"HC Leung","year":"2011","unstructured":"Leung HC, et al. A robust and accurate binning algorithm for metagenomic sequences with arbitrary species abundance ratio. Bioinformatics. 2011;27(11):1489\u201395.","journal-title":"Bioinformatics"},{"issue":"3","key":"1835_CR15","doi-asserted-by":"publisher","first-page":"523","DOI":"10.1089\/cmb.2010.0245","volume":"18","author":"Y-W Wu","year":"2011","unstructured":"Wu Y-W, Ye Y. A novel abundance-based algorithm for binning metagenomic sequences using l-tuples. J Comput Biol. 2011;18(3):523\u201334.","journal-title":"J Comput Biol"},{"key":"1835_CR16","doi-asserted-by":"publisher","DOI":"10.7717\/peerj.603","volume":"2","author":"M Imelfort","year":"2014","unstructured":"Imelfort M, et al. GroopM: an automated tool for the recovery of population genomes from related metagenomes. PeerJ. 2014;2:e603.","journal-title":"PeerJ"},{"issue":"1","key":"1835_CR17","doi-asserted-by":"publisher","first-page":"26","DOI":"10.1186\/2049-2618-2-26","volume":"2","author":"Y-W Wu","year":"2014","unstructured":"Wu Y-W, et al. MaxBin: an automated binning method to recover individual genomes from metagenomes using an expectation-maximization algorithm. Microbiome. 2014;2(1):26.","journal-title":"Microbiome"},{"issue":"4","key":"1835_CR18","doi-asserted-by":"publisher","first-page":"605","DOI":"10.1093\/bioinformatics\/btv638","volume":"32","author":"Y-W Wu","year":"2016","unstructured":"Wu Y-W, Simmons BA, Singer SW. MaxBin 2.0: an automated binning algorithm to recover genomes from multiple metagenomic datasets. Bioinformatics. 2016;32(4):605\u20137.","journal-title":"Bioinformatics"},{"issue":"1","key":"1835_CR19","doi-asserted-by":"publisher","first-page":"36","DOI":"10.1186\/s12859-015-0473-8","volume":"16","author":"Y Wang","year":"2015","unstructured":"Wang Y, Hu H, Li X. MBBC: an efficient approach for metagenomic binning based on clustering. BMC Bioinformatics. 2015;16(1):36.","journal-title":"BMC Bioinformatics"},{"key":"1835_CR20","doi-asserted-by":"publisher","first-page":"24175","DOI":"10.1038\/srep24175","volume":"6","author":"H-H Lin","year":"2016","unstructured":"Lin H-H, Liao Y-C. Accurate binning of metagenomic contigs via automated clustering sequences using information of genomic signatures and marker genes. Sci Rep. 2016;6:24175.","journal-title":"Sci Rep"},{"issue":"12","key":"1835_CR21","doi-asserted-by":"publisher","first-page":"3899","DOI":"10.1128\/jb.179.12.3899-3913.1997","volume":"179","author":"S Karlin","year":"1997","unstructured":"Karlin S, Mrazek J, Campbell AM. Compositional biases of bacterial genomes and evolutionary implications. J Bacteriol. 1997;179(12):3899\u2013913.","journal-title":"J Bacteriol"},{"issue":"8","key":"1835_CR22","doi-asserted-by":"publisher","first-page":"R85","DOI":"10.1186\/gb-2009-10-8-r85","volume":"10","author":"GJ Dick","year":"2009","unstructured":"Dick GJ, et al. Community-wide analysis of microbial genome sequence signatures. Genome Biol. 2009;10(8):R85.","journal-title":"Genome Biol"},{"issue":"11","key":"1835_CR23","doi-asserted-by":"publisher","first-page":"1467","DOI":"10.1089\/cmb.2010.0056","volume":"17","author":"L Wan","year":"2010","unstructured":"Wan L, et al. Alignment-free sequence comparison (II): theoretical power of comparison statistics. J Comput Biol. 2010;17(11):1467\u201390.","journal-title":"J Comput Biol"},{"issue":"1","key":"1835_CR24","doi-asserted-by":"publisher","first-page":"39","DOI":"10.1093\/nar\/gkw1002","volume":"45","author":"NA Ahlgren","year":"2017","unstructured":"Ahlgren NA, et al. Alignment-free d2* oligonucleotide frequency dissimilarity measure improves prediction of hosts from metagenomically-derived viral sequences. Nucleic Acids Res. 2017;45(1):39\u201353.","journal-title":"Nucleic Acids Res"},{"issue":"2","key":"1835_CR25","doi-asserted-by":"publisher","first-page":"64","DOI":"10.1089\/cmb.2012.0228","volume":"20","author":"K Song","year":"2013","unstructured":"Song K, et al. Alignment-free sequence comparison based on next-generation sequencing reads. J Comput Biol. 2013;20(2):64\u201379.","journal-title":"J Comput Biol"},{"issue":"1","key":"1835_CR26","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0084348","volume":"9","author":"Y Wang","year":"2014","unstructured":"Wang Y, et al. Comparison of metatranscriptomic samples based on k-tuple frequencies. PLoS One. 2014;9(1):e84348.","journal-title":"PLoS One"},{"key":"1835_CR27","doi-asserted-by":"publisher","first-page":"37243","DOI":"10.1038\/srep37243","volume":"6","author":"W Liao","year":"2016","unstructured":"Liao W, et al. Alignment-free transcriptomic and Metatranscriptomic comparison using sequencing signatures with variable length Markov chains. Sci Rep. 2016;6:37243.","journal-title":"Sci Rep"},{"issue":"1","key":"1835_CR28","doi-asserted-by":"publisher","first-page":"730","DOI":"10.1186\/1471-2164-13-730","volume":"13","author":"B Jiang","year":"2012","unstructured":"Jiang B, et al. Comparison of metagenomic samples using sequence signatures. BMC Genomics. 2012;13(1):730.","journal-title":"BMC Genomics"},{"issue":"2","key":"1835_CR29","doi-asserted-by":"publisher","first-page":"241","DOI":"10.1089\/cmb.2011.0276","volume":"19","author":"Y Wang","year":"2012","unstructured":"Wang Y, et al. MetaCluster 4.0: a novel binning algorithm for NGS reads and huge number of species. J Comput Biol. 2012;19(2):241\u20139.","journal-title":"J Comput Biol"},{"issue":"18","key":"1835_CR30","doi-asserted-by":"publisher","first-page":"i356","DOI":"10.1093\/bioinformatics\/bts397","volume":"28","author":"Y Wang","year":"2012","unstructured":"Wang Y, et al. MetaCluster 5.0: a two-round binning approach for metagenomic data for low-abundance species in a noisy sample. Bioinformatics. 2012;28(18):i356\u201362.","journal-title":"Bioinformatics"},{"issue":"10","key":"1835_CR31","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0003373","volume":"3","author":"DC Richter","year":"2008","unstructured":"Richter DC, et al. MetaSim\u2014a sequencing simulator for genomics and metagenomics. PLoS One. 2008;3(10):e3373.","journal-title":"PLoS One"},{"issue":"5","key":"1835_CR32","doi-asserted-by":"publisher","first-page":"821","DOI":"10.1101\/gr.074492.107","volume":"18","author":"DR Zerbino","year":"2008","unstructured":"Zerbino DR, Birney E. Velvet: algorithms for de novo short read assembly using de Bruijn graphs. Genome Res. 2008;18(5):821\u20139.","journal-title":"Genome Res"},{"issue":"6","key":"1835_CR33","doi-asserted-by":"publisher","first-page":"495","DOI":"10.1038\/nmeth1043","volume":"4","author":"K Mavromatis","year":"2007","unstructured":"Mavromatis K, et al. Use of simulated data sets to evaluate the fidelity of metagenomic processing methods. Nat Methods. 2007;4(6):495\u2013500.","journal-title":"Nat Methods"},{"issue":"48","key":"1835_CR34","doi-asserted-by":"publisher","first-page":"18296","DOI":"10.1073\/pnas.0608549103","volume":"103","author":"SJ Hallam","year":"2006","unstructured":"Hallam SJ, et al. Genomic analysis of the uncultivated marine crenarchaeote Cenarchaeum symbiosum. Proc Natl Acad Sci. 2006;103(48):18296\u2013301.","journal-title":"Proc Natl Acad Sci"},{"issue":"6978","key":"1835_CR35","doi-asserted-by":"publisher","first-page":"37","DOI":"10.1038\/nature02340","volume":"428","author":"GW Tyson","year":"2004","unstructured":"Tyson GW, et al. Community structure and metabolism through reconstruction of microbial genomes from the environment. Nature. 2004;428(6978):37\u201343.","journal-title":"Nature"},{"issue":"7114","key":"1835_CR36","doi-asserted-by":"publisher","first-page":"950","DOI":"10.1038\/nature05192","volume":"443","author":"T Woyke","year":"2006","unstructured":"Woyke T, et al. Symbiosis insights through metagenomic analysis of a microbial consortium. Nature. 2006;443(7114):950\u20135.","journal-title":"Nature"},{"issue":"5721","key":"1835_CR37","doi-asserted-by":"publisher","first-page":"554","DOI":"10.1126\/science.1107851","volume":"308","author":"SG Tringe","year":"2005","unstructured":"Tringe SG, et al. Comparative metagenomics of microbial communities. Science. 2005;308(5721):554\u20137.","journal-title":"Science"},{"issue":"1","key":"1835_CR38","doi-asserted-by":"publisher","first-page":"111","DOI":"10.1101\/gr.142315.112","volume":"23","author":"I Sharon","year":"2013","unstructured":"Sharon I, et al. Time series community genomics analysis reveals rapid shifts in bacterial species, strains, and phage during infant gut colonization. Genome Res. 2013;23(1):111\u201320.","journal-title":"Genome Res"},{"key":"1835_CR39","unstructured":"Ijaz, U, Quince C. TAXAassign v0.4. https:\/\/github.com\/umerijaz\/taxaassign 2013."},{"issue":"7","key":"1835_CR40","doi-asserted-by":"publisher","first-page":"1043","DOI":"10.1101\/gr.186072.114","volume":"25","author":"DH Parks","year":"2015","unstructured":"Parks DH, et al. CheckM: assessing the quality of microbial genomes recovered from isolates, single cells, and metagenomes. Genome Res. 2015;25(7):1043\u201355.","journal-title":"Genome Res"},{"key":"1835_CR41","volume-title":"ISODATA, a novel method of data analysis and pattern classification","author":"GH Ball","year":"1965","unstructured":"Ball GH, Hall DJ. ISODATA, a novel method of data analysis and pattern classification. Menlo Park CA: Stanford research inst; 1965."},{"key":"1835_CR42","doi-asserted-by":"crossref","unstructured":"Wu Y-W, et al. MaxBin: an automated binning method to recover individual genomes from metagenomes using an expectation-maximization algorithm. 2014 13 Apr 2017; Available from: http:\/\/downloads.jbei.org\/data\/microbial_communities\/MaxBin\/MaxBin.html .","DOI":"10.1186\/2049-2618-2-26"}],"container-title":["BMC Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s12859-017-1835-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1186\/s12859-017-1835-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s12859-017-1835-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,8,26]],"date-time":"2023-08-26T04:44:48Z","timestamp":1693025088000},"score":1,"resource":{"primary":{"URL":"https:\/\/bmcbioinformatics.biomedcentral.com\/articles\/10.1186\/s12859-017-1835-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,9,20]]},"references-count":42,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2017,12]]}},"alternative-id":["1835"],"URL":"https:\/\/doi.org\/10.1186\/s12859-017-1835-1","relation":{},"ISSN":["1471-2105"],"issn-type":[{"type":"electronic","value":"1471-2105"}],"subject":[],"published":{"date-parts":[[2017,9,20]]},"assertion":[{"value":"3 May 2017","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"11 September 2017","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"20 September 2017","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"Not applicable.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval and consent to participate"}},{"value":"Not applicable.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for publication"}},{"value":"The authors declare that they have no competing interests.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}},{"value":"Springer Nature remains neutral with regard to jurisdictional claims in published maps and institutional affiliations.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Publisher\u2019s Note"}}],"article-number":"425"}}