{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2022,12,29]],"date-time":"2022-12-29T01:30:12Z","timestamp":1672277412971},"reference-count":27,"publisher":"Springer Science and Business Media LLC","issue":"S5","content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["BMC Bioinformatics"],"published-print":{"date-parts":[[2015,12]]},"DOI":"10.1186\/1471-2105-16-s5-s2","type":"journal-article","created":{"date-parts":[[2015,6,18]],"date-time":"2015-06-18T09:53:13Z","timestamp":1434621193000},"update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":10,"title":["Exploiting topic modeling to boost metagenomic reads binning"],"prefix":"10.1186","volume":"16","author":[{"given":"Ruichang","family":"Zhang","sequence":"first","affiliation":[]},{"given":"Zhanzhan","family":"Cheng","sequence":"additional","affiliation":[]},{"given":"Jihong","family":"Guan","sequence":"additional","affiliation":[]},{"given":"Shuigeng","family":"Zhou","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2015,3,18]]},"reference":[{"issue":"7285","key":"6911_CR1","doi-asserted-by":"publisher","first-page":"59","DOI":"10.1038\/nature08821","volume":"464","author":"J Qin","year":"2010","unstructured":"Qin J, Li R, Raes J, Arumugam M, Burgdorf KS, Manichanh C, Nielsen T, Pons N, Levenez F, Yamada T, et al: A human gut microbial gene catalogue established by metagenomic sequencing. Nature. 2010, 464 (7285): 59-65. 10.1038\/nature08821.","journal-title":"Nature"},{"issue":"8","key":"6911_CR2","doi-asserted-by":"publisher","first-page":"3064","DOI":"10.1371\/journal.pone.0003064","volume":"3","author":"ZA Khachatryan","year":"2008","unstructured":"Khachatryan ZA, Ktsoyan ZA, Manukyan GP, Kelly D, Ghazaryan KA, Aminov RI: Predominant role of host genetics in controlling the composition of gut microbiota. PloS One. 2008, 3 (8): 3064-10.1371\/journal.pone.0003064.","journal-title":"PloS One"},{"issue":"6","key":"6911_CR3","doi-asserted-by":"publisher","first-page":"495","DOI":"10.1038\/nmeth1043","volume":"4","author":"K Mavromatis","year":"2007","unstructured":"Mavromatis K, Ivanova N, Barry K, Shapiro H, Goltsman E, McHardy AC, Rigoutsos I, Salamov A, Korzeniewski F, Land M, et al: Use of simulated data sets to evaluate the fidelity of metagenomics processing methods. Nature Methods. 2007, 4 (6): 495-500. 10.1038\/nmeth1043.","journal-title":"Nature Methods"},{"issue":"Suppl 1","key":"6911_CR4","doi-asserted-by":"publisher","first-page":"12","DOI":"10.1186\/1471-2105-10-S1-S12","volume":"10","author":"DH Huson","year":"2009","unstructured":"Huson DH, Richter DC, Mitra S, Auch AF, Schuster SC: Methods for comparative metagenomics. BMC Bioinformatics. 2009, 10 (Suppl 1): 12-10.1186\/1471-2105-10-S1-S12.","journal-title":"BMC Bioinformatics"},{"issue":"1","key":"6911_CR5","doi-asserted-by":"publisher","first-page":"63","DOI":"10.1038\/nmeth976","volume":"4","author":"AC McHardy","year":"2006","unstructured":"McHardy AC, Martin HG, Tsirigos A, Hugenholtz P, Rigoutsos I: Accurate phylogenetic classification of variable-length dna fragments. Nature Methods. 2006, 4 (1): 63-72.","journal-title":"Nature Methods"},{"issue":"1","key":"6911_CR6","doi-asserted-by":"publisher","first-page":"461","DOI":"10.1186\/1471-2164-11-461","volume":"11","author":"M Stark","year":"2010","unstructured":"Stark M, Berger S, Stamatakis A, von Mering C: Mltreemap-accurate maximum likelihood placement of environmental dna sequences into taxonomic and functional reference phylogenies. BMC Genomics. 2010, 11 (1): 461-10.1186\/1471-2164-11-461.","journal-title":"BMC Genomics"},{"key":"6911_CR7","doi-asserted-by":"publisher","first-page":"56","DOI":"10.1186\/1471-2105-10-56","volume":"10","author":"NN Diaz","year":"2009","unstructured":"Diaz NN, Krause L, Goesmann A, Niehaus K, Nattkemper TW: Tacoa-taxonomic classification of environmental genomic fragments using a kernelized nearest neighbor approach. BMC Bioinformatics. 2009, 10: 56-10.1186\/1471-2105-10-56.","journal-title":"BMC Bioinformatics"},{"issue":"9","key":"6911_CR8","doi-asserted-by":"publisher","first-page":"673","DOI":"10.1038\/nmeth.1358","volume":"6","author":"A Brady","year":"2009","unstructured":"Brady A, Salzberg SL: Phymm and phymmbl: metagenomic phylogenetic classification with interpolated markov models. Nature Methods. 2009, 6 (9): 673-676. 10.1038\/nmeth.1358.","journal-title":"Nature Methods"},{"issue":"3","key":"6911_CR9","doi-asserted-by":"publisher","first-page":"523","DOI":"10.1089\/cmb.2010.0245","volume":"18","author":"Y-W Wu","year":"2011","unstructured":"Wu Y-W, Ye Y: A novel abundance-based algorithm for binning metagenomic sequences using l-tuples. Journal of Computational Biology. 2011, 18 (3): 523-534. 10.1089\/cmb.2010.0245.","journal-title":"Journal of Computational Biology"},{"issue":"11","key":"6911_CR10","doi-asserted-by":"publisher","first-page":"1489","DOI":"10.1093\/bioinformatics\/btr186","volume":"27","author":"HC Leung","year":"2011","unstructured":"Leung HC, Yiu S-M, Yang B, Peng Y, Wang Y, Liu Z, Chen J, Qin J, Li R, Chin FY: A robust and accurate binning algorithm for metagenomic sequences with arbitrary species abundance ratio. Bioinformatics. 2011, 27 (11): 1489-1495. 10.1093\/bioinformatics\/btr186.","journal-title":"Bioinformatics"},{"issue":"2","key":"6911_CR11","doi-asserted-by":"publisher","first-page":"241","DOI":"10.1089\/cmb.2011.0276","volume":"19","author":"Y Wang","year":"2012","unstructured":"Wang Y, Leung HC, Yiu S-M, Chin FY: Metacluster 4.0: a novel binning algorithm for ngs reads and huge number of species. Journal of Computational Biology. 2012, 19 (2): 241-249. 10.1089\/cmb.2011.0276.","journal-title":"Journal of Computational Biology"},{"issue":"18","key":"6911_CR12","doi-asserted-by":"publisher","first-page":"356","DOI":"10.1093\/bioinformatics\/bts397","volume":"28","author":"Y Wang","year":"2012","unstructured":"Wang Y, Leung HC, Yiu S-M, Chin FY: Metacluster 5.0: a two-round binning approach for metagenomic data for low-abundance species in a noisy sample. Bioinformatics. 2012, 28 (18): 356-362. 10.1093\/bioinformatics\/bts397.","journal-title":"Bioinformatics"},{"issue":"Suppl 1","key":"6911_CR13","doi-asserted-by":"publisher","first-page":"12","DOI":"10.1186\/1471-2164-15-S1-S12","volume":"15","author":"Y Wang","year":"2014","unstructured":"Wang Y, Leung HC, Yiu SM, Chin FY: Metacluster-ta: taxonomic annotation for metagenomic data based on assembly-assisted binning. BMC Genomics. 2014, 15 (Suppl 1): 12-10.1186\/1471-2164-15-S1-S12.","journal-title":"BMC Genomics"},{"issue":"1","key":"6911_CR14","doi-asserted-by":"publisher","first-page":"42","DOI":"10.1109\/TCBB.2013.137","volume":"11","author":"R Liao","year":"2014","unstructured":"Liao R, Zhang R, Guan J, Zhou S: A new unsupervised binning approach for metagenomic sequences based on n-grams and automatic feature weighting. IEEE\/ACM Transactions on Computational Biology and Bioinformatics (TCBB). 2014, 11 (1): 42-54.","journal-title":"IEEE\/ACM Transactions on Computational Biology and Bioinformatics (TCBB)"},{"key":"6911_CR15","first-page":"993","volume":"3","author":"D Blei","year":"2003","unstructured":"Blei D, Ng A, Jordan M: Latent dirichlet allocation. Journal of Machine Learning Research. 2003, 3: 993-1022.","journal-title":"Journal of Machine Learning Research"},{"key":"6911_CR16","doi-asserted-by":"publisher","first-page":"45","DOI":"10.1007\/978-1-4757-4305-0_3","volume-title":"Survey of text mining","author":"H Frigui","year":"2004","unstructured":"Frigui H, Nasraoui O: Simultaneous clustering and dynamic keyword weighting for text documents. Survey of text mining. 2004, 45-72."},{"key":"6911_CR17","first-page":"3","volume":"23","author":"T Aso","year":"2009","unstructured":"Aso T, Eguchi K: Predicting protein-protein relationships from literature using latent topics. Proceedings of The 20th International Conference on Genome Informatics. 2009, 23: 3-12.","journal-title":"Proceedings of The 20th International Conference on Genome Informatics"},{"key":"6911_CR18","doi-asserted-by":"publisher","first-page":"58","DOI":"10.1186\/1471-2105-7-58","volume":"7","author":"B Zheng","year":"2006","unstructured":"Zheng B, McLean DC, Lu X: Identifying biological concepts from a protein-related corpus with a probabilistic topic model. BMC Bioinformatics. 2006, 7: 58-10.1186\/1471-2105-7-58.","journal-title":"BMC Bioinformatics"},{"key":"6911_CR19","volume-title":"Technical Report","author":"GK Gerber","year":"2007","unstructured":"Gerber GK, Dowell RD, Jaakkola TS, Gifford DK: Hierarchical dirichlet process-based models for discovery of cross-species mammalian gene expression. Technical Report. 2007"},{"issue":"4","key":"6911_CR20","doi-asserted-by":"publisher","first-page":"980","DOI":"10.1109\/TCBB.2011.113","volume":"9","author":"X Chen","year":"2012","unstructured":"Chen X, Hu X, Lim TY, Shen X, Park E, Rosen GL: Exploiting the functional and taxonomic structure of genomic data by probabilistic topic modeling. IEEE\/ACM Transactions on Computational Biology and Bioinformatics (TCBB). 2012, 9 (4): 980-991.","journal-title":"IEEE\/ACM Transactions on Computational Biology and Bioinformatics (TCBB)"},{"issue":"10","key":"6911_CR21","doi-asserted-by":"publisher","first-page":"108","DOI":"10.1186\/gb-2009-10-10-r108","volume":"10","author":"B Chor","year":"2009","unstructured":"Chor B, Horn D, Goldman N, Levy Y, Massingham T, et al: Genomic dna k-mer spectra: models and modalities. Genome Biology. 2009, 10 (10): 108-10.1186\/gb-2009-10-10-r108.","journal-title":"Genome Biology"},{"key":"6911_CR22","doi-asserted-by":"publisher","first-page":"546","DOI":"10.1186\/1471-2105-9-546","volume":"9","author":"F Zhou","year":"2008","unstructured":"Zhou F, Olman V, Xu Y: Barcodes for genomes and applications. BMC Bioinformatics. 2008, 9: 546-10.1186\/1471-2105-9-546.","journal-title":"BMC Bioinformatics"},{"issue":"Suppl 1","key":"6911_CR23","doi-asserted-by":"publisher","first-page":"5228","DOI":"10.1073\/pnas.0307752101","volume":"101","author":"TL Griffiths","year":"2004","unstructured":"Griffiths TL, Steyvers M: Finding scientific topics. Proceedings of the National academy of Sciences of the United States of America. 2004, 101 (Suppl 1): 5228-5235.","journal-title":"Proceedings of the National academy of Sciences of the United States of America"},{"issue":"10","key":"6911_CR24","doi-asserted-by":"publisher","first-page":"3373","DOI":"10.1371\/journal.pone.0003373","volume":"3","author":"DC Richter","year":"2008","unstructured":"Richter DC, Ott F, Auch AF, Schmid R, Huson DH: Metasima sequencing simulator for genomics and metagenomics. PloS One. 2008, 3 (10): 3373-10.1371\/journal.pone.0003373.","journal-title":"PloS One"},{"key":"6911_CR25","unstructured":"NCBI Acid Mine Drainage Metagenomics Dataset. [http:\/\/www.ncbi.nlm.nih.gov\/books\/NBK6860\/]"},{"issue":"6978","key":"6911_CR26","doi-asserted-by":"publisher","first-page":"37","DOI":"10.1038\/nature02340","volume":"428","author":"GW Tyson","year":"2004","unstructured":"Tyson GW, Chapman J, Hugenholtz P, Allen EE, Ram RJ, Richardson PM, Solovyev VV, Rubin EM, Rokhsar DS, Banfield JF: Community structure and metabolism through reconstruction of microbial genomes from the environment. Nature. 2004, 428 (6978): 37-43. 10.1038\/nature02340.","journal-title":"Nature"},{"key":"6911_CR27","first-page":"16","volume-title":"Proceedings of the 5th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, ACM","author":"B Larsen","year":"1999","unstructured":"Larsen B, Aone C: Fast and effective text mining using linear-time document clustering. Proceedings of the 5th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, ACM. 1999, 16-22."}],"container-title":["BMC Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/1471-2105-16-S5-S2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,9,2]],"date-time":"2021-09-02T19:19:24Z","timestamp":1630610364000},"score":1,"resource":{"primary":{"URL":"https:\/\/bmcbioinformatics.biomedcentral.com\/articles\/10.1186\/1471-2105-16-S5-S2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015,3,18]]},"references-count":27,"journal-issue":{"issue":"S5","published-print":{"date-parts":[[2015,12]]}},"alternative-id":["6911"],"URL":"https:\/\/doi.org\/10.1186\/1471-2105-16-s5-s2","relation":{},"ISSN":["1471-2105"],"issn-type":[{"value":"1471-2105","type":"electronic"}],"subject":[],"published":{"date-parts":[[2015,3,18]]},"assertion":[{"value":"18 March 2015","order":1,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}],"article-number":"S2"}}