{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,13]],"date-time":"2026-04-13T20:20:17Z","timestamp":1776111617614,"version":"3.50.1"},"reference-count":18,"publisher":"Springer Science and Business Media LLC","issue":"S13","license":[{"start":{"date-parts":[[2015,12,1]],"date-time":"2015-12-01T00:00:00Z","timestamp":1448928000000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["BMC Bioinformatics"],"published-print":{"date-parts":[[2015,12]]},"DOI":"10.1186\/1471-2105-16-s13-s8","type":"journal-article","created":{"date-parts":[[2015,9,26]],"date-time":"2015-09-26T04:03:43Z","timestamp":1443240223000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":272,"title":["A heuristic approach to determine an appropriate number of topics in topic modeling"],"prefix":"10.1186","volume":"16","author":[{"given":"Weizhong","family":"Zhao","sequence":"first","affiliation":[]},{"given":"James J","family":"Chen","sequence":"additional","affiliation":[]},{"given":"Roger","family":"Perkins","sequence":"additional","affiliation":[]},{"given":"Zhichao","family":"Liu","sequence":"additional","affiliation":[]},{"given":"Weigong","family":"Ge","sequence":"additional","affiliation":[]},{"given":"Yijun","family":"Ding","sequence":"additional","affiliation":[]},{"given":"Wen","family":"Zou","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2015,12,1]]},"reference":[{"issue":"6","key":"7159_CR1","doi-asserted-by":"publisher","first-page":"391","DOI":"10.1002\/(SICI)1097-4571(199009)41:6<391::AID-ASI1>3.0.CO;2-9","volume":"41","author":"S Deerwester","year":"1990","unstructured":"Deerwester S, Dumais ST, Furnas GW, Landauer TK, Harshman R: Indexing by Latent Semantic Analysis. J Am Soc Inform Sci. 1990, 41 (6): 391-407. 10.1002\/(SICI)1097-4571(199009)41:6<391::AID-ASI1>3.0.CO;2-9.","journal-title":"J Am Soc Inform Sci"},{"issue":"1-2","key":"7159_CR2","doi-asserted-by":"publisher","first-page":"177","DOI":"10.1023\/A:1007617005950","volume":"42","author":"T Hofmann","year":"2001","unstructured":"Hofmann T: Unsupervised learning by probabilistic latent semantic analysis. Machine Learning. 2001, 42 (1-2): 177-196.","journal-title":"Machine Learning"},{"key":"7159_CR3","doi-asserted-by":"crossref","first-page":"50","DOI":"10.1145\/312624.312649","volume-title":"Proceedings of the 22nd annual international ACM SIGIR conference on Research and development in information retrieval","author":"T Hofmann","year":"1999","unstructured":"Hofmann T: Probabilistic latent semantic indexing. Proceedings of the 22nd annual international ACM SIGIR conference on Research and development in information retrieval. 1999, 50-57."},{"key":"7159_CR4","first-page":"993","volume":"3","author":"DM Blei","year":"2003","unstructured":"Blei DM, Ng AY, Jordan MI: Latent Dirichlet Allocation. Journal of Machine Learning Research. 2003, 3: 993-1022.","journal-title":"Journal of Machine Learning Research"},{"issue":"Suppl 1","key":"7159_CR5","doi-asserted-by":"publisher","first-page":"5228","DOI":"10.1073\/pnas.0307752101","volume":"101","author":"TL Griffiths","year":"2004","unstructured":"Griffiths TL, Steyvers M: Finding scientific topics. Proc Natl Acad Sci U S A. 2004, 101 (Suppl 1): 5228-5235.","journal-title":"Proc Natl Acad Sci U S A"},{"key":"7159_CR6","doi-asserted-by":"publisher","first-page":"127","DOI":"10.1145\/860435.860460","volume-title":"Proceedings of the 26th annual international ACM SIGIR conference on Research and development in informaion retrieval","author":"DM Blei","year":"2003","unstructured":"Blei DM, Jordan MI: Modeling annotated data. Proceedings of the 26th annual international ACM SIGIR conference on Research and development in informaion retrieval. 2003, 127-134."},{"key":"7159_CR7","first-page":"1981","volume":"9","author":"EM Airoldi","year":"2008","unstructured":"Airoldi EM, Blei DM, Fienberg SE, Xing EP: Mixed Membership Stochastic Blockmodels. J Mach Learn Res. 2008, 9: 1981-2014.","journal-title":"J Mach Learn Res"},{"issue":"2","key":"7159_CR8","doi-asserted-by":"publisher","first-page":"143","DOI":"10.1109\/TCBB.2005.29","volume":"2","author":"S Rogers","year":"2005","unstructured":"Rogers S, Girolami M, Campbell C, Breitling R: The latent process decomposition of cDNA microarray data sets. IEEE\/ACM transactions on computational biology and bioinformatics. 2005, 2 (2): 143-156. 10.1109\/TCBB.2005.29.","journal-title":"IEEE\/ACM transactions on computational biology and bioinformatics"},{"issue":"13","key":"7159_CR9","doi-asserted-by":"publisher","first-page":"i61","DOI":"10.1093\/bioinformatics\/btr249","volume":"27","author":"S Shivashankar","year":"2011","unstructured":"Shivashankar S, Srivathsan S, Ravindran B, Tendulkar AV: Multi-view methods for protein structure comparison using latent dirichlet allocation. Bioinformatics. 2011, 27 (13): i61-i68. 10.1093\/bioinformatics\/btr249.","journal-title":"Bioinformatics"},{"issue":"Suppl 11","key":"7159_CR10","doi-asserted-by":"publisher","first-page":"S11","DOI":"10.1186\/1471-2105-15-S11-S11","volume":"15","author":"W Zhao","year":"2014","unstructured":"Zhao W, Zou W, Chen JJ: Topic modeling for cluster analysis of large biological and medical datasets. BMC Bioinformatics. 2014, 15 (Suppl 11): S11-10.1186\/1471-2105-15-S11-S11.","journal-title":"BMC Bioinformatics"},{"issue":"12","key":"7159_CR11","doi-asserted-by":"publisher","first-page":"i7","DOI":"10.1093\/bioinformatics\/btq220","volume":"26","author":"LP Coelho","year":"2010","unstructured":"Coelho LP, Peng T, Murphy RF: Quantifying the distribution of probes between subcellular locations using unsupervised pattern unmixing. Bioinformatics. 2010, 26 (12): i7-i12. 10.1093\/bioinformatics\/btq220.","journal-title":"Bioinformatics"},{"key":"7159_CR12","volume-title":"Paris, France: WHO Collaborting Centre for Reference and Research on Salmonella","author":"PA Grimont","year":"2007","unstructured":"Grimont PA, Weill FX: Antigenic formulae of the Salmonella serovars. Paris, France: WHO Collaborting Centre for Reference and Research on Salmonella. 2007, 9","edition":"9"},{"key":"7159_CR13","doi-asserted-by":"publisher","first-page":"343","DOI":"10.1038\/msb.2009.98","volume":"6","author":"M Kuhn","year":"2010","unstructured":"Kuhn M, Campillos M, Letunic I, Jensen LJ, Bork P: A side effect resource to capture phenotypic effects of drugs. Mol Syst Biol. 2010, 6: 343-","journal-title":"Mol Syst Biol"},{"key":"7159_CR14","volume-title":"MALLET: A Machine Learning for Language Toolkit","author":"AK McCallun","year":"2002","unstructured":"McCallun AK: MALLET: A Machine Learning for Language Toolkit. 2002, [http:\/\/http:\/\/mallet.cs.umass.edu\/]"},{"issue":"5","key":"7159_CR15","doi-asserted-by":"publisher","first-page":"1792","DOI":"10.1093\/nar\/gkh340","volume":"32","author":"RC Edgar","year":"2004","unstructured":"Edgar RC: MUSCLE: multiple sequence alignment with high accuracy and high throughput. Nucleic Acids Res. 2004, 32 (5): 1792-1797. 10.1093\/nar\/gkh340.","journal-title":"Nucleic Acids Res"},{"issue":"3","key":"7159_CR16","first-page":"379","volume":"27","author":"CE Shannon","year":"1948","unstructured":"Shannon CE: A Mathematical Theory of Communication. At&T Tech J. 1948, 27 (3): 379-423.","journal-title":"At&T Tech J"},{"key":"7159_CR17","doi-asserted-by":"publisher","first-page":"1313","DOI":"10.1145\/1242572.1242826","volume-title":"Proceedings of the 16th international conference on World Wide Web","author":"MJ Halvey","year":"2007","unstructured":"Halvey MJ, Keane MT: An Assessment of Tag Presentation Techniques. Proceedings of the 16th international conference on World Wide Web. 2007, 1313-1314."},{"issue":"3","key":"7159_CR18","doi-asserted-by":"publisher","first-page":"297","DOI":"10.1016\/0378-3758(95)00148-4","volume":"53","author":"L Giraitis","year":"1996","unstructured":"Giraitis L, Leipus R, Surgailis D: The change-point problem for dependent observations. J Stat Plan Infer. 1996, 53 (3): 297-310. 10.1016\/0378-3758(95)00148-4.","journal-title":"J Stat Plan Infer"}],"container-title":["BMC Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/1471-2105-16-S13-S8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1186\/1471-2105-16-S13-S8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/1471-2105-16-S13-S8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,9,2]],"date-time":"2021-09-02T19:39:34Z","timestamp":1630611574000},"score":1,"resource":{"primary":{"URL":"https:\/\/bmcbioinformatics.biomedcentral.com\/articles\/10.1186\/1471-2105-16-S13-S8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015,12]]},"references-count":18,"journal-issue":{"issue":"S13","published-print":{"date-parts":[[2015,12]]}},"alternative-id":["7159"],"URL":"https:\/\/doi.org\/10.1186\/1471-2105-16-s13-s8","relation":{},"ISSN":["1471-2105"],"issn-type":[{"value":"1471-2105","type":"electronic"}],"subject":[],"published":{"date-parts":[[2015,12]]},"assertion":[{"value":"1 December 2015","order":1,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}],"article-number":"S8"}}