{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,23]],"date-time":"2026-02-23T23:44:17Z","timestamp":1771890257362,"version":"3.50.1"},"reference-count":36,"publisher":"Springer Science and Business Media LLC","issue":"7","license":[{"start":{"date-parts":[[2017,9,7]],"date-time":"2017-09-07T00:00:00Z","timestamp":1504742400000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/501100004608","name":"Natural Science Foundation of Jiangsu Province","doi-asserted-by":"publisher","award":["BK20170513"],"award-info":[{"award-number":["BK20170513"]}],"id":[{"id":"10.13039\/501100004608","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61402203"],"award-info":[{"award-number":["61402203"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Appl Intell"],"published-print":{"date-parts":[[2018,7]]},"DOI":"10.1007\/s10489-017-1055-4","type":"journal-article","created":{"date-parts":[[2017,9,7]],"date-time":"2017-09-07T11:55:18Z","timestamp":1504785318000},"page":"1802-1812","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":33,"title":["Short text clustering based on Pitman-Yor process mixture model"],"prefix":"10.1007","volume":"48","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-5721-0293","authenticated-orcid":false,"given":"Jipeng","family":"Qiang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yun","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yunhao","family":"Yuan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xindong","family":"Wu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2017,9,7]]},"reference":[{"key":"1055_CR1","unstructured":"Anastasiu D, Tagarelli A, Karypis G (2013) Document clustering: The next frontier. Technical report, University of Minnesota"},{"key":"1055_CR2","unstructured":"Andrews N, Fox E (2007) Recent developments in document clustering. Technical report, Computer Science, Virginia Tech"},{"key":"1055_CR3","first-page":"993","volume":"3","author":"D Blei","year":"2003","unstructured":"Blei D, Ng N, Jordan M (2003) Latent dirichlet allocation. J Mach Learn Res 3:993\u20131022","journal-title":"J Mach Learn Res"},{"key":"1055_CR4","unstructured":"Catherine F, Coke R, Zhang R, Ye X, Radev D (2016) Effects of creativity and cluster tightness on short text clustering performance. In: Proceedings of the 54th annual meeting of the association for computational linguistics. Berlin, Germany, pp 654\u2013665"},{"issue":"3","key":"1055_CR5","doi-asserted-by":"crossref","first-page":"751","DOI":"10.1007\/s10115-016-0952-x","volume":"50","author":"B El Ghali","year":"2017","unstructured":"El Ghali B, El Qadi A (2017) Context-aware query expansion method using language models and latent semantic analyses. Knowl Inf Syst 50(3):751\u201362","journal-title":"Knowl Inf Syst"},{"key":"1055_CR6","unstructured":"Ester M, Kriegel HP, Sander J, Xu X (1996) A density-based algorithm for discovering clusters in large spatial databases with noise. In: Kdd, pp 226\u2013231"},{"key":"1055_CR7","doi-asserted-by":"crossref","unstructured":"Frey B, Dueck D (2007) Clustering by passing messages between data points Science, vol 315, pp 972\u2013976","DOI":"10.1126\/science.1136800"},{"key":"1055_CR8","doi-asserted-by":"crossref","unstructured":"Griffiths T, Steyvers M (2004) Finding scientific topics. In: Proceedings of the National Academy of Sciences, pp 5228\u20135235","DOI":"10.1073\/pnas.0307752101"},{"issue":"9","key":"1055_CR9","doi-asserted-by":"crossref","first-page":"3637","DOI":"10.1109\/TSP.2006.879282","volume":"54","author":"AB Hamza","year":"2006","unstructured":"Hamza AB, Brady DJ (2006) Reconstruction of reflectance spectra using robust nonnegative matrix factorization. IEEE Trans Signal Process 54(9):3637\u201342","journal-title":"IEEE Trans Signal Process"},{"key":"1055_CR10","volume-title":"Data mining: concepts and techniques: concepts and techniques","author":"J Han","year":"2011","unstructured":"Han J, Kamber M, Pei J (2011) Data mining: concepts and techniques: concepts and techniques. Elsevier, Amsterdam"},{"key":"1055_CR11","doi-asserted-by":"crossref","unstructured":"Hofmann T (1999) Probabilistic latent semantic indexing. In: SIGIR, pp 50\u201357","DOI":"10.1145\/312624.312649"},{"key":"1055_CR12","doi-asserted-by":"crossref","unstructured":"Huang R, Yu G, Wang Z, Zhang J, Shi L (2013) Dirichlet process mixture model for document clustering with feature partition. In: IEEE Transactions on knowledge and data engineering, vol 25, pp 1748\u20131759","DOI":"10.1109\/TKDE.2012.27"},{"key":"1055_CR13","doi-asserted-by":"crossref","unstructured":"Hubert L, Arabie P (1985) Comparing partitions. In: Journal of classification, vol 2, pp 193\u2013218","DOI":"10.1007\/BF01908075"},{"key":"1055_CR14","doi-asserted-by":"crossref","unstructured":"Jain A (2010) Data clustering: 50 years beyond k-means. In: Pattern recognition letters, vol 31, pp 651\u2013666","DOI":"10.1016\/j.patrec.2009.09.011"},{"key":"1055_CR15","unstructured":"Lau L, Collier N, Baldwin T (2012) On-line trend analysis with topic models: twitter trends detection topic model online. In: COLING, pp 1519\u20131534"},{"key":"1055_CR16","unstructured":"Lee D, Seung S (2001) Algorithms for non-negative matrix factorization. In: NIPS, pp 556\u2013562"},{"key":"1055_CR17","doi-asserted-by":"crossref","unstructured":"Liang S, Yilmaz E, Kanoulas E (2016) Dynamic clustering of streaming short documents. In: SIGKDD, pp 995\u20131004","DOI":"10.1145\/2939672.2939748"},{"issue":"2","key":"1055_CR18","doi-asserted-by":"crossref","first-page":"178","DOI":"10.1007\/s10791-010-9141-9","volume":"14","author":"Y Lu","year":"2011","unstructured":"Lu Y, Mei Q, Zhai C (2011) Investigating task performance of probabilistic topic models: an empirical study of PLSA and LDA. Inf Retr 14(2):178\u2013203","journal-title":"Inf Retr"},{"issue":"1","key":"1055_CR19","doi-asserted-by":"crossref","first-page":"27","DOI":"10.1007\/s10115-016-0930-3","volume":"50","author":"A Mojahed","year":"2017","unstructured":"Mojahed A, de la Iglesia B (2017) An adaptive version of k-medoids to deal with the uncertainty in clustering heterogeneous data using an intermediary fusion approach. Knowl Inf Syst 50(1):27\u201352","journal-title":"Knowl Inf Syst"},{"key":"1055_CR20","unstructured":"Vinh NX, Epps J, Bailey J (2010) Information theoretic measures for clusterings comparison: variants, properties, normalization and correction for chance. In: Journal of machine learning research, vol 11, pp 2837\u20132854"},{"key":"1055_CR21","doi-asserted-by":"crossref","unstructured":"Nigam K, McCallum AK, Thrun S, Mitchell T (2000) Text classification from labeled and unlabeled documents using EM. In: Machine learning, vol 39, pp 103\u2013134","DOI":"10.1023\/A:1007692713085"},{"issue":"3","key":"1055_CR22","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1007\/s10115-017-1031-7","volume":"52","author":"CF Olson","year":"2017","unstructured":"Olson CF, Hunn DC, Lyons HJ (2017) Efficient Monte Carlo clustering in subspaces. Knowl Inf Syst 52(3):1\u201322","journal-title":"Knowl Inf Syst"},{"key":"1055_CR23","unstructured":"Quan X, Kit C, Ge Y, Pan SJ (2015) Short and sparse text topic modeling via self-aggregation. In: AAAI, pp 2270\u20132276"},{"key":"1055_CR24","unstructured":"Gaussian RD (2009) Mixture models. Encyclopedia of Biometrics pp 659\u2013663"},{"issue":"2","key":"1055_CR25","doi-asserted-by":"crossref","first-page":"543","DOI":"10.1007\/s10115-016-0946-8","volume":"50","author":"F Ros","year":"2017","unstructured":"Ros F, Guillaume S (2017) DIDES: A fast and effective sampling for clustering algorithm. Knowl Inf Syst 50(2):543\u201368","journal-title":"Knowl Inf Syst"},{"key":"1055_CR26","unstructured":"Rosenberg A, Hirschberg J V-measure: A conditional entropy-based external cluster evaluation measure. In: AAAI, pp 410\u2013420"},{"issue":"2","key":"1055_CR27","doi-asserted-by":"crossref","first-page":"487","DOI":"10.1007\/s10489-014-0526-0","volume":"41","author":"CY Sang","year":"2014","unstructured":"Sang CY, Sun DH (2014) Co-clustering over multiple dynamic data streams based on non-negative matrix factorization. Appl Intell 41(2):487\u2013502","journal-title":"Appl Intell"},{"key":"1055_CR28","doi-asserted-by":"crossref","unstructured":"Sato I, Nakagawa H (2010) Topic models with power-law using Pitman-Yor process. In: SIGKDD, pp 673\u2013682","DOI":"10.1145\/1835804.1835890"},{"issue":"3","key":"1055_CR29","doi-asserted-by":"crossref","first-page":"941","DOI":"10.1007\/s10115-016-0996-y","volume":"51","author":"L Sun","year":"2017","unstructured":"Sun L, Guo C, Liu C, Xiong H (2017) Fast affinity propagation clustering based on incomplete similarity matrix. Knowl Inf Syst 51(3):941\u201363","journal-title":"Knowl Inf Syst"},{"issue":"476","key":"1055_CR30","first-page":"280","volume":"101","author":"YW Teh","year":"2006","unstructured":"Teh YW, Jordan M, Beal M, Blei D (2006) Hierarchical Dirichlet process. J Am Stat Assoc 101(476):280\u2013287","journal-title":"J Am Stat Assoc"},{"key":"1055_CR31","doi-asserted-by":"crossref","unstructured":"Teh YW (2011) Dirichlet process. In: Encyclopedia of machine learning. Springer, pp 280\u2013287","DOI":"10.1007\/978-0-387-30164-8_219"},{"key":"1055_CR32","doi-asserted-by":"crossref","unstructured":"Wu X, Kumar V, Quinlan JR, Ghosh J, Yang Q, Motoda H, McLachlan GJ, Ng A, Liu B, Philip SY, Zhou ZH (2008) Top 10 algorithms in data mining. In: Knowledge and Information Systems, vol 14, pp 1\u201337","DOI":"10.1007\/s10115-007-0114-2"},{"key":"1055_CR33","doi-asserted-by":"crossref","unstructured":"Yin J, Wang J (2014) A dirichlet multinomial mixture model-based approach for short text clustering. In: SIGKDD, pp 233\u2013 242","DOI":"10.1145\/2623330.2623715"},{"key":"1055_CR34","doi-asserted-by":"crossref","unstructured":"Yin J, Wang J (2016) A text clustering algorithm using an online clustering scheme for initialization. In: SIGKDD, pp 1995\u20132004","DOI":"10.1145\/2939672.2939841"},{"key":"1055_CR35","doi-asserted-by":"crossref","unstructured":"Yu G, Huang R, Wang Z (2010) Document clustering via dirichlet process mixture model with feature selection. In: SIGKDD, pp 763\u2013772","DOI":"10.1145\/1835804.1835901"},{"key":"1055_CR36","doi-asserted-by":"crossref","unstructured":"Zhao Y, Karypis G (2004) Empirical and theoretical comparisons of selected criterion functions for document clustering. In: Machine learning, vol 55, pp 311\u2013331","DOI":"10.1023\/B:MACH.0000027785.44527.d6"}],"container-title":["Applied Intelligence"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10489-017-1055-4\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10489-017-1055-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10489-017-1055-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,6,26]],"date-time":"2024-06-26T19:35:23Z","timestamp":1719430523000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10489-017-1055-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,9,7]]},"references-count":36,"journal-issue":{"issue":"7","published-print":{"date-parts":[[2018,7]]}},"alternative-id":["1055"],"URL":"https:\/\/doi.org\/10.1007\/s10489-017-1055-4","relation":{},"ISSN":["0924-669X","1573-7497"],"issn-type":[{"value":"0924-669X","type":"print"},{"value":"1573-7497","type":"electronic"}],"subject":[],"published":{"date-parts":[[2017,9,7]]}}}