{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2023,10,9]],"date-time":"2023-10-09T10:50:14Z","timestamp":1696848614174},"reference-count":42,"publisher":"Elsevier BV","issue":"22","license":[{"start":{"date-parts":[[2010,11,1]],"date-time":"2010-11-01T00:00:00Z","timestamp":1288569600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Information Sciences"],"published-print":{"date-parts":[[2010,11]]},"DOI":"10.1016\/j.ins.2010.07.028","type":"journal-article","created":{"date-parts":[[2010,8,4]],"date-time":"2010-08-04T04:49:30Z","timestamp":1280897370000},"page":"4353-4369","source":"Crossref","is-referenced-by-count":5,"title":["Validation of overlapping clustering: A random clustering perspective"],"prefix":"10.1016","volume":"180","author":[{"given":"Junjie","family":"Wu","sequence":"first","affiliation":[]},{"given":"Hua","family":"Yuan","sequence":"additional","affiliation":[]},{"given":"Hui","family":"Xiong","sequence":"additional","affiliation":[]},{"given":"Guoqing","family":"Chen","sequence":"additional","affiliation":[]}],"member":"78","reference":[{"key":"10.1016\/j.ins.2010.07.028_bib1","doi-asserted-by":"crossref","unstructured":"R. Agrawal, T. Imielinski, A. Swami, Mining association rules between sets of items in large databases, in: Proceedings of the 1993 ACM SIGMOD International Conference on Management of Data, May 1993, pp. 207\u2013216.","DOI":"10.1145\/170036.170072"},{"issue":"20","key":"10.1016\/j.ins.2010.07.028_bib2","doi-asserted-by":"crossref","first-page":"3583","DOI":"10.1016\/j.ins.2009.06.012","article-title":"Performance evaluation of density-based clustering methods","volume":"179","author":"Alidguliyev","year":"2009","journal-title":"Information Sciences"},{"key":"10.1016\/j.ins.2010.07.028_bib3","unstructured":"N.O. Andrews, E.A. Fox, Recent Developments in Document Clustering, Technical Report TR-07-35, Computer Science, Virginia Tech, 2007."},{"key":"10.1016\/j.ins.2010.07.028_bib4","unstructured":"R.A. Askey, R. Roy, Beta function. , 2008 (accessed 13.12.08)."},{"key":"10.1016\/j.ins.2010.07.028_bib5","doi-asserted-by":"crossref","unstructured":"F. Beil, M. Ester, X. Xu, Frequent term-based text clustering, in: Proceedings of the Eighth ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, 2002, pp. 436\u2013442.","DOI":"10.1145\/775107.775110"},{"key":"10.1016\/j.ins.2010.07.028_bib6","doi-asserted-by":"crossref","unstructured":"D.R. Cutting, D.R. Karger, J.O. Pedersen, J.W. Tukey, Scatter\/gather: a cluster-based approach to browsing large document collections, in: Proceedings of the 15th Annual International ACM SIGIR Conference on Research and Development in Information Retrieval, 1992, pp. 318\u2013329.","DOI":"10.1145\/133160.133214"},{"issue":"2","key":"10.1016\/j.ins.2010.07.028_bib7","doi-asserted-by":"crossref","first-page":"40","DOI":"10.1145\/565117.565124","article-title":"Cluster validity methods: Part I","volume":"31","author":"Halkidi","year":"2002","journal-title":"SIGMOD Record"},{"issue":"3","key":"10.1016\/j.ins.2010.07.028_bib8","doi-asserted-by":"crossref","first-page":"19","DOI":"10.1145\/601858.601862","article-title":"Clustering validity checking methods: Part II","volume":"31","author":"Halkidi","year":"2002","journal-title":"SIGMOD Record"},{"key":"10.1016\/j.ins.2010.07.028_bib9","doi-asserted-by":"crossref","unstructured":"E.-H. Han, D. Boley, M. Gini, R. Gross, K. Hastings, G. Karypis, V. Kumar, B. Mobasher, J. Moore, Webace: a web agent for document categorization and exploration, in: Proceedings of the Second International Conference on Autonomous Agents, 1998.","DOI":"10.1145\/280765.280872"},{"key":"10.1016\/j.ins.2010.07.028_bib10","doi-asserted-by":"crossref","unstructured":"J. Han, J. Pei, Y. Yin, Mining frequent patterns without candidate generation, in: Proceedings of the 2000 ACM SIGMOD International Conference on Management of Data, 2000, pp. 1\u201312.","DOI":"10.1145\/335191.335372"},{"key":"10.1016\/j.ins.2010.07.028_bib11","series-title":"Algorithms for Clustering Data","author":"Jain","year":"1988"},{"key":"10.1016\/j.ins.2010.07.028_bib12","doi-asserted-by":"crossref","first-page":"217","DOI":"10.1016\/0020-0271(71)90051-9","article-title":"The use of hierarchical clustering in information retrieval","volume":"7","author":"Jardine","year":"1971","journal-title":"Information Storage and Retrieval"},{"key":"10.1016\/j.ins.2010.07.028_bib13","doi-asserted-by":"crossref","unstructured":"B. Larsen, C. Aone, Fast and effective text mining using linear-time document clustering, in: Proceedings of the Fifth ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, 1999, pp. 16\u201322.","DOI":"10.1145\/312129.312186"},{"issue":"23","key":"10.1016\/j.ins.2010.07.028_bib14","doi-asserted-by":"crossref","first-page":"4501","DOI":"10.1016\/j.ins.2008.05.014","article-title":"Clustering high dimensional data: a graph-based relaxed optimization approach","volume":"178","author":"Lee","year":"2008","journal-title":"Information Sciences"},{"key":"10.1016\/j.ins.2010.07.028_bib15","unstructured":"D. Lewis, Reuters-21578. , 2004 (accessed 29.12.08)."},{"key":"10.1016\/j.ins.2010.07.028_bib16","series-title":"Introduction to Information Retrieval","author":"Manning","year":"2008"},{"key":"10.1016\/j.ins.2010.07.028_bib17","unstructured":"M. Mehlitz, C. Bauckhage, S. Albayrak, Normalizing document cluster evaluation results. , 2007 (accessed 12.12.08)."},{"key":"10.1016\/j.ins.2010.07.028_bib18","doi-asserted-by":"crossref","unstructured":"M. Mehlitz, C. Bauckhage, J. Kunegis, S. Albayrak, A new evaluation measure for information retrieval systems, in: Proceedings of the 2007 IEEE International Conference on Systems, Man, and Cybernetics, 2007, pp. 1200\u20131204.","DOI":"10.1109\/ICSMC.2007.4413662"},{"key":"10.1016\/j.ins.2010.07.028_bib19","doi-asserted-by":"crossref","unstructured":"M. Meila, Comparing clusterings \u2013 an axiomatic view, in: Proceedings of the 22nd International Conference on Machine Learning, 2005, pp. 577\u2013584.","DOI":"10.1145\/1102351.1102424"},{"issue":"3","key":"10.1016\/j.ins.2010.07.028_bib20","doi-asserted-by":"crossref","first-page":"414","DOI":"10.1016\/j.ins.2009.09.019","article-title":"Towards supporting expert evaluation of clustering results using a data mining process model","volume":"180","author":"Osei-Bryson","year":"2010","journal-title":"Information Sciences"},{"issue":"3","key":"10.1016\/j.ins.2010.07.028_bib21","doi-asserted-by":"crossref","DOI":"10.1108\/eb046814","article-title":"An algorithm for suffix stripping","volume":"14","author":"Porter","year":"1980","journal-title":"Program"},{"key":"10.1016\/j.ins.2010.07.028_bib22","series-title":"Numerical Recipes in C: The Art of Scientific Computing","author":"Press","year":"1992"},{"key":"10.1016\/j.ins.2010.07.028_bib23","series-title":"Introduction To Probability Models","author":"Ross","year":"2007"},{"key":"10.1016\/j.ins.2010.07.028_bib24","unstructured":"M. Steinbach, G. Karypis, V. Kumar, A comparison of document clustering techniques, in: Workshop on Text Mining, The Sixth ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, 2000."},{"key":"10.1016\/j.ins.2010.07.028_bib25","series-title":"Introduction to Data Mining","author":"Tan","year":"2005"},{"issue":"4","key":"10.1016\/j.ins.2010.07.028_bib26","doi-asserted-by":"crossref","first-page":"559","DOI":"10.1016\/S0306-4573(01)00048-6","article-title":"The effectiveness of query-specific hierarchic clustering in information retrieval","volume":"38","author":"Tombros","year":"2002","journal-title":"Information Processing and Management"},{"key":"10.1016\/j.ins.2010.07.028_bib27","unstructured":"TREC, Text retrieval conference. , 2000 (accessed 16.12.08)."},{"key":"10.1016\/j.ins.2010.07.028_bib28","series-title":"Information Retrieval","author":"van Rijsbergen","year":"1979"},{"issue":"18","key":"10.1016\/j.ins.2010.07.028_bib29","doi-asserted-by":"crossref","first-page":"3718","DOI":"10.1016\/j.ins.2007.02.045","article-title":"A novel document similarity measure based on earth movers distance","volume":"177","author":"Wan","year":"2007","journal-title":"Information Sciences"},{"key":"10.1016\/j.ins.2010.07.028_bib30","unstructured":"Wikipedia, Beta function \u2013 wikipedia, the free encyclopedia. , 2008 (accessed 13.12.08)."},{"key":"10.1016\/j.ins.2010.07.028_bib31","unstructured":"Wikipedia, Information retrieval \u2013 wikipedia, the free encyclopedia. , 2008 (accessed 12.12.08)."},{"key":"10.1016\/j.ins.2010.07.028_bib32","doi-asserted-by":"crossref","unstructured":"J. Wu, H. Xiong, J. Chen, Adapting the right measures for k-means clustering, in: Proceedings of the 15th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, 2009, pp. 877\u2013886.","DOI":"10.1145\/1557019.1557115"},{"issue":"3","key":"10.1016\/j.ins.2010.07.028_bib33","doi-asserted-by":"crossref","first-page":"6050","DOI":"10.1016\/j.eswa.2008.06.093","article-title":"External validation measures for k-means clustering: a data distribution perspective","volume":"36","author":"Wu","year":"2009","journal-title":"Expert Systems with Applications"},{"issue":"10\u201312","key":"10.1016\/j.ins.2010.07.028_bib34","doi-asserted-by":"crossref","first-page":"2319","DOI":"10.1016\/j.neucom.2008.12.011","article-title":"Towards understanding hierarchical clustering: a data distribution perspective","volume":"72","author":"Wu","year":"2009","journal-title":"Neurocomputing"},{"key":"10.1016\/j.ins.2010.07.028_bib35","series-title":"Clustering and Information Retrieval","author":"Wu","year":"2003"},{"issue":"2","key":"10.1016\/j.ins.2010.07.028_bib36","doi-asserted-by":"crossref","first-page":"219","DOI":"10.1007\/s10618-006-0043-9","article-title":"Hyperclique pattern discovery","volume":"13","author":"Xiong","year":"2006","journal-title":"Data Mining and Knowledge Discovery"},{"issue":"2","key":"10.1016\/j.ins.2010.07.028_bib37","doi-asserted-by":"crossref","first-page":"318","DOI":"10.1109\/TSMCB.2008.2004559","article-title":"K-means clustering versus validation measures: a data-distribution perspective","volume":"39","author":"Xiong","year":"2009","journal-title":"IEEE Transactions on Systems, Man, and Cybernetics: Part B"},{"key":"10.1016\/j.ins.2010.07.028_bib38","series-title":"Proceedings of the Third IEEE International Conference on Data Mining (ICDM 2003), December 19\u201322","first-page":"387","article-title":"Mining strong affinity association patterns in data sets with skewed support distribution","author":"Xiong","year":"2003"},{"key":"10.1016\/j.ins.2010.07.028_bib39","unstructured":"Yahoo!, Yahoo! home. , 2008 (accessed 29.12.08)."},{"key":"10.1016\/j.ins.2010.07.028_bib40","doi-asserted-by":"crossref","unstructured":"O. Zamir, O. Etzioni, Web document clustering: a feasibility demonstration, in: Proceedings of the 21st Annual International ACM SIGIR Conference on Research and Development in Information Retrieval, 1998, pp. 46\u201354.","DOI":"10.1145\/290941.290956"},{"issue":"3","key":"10.1016\/j.ins.2010.07.028_bib41","doi-asserted-by":"crossref","first-page":"311","DOI":"10.1023\/B:MACH.0000027785.44527.d6","article-title":"Criterion functions for document clustering: experiments and analysis","volume":"55","author":"Zhao","year":"2004","journal-title":"Machine Learning"},{"issue":"13","key":"10.1016\/j.ins.2010.07.028_bib42","doi-asserted-by":"crossref","first-page":"2249","DOI":"10.1016\/j.ins.2009.02.019","article-title":"Exploiting noun phrases and semantic relationships for text document clustering","volume":"179","author":"Zheng","year":"2009","journal-title":"Information Sciences"}],"container-title":["Information Sciences"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0020025510003464?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0020025510003464?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2019,6,1]],"date-time":"2019-06-01T03:41:05Z","timestamp":1559360465000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S0020025510003464"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2010,11]]},"references-count":42,"journal-issue":{"issue":"22","published-print":{"date-parts":[[2010,11]]}},"alternative-id":["S0020025510003464"],"URL":"http:\/\/dx.doi.org\/10.1016\/j.ins.2010.07.028","relation":{},"ISSN":["0020-0255"],"issn-type":[{"value":"0020-0255","type":"print"}],"subject":["Artificial Intelligence","Information Systems and Management","Computer Science Applications","Theoretical Computer Science","Control and Systems Engineering","Software"],"published":{"date-parts":[[2010,11]]}}}