{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,19]],"date-time":"2026-02-19T23:21:23Z","timestamp":1771543283180,"version":"3.50.1"},"reference-count":27,"publisher":"Springer Science and Business Media LLC","issue":"7","license":[{"start":{"date-parts":[[2015,3,11]],"date-time":"2015-03-11T00:00:00Z","timestamp":1426032000000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Sci. China Inf. Sci."],"published-print":{"date-parts":[[2015,7]]},"DOI":"10.1007\/s11432-014-5267-5","type":"journal-article","created":{"date-parts":[[2015,3,11]],"date-time":"2015-03-11T09:41:34Z","timestamp":1426066894000},"page":"1-15","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":6,"title":["A probabilistic framework for optimizing projected clusters with categorical attributes","\u4f18\u5316\u7c7b\u5c5e\u578b\u6570\u636e\u6295\u5f71\u805a\u7c7b\u7684\u6982\u7387\u6784\u67b6"],"prefix":"10.1007","volume":"58","author":[{"given":"LiFei","family":"Chen","sequence":"first","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2015,3,11]]},"reference":[{"key":"5267_CR1","doi-asserted-by":"crossref","first-page":"61","DOI":"10.1145\/304181.304188","volume":"28","author":"C. C. Aggarwal","year":"1999","unstructured":"Aggarwal C C, Procopiuc C, Wolf J L, et al. Fast algorithm for projected clustering. ACM SIGMOD Rec, 1999, 28: 61\u201372","journal-title":"ACM SIGMOD Rec"},{"key":"5267_CR2","doi-asserted-by":"crossref","first-page":"273","DOI":"10.1007\/s10115-007-0090-6","volume":"14","author":"G. Moise","year":"2008","unstructured":"Moise G, Sander J, Ester M. Robust projected clustering. Knowl Inf Syst, 2008, 14: 273\u2013298","journal-title":"Knowl Inf Syst"},{"key":"5267_CR3","doi-asserted-by":"crossref","first-page":"1291","DOI":"10.1109\/TKDE.2010.256","volume":"24","author":"L. Chen","year":"2012","unstructured":"Chen L, Jiang Q, Wang S. Model-based method for projective clustering. IEEE Trans Knowl Data Eng, 2012, 24: 1291\u20131305","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"5267_CR4","doi-asserted-by":"crossref","first-page":"657","DOI":"10.1109\/TPAMI.2005.95","volume":"27","author":"J. Z. Huang","year":"2005","unstructured":"Huang J Z, Ng M K, Rong H, et al. Automated variable weighting in k-means type clustering. IEEE Trans Patt Anal Mach Intell, 2005, 27: 657\u2013668","journal-title":"IEEE Trans Patt Anal Mach Intell"},{"key":"5267_CR5","first-page":"887","volume-title":"Proceedings of the 27th International Conference on Machine Learning","author":"L. Poon","year":"2010","unstructured":"Poon L, Zhang N, Chen T, et al. Variable selection in model-based clustering: to do or to facilitate. In: Proceedings of the 27th International Conference on Machine Learning, Haifa, 2010. 887\u2013894"},{"key":"5267_CR6","doi-asserted-by":"crossref","first-page":"534","DOI":"10.1080\/01621459.1971.10482297","volume":"66","author":"R. J. Light","year":"1971","unstructured":"Light R J, Marglin B H. An analysis of variance for categorical data. J Am Stat Assoc, 1971, 66: 534\u2013544","journal-title":"J Am Stat Assoc"},{"key":"5267_CR7","first-page":"241","volume":"14","author":"O. M. San","year":"2004","unstructured":"San O M, Huynh V N, Nakamori Y. An alternative extension of the k-means algorithm for clustering categorical data. Int J Appl Math Comput Sci, 2004, 14: 241\u2013247","journal-title":"Int J Appl Math Comput Sci"},{"key":"5267_CR8","doi-asserted-by":"crossref","first-page":"283","DOI":"10.1023\/A:1009769707641","volume":"2","author":"Z. Huang","year":"1998","unstructured":"Huang Z. Extensions to the k-means algorithm for clustering large data sets with categorical value. Data Min Knowl Discov, 1998, 2: 283\u2013304","journal-title":"Data Min Knowl Discov"},{"key":"5267_CR9","doi-asserted-by":"crossref","first-page":"943","DOI":"10.1016\/j.patcog.2003.11.003","volume":"37","author":"E. Y. Chan","year":"2004","unstructured":"Chan E Y, Ching W K, Ng M K, et al. An optimization algorithm for clustering using weighted dissimilarity measures. Patt Recogn, 2004, 37: 943\u2013952","journal-title":"Patt Recogn"},{"key":"5267_CR10","doi-asserted-by":"crossref","first-page":"2843","DOI":"10.1016\/j.patcog.2011.04.024","volume":"44","author":"L. Bai","year":"2011","unstructured":"Bai L, Liang J, Dang C, et al. A novel attribute weighting algorithm for clustering high-dimensional categorical data. Patt Recogn, 2011, 44: 2843\u20132861","journal-title":"Patt Recogn"},{"key":"5267_CR11","doi-asserted-by":"crossref","first-page":"103","DOI":"10.1007\/s10618-011-0221-2","volume":"24","author":"T. Xiong","year":"2012","unstructured":"Xiong T, Wang S, Mayers A, et al. DHCC: divisive hierarchical clustering of categorical data. Data Min Knowl Discov, 2012, 24: 103\u2013135","journal-title":"Data Min Knowl Discov"},{"key":"5267_CR12","first-page":"1260","volume-title":"Proceedings of the 23rd International Joint Conference on Artificial Intelligence","author":"L. Chen","year":"2013","unstructured":"Chen L, Wang S. Central clustering of categorical data with automated feature weighting. In: Proceedings of the 23rd International Joint Conference on Artificial Intelligence, Beijing, 2013. 1260\u20131266"},{"key":"5267_CR13","doi-asserted-by":"crossref","first-page":"23","DOI":"10.1016\/j.neucom.2012.11.009","volume":"108","author":"F. Cao","year":"2013","unstructured":"Cao F, Liang J, Li D, et al. A Weighting k-modes algorithm for subspace clustering of categorical data. Neurocomputing, 2013, 108: 23\u201330","journal-title":"Neurocomputing"},{"key":"5267_CR14","first-page":"243","volume-title":"Proceedings of the 8th SIAM International Conference on Data Mining","author":"S. Boriah","year":"2008","unstructured":"Boriah S, Chandola V, Kumar V. Similarity measures for categorical data: a comparative evaluation. In: Proceedings of the 8th SIAM International Conference on Data Mining, Atlanta, 2008. 243\u2013254"},{"key":"5267_CR15","doi-asserted-by":"crossref","first-page":"90","DOI":"10.1145\/1007730.1007731","volume":"6","author":"L. Parsons","year":"2004","unstructured":"Parsons L, Haque E, Liu H. Subspace clustering for high dimensional data: a review. ACM SIGKDD Explor Newslett, 2004, 6: 90\u2013105","journal-title":"ACM SIGKDD Explor Newslett"},{"key":"5267_CR16","doi-asserted-by":"crossref","first-page":"87","DOI":"10.1145\/1046456.1046468","volume":"6","author":"G. Gan","year":"2004","unstructured":"Gan G, Wu J. Subspace clustering for high dimensional categorical data. ACM SIGKDD Explor Newslett, 2004, 6: 87\u201394","journal-title":"ACM SIGKDD Explor Newslett"},{"key":"5267_CR17","doi-asserted-by":"crossref","first-page":"1509","DOI":"10.1109\/TPAMI.2012.228","volume":"35","author":"L. Bai","year":"2013","unstructured":"Bai L, Liang J, Dang C, et al. The impact of cluster representatives on the convergence of the k-modes type clustering. IEEE Trans Patt Anal Mach Intell, 2013, 35: 1509\u20131522","journal-title":"IEEE Trans Patt Anal Mach Intell"},{"key":"5267_CR18","first-page":"329","volume-title":"Metron Int J Stat","author":"P. K. Sen","year":"2005","unstructured":"Sen P K. Gini diversity index, hamming distance and curse of dimensionality. Metron Int J Stat, 2005, LXIII: 329\u2013349"},{"key":"5267_CR19","doi-asserted-by":"crossref","first-page":"1983","DOI":"10.1007\/s11432-012-4611-x","volume":"55","author":"J. Tao","year":"2012","unstructured":"Tao J, Chung F, Wang S. A kernel learning framework for domain adaptation learning. Sci China Inf Sci, 2012, 55: 1983\u20132007","journal-title":"Sci China Inf Sci"},{"key":"5267_CR20","doi-asserted-by":"crossref","first-page":"69","DOI":"10.1080\/10485250600569002","volume":"18","author":"D. Ouyang","year":"2006","unstructured":"Ouyang D, Li Q, Racine J. Cross-validation and the estimation of probability distributions with categorical data. Nonparametr Stat, 2006, 18: 69\u2013100","journal-title":"Nonparametr Stat"},{"key":"5267_CR21","volume-title":"Nonparametric Econometrics: Theory and Practice.","author":"Q. Li","year":"2007","unstructured":"Li Q, Racine J S. Nonparametric Econometrics: Theory and Practice. Princeton: Princeton University Press, 2007"},{"key":"5267_CR22","doi-asserted-by":"crossref","first-page":"413","DOI":"10.1093\/biomet\/63.3.413","volume":"63","author":"J. Aitchison","year":"1976","unstructured":"Aitchison J, Aitken C. Multivariate binary discrimination by the kernel method. Biometrika, 1976, 63: 413\u2013420","journal-title":"Biometrika"},{"key":"5267_CR23","doi-asserted-by":"crossref","first-page":"1171","DOI":"10.1214\/009053607000000677","volume":"36","author":"T. Hofmann","year":"2008","unstructured":"Hofmann T, Scholkopf B, Smola A J. Kernel methods in machine learning. Ann Stat, 2008, 36: 1171\u20131220","journal-title":"Ann Stat"},{"key":"5267_CR24","doi-asserted-by":"crossref","unstructured":"Zhou K, Fu C, Yang S. Fuzziness parameter selection in fuzzy c-means: the perspective of cluster validation. Sci China Inf Sci, 2014, 57: 112206","DOI":"10.1007\/s11432-014-5146-0"},{"key":"5267_CR25","doi-asserted-by":"crossref","first-page":"264","DOI":"10.1145\/331499.331504","volume":"31","author":"A. K. Jain","year":"1999","unstructured":"Jain A K, Murty M N, Flynn P J. Data clustering: a review. ACM Comput Surv, 1999, 31: 264\u2013323","journal-title":"ACM Comput Surv"},{"key":"5267_CR26","first-page":"536","volume-title":"Proceedings of the 21st International Conference on Machine Learning","author":"T. Li","year":"2004","unstructured":"Li T, Ma S, Ogihara M. Entropy-based criterion in categorical clustering. In: Proceedings of the 21st International Conference on Machine Learning, Alberta, 2004. 536\u2013543"},{"key":"5267_CR27","doi-asserted-by":"crossref","first-page":"2040","DOI":"10.1007\/s11432-011-4386-5","volume":"54","author":"K. Wang","year":"2011","unstructured":"Wang K, Yan X, Chen L. Geometric double-entity model for recognizing far-near relations of clusters. Sci China Inf Sci, 2011, 54: 2040\u20132050","journal-title":"Sci China Inf Sci"}],"container-title":["Science China Information Sciences"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s11432-014-5267-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s11432-014-5267-5\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s11432-014-5267-5","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,6,1]],"date-time":"2019-06-01T15:38:00Z","timestamp":1559403480000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s11432-014-5267-5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015,3,11]]},"references-count":27,"journal-issue":{"issue":"7","published-print":{"date-parts":[[2015,7]]}},"alternative-id":["5267"],"URL":"https:\/\/doi.org\/10.1007\/s11432-014-5267-5","relation":{},"ISSN":["1674-733X","1869-1919"],"issn-type":[{"value":"1674-733X","type":"print"},{"value":"1869-1919","type":"electronic"}],"subject":[],"published":{"date-parts":[[2015,3,11]]}}}