{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,7]],"date-time":"2026-03-07T22:43:30Z","timestamp":1772923410506,"version":"3.50.1"},"reference-count":47,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2022,1,17]],"date-time":"2022-01-17T00:00:00Z","timestamp":1642377600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2022,1,17]],"date-time":"2022-01-17T00:00:00Z","timestamp":1642377600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["U1805263"],"award-info":[{"award-number":["U1805263"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61772004"],"award-info":[{"award-number":["61772004"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61976053"],"award-info":[{"award-number":["61976053"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100005270","name":"Fujian Provincial Department of Science and Technology","doi-asserted-by":"publisher","award":["2020H0011"],"award-info":[{"award-number":["2020H0011"]}],"id":[{"id":"10.13039\/501100005270","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Soft Comput"],"published-print":{"date-parts":[[2022,2]]},"DOI":"10.1007\/s00500-021-06600-9","type":"journal-article","created":{"date-parts":[[2022,1,16]],"date-time":"2022-01-16T19:03:47Z","timestamp":1642359827000},"page":"1249-1259","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["Kernel-based data transformation model for nonlinear classification of symbolic data"],"prefix":"10.1007","volume":"26","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-7820-8766","authenticated-orcid":false,"given":"Xuanhui","family":"Yan","sequence":"first","affiliation":[]},{"given":"Lifei","family":"Chen","sequence":"additional","affiliation":[]},{"given":"Gongde","family":"Guo","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2022,1,17]]},"reference":[{"key":"6600_CR1","volume-title":"An introduction to categorical data analysis","author":"A Agresti","year":"2008","unstructured":"Agresti A (2008) An introduction to categorical data analysis. Wiley, New York"},{"issue":"3","key":"6600_CR2","doi-asserted-by":"publisher","first-page":"413","DOI":"10.1093\/biomet\/63.3.413","volume":"63","author":"J Aitchison","year":"1976","unstructured":"Aitchison J, Aitken CGG (1976) Multivariate binary discrimination by the kernel method. Biometrika 63(3):413\u2013420","journal-title":"Biometrika"},{"key":"6600_CR3","first-page":"1","volume":"20","author":"MZ Alaya","year":"2017","unstructured":"Alaya MZ, Bussy S, Gaiffas S, Guilloux A (2017) Binarsity: a penalization for one-hot encoded features. J Machine Learn Res 20:1\u201334","journal-title":"J Machine Learn Res"},{"key":"6600_CR4","doi-asserted-by":"crossref","unstructured":"Boriah S, Chandola V, Kumar V (2008). Similarity measures for categorical data: a comparative evaluation. In: Proceedings of the 8th SIAM international conference on data mining, pp 243\u2013254","DOI":"10.1137\/1.9781611972788.22"},{"issue":"1","key":"6600_CR5","doi-asserted-by":"publisher","first-page":"5","DOI":"10.1023\/A:1010933404324","volume":"45","author":"L Breiman","year":"2001","unstructured":"Breiman L (2001) Random forests. Machine Learn 45(1):5\u201332","journal-title":"Machine Learn"},{"issue":"2","key":"6600_CR6","doi-asserted-by":"publisher","first-page":"169","DOI":"10.1111\/1467-842X.00219","volume":"44","author":"AP Bremner","year":"2002","unstructured":"Bremner AP, Taplin RH (2002) Theory & methods: modified classification and regression tree splitting criteria for data with interactions. Aust & N. Z. J Stat 44(2):169\u2013176","journal-title":"Aust & N. Z. J Stat"},{"issue":"2","key":"6600_CR7","doi-asserted-by":"publisher","first-page":"157","DOI":"10.1016\/S0167-9473(98)00032-2","volume":"28","author":"SE Buttrey","year":"1998","unstructured":"Buttrey SE (1998) Nearest-neighbor classification with categorical variables. Comput Stat Data Anal 28(2):157\u2013169","journal-title":"Comput Stat Data Anal"},{"issue":"22","key":"6600_CR8","doi-asserted-by":"publisher","first-page":"17187","DOI":"10.1007\/s00500-020-05011-6","volume":"24","author":"JP Casquilho","year":"2020","unstructured":"Casquilho JP (2020) On the weighted gini-simpson index: estimating feasible weights using the optimal point and discussing a link with possibility theory. Soft Comput 24(22):17187\u201317194","journal-title":"Soft Comput"},{"issue":"8\u201310","key":"6600_CR9","doi-asserted-by":"publisher","first-page":"1477","DOI":"10.1007\/s10994-018-5724-2","volume":"107","author":"P Cerda","year":"2018","unstructured":"Cerda P, Varoquaux G, K\u00e9gl B (2018) Similarity encoding for learning with dirty categorical variables. Machine Learn 107(8\u201310):1477\u20131494","journal-title":"Machine Learn"},{"issue":"6","key":"6600_CR10","doi-asserted-by":"publisher","first-page":"3142","DOI":"10.1016\/j.eswa.2014.12.002","volume":"42","author":"L Chen","year":"2015","unstructured":"Chen L, Guo G (2015) Nearest neighbor classification of categorical data by attributes weighting. Expert Syst Appl 42(6):3142\u20133149","journal-title":"Expert Syst Appl"},{"issue":"8","key":"6600_CR11","doi-asserted-by":"publisher","first-page":"2981","DOI":"10.1007\/s00500-015-1926-8","volume":"20","author":"L Chen","year":"2016","unstructured":"Chen L, Ye Y, Guo G, Zhu J (2016) Kernel-based linear classification on categorical data. Soft Comput 20(8):2981\u20132993","journal-title":"Soft Comput"},{"key":"6600_CR12","doi-asserted-by":"publisher","first-page":"322","DOI":"10.1016\/j.patcog.2015.09.027","volume":"51","author":"L Chen","year":"2016","unstructured":"Chen L, Wang S, Wang K, Zhu J (2016) Soft subspace clustering of categorical data with probabilistic distance. Pattern Recognit 51:322\u2013332","journal-title":"Pattern Recognit"},{"key":"6600_CR13","doi-asserted-by":"publisher","first-page":"325","DOI":"10.1016\/j.neucom.2019.07.069","volume":"365","author":"L Cheng","year":"2019","unstructured":"Cheng L, Wang Y, Ma X (2019) A neural probabilistic outlier detection method for categorical data. Neurocomputing 365:325\u2013335","journal-title":"Neurocomputing"},{"key":"6600_CR14","doi-asserted-by":"crossref","unstructured":"Chen T, Guestrin C (2016). XGBoost: a scalable tree boosting system. In: Proceedings of the 22nd ACM SIGKDD international conference on knowledge discovery and data mining (KDD\u201916), pp 785\u2013794","DOI":"10.1145\/2939672.2939785"},{"key":"6600_CR15","doi-asserted-by":"crossref","unstructured":"Chen L, Guo G, Wang S, Kong X (2014b). Kernel learning method for distance-based classification of categorical data. In: Proceedings of the 14th UK workshop on computational intelligence (UKCI\u201914), pp 58\u201363","DOI":"10.1109\/UKCI.2014.6930159"},{"key":"6600_CR16","unstructured":"Chen L, Wang S (2013). Central clustering of categorical data with automated feature weighting. In: Proceedings of the 23th international joint conference on artificial intelligence (IJCAI\u201913), pp 1260\u20131266"},{"key":"6600_CR17","first-page":"273","volume":"20","author":"C Cortes","year":"1995","unstructured":"Cortes C, Vapnik V (1995) Support-vector networks. Machine Learn 20:273\u2013297","journal-title":"Machine Learn"},{"issue":"8","key":"6600_CR18","doi-asserted-by":"publisher","first-page":"1181","DOI":"10.1007\/s10851-018-0804-2","volume":"60","author":"G Deng","year":"2018","unstructured":"Deng G, Manton JH, Wang S (2018) Fast kernel smoothing by a low-rank approximation of the kernel toeplitz matrix. J Math Imaging Vis 60(8):1181\u20131195","journal-title":"J Math Imaging Vis"},{"issue":"3","key":"6600_CR19","doi-asserted-by":"publisher","first-page":"1247","DOI":"10.1016\/j.eswa.2014.09.012","volume":"42","author":"TRL Dos Santos","year":"2015","unstructured":"Dos Santos TRL, Z\u00e1rate LE (2015) Categorical data clustering: What similarity measure to recommend? Expert Syst Appl 42(3):1247\u20131260","journal-title":"Expert Syst Appl"},{"key":"6600_CR20","volume-title":"Kernel smoothing principles","author":"S Ghosh","year":"2018","unstructured":"Ghosh S (2018) Kernel smoothing principles. Wiley, Hoboken"},{"issue":"5","key":"6600_CR21","doi-asserted-by":"publisher","first-page":"345","DOI":"10.1016\/S0306-4379(00)00022-3","volume":"25","author":"S Guha","year":"2000","unstructured":"Guha S, Rastogi R, Shim K (2000) ROCK: a robust clustering algorithm for categorical attributes. Inform Syst 25(5):345\u2013366","journal-title":"Inform Syst"},{"key":"6600_CR22","doi-asserted-by":"crossref","unstructured":"Han E, Karypis G (2000). Centroid-based document classification: analysis & experimental results. In: Proceedings of the 4th European conference on principles and practice of knowledge discovery in databases (PKDD\u201900), pp 424\u2013431","DOI":"10.1007\/3-540-45372-5_46"},{"issue":"2","key":"6600_CR23","doi-asserted-by":"publisher","first-page":"223","DOI":"10.1016\/j.inffus.2006.05.006","volume":"9","author":"Z He","year":"2008","unstructured":"He Z, Xu X, Deng S (2008) K-ANMI: a mutual information based clustering algorithm for categorical data. Inform Fusion 9(2):223\u2013233","journal-title":"Inform Fusion"},{"issue":"3","key":"6600_CR24","doi-asserted-by":"publisher","first-page":"1171","DOI":"10.1214\/009053607000000677","volume":"36","author":"T Hofmann","year":"2008","unstructured":"Hofmann T, Sch\u00f6lkopf B, Smola AJ (2008) Kernel methods in machine learning. Ann Stat 36(3):1171\u20131220","journal-title":"Ann Stat"},{"issue":"3","key":"6600_CR25","doi-asserted-by":"publisher","first-page":"283","DOI":"10.1023\/A:1009769707641","volume":"2","author":"Z Huang","year":"1998","unstructured":"Huang Z (1998) Extensions to the K-means algorithm for clustering large data sets with categorical values. Data Mining Knowl Discovery 2(3):283\u2013304","journal-title":"Data Mining Knowl Discovery"},{"issue":"5","key":"6600_CR26","doi-asserted-by":"publisher","first-page":"657","DOI":"10.1109\/TPAMI.2005.95","volume":"27","author":"JZ Huang","year":"2005","unstructured":"Huang JZ, Ng MK, Rong H, Li Z (2005) Automated variable weighting in K-means type clustering. IEEE Trans Pattern Anal Machine Intell 27(5):657\u2013668","journal-title":"IEEE Trans Pattern Anal Machine Intell"},{"key":"6600_CR27","doi-asserted-by":"crossref","unstructured":"Jin W, Li ZJ, Wei LS, Zhen H (2000). The improvements of BP neural network learning algorithm. In: Proceedings of the 5th international conference on signal processing, pp 1647\u20131649","DOI":"10.1109\/ICOSP.2000.893417"},{"issue":"1","key":"6600_CR28","first-page":"643","volume":"13","author":"H Larochelle","year":"2012","unstructured":"Larochelle H, Mandel M, Pascanu R, Bengio Y (2012) Learning algorithms for the classification restricted boltzmann machine. J Machine Learn Res 13(1):643\u2013669","journal-title":"J Machine Learn Res"},{"key":"6600_CR29","volume-title":"Nonparametric econometrics: theory and practice","author":"Q Li","year":"2007","unstructured":"Li Q, Racine JS (2007) Nonparametric econometrics: theory and practice. Princeton University Press, Princeton"},{"key":"6600_CR30","unstructured":"Mikolov T, Chen K, Corrado G, Dean J (2013). Efficient estimation of word representations in vector space. arXiv preprint arXiv:1301.3781"},{"issue":"1","key":"6600_CR31","doi-asserted-by":"publisher","first-page":"69","DOI":"10.1080\/10485250600569002","volume":"18","author":"D Ouyang","year":"2006","unstructured":"Ouyang D, Li Q, Racine JS (2006) Cross-validation and the estimation of probability distributions with categorical data. J Nonparametric Stat 18(1):69\u2013100","journal-title":"J Nonparametric Stat"},{"issue":"10","key":"6600_CR32","doi-asserted-by":"publisher","first-page":"2047","DOI":"10.1109\/TNNLS.2015.2451151","volume":"27","author":"Y Qian","year":"2016","unstructured":"Qian Y, Li F, Liang J, Liu B, Dang C (2016) Space structure and clustering of categorical data. IEEE Trans Neural Netw Learn Syst 27(10):2047\u20132059","journal-title":"IEEE Trans Neural Netw Learn Syst"},{"key":"6600_CR33","unstructured":"Quinlan J (1995). C4.5: Programms for machine learning. Morgan Kaufmann Publishers Inc"},{"key":"6600_CR34","doi-asserted-by":"publisher","first-page":"2323","DOI":"10.1126\/science.290.5500.2323","volume":"290","author":"S Roweis","year":"2000","unstructured":"Roweis S, Saul L (2000) Nonlinear dimensionality reduction by locally linear embedding. Science 290:2323","journal-title":"Science"},{"key":"6600_CR35","doi-asserted-by":"publisher","DOI":"10.1002\/9780470316849","volume-title":"Multivariate density estimation: theory, practice, and visualization","author":"DW Scott","year":"1992","unstructured":"Scott DW (1992) Multivariate density estimation: theory, practice, and visualization. Wiley, New York"},{"key":"6600_CR36","unstructured":"Seeger M (2006). Bayesian modeling in machine learning: a tutorial review. Tutorial, Saarland University. http:\/\/lapmal.epfl.ch\/papers\/bayes-review"},{"issue":"4","key":"6600_CR37","doi-asserted-by":"publisher","first-page":"1285","DOI":"10.1214\/aos\/1176346792","volume":"12","author":"CJ Stone","year":"1984","unstructured":"Stone CJ (1984) An asymptotically optimal window selection rule for kernel density estimates. Ann Stat 12(4):1285-1297","journal-title":"Ann Stat"},{"key":"6600_CR38","doi-asserted-by":"crossref","unstructured":"Vo KT, Sowmya A (2010). Multiple kernel learning for classification of diffuse lung disease using HRCT lung images. In: Proceedings of the 2010 annual international conference of the IEEE engineering in medicine and biology, pp 3085\u20133088","DOI":"10.1109\/IEMBS.2010.5626113"},{"key":"6600_CR39","doi-asserted-by":"crossref","unstructured":"Wang MQ, Yue XD, Gao C, Chen Y (2018). Feature selection ensemble for symbolic data classification with AHP. In: Proceedings of the 24th international conference on pattern recognition (ICPR\u201908), pp 868\u2013873","DOI":"10.1109\/ICPR.2018.8546098"},{"key":"6600_CR40","doi-asserted-by":"publisher","first-page":"107050","DOI":"10.1016\/j.patcog.2019.107050","volume":"99","author":"Z Wang","year":"2020","unstructured":"Wang Z, Zhu Z, Li D (2020) Collaborative and geometric multi-kernel learning for multi-class classification. Pattern Recognit 99:107050","journal-title":"Pattern Recognit"},{"key":"6600_CR41","doi-asserted-by":"crossref","unstructured":"Wang R, Li Z, Cao J, Chen T, Wang L (2019). Convolutional recurrent neural networks for text classification. In: Proceedings of the 2019 international joint conference on neural networks (IJCNN), pp 1\u20136","DOI":"10.1109\/IJCNN.2019.8852406"},{"key":"6600_CR42","doi-asserted-by":"crossref","unstructured":"Wang D, Tanaka T (2016). Sparse kernel principal component analysis based on elastic net regularization. In: Proceedings of the 2016 international joint conference on neural networks (IJCNN), pp 3703\u20133708","DOI":"10.1109\/IJCNN.2016.7727676"},{"issue":"5","key":"6600_CR43","doi-asserted-by":"publisher","first-page":"1032","DOI":"10.1007\/s11704-018-7186-x","volume":"12","author":"X Yan","year":"2018","unstructured":"Yan X, Chen L, Guo G (2018) Center-based clustering of categorical data using kernel smoothing methods. Front Computer Sci 12(5):1032\u20131034","journal-title":"Front Computer Sci"},{"key":"6600_CR44","doi-asserted-by":"publisher","first-page":"179","DOI":"10.1016\/j.knosys.2013.05.013","volume":"49","author":"J Zhang","year":"2013","unstructured":"Zhang J, Chen L, Guo G (2013) Projected-prototype-based classifier for text categorization. Knowl Based Syst 49:179\u2013189","journal-title":"Knowl Based Syst"},{"key":"6600_CR45","doi-asserted-by":"publisher","first-page":"51","DOI":"10.1016\/j.neunet.2014.05.014","volume":"57","author":"S Zhong","year":"2014","unstructured":"Zhong S, Chen T, He F, Niu Y (2014) Fast gaussian kernel learning for classification tasks based on specially structured global optimization. Neural Netw 57:51\u201362","journal-title":"Neural Netw"},{"issue":"19","key":"6600_CR46","doi-asserted-by":"publisher","first-page":"125","DOI":"10.1016\/j.neucom.2015.09.127","volume":"198","author":"J Zhou","year":"2016","unstructured":"Zhou J, Chen L, Chen CLP, Zhang Y, Li HX (2016) Fuzzy clustering with the entropy of attribute weights. Neurocomputing 198(19):125\u2013134","journal-title":"Neurocomputing"},{"key":"6600_CR47","doi-asserted-by":"publisher","first-page":"230","DOI":"10.1016\/j.eswa.2017.12.013","volume":"96","author":"S Zhu","year":"2018","unstructured":"Zhu S, Xu L (2018) Many-objective fuzzy centroids clustering algorithm for categorical data. Expert Syst Appl 96:230\u2013248","journal-title":"Expert Syst Appl"}],"container-title":["Soft Computing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00500-021-06600-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00500-021-06600-9\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00500-021-06600-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,1,24]],"date-time":"2022-01-24T11:22:16Z","timestamp":1643023336000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00500-021-06600-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,1,17]]},"references-count":47,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2022,2]]}},"alternative-id":["6600"],"URL":"https:\/\/doi.org\/10.1007\/s00500-021-06600-9","relation":{"has-preprint":[{"id-type":"doi","id":"10.21203\/rs.3.rs-996277\/v1","asserted-by":"object"}]},"ISSN":["1432-7643","1433-7479"],"issn-type":[{"value":"1432-7643","type":"print"},{"value":"1433-7479","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022,1,17]]},"assertion":[{"value":"19 November 2021","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"17 January 2022","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declaration"}},{"value":"The authors declare that they have no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}