{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,27]],"date-time":"2025-03-27T13:22:41Z","timestamp":1743081761547,"version":"3.40.3"},"publisher-location":"Cham","reference-count":24,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319754284"},{"type":"electronic","value":"9783319754291"}],"license":[{"start":{"date-parts":[[2018,1,1]],"date-time":"2018-01-01T00:00:00Z","timestamp":1514764800000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018]]},"DOI":"10.1007\/978-3-319-75429-1_10","type":"book-chapter","created":{"date-parts":[[2018,2,3]],"date-time":"2018-02-03T10:33:11Z","timestamp":1517653991000},"page":"114-125","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["A New Context-Based Similarity Measure for Categorical Data Using Information Theory"],"prefix":"10.1007","author":[{"given":"Thanh-Phu","family":"Nguyen","sequence":"first","affiliation":[]},{"given":"Mina","family":"Ryoke","sequence":"additional","affiliation":[]},{"given":"Van-Nam","family":"Huynh","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2018,2,4]]},"reference":[{"key":"10_CR1","volume-title":"Applied Multiple Regression\/Correlation Analysis for the Behavioral Sciences","author":"J Cohen","year":"1983","unstructured":"Cohen, J., Cohen, P.: Applied Multiple Regression\/Correlation Analysis for the Behavioral Sciences. L. Erlbaum Associates, Hillsdale (1983)"},{"issue":"4","key":"10_CR2","doi-asserted-by":"publisher","first-page":"882","DOI":"10.2307\/2528080","volume":"22","author":"DW Goodall","year":"1966","unstructured":"Goodall, D.W.: A new similarity index based on probability. Biometrics 22(4), 882\u2013907 (1966)","journal-title":"Biometrics"},{"key":"10_CR3","series-title":"Lecture Notes in Computer Science (Lecture Notes in Artificial Intelligence)","doi-asserted-by":"publisher","first-page":"251","DOI":"10.1007\/978-3-319-23528-8_16","volume-title":"Machine Learning and Knowledge Discovery in Databases","author":"M Ring","year":"2015","unstructured":"Ring, M., Otto, F., Becker, M., Niebler, T., Landes, D., Hotho, A.: ConDist: a context-driven categorical distance measure. In: Appice, A., Rodrigues, P.P., Santos Costa, V., Soares, C., Gama, J., Jorge, A. (eds.) ECML PKDD 2015. LNCS (LNAI), vol. 9284, pp. 251\u2013266. Springer, Cham (2015). https:\/\/doi.org\/10.1007\/978-3-319-23528-8_16"},{"key":"10_CR4","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"115","DOI":"10.1007\/978-3-319-30024-5_7","volume-title":"Foundations of Information and Knowledge Systems","author":"T-HT Nguyen","year":"2016","unstructured":"Nguyen, T.-H.T., Huynh, V.-N.: A k-means-like algorithm for clustering categorical data using an information theoretic-based dissimilarity measure. In: Gyssens, M., Simari, G. (eds.) FoIKS 2016. LNCS, vol. 9616, pp. 115\u2013130. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-30024-5_7"},{"key":"10_CR5","volume-title":"Principles of Numerical Taxonomy","author":"RR Sokal","year":"1961","unstructured":"Sokal, R.R., Sneath, P.H.A.: Principles of Numerical Taxonomy. W. H. Freeman, San Francisco (1961)"},{"issue":"12","key":"10_CR6","doi-asserted-by":"publisher","first-page":"1213","DOI":"10.1145\/7902.7906","volume":"29","author":"C Stanfill","year":"1986","unstructured":"Stanfill, C., Waltz, D.: Toward memory-based reasoning. Commun. ACM 29(12), 1213\u20131228 (1986)","journal-title":"Commun. ACM"},{"key":"10_CR7","doi-asserted-by":"crossref","unstructured":"Boriah, S., Chandola, V., Kumar, V.: Similarity measures for categorical data: a comparative evaluation. In: Proceedings of the 2008 SIAM International Conference on Data Mining, pp. 243\u2013254 (2008)","DOI":"10.1137\/1.9781611972788.22"},{"issue":"12","key":"10_CR8","first-page":"47","volume":"17","author":"P Gambaryan","year":"1964","unstructured":"Gambaryan, P.: A mathematical model of taxonomy. SSR 17(12), 47\u201353 (1964)","journal-title":"SSR"},{"key":"10_CR9","doi-asserted-by":"crossref","unstructured":"Eskin, E., Arnold, A., Prerau, M., Portnoy, L., Stolfo, S.: A geometric framework for unsupervised anomaly detection: detecting intrusions in unlabeled data. In: Applications of Data Mining in Computer Security. Kluwer (2002)","DOI":"10.1007\/978-1-4615-0953-0_4"},{"issue":"1","key":"10_CR10","doi-asserted-by":"publisher","first-page":"25","DOI":"10.1007\/BF02332078","volume":"2","author":"TP Burnaby","year":"1970","unstructured":"Burnaby, T.P.: On a method for character weighting a similarity coefficient, employing the concept of information. J. Int. Assoc. Math. Geol. 2(1), 25\u201338 (1970)","journal-title":"J. Int. Assoc. Math. Geol."},{"key":"10_CR11","unstructured":"Lin, D.: An information-theoretic definition of similarity. In: Proceedings of the 15th International Conference on Machine Learning, pp. 296\u2013304. Morgan Kaufmann (1998)"},{"issue":"1","key":"10_CR12","doi-asserted-by":"publisher","first-page":"1","DOI":"10.2307\/2412390","volume":"17","author":"ES Smirnov","year":"1968","unstructured":"Smirnov, E.S.: On exact methods in systematics. Syst. Zool. 17(1), 1\u201313 (1968)","journal-title":"Syst. Zool."},{"key":"10_CR13","volume-title":"Cluster Analysis for Applications","author":"MR Anderberg","year":"1973","unstructured":"Anderberg, M.R.: Cluster Analysis for Applications. Academic Press, New York (1973)"},{"key":"10_CR14","doi-asserted-by":"crossref","unstructured":"Alamuri, M., Surampudi, B.R., Negi, A.: A survey of distance\/similarity measures for categorical data. In: 2014 International Joint Conference on Neural Networks (IJCNN), pp. 1907\u20131914, July 2014","DOI":"10.1109\/IJCNN.2014.6889941"},{"issue":"16","key":"10_CR15","doi-asserted-by":"publisher","first-page":"2549","DOI":"10.1016\/j.patrec.2005.06.002","volume":"26","author":"SQ Le","year":"2005","unstructured":"Le, S.Q., Ho, T.B.: An association-based dissimilarity measure for categorical data. Pattern Recogn. Lett. 26(16), 2549\u20132557 (2005)","journal-title":"Pattern Recogn. Lett."},{"issue":"1","key":"10_CR16","doi-asserted-by":"publisher","first-page":"1:1","DOI":"10.1145\/2133360.2133361","volume":"6","author":"D Ienco","year":"2012","unstructured":"Ienco, D., Pensa, R.G., Meo, R.: From context to distance: learning dissimilarity for categorical data clustering. ACM Trans. Knowl. Discov. Data 6(1), 1:1\u20131:25 (2012)","journal-title":"ACM Trans. Knowl. Discov. Data"},{"key":"10_CR17","doi-asserted-by":"crossref","unstructured":"Khorshidpour, Z., Hashemi, S., Hamzeh, A.: Distance learning for categorical attribute based on context information. In: 2010 2nd International Conference on Software Technology and Engineering, vol. 2, pp. V2-296\u2013V2-300, October 2010","DOI":"10.1109\/ICSTE.2010.5608801"},{"issue":"2","key":"10_CR18","doi-asserted-by":"publisher","first-page":"199","DOI":"10.1007\/s00357-012-9107-2","volume":"29","author":"I Morlini","year":"2012","unstructured":"Morlini, I., Zani, S.: A new class of weighted similarity indices using polytomous variables. J. Classif. 29(2), 199\u2013226 (2012)","journal-title":"J. Classif."},{"issue":"5","key":"10_CR19","doi-asserted-by":"publisher","first-page":"1065","DOI":"10.1109\/TNNLS.2015.2436432","volume":"27","author":"H Jia","year":"2016","unstructured":"Jia, H., Cheung, Y., Liu, J.: A new distance metric for unsupervised learning of categorical data. IEEE Trans. Neural Netw. Learn. Syst. 27(5), 1065\u20131079 (2016)","journal-title":"IEEE Trans. Neural Netw. Learn. Syst."},{"key":"10_CR20","volume-title":"Information Theory, Inference & Learning Algorithms","author":"DJC MacKay","year":"2002","unstructured":"MacKay, D.J.C.: Information Theory, Inference & Learning Algorithms. Cambridge University Press, New York (2002)"},{"issue":"2","key":"10_CR21","doi-asserted-by":"publisher","first-page":"83","DOI":"10.1109\/TCBB.2005.17","volume":"2","author":"WH Au","year":"2005","unstructured":"Au, W.H., Chan, K.C.C., Wong, A.K.C., Wang, Y.: Attribute clustering for grouping, selection, and classification of gene expression data. IEEE\/ACM Trans. Comput. Biol. Bioinform. 2(2), 83\u2013101 (2005)","journal-title":"IEEE\/ACM Trans. Comput. Biol. Bioinform."},{"key":"10_CR22","unstructured":"Machine Learning with Python: k-Nearest Neighbor Classifier. http:\/\/www.python-course.eu\/k_nearest_neighbor_classifier.php"},{"key":"10_CR23","unstructured":"Lichman, M.: UCI machine learning repository (2013). http:\/\/archive.ics.uci.edu\/ml"},{"issue":"6","key":"10_CR24","doi-asserted-by":"publisher","first-page":"1437","DOI":"10.1109\/TKDE.2003.1245283","volume":"15","author":"MA Hall","year":"2003","unstructured":"Hall, M.A., Holmes, G.: Benchmarking attribute selection techniques for discrete class data mining. IEEE Trans. Knowl. Data Eng. 15(6), 1437\u20131447 (2003)","journal-title":"IEEE Trans. Knowl. Data Eng."}],"container-title":["Lecture Notes in Computer Science","Integrated Uncertainty in Knowledge Modelling and Decision Making"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-75429-1_10","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,7]],"date-time":"2024-03-07T15:56:58Z","timestamp":1709827018000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-319-75429-1_10"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018]]},"ISBN":["9783319754284","9783319754291"],"references-count":24,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-75429-1_10","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2018]]},"assertion":[{"value":"4 February 2018","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"IUKM","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Symposium on Integrated Uncertainty in Knowledge Modelling and Decision Making","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Hanoi","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Vietnam","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2018","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"15 March 2018","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"17 March 2018","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"6","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"iukm2018","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/www.jaist.ac.jp\/IUKM\/IUKM2018\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}