{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,4]],"date-time":"2026-04-04T01:32:48Z","timestamp":1775266368508,"version":"3.50.1"},"publisher-location":"Cham","reference-count":29,"publisher":"Springer International Publishing","isbn-type":[{"value":"9783030010539","type":"print"},{"value":"9783030010546","type":"electronic"}],"license":[{"start":{"date-parts":[[2018,11,9]],"date-time":"2018-11-09T00:00:00Z","timestamp":1541721600000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2019]]},"DOI":"10.1007\/978-3-030-01054-6_71","type":"book-chapter","created":{"date-parts":[[2018,11,8]],"date-time":"2018-11-08T09:47:05Z","timestamp":1541670425000},"page":"1025-1040","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":5,"title":["Enhancement of the K-Means Algorithm for Mixed Data in Big Data Platforms"],"prefix":"10.1007","author":[{"given":"Oded","family":"Koren","sequence":"first","affiliation":[]},{"given":"Carina Antonia","family":"Hallin","sequence":"additional","affiliation":[]},{"given":"Nir","family":"Perel","sequence":"additional","affiliation":[]},{"given":"Dror","family":"Bendet","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2018,11,9]]},"reference":[{"issue":"2","key":"71_CR1","doi-asserted-by":"publisher","first-page":"I","DOI":"10.17705\/1jais.00423","volume":"17","author":"Ahmed Abbasi","year":"2016","unstructured":"Abbasi, A., Sarker, S., Chiang, R.H.: Big data research in information systems: toward an inclusive research agenda. J. Assoc. Inf. Syst. 17(2) (2016)","journal-title":"Journal of the Association for Information Systems"},{"issue":"3","key":"71_CR2","doi-asserted-by":"publisher","first-page":"443","DOI":"10.1287\/isre.2014.0546","volume":"25","author":"R Agarwal","year":"2014","unstructured":"Agarwal, R., Dhar, V.: Editorial\u2014big data, data science, and analytics: the opportunity and challenge for IS research. Inf. Syst. Res. 25(3), 443\u2013448 (2014)","journal-title":"Inf. Syst. Res."},{"issue":"2","key":"71_CR3","doi-asserted-by":"publisher","first-page":"503","DOI":"10.1016\/j.datak.2007.03.016","volume":"63","author":"A Ahmad","year":"2007","unstructured":"Ahmad, A., Dey, L.: A K-mean clustering algorithm for mixed numeric and categorical data. Data Knowl. Eng. 63(2), 503\u2013527 (2007)","journal-title":"Data Knowl. Eng."},{"key":"71_CR4","doi-asserted-by":"crossref","unstructured":"Berkhin, P.: A survey of clustering data mining techniques. In: Grouping Multidimensional Data, pp. 25\u201371. Springer, Berlin (2006)","DOI":"10.1007\/3-540-28349-8_2"},{"key":"71_CR5","unstructured":"Cai, X., Nie, F., Huang, H.: Multi-view K-means clustering on big data. IJCAI (2013)"},{"key":"71_CR6","unstructured":"Cisco: The Zettabyte era: trends and analysis. White paper (2016)"},{"issue":"3","key":"71_CR7","doi-asserted-by":"publisher","first-page":"1249","DOI":"10.1007\/s11227-014-1225-7","volume":"70","author":"X Cui","year":"2014","unstructured":"Cui, X., Zhu, P., Yang, X., Li, K., Ji, C.: Optimized big data K-means clustering using MapReduce. J. Supercomput. 70(3), 1249\u20131259 (2014)","journal-title":"J. Supercomput."},{"issue":"3","key":"71_CR8","first-page":"28","volume":"92","author":"K Cukier","year":"2013","unstructured":"Cukier, K., Mayer-Schoenberger, V.: The rise of big data: how it\u2019s changing the way we think about the world. Foreign Aff. 92(3), 28\u201340 (2013)","journal-title":"Foreign Aff."},{"issue":"1","key":"71_CR9","doi-asserted-by":"publisher","first-page":"107","DOI":"10.1145\/1327452.1327492","volume":"51","author":"J Dean","year":"2008","unstructured":"Dean, J., Ghemawat, S.: MapReduce: simplified data processing on large clusters. Commun. ACM 51(1), 107\u2013113 (2008)","journal-title":"Commun. ACM"},{"key":"71_CR10","doi-asserted-by":"crossref","unstructured":"Demchenko, Y., Ngo, C., Membrey, P.: Architecture framework and components for the big data ecosystem. J. Syst. Netw. Eng. 1\u201331 (2013)\u200f","DOI":"10.1109\/CTS.2014.6867550"},{"issue":"3","key":"71_CR11","doi-asserted-by":"publisher","first-page":"49","DOI":"10.2753\/MIS0742-1222300303","volume":"30","author":"D Tullio Di","year":"2013","unstructured":"Di Tullio, D., Staples, D.S.: The governance and control of open source software projects. J. Manag. Inf. Syst. 30(3), 49\u201380 (2013)","journal-title":"J. Manag. Inf. Syst."},{"issue":"11","key":"71_CR12","first-page":"429","volume":"10","author":"G Engelberg","year":"2016","unstructured":"Engelberg, G., Koren, O., Perel, N.: Big data performance evaluation analysis using Apache Pig. Int. J. Softw. Eng. Appl. 10(11), 429\u2013440 (2016)","journal-title":"Int. J. Softw. Eng. Appl."},{"issue":"1","key":"71_CR13","doi-asserted-by":"publisher","first-page":"273","DOI":"10.2753\/MIS0742-1222310111","volume":"31","author":"J F\u00fcller","year":"2014","unstructured":"F\u00fcller, J., Hutter, K., Hautz, J., Matzler, K.: User roles and contributions in innovation-contest communities. J. Manag. Inf. Syst. 31(1), 273\u2013308 (2014)","journal-title":"J. Manag. Inf. Syst."},{"issue":"5","key":"71_CR14","doi-asserted-by":"publisher","first-page":"29","DOI":"10.1145\/1165389.945450","volume":"37","author":"Sanjay Ghemawat","year":"2003","unstructured":"Ghemawat, S., Gobioff, H., Leung, S.T.: The Google File System, ACM SIGOPS Operating Systems Review, vol. 37, pp. 29\u201343 (2003)","journal-title":"ACM SIGOPS Operating Systems Review"},{"issue":"2","key":"71_CR15","doi-asserted-by":"publisher","first-page":"487","DOI":"10.1080\/07421222.2017.1334480","volume":"34","author":"S Guo","year":"2017","unstructured":"Guo, S., Guo, X., Fang, Y., Vogel, D.: How doctors gain social and economic returns in online health-care communities: a professional capital perspective. J. Manag. Inf. Syst. 34(2), 487\u2013519 (2017)","journal-title":"J. Manag. Inf. Syst."},{"key":"71_CR16","unstructured":"Henschen, D.: Why Sears is going all-in on Hadoop. InformationWeek (2012)"},{"key":"71_CR17","doi-asserted-by":"publisher","first-page":"283","DOI":"10.1023\/A:1009769707641","volume":"2","author":"Z Huang","year":"1998","unstructured":"Huang, Z.: Extensions to the k-means algorithm for clustering large data sets with categorical values. Data Min. Knowl. Discov. 2, 283\u2013304 (1998)","journal-title":"Data Min. Knowl. Discov."},{"issue":"12","key":"71_CR18","doi-asserted-by":"publisher","first-page":"267","DOI":"10.14257\/ijdta.2016.9.12.24","volume":"9","author":"D Kendal","year":"2016","unstructured":"Kendal, D., Koren, O., Perel, N.: Pig vs. hive use case analysis. Int. J. Database Theory Appl. 9(12), 267\u2013276 (2016)","journal-title":"Int. J. Database Theory Appl."},{"issue":"1","key":"71_CR19","doi-asserted-by":"publisher","first-page":"24","DOI":"10.1186\/s40537-015-0032-1","volume":"2","author":"S Landset","year":"2015","unstructured":"Landset, S., Khoshgoftaar, T.M., Richter, A.N., Hasanin, T.: A survey of open source tools for machine learning with big data in the Apache\u2122 Hadoop\u00ae! ecosystem. J. Big Data 2(1), 24 (2015)","journal-title":"J. Big Data"},{"key":"71_CR20","unstructured":"MacQueen, J.B.: Some methods for classification and analysis of multivariate observations. In: Proceedings of the 5th Berkeley Symposium on Mathematical Statistics and Probability, pp. 281\u2013297 (1967)"},{"key":"71_CR21","unstructured":"Manyika, J., Chui, M., Brown, B., Bughin, J., Dobbs, R., Roxburgh, C., Byers, A.H.: Big data: the next frontier for innovation, competition, and productivity. McKinsey Global Institute (2011)"},{"key":"71_CR22","unstructured":"Preethi, R.A., Elavarasi, J.: Big data analytics using Hadoop tools\u2014Apache Hive vs Apache Pig. Int. J. Emerg. Technol. Comput. Sci. Electron. 24(3) (2017)"},{"key":"71_CR23","doi-asserted-by":"crossref","unstructured":"Rai, A.: Synergies between big data and theory. Manag. Inf. Syst. Q. 40(2), iii\u2013ix (2016)","DOI":"10.25300\/MISQ\/2016\/40.2.E0"},{"issue":"11","key":"71_CR24","doi-asserted-by":"publisher","first-page":"1147","DOI":"10.1016\/0167-8655(95)00075-R","volume":"16","author":"H Ralambondrain","year":"1995","unstructured":"Ralambondrain, H.: A conceptual version of the K-means algorithm. Pattern Recogn. Lett. 16(11), 1147\u20131157 (1995)","journal-title":"Pattern Recogn. Lett."},{"issue":"4","key":"71_CR25","doi-asserted-by":"publisher","first-page":"911","DOI":"10.25300\/MISQ\/2016\/40.4.06","volume":"40","author":"Alok R. Saboo","year":"2016","unstructured":"Saboo, A.R., Kumar, V., Park, I.: Using big data to model time-varying effects for marketing resource (re) allocation. MIS Q. 40(4) (2016)","journal-title":"MIS Quarterly"},{"issue":"2","key":"71_CR26","first-page":"241","volume":"14","author":"OM San","year":"2004","unstructured":"San, O.M., Huynh, V.-N., Nakamori, Y.: An alternative extension of the k-means algorithm for clustering categorical data. Int. J. Appl. Math. Comput. Sci. 14(2), 241\u2013248 (2004)","journal-title":"Int. J. Appl. Math. Comput. Sci."},{"issue":"6","key":"71_CR27","doi-asserted-by":"publisher","first-page":"1452","DOI":"10.1287\/mnsc.2014.1899","volume":"60","author":"Prasanna Tambe","year":"2014","unstructured":"Tambe, P.: Big data investment, skills, and firm value. Alok Gupta, pp. 1452\u20131469 (2014)","journal-title":"Management Science"},{"key":"71_CR28","volume-title":"Hadoop: The Definitive Guide","author":"T White","year":"2015","unstructured":"White, T.: Hadoop: The Definitive Guide, 4th edn. OReilly Media, Sebastopol (2015)","edition":"4"},{"issue":"3","key":"71_CR29","doi-asserted-by":"publisher","first-page":"645","DOI":"10.1109\/TNN.2005.845141","volume":"16","author":"R Xu","year":"2005","unstructured":"Xu, R., Wunsch, D.: Survey of clustering algorithms. IEEE Trans. Neural Netw. 16(3), 645\u2013678 (2005)","journal-title":"IEEE Trans. Neural Netw."}],"container-title":["Advances in Intelligent Systems and Computing","Intelligent Systems and Applications"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-01054-6_71","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,4,4]],"date-time":"2026-04-04T00:28:47Z","timestamp":1775262527000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-030-01054-6_71"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,11,9]]},"ISBN":["9783030010539","9783030010546"],"references-count":29,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-01054-6_71","relation":{},"ISSN":["2194-5357","2194-5365"],"issn-type":[{"value":"2194-5357","type":"print"},{"value":"2194-5365","type":"electronic"}],"subject":[],"published":{"date-parts":[[2018,11,9]]},"assertion":[{"value":"IntelliSys","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Proceedings of SAI Intelligent Systems Conference","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"London","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"United Kingdom","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2018","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"6 September 2018","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"7 September 2018","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"intellisys2018","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/saiconference.com\/IntelliSys2018\/CallforPapers","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}