{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,8]],"date-time":"2026-01-08T23:53:37Z","timestamp":1767916417000,"version":"3.49.0"},"reference-count":30,"publisher":"Springer Science and Business Media LLC","issue":"11","license":[{"start":{"date-parts":[[2018,1,29]],"date-time":"2018-01-29T00:00:00Z","timestamp":1517184000000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"crossref","award":["U1509207"],"award-info":[{"award-number":["U1509207"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"crossref","award":["61325019"],"award-info":[{"award-number":["61325019"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"crossref"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Soft Comput"],"published-print":{"date-parts":[[2019,6]]},"DOI":"10.1007\/s00500-018-3041-0","type":"journal-article","created":{"date-parts":[[2018,1,29]],"date-time":"2018-01-29T06:24:17Z","timestamp":1517207057000},"page":"3793-3801","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":44,"title":["Very large-scale data classification based on K-means clustering and multi-kernel SVM"],"prefix":"10.1007","volume":"23","author":[{"given":"Tinglong","family":"Tang","sequence":"first","affiliation":[]},{"given":"Shengyong","family":"Chen","sequence":"additional","affiliation":[]},{"given":"Meng","family":"Zhao","sequence":"additional","affiliation":[]},{"given":"Wei","family":"Huang","sequence":"additional","affiliation":[]},{"given":"Jake","family":"Luo","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2018,1,29]]},"reference":[{"key":"3041_CR1","unstructured":"Alcal\u00e1-Fdez J, Fern\u00e1ndez A, Luengo J, Derrac J, Garc\u00eda S, S\u00e1nchez L, Herrera F (2011) Keel data-mining software tool: data set repository, integration of algorithms and experimental analysis framework. J Multiple-Valued Logic Soft Comput 17:255\u2013287"},{"key":"3041_CR2","doi-asserted-by":"publisher","first-page":"83","DOI":"10.1016\/j.knosys.2016.05.056","volume":"107","author":"\u00c1 Arnaiz-Gonz\u00e1lez","year":"2016","unstructured":"Arnaiz-Gonz\u00e1lez \u00c1, D\u00edez-Pastor J-F, Rodr\u00edguez JJ, Garc\u00eda-Osorio C (2016) Instance selection of linear complexity for big data. Knowl Based Syst 107:83\u201395","journal-title":"Knowl Based Syst"},{"issue":"1","key":"3041_CR3","first-page":"301","volume":"3","author":"L Bottou","year":"2007","unstructured":"Bottou L, Lin C-J (2007) Support vector machine solvers. Large Scale Kernel Mach 3(1):301\u2013320","journal-title":"Large Scale Kernel Mach"},{"issue":"17","key":"3041_CR4","doi-asserted-by":"publisher","first-page":"6894","DOI":"10.1016\/j.eswa.2013.06.053","volume":"40","author":"GDC Cavalcanti","year":"2013","unstructured":"Cavalcanti GDC, Ren TI, Pereira CL (2013) ATISA: adaptive threshold-based instance selection algorithm. Expert Syst Appl 40(17):6894\u20136900","journal-title":"Expert Syst Appl"},{"issue":"3","key":"3041_CR5","first-page":"27","volume":"2","author":"C-C Chang","year":"2011","unstructured":"Chang C-C, Lin C-J (2011) LIBSVM: a library for support vector machines. ACM Trans Intell Syst Technol (TIST) 2(3):27","journal-title":"ACM Trans Intell Syst Technol (TIST)"},{"key":"3041_CR6","doi-asserted-by":"publisher","first-page":"12","DOI":"10.1016\/j.jbi.2016.05.007","volume":"62","author":"H Chen","year":"2016","unstructured":"Chen H, Zhang Y, Gutman I (2016) A kernel-based clustering method for gene selection with gene expression data. J Biomed Inform 62:12\u201320","journal-title":"J Biomed Inform"},{"issue":"1","key":"3041_CR7","doi-asserted-by":"publisher","first-page":"107","DOI":"10.1145\/1327452.1327492","volume":"51","author":"J Dean","year":"2008","unstructured":"Dean J, Ghemawat S (2008) MapReduce: simplified data processing on large clusters. Commun ACM 51(1):107\u2013113","journal-title":"Commun ACM"},{"issue":"11","key":"3041_CR8","doi-asserted-by":"publisher","first-page":"3714","DOI":"10.1016\/j.patcog.2015.05.018","volume":"48","author":"F Dornaika","year":"2015","unstructured":"Dornaika F, Aldine IK (2015) Decremental sparse modeling representative selection for prototype selection. Pattern Recogn 48(11):3714\u20133727","journal-title":"Pattern Recogn"},{"issue":"1","key":"3041_CR9","doi-asserted-by":"publisher","first-page":"25","DOI":"10.1007\/s13042-014-0239-z","volume":"7","author":"J Hamidzadeh","year":"2016","unstructured":"Hamidzadeh J, Monsefi R, Yazdi HS (2016) Large symmetric margin instance selection algorithm. Int J Mach Learn Cybern 7(1):25\u201345","journal-title":"Int J Mach Learn Cybern"},{"issue":"3","key":"3041_CR10","doi-asserted-by":"publisher","first-page":"283","DOI":"10.1023\/A:1009769707641","volume":"2","author":"Z Huang","year":"1998","unstructured":"Huang Z (1998) Extensions to the k-means algorithm for clustering large data sets with categorical values. Data Min Knowl Discov 2(3):283\u2013304","journal-title":"Data Min Knowl Discov"},{"key":"3041_CR11","doi-asserted-by":"publisher","first-page":"515","DOI":"10.1016\/j.asoc.2016.06.014","volume":"47","author":"HR Khosravani","year":"2016","unstructured":"Khosravani HR, Ruano AE, Ferreira PM (2016) A convex hull-based data selection method for data driven models. Appl Soft Comput 47:515\u2013533","journal-title":"Appl Soft Comput"},{"key":"3041_CR12","doi-asserted-by":"crossref","unstructured":"Kim MS (2013) Robust, scalable anomaly detection for large collections of images. In: 2013 International conference on social computing (SocialCom), pp 1054\u20131058. IEEE","DOI":"10.1109\/SocialCom.2013.170"},{"key":"3041_CR13","unstructured":"Lichman M (2013) UCI machine learning repository. University of California, School of Information and Computer Science, Irvine, CA. \n                    http:\/\/archive.ics.uci.edu\/ml"},{"key":"3041_CR14","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.jss.2015.04.038","volume":"106","author":"W-C Lin","year":"2015","unstructured":"Lin W-C, Tsai C-F, Ke S-W, Hung C-W, Eberle W (2015) Learning to detect representative data for large scale instance selection. J Syst Softw 106:1\u20138","journal-title":"J Syst Softw"},{"key":"3041_CR15","doi-asserted-by":"publisher","first-page":"30","DOI":"10.1016\/j.neucom.2012.01.035","volume":"89","author":"X Liu","year":"2012","unstructured":"Liu X, Wang L, Yin J, Liu L (2012) Incorporation of radius-info can be simple with SimpleMKL. Neurocomputing 89:30\u201338","journal-title":"Neurocomputing"},{"issue":"7","key":"3041_CR16","doi-asserted-by":"publisher","first-page":"2141","DOI":"10.1016\/j.patcog.2014.12.007","volume":"48","author":"X Liu","year":"2015","unstructured":"Liu X, Zhou L, Wang L, Zhang J, Yin J, Shen D (2015) An efficient radius-incorporated MKL algorithm for Alzheimer\u2019s disease prediction. Pattern Recogn 48(7):2141\u20132150","journal-title":"Pattern Recogn"},{"key":"3041_CR17","doi-asserted-by":"crossref","unstructured":"Neugebauer J, Kramer O, Sonnenschein M (2016) Improving cascade classifier precision by instance selection and outlier generation. In: ICAART, no. 2, pp 96\u2013104","DOI":"10.5220\/0005702100960104"},{"issue":"2","key":"3041_CR18","doi-asserted-by":"publisher","first-page":"131","DOI":"10.1007\/s10044-008-0142-x","volume":"13","author":"JA Olvera-L\u00f3pez","year":"2010","unstructured":"Olvera-L\u00f3pez JA, Carrasco-Ochoa JA, Mart\u00ednez-Trinidad JF (2010) A new fast prototype selection method based on clustering. Pattern Anal Appl 13(2):131\u2013141","journal-title":"Pattern Anal Appl"},{"issue":"20","key":"3041_CR19","doi-asserted-by":"publisher","first-page":"6844","DOI":"10.1016\/j.eswa.2015.05.006","volume":"42","author":"A Onan","year":"2015","unstructured":"Onan A (2015) A fuzzy-rough nearest neighbor classifier combined with consistency-based subset evaluation and instance selection for automated diagnosis of breast cancer. Expert Syst Appl 42(20):6844\u20136852","journal-title":"Expert Syst Appl"},{"issue":"Nov","key":"3041_CR20","first-page":"2491","volume":"9","author":"A Rakotomamonjy","year":"2008","unstructured":"Rakotomamonjy A, Bach FR, Canu S, Grandvalet Y (2008) SimpleMKL. J Mach Learn Res 9(Nov):2491\u20132521","journal-title":"J Mach Learn Res"},{"key":"3041_CR21","doi-asserted-by":"publisher","first-page":"256","DOI":"10.1016\/j.neucom.2015.01.008","volume":"157","author":"M Rezaei","year":"2015","unstructured":"Rezaei M, Nezamabadi-Pour H (2015) Using gravitational search algorithm in prototype generation for nearest neighbor classification. Neurocomputing 157:256\u2013263","journal-title":"Neurocomputing"},{"key":"3041_CR22","doi-asserted-by":"publisher","first-page":"24","DOI":"10.1016\/j.datak.2015.11.002","volume":"101","author":"DANS Silva","year":"2016","unstructured":"Silva DANS, Souza LC, Motta GHMB (2016) An instance selection method for large datasets based on Markov geometric diffusion. Data Knowl Eng 101:24\u201341","journal-title":"Data Knowl Eng"},{"key":"3041_CR23","doi-asserted-by":"publisher","first-page":"236","DOI":"10.1016\/j.neucom.2014.03.006","volume":"141","author":"MB Stojanovi\u0107","year":"2014","unstructured":"Stojanovi\u0107 MB, Bo\u017ei\u0107 MM, Stankovi\u0107 MM, Staji\u0107 ZP (2014) A methodology for training set instance selection using mutual information in time series prediction. Neurocomputing 141:236\u2013245","journal-title":"Neurocomputing"},{"issue":"3","key":"3041_CR24","doi-asserted-by":"publisher","first-page":"2566","DOI":"10.1016\/j.eswa.2010.08.046","volume":"38","author":"J Sun","year":"2011","unstructured":"Sun J, Li H (2011) Dynamic financial distress prediction using instance selection for the disposal of concept drift. Expert Syst Appl 38(3):2566\u20132576","journal-title":"Expert Syst Appl"},{"key":"3041_CR25","doi-asserted-by":"publisher","first-page":"332","DOI":"10.1016\/j.neucom.2012.06.009","volume":"97","author":"I Triguero","year":"2012","unstructured":"Triguero I, Derrac JN, Garc\u00edA S, Herrera F (2012) Integrating a differential evolution feature weighting scheme into prototype generation. Neurocomputing 97:332\u2013343","journal-title":"Neurocomputing"},{"key":"3041_CR26","doi-asserted-by":"publisher","first-page":"150","DOI":"10.1016\/j.neucom.2016.04.018","volume":"203","author":"JJ Valero-Mas","year":"2016","unstructured":"Valero-Mas JJ, Calvo-Zaragoza J, Rico-Juan JR (2016) On the suitability of prototype selection methods for kNN classification with distributed data. Neurocomputing 203:150\u2013160","journal-title":"Neurocomputing"},{"key":"3041_CR27","doi-asserted-by":"crossref","unstructured":"Whelan M, Le\u00a0Khac NA, Kechadi M-T (2010) Data reduction in very large spatio-temporal datasets. In: 2010 19th IEEE International workshop on enabling technologies: infrastructures for collaborative enterprises (WETICE). IEEE, pp 104\u2013109","DOI":"10.1109\/WETICE.2010.23"},{"issue":"3","key":"3041_CR28","doi-asserted-by":"publisher","first-page":"257","DOI":"10.1023\/A:1007626913721","volume":"38","author":"DR Wilson","year":"2000","unstructured":"Wilson DR, Martinez TR (2000) Reduction techniques for instance-based learning algorithms. Mach Learn 38(3):257\u2013286","journal-title":"Mach Learn"},{"key":"3041_CR29","doi-asserted-by":"publisher","first-page":"46","DOI":"10.1016\/j.neucom.2014.06.094","volume":"165","author":"P Wu","year":"2015","unstructured":"Wu P, Duan F, Guo P (2015) A pre-selecting base kernel method in multiple kernel learning. Neurocomputing 165:46\u201353","journal-title":"Neurocomputing"},{"key":"3041_CR30","doi-asserted-by":"publisher","first-page":"1066","DOI":"10.1016\/j.ins.2016.07.026","volume":"367","author":"J Zhai","year":"2016","unstructured":"Zhai J, Wang X, Pang X (2016) Voting-based instance selection from large data sets with MapReduce and random weight networks. Inf Sci 367:1066\u20131077","journal-title":"Inf Sci"}],"container-title":["Soft Computing"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s00500-018-3041-0\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s00500-018-3041-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s00500-018-3041-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,4,23]],"date-time":"2019-04-23T11:19:52Z","timestamp":1556018392000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s00500-018-3041-0"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,1,29]]},"references-count":30,"journal-issue":{"issue":"11","published-print":{"date-parts":[[2019,6]]}},"alternative-id":["3041"],"URL":"https:\/\/doi.org\/10.1007\/s00500-018-3041-0","relation":{},"ISSN":["1432-7643","1433-7479"],"issn-type":[{"value":"1432-7643","type":"print"},{"value":"1433-7479","type":"electronic"}],"subject":[],"published":{"date-parts":[[2018,1,29]]},"assertion":[{"value":"29 January 2018","order":1,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Compliance with ethical standards"}},{"value":"Tinglong Tang, Shengyong Chen, Meng Zhao, Wei Huang and Jake Luo declare that they have no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"This article does not contain any studies with human participants performed by any of the authors.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical approval"}}]}}