{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,6]],"date-time":"2025-12-06T04:58:30Z","timestamp":1764997110301,"version":"3.37.3"},"reference-count":26,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2017,2,10]],"date-time":"2017-02-10T00:00:00Z","timestamp":1486684800000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/501100003329","name":"Ministerio de Econom\u00eda y Competitividad (ES)","doi-asserted-by":"crossref","award":["TIN 2015-67534-P"],"award-info":[{"award-number":["TIN 2015-67534-P"]}],"id":[{"id":"10.13039\/501100003329","id-type":"DOI","asserted-by":"crossref"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Prog Artif Intell"],"published-print":{"date-parts":[[2017,9]]},"DOI":"10.1007\/s13748-017-0117-5","type":"journal-article","created":{"date-parts":[[2017,2,10]],"date-time":"2017-02-10T09:22:04Z","timestamp":1486718524000},"page":"211-219","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":26,"title":["MR-DIS: democratic instance selection for big data by MapReduce"],"prefix":"10.1007","volume":"6","author":[{"given":"\u00c1lvar","family":"Arnaiz-Gonz\u00e1lez","sequence":"first","affiliation":[]},{"given":"Alejandro","family":"Gonz\u00e1lez-Rogel","sequence":"additional","affiliation":[]},{"given":"Jos\u00e9-Francisco","family":"D\u00edez-Pastor","sequence":"additional","affiliation":[]},{"given":"Carlos","family":"L\u00f3pez-Nozal","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2017,2,10]]},"reference":[{"key":"117_CR1","doi-asserted-by":"publisher","unstructured":"Amdahl, G.M.: Validity of the single processor approach to achieving large scale computing capabilities. In: Proceedings of the April 18\u201320, 1967, Spring Joint Computer Conference, AFIPS \u201967 (Spring), pp. 483\u2013485. ACM, New York (1967). doi: 10.1145\/1465482.1465560","DOI":"10.1145\/1465482.1465560"},{"issue":"12","key":"117_CR2","doi-asserted-by":"publisher","first-page":"1593","DOI":"10.1109\/TKDE.2007.190665","volume":"19","author":"F Angiulli","year":"2007","unstructured":"Angiulli, F., Folino, G.: Distributed nearest neighbor-based condensation of very large data sets. IEEE Trans. Knowl. Data Eng. 19(12), 1593\u20131606 (2007). doi: 10.1109\/TKDE.2007.190665","journal-title":"IEEE Trans. Knowl. Data Eng."},{"key":"117_CR3","doi-asserted-by":"publisher","first-page":"83","DOI":"10.1016\/j.knosys.2016.05.056","volume":"107","author":"\u00c1 Arnaiz-Gonz\u00e1lez","year":"2016","unstructured":"Arnaiz-Gonz\u00e1lez, \u00c1., D\u00edez-Pastor, J.F., Rodr\u00edguez, J.J., Garc\u00eda-Osorio, C.I.: Instance selection of linear complexity for big data. Knowl. Based Syst. 107, 83\u201395 (2016). doi: 10.1016\/j.knosys.2016.05.056","journal-title":"Knowl. Based Syst."},{"issue":"1","key":"117_CR4","doi-asserted-by":"crossref","first-page":"128","DOI":"10.1137\/0906011","volume":"6","author":"D Asimov","year":"1985","unstructured":"Asimov, D.: The grand tour: a tool for viewing multidimensional data. SIAM J. Sci. Stat. Comput. 6(1), 128\u2013143 (1985)","journal-title":"SIAM J. Sci. Stat. Comput."},{"issue":"2","key":"117_CR5","doi-asserted-by":"publisher","first-page":"153","DOI":"10.1023\/A:1014043630878","volume":"6","author":"H Brighton","year":"2002","unstructured":"Brighton, H., Mellish, C.: Advances in instance selection for instance-based learning algorithms. Data Min. Knowl. Discov. 6(2), 153\u2013172 (2002). doi: 10.1023\/A:1014043630878","journal-title":"Data Min. Knowl. Discov."},{"issue":"7","key":"117_CR6","doi-asserted-by":"publisher","first-page":"953","DOI":"10.1016\/j.patrec.2004.09.043","volume":"26","author":"JR Cano","year":"2005","unstructured":"Cano, J.R., Herrera, F., Lozano, M.: Stratification for scaling up evolutionary prototype selection. Pattern Recognit. Lett. 26(7), 953\u2013963 (2005). doi: 10.1016\/j.patrec.2004.09.043","journal-title":"Pattern Recognit. Lett."},{"issue":"2","key":"117_CR7","doi-asserted-by":"publisher","first-page":"171","DOI":"10.1007\/s11036-013-0489-0","volume":"19","author":"M Chen","year":"2014","unstructured":"Chen, M., Mao, S., Liu, Y.: Big data: a survey. Mob. Netw. Appl. 19(2), 171\u2013209 (2014). doi: 10.1007\/s11036-013-0489-0","journal-title":"Mob. Netw. Appl."},{"key":"117_CR8","doi-asserted-by":"publisher","unstructured":"de Haro-Garc\u00eda, A., Garc\u00eda-Pedrajas, N.: A divide-and-conquer recursive approach for scaling up instance selection algorithms. Data Min. Knowl. Discov. 18(3), 392\u2013418 (2009). doi: 10.1007\/s10618-008-0121-2","DOI":"10.1007\/s10618-008-0121-2"},{"issue":"1","key":"117_CR9","doi-asserted-by":"publisher","first-page":"107","DOI":"10.1145\/1327452.1327492","volume":"51","author":"J Dean","year":"2008","unstructured":"Dean, J., Ghemawat, S.: MapReduce: simplified data processing on large clusters. Commun. ACM 51(1), 107\u2013113 (2008). doi: 10.1145\/1327452.1327492","journal-title":"Commun. ACM"},{"issue":"3","key":"117_CR10","doi-asserted-by":"publisher","first-page":"417","DOI":"10.1109\/TPAMI.2011.142","volume":"34","author":"S Garcia","year":"2012","unstructured":"Garcia, S., Derrac, J., Cano, J., Herrera, F.: Prototype selection for nearest neighbor classification: taxonomy and empirical study. IEEE Trans. Pattern Anal. Mach. Intell. 34(3), 417\u2013435 (2012). doi: 10.1109\/TPAMI.2011.142","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"117_CR11","doi-asserted-by":"crossref","unstructured":"Garc\u00eda, S., Luengo, J., Herrera, F.: Data Preprocessing in Data Mining. Springer, Berlin (2014)","DOI":"10.1007\/978-3-319-10247-4"},{"issue":"56","key":"117_CR12","doi-asserted-by":"publisher","first-page":"410","DOI":"10.1016\/j.artint.2010.01.001","volume":"174","author":"C Garc\u00eda-Osorio","year":"2010","unstructured":"Garc\u00eda-Osorio, C., de Haro-Garc\u00eda, A., Garc\u00eda-Pedrajas, N.: Democratic instance selection: a linear complexity instance selection algorithm based on classifier ensemble concepts. Artif. Intell. 174(56), 410\u2013441 (2010). doi: 10.1016\/j.artint.2010.01.001","journal-title":"Artif. Intell."},{"issue":"3","key":"117_CR13","doi-asserted-by":"publisher","first-page":"12","DOI":"10.1109\/88.242438","volume":"1","author":"AY Grama","year":"1993","unstructured":"Grama, A.Y., Gupta, A., Kumar, V.: Isoefficiency: measuring the scalability of parallel algorithms and architectures. IEEE Parallel Distrib. Technol. 1(3), 12\u201321 (1993). doi: 10.1109\/88.242438","journal-title":"IEEE Parallel Distrib. Technol."},{"issue":"3","key":"117_CR14","doi-asserted-by":"crossref","first-page":"515","DOI":"10.1109\/TIT.1968.1054155","volume":"14","author":"P Hart","year":"1968","unstructured":"Hart, P.: The condensed nearest neighbor rule (corresp.). IEEE Trans. Inf. Theory 14(3), 515\u2013516 (1968)","journal-title":"IEEE Trans. Inf. Theory"},{"key":"117_CR15","doi-asserted-by":"publisher","unstructured":"Indyk, P., Motwani, R.: Approximate nearest neighbors: towards removing the curse of dimensionality. In: Proceedings of the Thirtieth Annual ACM Symposium on Theory of Computing, STOC \u201998, pp. 604\u2013613. ACM, New York (1998). doi: 10.1145\/276698.276876","DOI":"10.1145\/276698.276876"},{"key":"117_CR16","unstructured":"Laney, D.: 3-d data management: controlling data volume, velocity and variety, Technical Report META Group Research Note (2001)"},{"issue":"4","key":"117_CR17","doi-asserted-by":"publisher","first-page":"1523","DOI":"10.1016\/j.patcog.2014.10.001","volume":"48","author":"E Leyva","year":"2015","unstructured":"Leyva, E., Gonz\u00e1lez, A., P\u00e9rez, R.: Three new instance selection methods based on local sets: a comparative study with several approaches from a bi-objective perspective. Pattern Recognit. 48(4), 1523\u20131537 (2015). doi: 10.1016\/j.patcog.2014.10.001","journal-title":"Pattern Recognit."},{"key":"117_CR18","unstructured":"Lichman, M.: UCI machine learning repository (2013). http:\/\/archive.ics.uci.edu\/ml"},{"key":"117_CR19","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2016.06.012","author":"J Maillo","year":"2016","unstructured":"Maillo, J., Ram\u00edrez, S., Triguero, I., Herrera, F.: kNN-IS: An iterative spark-based design of the k-nearest neighbors classifier for big data. Knowledge-Based Systems (2016). doi: 10.1016\/j.knosys.2016.06.012","journal-title":"Knowledge-Based Systems"},{"key":"117_CR20","doi-asserted-by":"publisher","DOI":"10.1002\/9781118562260.fmatter","volume-title":"Big Data, Big Analytics: Emerging Business Intelligence and Analytic Trends for Today\u2019s Businesses","author":"M Minelli","year":"2012","unstructured":"Minelli, M., Chambers, M., Dhiraj, A.: Big Data, Big Analytics: Emerging Business Intelligence and Analytic Trends for Today\u2019s Businesses. Wiley, London (2012). doi: 10.1002\/9781118562260.fmatter"},{"issue":"1","key":"117_CR21","doi-asserted-by":"publisher","first-page":"5","DOI":"10.1002\/widm.1173","volume":"6","author":"S Ram\u00edrez-Gallego","year":"2016","unstructured":"Ram\u00edrez-Gallego, S., Garc\u00eda, S., Mouri\u00f1o Tal\u00edn, H., Mart\u00ednez-Rego, D., Bol\u00f3n-Canedo, V., Alonso-Betanzos, A., Ben\u00edtez, J.M., Herrera, F.: Data discretization: taxonomy and big data challenge. Wiley Interdiscip. Rev. Data Min. Knowl. Discov. 6(1), 5\u201321 (2016). doi: 10.1002\/widm.1173","journal-title":"Wiley Interdiscip. Rev. Data Min. Knowl. Discov."},{"key":"117_CR22","doi-asserted-by":"publisher","unstructured":"Triguero, I., Peralta, D., Bacardit, J., Garc\u00eda, S., Herrera, F.: Mrpr: a mapreduce solution for prototype reduction in big data classification. Neurocomputing 150 Part A, 331\u2013345 (2015). doi: 10.1016\/j.neucom.2014.04.078","DOI":"10.1016\/j.neucom.2014.04.078"},{"key":"117_CR23","doi-asserted-by":"publisher","first-page":"83","DOI":"10.1016\/j.jss.2016.09.007","volume":"122","author":"CF Tsai","year":"2016","unstructured":"Tsai, C.F., Lin, W.C., Ke, S.W.: Big data mining with parallel computing: a comparison of distributed and mapreduce methodologies. J. Syst. Softw. 122, 83\u201392 (2016). doi: 10.1016\/j.jss.2016.09.007","journal-title":"J. Syst. Softw."},{"key":"117_CR24","unstructured":"Wilson, D.R., Martinez, T.R.: Instance pruning techniques. In: Machine Learning: Proceedings of the Fourteenth International Conference (ICML97), pp. 404\u2013411. Morgan Kaufmann (1997)"},{"issue":"1","key":"117_CR25","doi-asserted-by":"publisher","first-page":"97","DOI":"10.1109\/TKDE.2013.109","volume":"26","author":"X Wu","year":"2014","unstructured":"Wu, X., Zhu, X., Wu, G.Q., Ding, W.: Data mining with big data. IEEE Trans. Knowl. Data Eng. 26(1), 97\u2013107 (2014). doi: 10.1109\/TKDE.2013.109","journal-title":"IEEE Trans. Knowl. Data Eng."},{"key":"117_CR26","first-page":"10","volume":"10","author":"M Zaharia","year":"2010","unstructured":"Zaharia, M., Chowdhury, M., Franklin, M.J., Shenker, S., Stoica, I.: Spark: cluster computing with working sets. HotCloud 10, 10\u201310 (2010)","journal-title":"HotCloud"}],"container-title":["Progress in Artificial Intelligence"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s13748-017-0117-5\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s13748-017-0117-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s13748-017-0117-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,9,18]],"date-time":"2019-09-18T10:51:21Z","timestamp":1568803881000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s13748-017-0117-5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,2,10]]},"references-count":26,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2017,9]]}},"alternative-id":["117"],"URL":"https:\/\/doi.org\/10.1007\/s13748-017-0117-5","relation":{},"ISSN":["2192-6352","2192-6360"],"issn-type":[{"type":"print","value":"2192-6352"},{"type":"electronic","value":"2192-6360"}],"subject":[],"published":{"date-parts":[[2017,2,10]]}}}