{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,30]],"date-time":"2025-12-30T17:56:21Z","timestamp":1767117381344,"version":"3.37.3"},"publisher-location":"Cham","reference-count":32,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319768915"},{"type":"electronic","value":"9783319768922"}],"license":[{"start":{"date-parts":[[2018,1,1]],"date-time":"2018-01-01T00:00:00Z","timestamp":1514764800000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018]]},"DOI":"10.1007\/978-3-319-76892-2_8","type":"book-chapter","created":{"date-parts":[[2018,2,23]],"date-time":"2018-02-23T21:43:13Z","timestamp":1519422193000},"page":"101-115","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":9,"title":["Feature Selection in High-Dimensional Dataset Using MapReduce"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-7324-4116","authenticated-orcid":false,"given":"Claudio","family":"Reggiani","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5679-7758","authenticated-orcid":false,"given":"Yann-A\u00ebl","family":"Le Borgne","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8621-316X","authenticated-orcid":false,"given":"Gianluca","family":"Bontempi","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2018,2,25]]},"reference":[{"key":"8_CR1","doi-asserted-by":"crossref","first-page":"33","DOI":"10.1016\/j.knosys.2015.05.014","volume":"86","author":"V Bol\u00f3n-Canedo","year":"2015","unstructured":"Bol\u00f3n-Canedo, V., S\u00e1nchez-Maro\u00f1o, N., Alonso-Betanzos, A.: Recent advances and emerging challenges of feature selection in the context of big data. Knowl. Based Syst. 86, 33\u201345 (2015)","journal-title":"Knowl. Based Syst."},{"issue":"1","key":"8_CR2","doi-asserted-by":"crossref","first-page":"107","DOI":"10.1145\/1327452.1327492","volume":"51","author":"J Dean","year":"2008","unstructured":"Dean, J., Ghemawat, S.: MapReduce: simplified data processing on large clusters. Commun. ACM 51(1), 107\u2013113 (2008)","journal-title":"Commun. ACM"},{"key":"8_CR3","doi-asserted-by":"crossref","unstructured":"Yeung, J.H., Tsang, C., Tsoi, K.H., Kwan, B.S., Cheung, C.C., Chan, A.P., Leong, P.H.: Map-reduce as a programming model for custom computing machines. In: 16th International Symposium on Field-Programmable Custom Computing Machines (FCCM 2008), pp. 149\u2013159. IEEE (2008)","DOI":"10.1109\/FCCM.2008.19"},{"issue":"2","key":"8_CR4","doi-asserted-by":"crossref","first-page":"1626","DOI":"10.14778\/1687553.1687609","volume":"2","author":"A Thusoo","year":"2009","unstructured":"Thusoo, A., Sarma, J.S., Jain, N., Shao, Z., Chakka, P., Anthony, S., Liu, H., Wyckoff, P., Murthy, R.: Hive: a warehousing solution over a map-reduce framework. Proc. VLDB Endow. 2(2), 1626\u20131629 (2009)","journal-title":"Proc. VLDB Endow."},{"key":"8_CR5","first-page":"281","volume":"19","author":"C Chu","year":"2007","unstructured":"Chu, C., Kim, S.K., Lin, Y.A., Yu, Y., Bradski, G., Ng, A.Y., Olukotun, K.: Map-reduce for machine learning on multicore. Adv. Neural Inf. Process. Syst. 19, 281 (2007)","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"8_CR6","unstructured":"Apache Mahout: Scalable machine learning and data mining. https:\/\/mahout.apache.org\/"},{"issue":"34","key":"8_CR7","first-page":"1","volume":"17","author":"X Meng","year":"2016","unstructured":"Meng, X., Bradley, J., Yuvaz, B., Sparks, E., Venkataraman, S., Liu, D., Freeman, J., Tsai, D., Amde, M., Owen, S., et al.: MLlib: machine learning in apache spark. JMLR 17(34), 1\u20137 (2016)","journal-title":"JMLR"},{"key":"8_CR8","first-page":"1157","volume":"3","author":"I Guyon","year":"2003","unstructured":"Guyon, I., Elisseeff, A.: An introduction to variable and feature selection. J. Mach. Learn. Res. 3, 1157\u20131182 (2003)","journal-title":"J. Mach. Learn. Res."},{"issue":"1\u20132","key":"8_CR9","doi-asserted-by":"crossref","first-page":"273","DOI":"10.1016\/S0004-3702(97)00043-X","volume":"97","author":"R Kohavi","year":"1997","unstructured":"Kohavi, R., John, G.H.: Wrappers for feature subset selection. Artif. Intell. 97(1\u20132), 273\u2013324 (1997)","journal-title":"Artif. Intell."},{"issue":"2","key":"8_CR10","doi-asserted-by":"crossref","first-page":"477","DOI":"10.1016\/j.ejor.2004.08.010","volume":"169","author":"FG L\u00f3pez","year":"2006","unstructured":"L\u00f3pez, F.G., Torres, M.G., Batista, B.M., P\u00e9rez, J.A.M., Moreno-Vega, J.M.: Solving feature subset selection problem by a parallel scatter search. Eur. J. Oper. Res. 169(2), 477\u2013489 (2006)","journal-title":"Eur. J. Oper. Res."},{"issue":"8","key":"8_CR11","doi-asserted-by":"crossref","first-page":"1052","DOI":"10.1016\/j.jpdc.2005.11.006","volume":"66","author":"N Melab","year":"2006","unstructured":"Melab, N., Cahon, S., Talbi, E.G.: Grid computing for parallel bioinspired algorithms. J. Parallel Distrib. Comput. 66(8), 1052\u20131061 (2006)","journal-title":"J. Parallel Distrib. Comput."},{"issue":"3","key":"8_CR12","doi-asserted-by":"crossref","first-page":"433","DOI":"10.1007\/s00453-006-1220-3","volume":"45","author":"JT Souza de","year":"2006","unstructured":"de Souza, J.T., Matwin, S., Japkowicz, N.: Parallelizing feature selection. Algorithmica 45(3), 433\u2013456 (2006)","journal-title":"Algorithmica"},{"key":"8_CR13","unstructured":"Garcia, D.J., Hall, L.O., Goldgof, D.B., Kramer, K.: A parallel feature selection algorithm from random subsets. In: Proceedings of the 17th European Conference on Machine Learning and the 10th European Conference on Principles and Practice of Knowledge Discovery in Databases, Berlin (2006)"},{"key":"8_CR14","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"1224","DOI":"10.1007\/978-3-642-02478-8_153","volume-title":"Bio-Inspired Systems: Computational and Ambient Intelligence","author":"A Guill\u00e9n","year":"2009","unstructured":"Guill\u00e9n, A., Sorjamaa, A., Miche, Y., Lendasse, A., Rojas, I.: Efficient parallel feature selection for steganography problems. In: Cabestany, J., Sandoval, F., Prieto, A., Corchado, J.M. (eds.) IWANN 2009. LNCS, vol. 5517, pp. 1224\u20131231. Springer, Heidelberg (2009). https:\/\/doi.org\/10.1007\/978-3-642-02478-8_153"},{"key":"8_CR15","doi-asserted-by":"crossref","unstructured":"Singh, S., Kubica, J., Larsen, S., Sorokina, D.: Parallel large scale feature selection for logistic regression. In: SDM, pp. 1172\u20131183. SIAM (2009)","DOI":"10.1137\/1.9781611972795.100"},{"key":"8_CR16","doi-asserted-by":"crossref","unstructured":"Peralta, D., R\u00edo, S., Ram\u00edrez, S., Triguero, I., Ben\u00edtez, J.M., Herrera, F.: Evolutionary feature selection for big data classification: a MapReduce approach. In: Mathematical Problems in Engineering (2015)","DOI":"10.1155\/2015\/246139"},{"issue":"1","key":"8_CR17","doi-asserted-by":"crossref","first-page":"195","DOI":"10.1007\/s10994-013-5373-4","volume":"92","author":"Z Zhao","year":"2013","unstructured":"Zhao, Z., Zhang, R., Cox, J., Duling, D., Sarle, W.: Massively parallel feature selection: an approach based on variance preservation. Mach. Learn. 92(1), 195\u2013220 (2013)","journal-title":"Mach. Learn."},{"key":"8_CR18","series-title":"Lecture Notes in Electrical Engineering","doi-asserted-by":"publisher","first-page":"299","DOI":"10.1007\/978-3-319-01766-2_35","volume-title":"Computer Engineering and Networking","author":"Z Sun","year":"2014","unstructured":"Sun, Z.: Parallel feature selection based on MapReduce. In: Wong, W.E., Zhu, T. (eds.) Computer Engineering and Networking. LNEE, vol. 277, pp. 299\u2013306. Springer, Cham (2014). https:\/\/doi.org\/10.1007\/978-3-319-01766-2_35"},{"key":"8_CR19","series-title":"Communications in Computer and Information Science","doi-asserted-by":"publisher","first-page":"186","DOI":"10.1007\/978-3-319-23201-0_21","volume-title":"New Trends in Databases and Information Systems","author":"B Ordozgoiti","year":"2015","unstructured":"Ordozgoiti, B., G\u00f3mez Canaval, S., Mozo, A.: Massively parallel unsupervised feature selection on spark. In: Morzy, T., Valduriez, P., Bellatreche, L. (eds.) ADBIS 2015. CCIS, vol. 539, pp. 186\u2013196. Springer, Cham (2015). https:\/\/doi.org\/10.1007\/978-3-319-23201-0_21"},{"key":"8_CR20","doi-asserted-by":"crossref","first-page":"136","DOI":"10.1016\/j.asoc.2015.01.035","volume":"30","author":"V Bol\u00f3n-Canedo","year":"2015","unstructured":"Bol\u00f3n-Canedo, V., S\u00e1nchez-Maro\u00f1o, N., Alonso-Betanzos, A.: Distributed feature selection: an application to microarray data classification. Appl. Soft Comput. J. 30, 136\u2013150 (2015)","journal-title":"Appl. Soft Comput. J."},{"issue":"99","key":"8_CR21","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1109\/TSMC.2017.2670926","volume":"PP","author":"S Ram\u00edrez-Gallego","year":"2017","unstructured":"Ram\u00edrez-Gallego, S., Mouri\u00f1o-Tal\u00edn, H., Mart\u00ednez-Rego, D., Bol\u00f3n-Canedo, V., Ben\u00edtez, J.M., Alonso-Betanzos, A., Herrera, F.: An information theory-based feature selection framework for big data under apache spark. IEEE Trans. Syst. Man Cybern. Syst. PP(99), 1\u201313 (2017)","journal-title":"IEEE Trans. Syst. Man Cybern. Syst."},{"key":"8_CR22","first-page":"27","volume":"13","author":"G Brown","year":"2012","unstructured":"Brown, G., Pocock, A., Ming-Jie, Z., Luj\u00e1n, M.: Conditional likelihood maximisation: a unifying framework for information theoretic feature selection. J. Mach. Learn. Res. 13, 27\u201366 (2012)","journal-title":"J. Mach. Learn. Res."},{"issue":"8","key":"8_CR23","doi-asserted-by":"crossref","first-page":"1226","DOI":"10.1109\/TPAMI.2005.159","volume":"27","author":"H Peng","year":"2005","unstructured":"Peng, H., Long, F., Ding, C.: Feature selection based on mutual information: criteria of max-dependency, max-relevance, and min-redundancy. IEEE Trans. Pattern Anal. Mach. Intell. 27(8), 1226\u20131238 (2005)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"8_CR24","doi-asserted-by":"crossref","first-page":"461","DOI":"10.1186\/1471-2105-9-461","volume":"9","author":"PE Meyer","year":"2008","unstructured":"Meyer, P.E., Lafitte, F., Bontempi, G.: minet: a R\/bioconductor package for inferring large transcriptional networks using mutual information. BMC Bioinform. 9, 461 (2008)","journal-title":"BMC Bioinform."},{"key":"8_CR25","doi-asserted-by":"crossref","unstructured":"Reggiani, C., Le Borgne, Y.A., Bontempi, G.: Feature selection in high-dimensional dataset using MapReduce. ArXiv e-prints, September 2017","DOI":"10.1007\/978-3-319-76892-2_8"},{"key":"8_CR26","doi-asserted-by":"crossref","unstructured":"Blanas, S., Patel, J.M., Ercegovac, V., Rao, J., Shekita, E.J., Tian, Y.: A comparison of join algorithms for log processing in MapReduce. In: Proceedings of the 2010 ACM SIGMOD International Conference on Management of Data (SIGMOD 2010), New York, pp. 975\u2013986. ACM (2010)","DOI":"10.1145\/1807167.1807273"},{"key":"8_CR27","doi-asserted-by":"crossref","unstructured":"Sarma, A.D., Afrati, F.N., Salihoglu, S., Ullman, J.D.: Upper and lower bounds on the cost of a map-reduce computation. In: Proceedings of the VLDB Endowment, vol. 6, pp. 277\u2013288. VLDB Endowment (2013)","DOI":"10.14778\/2535570.2488334"},{"key":"8_CR28","doi-asserted-by":"crossref","first-page":"74","DOI":"10.1016\/j.csda.2015.04.006","volume":"90","author":"J Ahn","year":"2015","unstructured":"Ahn, J., Jeon, Y.: Sparse HDLSS discrimination with constrained data piling. Comput. Stat. Data Anal. 90, 74\u201383 (2015)","journal-title":"Comput. Stat. Data Anal."},{"issue":"18","key":"8_CR29","doi-asserted-by":"crossref","first-page":"2365","DOI":"10.1093\/bioinformatics\/btt383","volume":"29","author":"ND Jay","year":"2013","unstructured":"Jay, N.D., Papillon-Cavanagh, S., Olsen, C., Hachem, N., Bontempi, G., Haibe-Kains, B.: mRMRe: an R package for parallelized mRMR ensemble feature selection. Bioinformatics 29(18), 2365\u20132368 (2013)","journal-title":"Bioinformatics"},{"key":"8_CR30","volume-title":"Learning Spark: Lightning-Fast Big Data Analytics","author":"H Karau","year":"2015","unstructured":"Karau, H., Konwinski, A., Wendell, P., Zaharia, M.: Learning Spark: Lightning-Fast Big Data Analytics, 1st edn. O\u2019Reilly Media Inc., Sebastopol (2015)","edition":"1"},{"key":"8_CR31","unstructured":"Zaharia, M., Chowdhury, M., Das, T., Dave, A., Ma, J., McCauley, M., Franklin, M.J., Shenker, S., Stoica, I.: Resilient distributed datasets: a fault-tolerant abstraction for in-memory cluster computing. In: Proceedings of the 9th USENIX Conference on Networked Systems Design and Implementation (NSDI 2012), Berkeley, p. 2. USENIX Association (2012)"},{"key":"8_CR32","series-title":"Artificial Intelligence: Foundations, Theory, and Algorithms","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-21858-8","volume-title":"Feature Selection for High-Dimensional Data","author":"V Bol\u00f3n-Canedo","year":"2015","unstructured":"Bol\u00f3n-Canedo, V., S\u00e1nchez-Maro\u00f1o, N., Alonso-Betanzos, A.: Feature Selection for High-Dimensional Data. AIFTA. Springer, Cham (2015). https:\/\/doi.org\/10.1007\/978-3-319-21858-8"}],"container-title":["Communications in Computer and Information Science","Artificial Intelligence"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-76892-2_8","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,10,11]],"date-time":"2019-10-11T15:39:17Z","timestamp":1570808357000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-76892-2_8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018]]},"ISBN":["9783319768915","9783319768922"],"references-count":32,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-76892-2_8","relation":{},"ISSN":["1865-0929","1865-0937"],"issn-type":[{"type":"print","value":"1865-0929"},{"type":"electronic","value":"1865-0937"}],"subject":[],"published":{"date-parts":[[2018]]}}}