{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,26]],"date-time":"2025-03-26T03:42:06Z","timestamp":1742960526095,"version":"3.40.3"},"publisher-location":"Cham","reference-count":18,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319232003"},{"type":"electronic","value":"9783319232010"}],"license":[{"start":{"date-parts":[[2015,1,1]],"date-time":"2015-01-01T00:00:00Z","timestamp":1420070400000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2015]]},"DOI":"10.1007\/978-3-319-23201-0_21","type":"book-chapter","created":{"date-parts":[[2015,8,27]],"date-time":"2015-08-27T11:57:35Z","timestamp":1440676655000},"page":"186-196","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["Massively Parallel Unsupervised Feature Selection on Spark"],"prefix":"10.1007","author":[{"given":"Bruno","family":"Ordozgoiti","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Sandra","family":"G\u00f3mez Canaval","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Alberto","family":"Mozo","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2015,8,28]]},"reference":[{"key":"21_CR1","doi-asserted-by":"crossref","unstructured":"Boutsidis, C., Mahoney, M.W., Drineas, P.: An improved approximation algorithm for the column subset selection problem. In: Proceedings of the Twentieth Annual ACM-SIAM Symposium on Discrete Algorithms, pp. 968\u2013977. Society for Industrial and Applied Mathematics, January 2009","DOI":"10.1137\/1.9781611973068.105"},{"key":"21_CR2","doi-asserted-by":"crossref","unstructured":"Boutsidis, C., Mahoney, M.W., Drineas, P.: Unsupervised feature selection for principal components analysis. In: Proceedings of the 14th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining. ACM (2008)","DOI":"10.1145\/1401890.1401903"},{"key":"21_CR3","unstructured":"Pi, Y., et al.: A scalable approach to column-based low-rank matrix approximation. In: Proceedings of the Twenty-Third International Joint Conference on Artificial Intelligence. AAAI Press (2013)"},{"key":"21_CR4","doi-asserted-by":"crossref","unstructured":"Sun, Z., Li, Z.: Data intensive parallel feature selection method study. In: 2014 International Joint Conference on Neural Networks (IJCNN). IEEE (2014)","DOI":"10.1109\/IJCNN.2014.6889409"},{"key":"21_CR5","unstructured":"Reggiani, C., et al.: Minimum redundancy maximum relevance: mapreduce implementation using apache hadoop. In: BENELEARN 2014, p. 2 (2014)"},{"key":"21_CR6","doi-asserted-by":"publisher","first-page":"136","DOI":"10.1016\/j.asoc.2015.01.035","volume":"30","author":"V Bol\u00f3n-Canedo","year":"2015","unstructured":"Bol\u00f3n-Canedo, V., S\u00e1nchez-Maro\u00f1o, N., Alonso-Betanzos, A.: Distributed feature selection: An application to microarray data classification. Applied Soft Computing 30, 136\u2013150 (2015)","journal-title":"Applied Soft Computing"},{"key":"21_CR7","doi-asserted-by":"crossref","unstructured":"Singh, S., et al.: Parallel large scale feature selection for logistic regression. In: SDM (2009)","DOI":"10.1137\/1.9781611972795.100"},{"issue":"1","key":"21_CR8","doi-asserted-by":"publisher","first-page":"195","DOI":"10.1007\/s10994-013-5373-4","volume":"92","author":"Z Zhao","year":"2013","unstructured":"Zhao, Z., et al.: Massively parallel feature selection: an approach based on variance preservation. Machine Learning 92(1), 195\u2013220 (2013)","journal-title":"Machine Learning"},{"key":"21_CR9","doi-asserted-by":"crossref","unstructured":"Farahat, A.K., et al.: Distributed column subset selection on MapReduce. In: 2013 IEEE 13th International Conference on Data Mining (ICDM). IEEE (2013)","DOI":"10.1109\/ICDM.2013.155"},{"key":"21_CR10","doi-asserted-by":"crossref","unstructured":"He, Q., et al.: Parallel feature selection using positive approximation based on MapReduce. In: 2014 11th International Conference on Fuzzy Systems and Knowledge Discovery (FSKD). IEEE (2014)","DOI":"10.1109\/FSKD.2014.6980867"},{"issue":"1","key":"21_CR11","doi-asserted-by":"publisher","first-page":"199","DOI":"10.1016\/S0024-3795(00)00120-8","volume":"316","author":"C-T Pan","year":"2000","unstructured":"Pan, C.-T.: On the existence and computation of rank-revealing LU factorizations. Linear Algebra and its Applications 316(1), 199\u2013222 (2000)","journal-title":"Linear Algebra and its Applications"},{"key":"21_CR12","unstructured":"Zaharia, M., et al.: Resilient distributed datasets: a fault-tolerant abstraction for in-memory cluster computing. In: Proceedings of the 9th USENIX Conference on Networked Systems Design and Implementation. USENIX Association (2012)"},{"issue":"4","key":"21_CR13","doi-asserted-by":"publisher","first-page":"783","DOI":"10.1137\/0914050","volume":"14","author":"NJ Higham","year":"1993","unstructured":"Higham, N.J.: The accuracy of floating point summation. SIAM Journal on Scientific Computing 14(4), 783\u2013799 (1993)","journal-title":"SIAM Journal on Scientific Computing"},{"key":"21_CR14","doi-asserted-by":"crossref","unstructured":"Kahan, W.: 1965. Pracniques: further remarks on reducing truncation errors. Commun. ACM 8(1), January 1965","DOI":"10.1145\/363707.363723"},{"issue":"1","key":"21_CR15","doi-asserted-by":"publisher","first-page":"107","DOI":"10.1145\/1327452.1327492","volume":"51","author":"J Dean","year":"2008","unstructured":"Dean, J., Ghemawat, S.: MapReduce: simplified data processing on large clusters. Communications of the ACM 51(1), 107\u2013113 (2008)","journal-title":"Communications of the ACM"},{"key":"21_CR16","doi-asserted-by":"crossref","unstructured":"Shvachko, K., et al.: The hadoop distributed file system. In: 2010 IEEE 26th Symposium on Mass Storage Systems and Technologies (MSST). IEEE (2010)","DOI":"10.1109\/MSST.2010.5496972"},{"key":"21_CR17","unstructured":"Murray, D.G., et al.: CIEL: a universal execution engine for distributed data-flow computing. In: NSDI, vol. 11 (2011)"},{"key":"21_CR18","doi-asserted-by":"crossref","unstructured":"Isard, M., et al.: Dryad: distributed data-parallel programs from sequential building blocks. ACM SIGOPS Operating Systems Review 41(3) (2007)","DOI":"10.1145\/1272998.1273005"}],"container-title":["Communications in Computer and Information Science","New Trends in Databases and Information Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-23201-0_21","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,2,17]],"date-time":"2023-02-17T20:42:46Z","timestamp":1676666566000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-319-23201-0_21"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015]]},"ISBN":["9783319232003","9783319232010"],"references-count":18,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-23201-0_21","relation":{},"ISSN":["1865-0929","1865-0937"],"issn-type":[{"type":"print","value":"1865-0929"},{"type":"electronic","value":"1865-0937"}],"subject":[],"published":{"date-parts":[[2015]]},"assertion":[{"value":"28 August 2015","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}}]}}