{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,29]],"date-time":"2025-09-29T08:07:01Z","timestamp":1759133221377,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":25,"publisher":"ACM","license":[{"start":{"date-parts":[[2018,7,19]],"date-time":"2018-07-19T00:00:00Z","timestamp":1531958400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100008297","name":"Cray Incorporated","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100008297","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000185","name":"Defense Advanced Research Projects Agency","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100000185","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2018,7,19]]},"DOI":"10.1145\/3219819.3219927","type":"proceedings-article","created":{"date-parts":[[2018,7,19]],"date-time":"2018-07-19T13:05:12Z","timestamp":1532005512000},"page":"293-301","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":9,"title":["Accelerating Large-Scale Data Analysis by Offloading to High-Performance Computing Libraries using Alchemist"],"prefix":"10.1145","author":[{"given":"Alex","family":"Gittens","sequence":"first","affiliation":[{"name":"Rensselaer Polytechnic Institute, Troy, NY, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Kai","family":"Rothauge","sequence":"additional","affiliation":[{"name":"University of California, Berkeley, Berkeley, CA, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Shusen","family":"Wang","sequence":"additional","affiliation":[{"name":"University of California, Berkeley, Berkeley, CA, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Michael W.","family":"Mahoney","sequence":"additional","affiliation":[{"name":"University of California, Berkeley, Berkeley, CA, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Lisa","family":"Gerhardt","sequence":"additional","affiliation":[{"name":"NERSC\/LBNL, Berkeley, CA, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"family":"Prabhat","sequence":"additional","affiliation":[{"name":"NERSC\/LBNL, Berkeley, CA, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jey","family":"Kottalam","sequence":"additional","affiliation":[{"name":"University of California, Berkeley, Berkeley, CA, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Michael","family":"Ringenburg","sequence":"additional","affiliation":[{"name":"Cray Inc., Seattle, WA, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Kristyn","family":"Maschhoff","sequence":"additional","affiliation":[{"name":"Cray Inc., Seattle, WA, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2018,7,19]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.14778\/3090163.3090168"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1145\/2842602"},{"volume-title":"TIMIT Acoustic-Phonetic Continuous Speech Corpus. deftempurl%https:\/\/catalog.ldc.upenn.edu\/LDC93S1 Retrieved","year":"2018","author":"Garofolo J. S.","key":"e_1_3_2_1_3_1"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"crossref","unstructured":"A. Gittens A. Devarakonda E. Racah M. Ringenburg L. Gerhardt J. Kottalam J. Liu K. Maschhoff S. Canon J. Chhugani P. Sharma J. Yang J. Demmel J. Harrell V. Krishnamurthy M. W. Mahoney and Prabhat . 2016. Matrix factorizations at scale: A comparison of scientific data analytics in Spark and C  A. Gittens A. Devarakonda E. Racah M. Ringenburg L. Gerhardt J. Kottalam J. Liu K. Maschhoff S. Canon J. Chhugani P. Sharma J. Yang J. Demmel J. Harrell V. Krishnamurthy M. W. Mahoney and Prabhat . 2016. Matrix factorizations at scale: A comparison of scientific data analytics in Spark and C","DOI":"10.1109\/BigData.2016.7840606"},{"volume-title":"2016 IEEE International Conference on Big Data (Big Data). 204--213","author":"MPI","key":"e_1_3_2_1_5_1"},{"volume-title":"Alchemist: An Apache Spark <=> MPI Interface. Concurrency and Computation Practice and Experience on the Cray User Group","year":"2018","author":"Gittens A.","key":"e_1_3_2_1_6_1"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"crossref","unstructured":"P.-S. Huang H. Avron T. N. Sainath V. Sindhwani and B. Ramabhadran . 2014. Kernel methods match Deep Neural Networks on TIMIT 2014 IEEE International Conference on Acoustics Speech and Signal Processing (ICASSP). 205--209.  P.-S. Huang H. Avron T. N. Sainath V. Sindhwani and B. Ramabhadran . 2014. Kernel methods match Deep Neural Networks on TIMIT 2014 IEEE International Conference on Acoustics Speech and Signal Processing (ICASSP). 205--209.","DOI":"10.1109\/ICASSP.2014.6853587"},{"key":"e_1_3_2_1_8_1","unstructured":"C. Kohlhoff . 2018. Boost.Asio. deftempurl%https:\/\/www.boost.org\/ tempurl  C. Kohlhoff . 2018. Boost.Asio. deftempurl%https:\/\/www.boost.org\/ tempurl"},{"volume-title":"ARPACK: Solution of Large Scale Eigenvalue Problems with Implicitly Restarted Arnoldi Methods. deftempurl%http:\/\/www.caam.rice.edu\/software\/ARPACK\/ tempurl","year":"1997","author":"Lehoucq R. B.","key":"e_1_3_2_1_9_1"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"crossref","unstructured":"N. Malitsky A. Chaudhary S. Jourdain M. Cowan P. O'Leary M. Hanwell and K. K. Van Dam . 2017. Building near-real-time processing pipelines with the Spark-MPI platform 2017 New York Scientific Data Summit (NYSDS). 1--8.  N. Malitsky A. Chaudhary S. Jourdain M. Cowan P. O'Leary M. Hanwell and K. K. Van Dam . 2017. Building near-real-time processing pipelines with the Spark-MPI platform 2017 New York Scientific Data Summit (NYSDS). 1--8.","DOI":"10.1109\/NYSDS.2017.8085039"},{"volume-title":"MPI: A Message-Passing Interface Standard: Version 3.1. Technical Report. deftempurl%https:\/\/www.mpi-forum.org\/docs\/ tempurl","year":"2015","key":"e_1_3_2_1_11_1"},{"key":"e_1_3_2_1_12_1","unstructured":"MPICH 2018. MPICH: High-Performance Portable MPI. https:\/\/www.mpich.org\/  MPICH 2018. MPICH: High-Performance Portable MPI. https:\/\/www.mpich.org\/"},{"volume-title":"MPI","year":"2018","key":"e_1_3_2_1_13_1"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1145\/2427023.2427030"},{"key":"e_1_3_2_1_15_1","unstructured":"A. Rahimi and B. Recht . 2008. Random features for large-scale kernel machines. In Advances in Neural Information Processing Systems.   A. Rahimi and B. Recht . 2008. Random features for large-scale kernel machines. In Advances in Neural Information Processing Systems."},{"volume-title":"Big data analytics in the cloud: Spark on Hadoop vs MPI\/OpenMP on Beowulf Procedia Computer Science","author":"Reyes-Ortiz J. L.","key":"e_1_3_2_1_16_1"},{"volume-title":"Alchemist: An Apache Spark $<$=$>$ MPI Interface. deftempurl%http:\/\/github.com\/project-alchemist\/ tempurl","year":"2018","author":"Rothauge K.","key":"e_1_3_2_1_17_1"},{"edition":"2","volume-title":"Iterative methods for sparse linear systems (bibinfoedition","author":"Saad Y.","key":"e_1_3_2_1_18_1"},{"volume-title":"January 1979 to","year":"2010","author":"Saha S.","key":"e_1_3_2_1_19_1"},{"volume-title":"Smart-MLlib: A High-Performance Machine-Learning Library 2016 IEEE International Conference on Cluster Computing (CLUSTER). 336--345","year":"2016","author":"Siegal D.","key":"e_1_3_2_1_20_1"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS.2016.93"},{"volume-title":"Large scale kernel learning using block coordinate descent. arXiv preprint arXiv:1602.05310","year":"2016","author":"Tu S.","key":"e_1_3_2_1_22_1"},{"volume-title":"et almbox","year":"2017","author":"Vishnu A.","key":"e_1_3_2_1_23_1"},{"volume-title":"Proceedings of the 9th USENIX Conference on Networked Systems Design and Implementation (NSDI). 15--28","year":"2012","author":"Zaharia M.","key":"e_1_3_2_1_24_1"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1145\/2934664"}],"event":{"name":"KDD '18: The 24th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining","sponsor":["SIGMOD ACM Special Interest Group on Management of Data","SIGKDD ACM Special Interest Group on Knowledge Discovery in Data"],"location":"London United Kingdom","acronym":"KDD '18"},"container-title":["Proceedings of the 24th ACM SIGKDD International Conference on Knowledge Discovery &amp; Data Mining"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3219819.3219927","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3219819.3219927","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3219819.3219927","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T02:07:21Z","timestamp":1750212441000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3219819.3219927"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,7,19]]},"references-count":25,"alternative-id":["10.1145\/3219819.3219927","10.1145\/3219819"],"URL":"https:\/\/doi.org\/10.1145\/3219819.3219927","relation":{},"subject":[],"published":{"date-parts":[[2018,7,19]]},"assertion":[{"value":"2018-07-19","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}