{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,27]],"date-time":"2025-03-27T06:58:30Z","timestamp":1743058710080,"version":"3.40.3"},"publisher-location":"Cham","reference-count":18,"publisher":"Springer Nature Switzerland","isbn-type":[{"type":"print","value":"9783031408427"},{"type":"electronic","value":"9783031408434"}],"license":[{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023]]},"DOI":"10.1007\/978-3-031-40843-4_29","type":"book-chapter","created":{"date-parts":[[2023,8,24]],"date-time":"2023-08-24T12:02:32Z","timestamp":1692878552000},"page":"391-402","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["An Earlier Experiences Towards Optimizing Apache Spark Over\u00a0Frontera Supercomputer"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-6175-4012","authenticated-orcid":false,"given":"Samuel","family":"Bernardo","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6547-714X","authenticated-orcid":false,"given":"Amit","family":"Ruhela","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6607-2152","authenticated-orcid":false,"given":"John","family":"Cazes","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5327-525X","authenticated-orcid":false,"given":"Stephen Lien","family":"Harrell","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9142-2596","authenticated-orcid":false,"given":"Jorge","family":"Gomes","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2023,8,25]]},"reference":[{"doi-asserted-by":"crossref","unstructured":"Al-Attar, K., Shafi, A., Abduljabbar, M., Subramoni, H., Panda, D.K.: Spark meets MPI: towards high-performance communication framework for spark using MPI. In: 2022 IEEE International Conference on Cluster Computing (CLUSTER), pp. 71\u201381. IEEE (2022)","key":"29_CR1","DOI":"10.1109\/CLUSTER51413.2022.00022"},{"unstructured":"Bernardo, S.: Distributed computing toolkit for machine learning operations\/workshops\/isc 2023 ixpug\/pi calculus $$\\cdot $$ gitlab, March 2023. https:\/\/gitlab.com\/distributed-computing-toolkit\/workshops\/isc-2023-ixpug\/pi-calculus. Accessed on 03 Mar 2023","key":"29_CR2"},{"unstructured":"Carbone, P., Katsifodimos, A., Ewen, S., Markl, V., Haridi, S., Tzoumas, K.: Apache flink: stream and batch processing in a single engine. Bull. Tech. Comm. Data Eng. 38(4) (2015). https:\/\/asterios.katsifodimos.com\/assets\/publications\/flink-deb.pdf","key":"29_CR3"},{"issue":"1","key":"29_CR4","doi-asserted-by":"publisher","first-page":"45","DOI":"10.1177\/1094342017701278","volume":"32","author":"J Conejero","year":"2018","unstructured":"Conejero, J., Corella, S., Badia, R.M., Labarta, J.: Task-based programming in COMPSs to converge from HPC to big data. Int. J. High Perform. Comput. Appl. 32(1), 45\u201360 (2018)","journal-title":"Int. J. High Perform. Comput. Appl."},{"unstructured":"Dean, J., Ghemawat, S.: Mapreduce: simplified data processing on large clusters (2004)","key":"29_CR5"},{"doi-asserted-by":"crossref","unstructured":"Guller, M., Guller, M.: Cluster managers. Big Data Analytics with Spark: A Practitioner\u2019s Guide to Using Spark for Large-Scale Data Processing, Machine Learning, and Graph Analytics, and High-Velocity Data Stream Processing, pp. 231\u2013242 (2015)","key":"29_CR6","DOI":"10.1007\/978-1-4842-0964-6_10"},{"doi-asserted-by":"crossref","unstructured":"Hayot-Sasson, V., Glatard, T.: Evaluation of pilot jobs for apache spark applications on HPC clusters. In: 2019 15th International Conference on eScience (eScience), pp. 146\u2013155. IEEE (2019)","key":"29_CR7","DOI":"10.1109\/eScience.2019.00023"},{"unstructured":"Hindman, B., et al.: Mesos: a platform for fine-grained resource sharing in the data center. In: NSDI, vol. 11, p. 22 (2011)","key":"29_CR8"},{"doi-asserted-by":"crossref","unstructured":"Lu, X., Rahman, M.W.U., Islam, N., Shankar, D., Panda, D.K.: Accelerating spark with RDMA for big data processing: early experiences. In: 2014 IEEE 22nd Annual Symposium on High-Performance Interconnects, pp. 9\u201316. IEEE (2014)","key":"29_CR9","DOI":"10.1109\/HOTI.2014.15"},{"doi-asserted-by":"crossref","unstructured":"Lu, X., Shankar, D., Gugnani, S., Panda, D.K.: High-performance design of apache spark with RDMA and its benefits on various workloads. In: 2016 IEEE International Conference on Big Data (Big Data), pp. 253\u2013262. IEEE (2016)","key":"29_CR10","DOI":"10.1109\/BigData.2016.7840611"},{"issue":"1","key":"29_CR11","first-page":"1235","volume":"17","author":"X Meng","year":"2016","unstructured":"Meng, X., et al.: Mllib: machine learning in apache spark. J. Mach. Learn. Res. 17(1), 1235\u20131241 (2016)","journal-title":"J. Mach. Learn. Res."},{"doi-asserted-by":"crossref","unstructured":"Stanzione, D., West, J., Evans, R.T., Minyard, T., Ghattas, O., Panda, D.K.: Frontera: the evolution of leadership computing at the national science foundation. In: Practice and Experience in Advanced Research Computing, pp. 106\u2013111 (2020)","key":"29_CR12","DOI":"10.1145\/3311790.3396656"},{"unstructured":"Thiruvathukal, G.K., Christensen, C., Jin, X., Tessier, F., Vishwanath, V.: A benchmarking study to evaluate apache spark on large-scale supercomputers. arXiv preprint arXiv:1904.11812 (2019)","key":"29_CR13"},{"doi-asserted-by":"crossref","unstructured":"Vavilapalli, V.K., et al.: Apache Hadoop YARN: yet another resource negotiator. In: Proceedings of the 4th Annual Symposium on Cloud Computing, pp. 1\u201316 (2013)","key":"29_CR14","DOI":"10.1145\/2523616.2523633"},{"doi-asserted-by":"crossref","unstructured":"Verma, A., Pedrosa, L., Korupolu, M.R., Oppenheimer, D., Tune, E., Wilkes, J.: Large-scale cluster management at Google with Borg. In: Proceedings of the European Conference on Computer Systems (EuroSys). Bordeaux, France (2015)","key":"29_CR15","DOI":"10.1145\/2741948.2741964"},{"key":"29_CR16","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"44","DOI":"10.1007\/10968987_3","volume-title":"Job Scheduling Strategies for Parallel Processing","author":"AB Yoo","year":"2003","unstructured":"Yoo, A.B., Jette, M.A., Grondona, M.: SLURM: simple Linux utility for resource management. In: Feitelson, D., Rudolph, L., Schwiegelshohn, U. (eds.) JSSPP 2003. LNCS, vol. 2862, pp. 44\u201360. Springer, Heidelberg (2003). https:\/\/doi.org\/10.1007\/10968987_3"},{"unstructured":"Zaharia, M., et al.: Resilient distributed datasets: a fault-tolerant abstraction for in-memory cluster computing. In: Presented as part of the 9th $$\\{$$USENIX$$\\}$$ Symposium on Networked Systems Design and Implementation ($$\\{$$NSDI$$\\}$$ 12), pp. 15\u201328 (2012)","key":"29_CR17"},{"issue":"10\u201310","key":"29_CR18","first-page":"95","volume":"10","author":"M Zaharia","year":"2010","unstructured":"Zaharia, M., Chowdhury, M., Franklin, M.J., Shenker, S., Stoica, I., et al.: Spark: cluster computing with working sets. HotCloud 10(10\u201310), 95 (2010)","journal-title":"HotCloud"}],"container-title":["Lecture Notes in Computer Science","High Performance Computing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-40843-4_29","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,8,24]],"date-time":"2023-08-24T12:06:36Z","timestamp":1692878796000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-40843-4_29"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023]]},"ISBN":["9783031408427","9783031408434"],"references-count":18,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-40843-4_29","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2023]]},"assertion":[{"value":"25 August 2023","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ISC High Performance","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on High Performance Computing","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Hamburg","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Germany","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2023","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"21 May 2023","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"25 May 2023","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"38","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"supercomputing2023","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/www.isc-hpc.com\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Double-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Linklings","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"70","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"49","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"0","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"70% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"2","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"No","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}