{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,26]],"date-time":"2025-03-26T17:08:31Z","timestamp":1743008911898,"version":"3.40.3"},"publisher-location":"Cham","reference-count":31,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783030586683"},{"type":"electronic","value":"9783030586690"}],"license":[{"start":{"date-parts":[[2020,9,20]],"date-time":"2020-09-20T00:00:00Z","timestamp":1600560000000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2020,9,20]],"date-time":"2020-09-20T00:00:00Z","timestamp":1600560000000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021]]},"DOI":"10.1007\/978-3-030-58669-0_36","type":"book-chapter","created":{"date-parts":[[2020,9,19]],"date-time":"2020-09-19T07:03:35Z","timestamp":1600499015000},"page":"394-403","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":7,"title":["Memory Management Approaches in Apache Spark: A Review"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-3394-1950","authenticated-orcid":false,"given":"Maha","family":"Dessokey","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9014-5590","authenticated-orcid":false,"given":"Sherif M.","family":"Saif","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7553-4002","authenticated-orcid":false,"given":"Sameh","family":"Salem","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4662-3874","authenticated-orcid":false,"given":"Elsayed","family":"Saad","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9669-5991","authenticated-orcid":false,"given":"Hesham","family":"Eldeeb","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2020,9,20]]},"reference":[{"issue":"1","key":"36_CR1","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s40537-014-0008-6","volume":"2","author":"D Singh","year":"2014","unstructured":"Singh, D., Reddy, C.K.: A survey on platforms for big data analytics. J. Big Data 2(1), 1\u201320 (2014). https:\/\/doi.org\/10.1186\/s40537-014-0008-6","journal-title":"J. Big Data"},{"issue":"1","key":"36_CR2","doi-asserted-by":"publisher","first-page":"107","DOI":"10.1145\/1327452.1327492","volume":"51","author":"J Dean","year":"2008","unstructured":"Dean, J., Ghemawat, S.: MapReduce: simplified data processing on large clusters. Commun. ACM 51(1), 107\u2013113 (2008)","journal-title":"Commun. ACM"},{"issue":"10\u201310","key":"36_CR3","first-page":"95","volume":"10","author":"M Zaharia","year":"2010","unstructured":"Zaharia, M., et al.: Spark: cluster computing with working sets. HotCloud 10(10\u201310), 95 (2010)","journal-title":"HotCloud"},{"doi-asserted-by":"crossref","unstructured":"Gu, L., Li, H.: Memory or time: performance evaluation for iterative operation on Hadoop and spark. In: 2013 IEEE 10th International Conference on High Performance Computing and Communications (2013)","key":"36_CR4","DOI":"10.1109\/HPCC.and.EUC.2013.106"},{"doi-asserted-by":"crossref","unstructured":"Costa, C.H.A., et al.: Optimization of genomics analysis pipeline for scalable performance in a cloud environment. In: 2018 IEEE International Conference on Bioinformatics and Biomedicine (BIBM) (2018)","key":"36_CR5","DOI":"10.1109\/BIBM.2018.8621208"},{"doi-asserted-by":"crossref","unstructured":"Sarumi, O.A., Leung, C.K.: Exploiting anti-monotonic constraints in mining palindromic motifs from big genomic data. In: 2019 IEEE International Conference on Big Data (Big Data) (2019)","key":"36_CR6","DOI":"10.1109\/BigData47090.2019.9006397"},{"key":"36_CR7","doi-asserted-by":"publisher","first-page":"154035","DOI":"10.1109\/ACCESS.2019.2948949","volume":"7","author":"H Zhou","year":"2019","unstructured":"Zhou, H., et al.: A big data mining approach of PSO-based BP neural network for financial risk management with IoT. IEEE Access 7, 154035\u2013154043 (2019)","journal-title":"IEEE Access"},{"doi-asserted-by":"crossref","unstructured":"Zhang, Z., et al. Scientific computing meets big data technology: an astronomy use case. In: 2015 IEEE International Conference on Big Data (Big Data) (2015)","key":"36_CR8","DOI":"10.1109\/BigData.2015.7363840"},{"key":"36_CR9","volume-title":"Learning Spark: Lightning-Fast Big Data Analysis","author":"H Karau","year":"2015","unstructured":"Karau, H., et al.: Learning Spark: Lightning-Fast Big Data Analysis. O\u2019Reilly Media, Newton (2015)"},{"doi-asserted-by":"crossref","unstructured":"Zaharia, M.: An Architecture for Fast and General Data Processing on Large Clusters. Association for Computing Machinery and Morgan & Claypool Publishers (2016)","key":"36_CR10","DOI":"10.1145\/2886107"},{"unstructured":"Berger, D.S., Sitaraman, R.K., Harchol-Balter, M.: Adaptsize: orchestrating the hot object memory cache in a content delivery network. In: Proceedings of the 14th USENIX Conference on Networked Systems Design and Implementation, pp. 483\u2013498. USENIX Association, Boston (2017)","key":"36_CR11"},{"unstructured":"Megiddo, N., Modha, D.S.: ARC: a self-tuning, low overhead replacement cache. In: Proceedings of the 2nd USENIX Conference on File and Storage Technologies, pp. 115\u2013130. USENIX Association, San Francisco (2003)","key":"36_CR12"},{"issue":"1","key":"36_CR13","doi-asserted-by":"publisher","first-page":"31","DOI":"10.1145\/511399.511340","volume":"30","author":"S Jiang","year":"2002","unstructured":"Jiang, S., Zhang, X.: LIRS: an efficient low inter-reference recency set replacement policy to improve buffer cache performance. SIGMETRICS Perform. Eval. Rev. 30(1), 31\u201342 (2002)","journal-title":"SIGMETRICS Perform. Eval. Rev."},{"issue":"8","key":"36_CR14","doi-asserted-by":"publisher","first-page":"2473","DOI":"10.1002\/cpe.3584","volume":"28","author":"M Duan","year":"2016","unstructured":"Duan, M., et al.: Selection and replacement algorithms for memory performance improvement in Spark. Concurr. Comput.: Pract. Exp. 28(8), 2473\u20132486 (2016)","journal-title":"Concurr. Comput.: Pract. Exp."},{"issue":"6","key":"36_CR15","doi-asserted-by":"publisher","first-page":"1285","DOI":"10.1007\/s10766-016-0470-1","volume":"45","author":"Y Geng","year":"2017","unstructured":"Geng, Y., et al.: LCS: an efficient data eviction strategy for Spark. Int. J. Parallel Program. 45(6), 1285\u20131297 (2017)","journal-title":"Int. J. Parallel Program."},{"issue":"9","key":"36_CR16","first-page":"27","volume":"5","author":"C Zhao","year":"2019","unstructured":"Zhao, C., et al.: Research cache replacement strategy in memory optimization of spark. Int. J. New Technol. Res. (IJNTR) 5(9), 27\u201332 (2019)","journal-title":"Int. J. New Technol. Res. (IJNTR)"},{"doi-asserted-by":"crossref","unstructured":"Yu, Y., et al. LRC: dependency-aware cache management for data analytics clusters. In: IEEE INFOCOM 2017-IEEE Conference on Computer Communications. IEEE (2017)","key":"36_CR17","DOI":"10.1109\/INFOCOM.2017.8057007"},{"doi-asserted-by":"crossref","unstructured":"Yu, Y., et al. LERC: coordinated cache management for data-parallel systems. In: GLOBECOM 2017-2017 IEEE Global Communications Conference. IEEE (2017)","key":"36_CR18","DOI":"10.1109\/GLOCOM.2017.8254999"},{"doi-asserted-by":"crossref","unstructured":"Wang, B., et al.: LCRC: a dependency-aware cache management policy for Spark. In: 2018 IEEE International Conference on Parallel and Distributed Processing with Applications. IEEE (2018)","key":"36_CR19","DOI":"10.1109\/BDCloud.2018.00140"},{"doi-asserted-by":"crossref","unstructured":"Perez, T.B.G., Zhou, X., Cheng, D.: Reference-distance eviction and prefetching for cache management in Spark. In: Proceedings of the 47th International Conference on Parallel Processing, Association for Computing Machinery, p. Article 88, Eugene (2018)","key":"36_CR20","DOI":"10.1145\/3225058.3225087"},{"doi-asserted-by":"crossref","unstructured":"Huang, S., et al.: The HiBench benchmark suite: characterization of the MapReduce-based data analysis. In: 2010 IEEE 26th International Conference on Data Engineering Workshops (ICDEW 2010). IEEE (2010)","key":"36_CR21","DOI":"10.1109\/ICDEW.2010.5452747"},{"issue":"3","key":"36_CR22","doi-asserted-by":"publisher","first-page":"2575","DOI":"10.1007\/s10586-016-0723-1","volume":"20","author":"M Li","year":"2017","unstructured":"Li, M., et al.: SparkBench: a spark benchmarking suite characterizing largescale in-memory data analytics. Cluster Comput. 20(3), 2575\u20132589 (2017)","journal-title":"Cluster Comput."},{"doi-asserted-by":"crossref","unstructured":"Yang, Z., et al.: Intermediate data caching optimization for multi-stage and parallel big data frameworks. In: 2018 IEEE 11th International Conference on Cloud Computing (CLOUD). IEEE (2018)","key":"36_CR23","DOI":"10.1109\/CLOUD.2018.00042"},{"doi-asserted-by":"crossref","unstructured":"Niu, D., et al.: The classified and active caching strategy for iterative application in Spark. In: 2018 27th International Conference on Computer Communication and Networks (ICCCN). IEEE (2018)","key":"36_CR24","DOI":"10.1109\/ICCCN.2018.8487381"},{"unstructured":"Xu, E., Saxena, M., Chiu, L.: Neutrino: revisiting memory caching for iterative data analytics. In: 8th {USENIX} Workshop on Hot Topics in Storage and File Systems (HotStorage 2016) (2016)","key":"36_CR25"},{"doi-asserted-by":"crossref","unstructured":"Zhou, P., et al. Doppio: I\/O-aware performance analysis, modeling and optimization for in-memory computing framework. IEEE. (2018)","key":"36_CR26","DOI":"10.1109\/ISPASS.2018.00011"},{"unstructured":"RubiX. https:\/\/github.com\/qubole\/rubix","key":"36_CR27"},{"unstructured":"Azure HDInsight. https:\/\/docs.microsoft.com\/en-us\/azure\/hdinsight\/spark\/apache-spark-improve-performance-iocache","key":"36_CR28"},{"unstructured":"Databricks Delta Lake. https:\/\/docs.databricks.com\/delta\/optimizations\/delta-cache.html","key":"36_CR29"},{"unstructured":"Open Cache Acceleration. https:\/\/open-cas.github.io\/","key":"36_CR30"},{"unstructured":"Alluxio. https:\/\/www.alluxio.io\/","key":"36_CR31"}],"container-title":["Advances in Intelligent Systems and Computing","Proceedings of the International Conference on Advanced Intelligent Systems and Informatics 2020"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-58669-0_36","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,2,26]],"date-time":"2021-02-26T15:51:19Z","timestamp":1614354679000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-030-58669-0_36"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,9,20]]},"ISBN":["9783030586683","9783030586690"],"references-count":31,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-58669-0_36","relation":{},"ISSN":["2194-5357","2194-5365"],"issn-type":[{"type":"print","value":"2194-5357"},{"type":"electronic","value":"2194-5365"}],"subject":[],"published":{"date-parts":[[2020,9,20]]},"assertion":[{"value":"20 September 2020","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"AISI","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Advanced Intelligent Systems and Informatics","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Cairo","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Egypt","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2020","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"19 October 2020","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"21 October 2020","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"aisi2020","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/egyptscience.net\/AISI2020\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}