{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,10]],"date-time":"2026-01-10T07:52:55Z","timestamp":1768031575330,"version":"3.49.0"},"publisher-location":"New York, NY, USA","reference-count":31,"publisher":"ACM","license":[{"start":{"date-parts":[[2015,5,6]],"date-time":"2015-05-06T00:00:00Z","timestamp":1430870400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2015,5,6]]},"DOI":"10.1145\/2742854.2747283","type":"proceedings-article","created":{"date-parts":[[2015,5,11]],"date-time":"2015-05-11T16:31:04Z","timestamp":1431361864000},"page":"1-8","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":120,"title":["SparkBench"],"prefix":"10.1145","author":[{"given":"Min","family":"Li","sequence":"first","affiliation":[{"name":"IBM TJ Watson Research Center"}]},{"given":"Jian","family":"Tan","sequence":"additional","affiliation":[{"name":"IBM TJ Watson Research Center"}]},{"given":"Yandong","family":"Wang","sequence":"additional","affiliation":[{"name":"IBM TJ Watson Research Center"}]},{"given":"Li","family":"Zhang","sequence":"additional","affiliation":[{"name":"IBM TJ Watson Research Center"}]},{"given":"Valentina","family":"Salapura","sequence":"additional","affiliation":[{"name":"IBM TJ Watson Research Center"}]}],"member":"320","published-online":{"date-parts":[[2015,5,6]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"http:\/\/www.tpc.org\/tpcds\/","author":"DS.","year":"2014","unstructured":"TPC- DS. http:\/\/www.tpc.org\/tpcds\/ , 2014 . TPC-DS. http:\/\/www.tpc.org\/tpcds\/, 2014."},{"key":"e_1_3_2_1_2_1","volume-title":"http:\/\/www.tpc.org\/tpch\/","author":"H.","year":"2014","unstructured":"TPC- H. http:\/\/www.tpc.org\/tpch\/ , 2014 . TPC-H. http:\/\/www.tpc.org\/tpch\/, 2014."},{"key":"e_1_3_2_1_3_1","volume-title":"Big Data Benchmark. https:\/\/amplab.cs.berkeley.edu\/benchmark\/","year":"2013","unstructured":"AMPLab. Big Data Benchmark. https:\/\/amplab.cs.berkeley.edu\/benchmark\/ , 2013 . AMPLab. Big Data Benchmark. https:\/\/amplab.cs.berkeley.edu\/benchmark\/, 2013."},{"key":"e_1_3_2_1_4_1","unstructured":"Apache. Spark. http:\/\/spark.apache.org\/.  Apache. Spark. http:\/\/spark.apache.org\/."},{"key":"e_1_3_2_1_5_1","volume-title":"http:\/\/hadoop.apache.org\/docs\/r1.2.1\/gridmix.html","year":"2013","unstructured":"Apache. GridMix. http:\/\/hadoop.apache.org\/docs\/r1.2.1\/gridmix.html , 2013 . Apache. GridMix. http:\/\/hadoop.apache.org\/docs\/r1.2.1\/gridmix.html, 2013."},{"key":"e_1_3_2_1_6_1","volume-title":"https:\/\/cwiki.apache.org\/confluence\/display\/PIG\/PigMix","year":"2013","unstructured":"Apache. PigMix. https:\/\/cwiki.apache.org\/confluence\/display\/PIG\/PigMix , 2013 . Apache. PigMix. https:\/\/cwiki.apache.org\/confluence\/display\/PIG\/PigMix, 2013."},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1145\/2463676.2465296"},{"key":"e_1_3_2_1_8_1","volume-title":"Proceedings of the Hadoop Summit. Santa Clara","author":"Avery C.","year":"2011","unstructured":"C. Avery . Giraph : Large-scale graph processing infrastructure on hadoop . Proceedings of the Hadoop Summit. Santa Clara , 2011 . C. Avery. Giraph: Large-scale graph processing infrastructure on hadoop. Proceedings of the Hadoop Summit. Santa Clara, 2011."},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1145\/1807128.1807152"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1145\/1327452.1327492"},{"key":"e_1_3_2_1_11_1","unstructured":"FaceBook. Social Network Graph. http:\/\/snap.stanford.edu\/data\/egonets-Facebook.html.  FaceBook. Social Network Graph. http:\/\/snap.stanford.edu\/data\/egonets-Facebook.html."},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1145\/2150976.2150982"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1145\/2463676.2463712"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDM.2008.22"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDEW.2010.5452747"},{"key":"e_1_3_2_1_16_1","unstructured":"IBM. Big Data and Analytics Hub. http:\/\/www.ibmbigdatahub.com\/infographic\/four-vs-big-data.  IBM. Big Data and Analytics Hub. http:\/\/www.ibmbigdatahub.com\/infographic\/four-vs-big-data."},{"key":"e_1_3_2_1_17_1","unstructured":"IBM. SoftLayer. http:\/\/www.softlayer.com\/.  IBM. SoftLayer. http:\/\/www.softlayer.com\/."},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4614-7138-7"},{"key":"e_1_3_2_1_19_1","volume-title":"Efficient triangle counting in large graphs via degree-based vertex partitioning. Internet Mathematics, 8(1--2): 161--185","author":"Kolountzakis M. N.","year":"2012","unstructured":"M. N. Kolountzakis , G. L. Miller , R. Peng , and C. E. Tsourakakis . Efficient triangle counting in large graphs via degree-based vertex partitioning. Internet Mathematics, 8(1--2): 161--185 , 2012 . M. N. Kolountzakis, G. L. Miller, R. Peng, and C. E. Tsourakakis. Efficient triangle counting in large graphs via degree-based vertex partitioning. Internet Mathematics, 8(1--2): 161--185, 2012."},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1145\/1401890.1401944"},{"key":"e_1_3_2_1_21_1","unstructured":"M. Li J. Tan Y. Wang L. Zhang and V. Salapura. SparkBench: A Comprehensive Spark Benchmarking Suite. https:\/\/bitbucket.org\/lm0926\/sparkbench.  M. Li J. Tan Y. Wang L. Zhang and V. Salapura. SparkBench: A Comprehensive Spark Benchmarking Suite. https:\/\/bitbucket.org\/lm0926\/sparkbench."},{"key":"e_1_3_2_1_22_1","unstructured":"S. Neumann. Spark vs. Hadoop MapReduce. https:\/\/www.xplenty.com\/blog\/2014\/11\/apache-spark-vs-hadoop-mapreduce\/.  S. Neumann. Spark vs. Hadoop MapReduce. https:\/\/www.xplenty.com\/blog\/2014\/11\/apache-spark-vs-hadoop-mapreduce\/."},{"key":"e_1_3_2_1_23_1","unstructured":"C. Nyberg M. Shah and N. Govindaraju. Sort Benchmark. http:\/\/sortbenchmark.org\/ 2014.  C. Nyberg M. Shah and N. Govindaraju. Sort Benchmark. http:\/\/sortbenchmark.org\/ 2014."},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1145\/1559845.1559865"},{"key":"e_1_3_2_1_26_1","unstructured":"Twitter. Twitter4j: a Java Library for the Twitter API. http:\/\/twitter4j.org.  Twitter. Twitter4j: a Java Library for the Twitter API. http:\/\/twitter4j.org."},{"key":"e_1_3_2_1_27_1","unstructured":"L. Wang J. Zhan C. Luo Y. Zhu Q. Yang Y. He W. Gao Z. Jia Y. Shi S. Zhang C. Zheng G. Lu K. Zhan X. Li and B. Qiu. BigDataBench. http:\/\/prof.ict.ac.cn\/BigDataBench\/ 2014.  L. Wang J. Zhan C. Luo Y. Zhu Q. Yang Y. He W. Gao Z. Jia Y. Shi S. Zhang C. Zheng G. Lu K. Zhan X. Li and B. Qiu. BigDataBench. http:\/\/prof.ict.ac.cn\/BigDataBench\/ 2014."},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA.2014.6835958"},{"key":"e_1_3_2_1_29_1","unstructured":"Wikipedia. Data Dumps. http:\/\/dumps.wikimedia.org\/enwiki\/.  Wikipedia. Data Dumps. http:\/\/dumps.wikimedia.org\/enwiki\/."},{"key":"e_1_3_2_1_30_1","unstructured":"A. Woodie. Spark Smashes MapReduce in Big Data Benchmark. http:\/\/www.datanami.com\/2014\/10\/10\/spark-smashes-mapreduce-big-data-benchmark\/.  A. Woodie. Spark Smashes MapReduce in Big Data Benchmark. http:\/\/www.datanami.com\/2014\/10\/10\/spark-smashes-mapreduce-big-data-benchmark\/."},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1109\/BigData.2013.6691707"},{"key":"e_1_3_2_1_32_1","volume-title":"Proceedings of the 9th USENIX NSDI","author":"Zaharia M.","year":"2012","unstructured":"M. Zaharia , M. Chowdhury , T. Das , A. Dave , J. Ma , M. McCauley , M. J. Franklin , S. Shenker , and I. Stoica . Resilient distributed datasets: A fault-tolerant abstraction for in-memory cluster computing . In Proceedings of the 9th USENIX NSDI , Berkeley, CA, USA , 2012 . M. Zaharia, M. Chowdhury, T. Das, A. Dave, J. Ma, M. McCauley, M. J. Franklin, S. Shenker, and I. Stoica. Resilient distributed datasets: A fault-tolerant abstraction for in-memory cluster computing. In Proceedings of the 9th USENIX NSDI, Berkeley, CA, USA, 2012."}],"event":{"name":"CF'15: Computing Frontiers Conference","location":"Ischia Italy","acronym":"CF'15","sponsor":["SIGMICRO ACM Special Interest Group on Microarchitectural Research and Processing"]},"container-title":["Proceedings of the 12th ACM International Conference on Computing Frontiers"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/2742854.2747283","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/2742854.2747283","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T06:16:34Z","timestamp":1750227394000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/2742854.2747283"}},"subtitle":["a comprehensive benchmarking suite for in memory data analytic platform Spark"],"short-title":[],"issued":{"date-parts":[[2015,5,6]]},"references-count":31,"alternative-id":["10.1145\/2742854.2747283","10.1145\/2742854"],"URL":"https:\/\/doi.org\/10.1145\/2742854.2747283","relation":{},"subject":[],"published":{"date-parts":[[2015,5,6]]},"assertion":[{"value":"2015-05-06","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}