{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T04:07:13Z","timestamp":1750306033383,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":15,"publisher":"ACM","license":[{"start":{"date-parts":[[2017,12,8]],"date-time":"2017-12-08T00:00:00Z","timestamp":1512691200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"Science and Technology Plan of Sichuan Province","award":["2016GZ0322"],"award-info":[{"award-number":["2016GZ0322"]}]},{"name":"Natural Science Foundation of China","award":["61672136, 61650110513"],"award-info":[{"award-number":["61672136, 61650110513"]}]},{"name":"Xi Bu Zhi Guang Plan of Academy of Science","award":["R51A150Z10"],"award-info":[{"award-number":["R51A150Z10"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2017,12,8]]},"DOI":"10.1145\/3171592.3171610","type":"proceedings-article","created":{"date-parts":[[2018,3,16]],"date-time":"2018-03-16T12:53:36Z","timestamp":1521204816000},"page":"1-6","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":4,"title":["A Comparative Study of Data Skew in Hadoop"],"prefix":"10.1145","author":[{"given":"Majun","family":"He","sequence":"first","affiliation":[{"name":"School of Information and Software Engineering, University of Electronic Science and Technology of China, Chengdu, China"}]},{"given":"Guozhong","family":"Li","sequence":"additional","affiliation":[{"name":"School of Information and Software Engineering, University of Electronic Science and Technology of China, Chengdu, China"}]},{"given":"Chaojie","family":"Huang","sequence":"additional","affiliation":[{"name":"School of Information and Software Engineering, University of Electronic Science and Technology of China, Chengdu, China"}]},{"given":"Yufei","family":"Ye","sequence":"additional","affiliation":[{"name":"School of Information and Software Engineering, University of Electronic Science and Technology of China, Chengdu, China"}]},{"given":"Wenhong","family":"Tian","sequence":"additional","affiliation":[{"name":"School of Information and Software Engineering, University of Electronic Science and Technology of China, Chengdu, China"}]}],"member":"320","published-online":{"date-parts":[[2017,12,8]]},"reference":[{"issue":"1","key":"e_1_3_2_1_1_1","first-page":"107","volume":"51","author":"Dean J","year":"2004","unstructured":"Dean J , Ghemawat S. MapReduce : Simplified Data Processing on Large Clusters.{J}. In Proceedings of Operating Systems Design and Implementation ( OSDI , 2004 , 51 ( 1 ): 107 -- 113 . Dean J, Ghemawat S. MapReduce: Simplified Data Processing on Large Clusters.{J}. In Proceedings of Operating Systems Design and Implementation (OSDI, 2004, 51(1):107--113.","journal-title":"OSDI"},{"key":"e_1_3_2_1_2_1","volume-title":"Open Cirrus Summit","author":"Kwon Y","year":"2011","unstructured":"Kwon Y , Balazinska M , Howe B , A Study of Skew in MapReduce Applications{J} . Open Cirrus Summit , 2011 . Kwon Y, Balazinska M, Howe B, et al. A Study of Skew in MapReduce Applications{J}. Open Cirrus Summit, 2011."},{"key":"e_1_3_2_1_3_1","unstructured":"Lin J. The Curse of Zipf and Limits to Parallelization: A Look at the Stragglers Problem in MapReduce{J}. 2012:2009.  Lin J. The Curse of Zipf and Limits to Parallelization: A Look at the Stragglers Problem in MapReduce{J}. 2012:2009."},{"issue":"2","key":"e_1_3_2_1_4_1","first-page":"15","volume":"6","author":"Mount R P","year":"2005","unstructured":"Mount R P . The Office of Science Data-Management Challenge{J}. Doe Office of Advanced Scientific Computing Research March\u00cdCmay , 2005 , 6 ( 2 ): 15 -- 16 . Mount R P. The Office of Science Data-Management Challenge{J}. Doe Office of Advanced Scientific Computing Research March\u00cdCmay, 2005, 6(2):15--16.","journal-title":"Doe Office of Advanced Scientific Computing Research March\u00cdCmay"},{"key":"e_1_3_2_1_5_1","volume-title":"Nature","author":"Szalay A","year":"2020","unstructured":"Szalay A , Gray J. 2020 computing: science in an exponential world.{J} . Nature , 2006, 440(7083):413--4. Szalay A, Gray J. 2020 computing: science in an exponential world.{J}. Nature, 2006, 440(7083):413--4."},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1109\/SC.Companion.2012.254"},{"key":"e_1_3_2_1_7_1","unstructured":"http:\/\/hadoop.apache.org\/.  http:\/\/hadoop.apache.org\/."},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1145\/1807128.1807140"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1145\/2213836.2213840"},{"key":"e_1_3_2_1_10_1","volume-title":"International Conference on Autonomic Computing","author":"Guo Y","year":"2013","unstructured":"Guo Y , Rao J , Zhou X. i Shuffle : Improving Hadoop Performance with Shuffle-on-Write.{J} . International Conference on Autonomic Computing , 2013 . Guo Y, Rao J, Zhou X. iShuffle: Improving Hadoop Performance with Shuffle-on-Write.{J}. International Conference on Autonomic Computing, 2013."},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1007\/s12083-013-0213-7"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2014.2350972"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1145\/1989323.1989350"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1145\/2063384.2063461"},{"key":"e_1_3_2_1_15_1","unstructured":"PUMA\n  : Purdue mapreduce benchmark suite. https:\/\/engineering.purdue.edu\/~puma\/datasets.htm.  PUMA: Purdue mapreduce benchmark suite. https:\/\/engineering.purdue.edu\/~puma\/datasets.htm."}],"event":{"name":"ICNCC 2017: 2017 VI International Conference on Network, Communication and Computing","acronym":"ICNCC 2017","location":"Kunming China"},"container-title":["Proceedings of the 2017 VI International Conference on Network, Communication and Computing"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3171592.3171610","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3171592.3171610","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T03:02:53Z","timestamp":1750215773000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3171592.3171610"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,12,8]]},"references-count":15,"alternative-id":["10.1145\/3171592.3171610","10.1145\/3171592"],"URL":"https:\/\/doi.org\/10.1145\/3171592.3171610","relation":{},"subject":[],"published":{"date-parts":[[2017,12,8]]},"assertion":[{"value":"2017-12-08","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}