{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,20]],"date-time":"2025-12-20T08:39:49Z","timestamp":1766219989030,"version":"3.48.0"},"publisher-location":"New York, NY, USA","reference-count":42,"publisher":"ACM","content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,9,8]]},"DOI":"10.1145\/3754598.3754640","type":"proceedings-article","created":{"date-parts":[[2025,12,20]],"date-time":"2025-12-20T08:34:32Z","timestamp":1766219672000},"page":"730-740","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Decision Shuffle: Efficient Pre-scheduling System for Push-based Shuffle in DAG Computing Frameworks"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0006-0231-9439","authenticated-orcid":false,"given":"Shihao","family":"Zhang","sequence":"first","affiliation":[{"name":"Shanghai Jiao Tong University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0000-0415-4064","authenticated-orcid":false,"given":"Chi","family":"Zhang","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6882-3754","authenticated-orcid":false,"given":"Chentao","family":"Wu","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4974-6116","authenticated-orcid":false,"given":"Jie","family":"Li","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0034-2302","authenticated-orcid":false,"given":"Minyi","family":"Guo","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0009-3728-8726","authenticated-orcid":false,"given":"Hui","family":"Li","sequence":"additional","affiliation":[{"name":"Inspur (Jinan) Data Technology Co., Shandong, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-9337-0152","authenticated-orcid":false,"given":"Liqiang","family":"Zhang","sequence":"additional","affiliation":[{"name":"Inspur (Jinan) Data Technology Co., Shandong, China"}]}],"member":"320","published-online":{"date-parts":[[2025,12,20]]},"reference":[{"key":"e_1_3_3_2_2_2","first-page":"267","volume-title":"Proc. 9th USENIX Symp. Netw. Syst. Des. Implement. (NSDI 12)","author":"Ananthanarayanan G.","year":"2012","unstructured":"G. Ananthanarayanan, A. Ghodsi, A. Warfield, D. Borthakur, S. Kandula, S. Shenker, and I. Stoica. 2012. PACMan: Coordinated Memory Caching for Parallel Jobs. In Proc. 9th USENIX Symp. Netw. Syst. Des. Implement. (NSDI 12). 267\u2013280."},{"key":"e_1_3_3_2_3_2","volume-title":"Proc. 9th USENIX Symp. Oper. Syst. Des. Implement. (OSDI 10)","author":"Ananthanarayanan G.","year":"2010","unstructured":"G. Ananthanarayanan, S. Kandula, A. Greenberg, I. Stoica, Y. Lu, B. Saha, and E. Harris. 2010. Reining in the Outliers in Map-Reduce Clusters Using Mantri. In Proc. 9th USENIX Symp. Oper. Syst. Des. Implement. (OSDI 10)."},{"key":"e_1_3_3_2_4_2","doi-asserted-by":"publisher","DOI":"10.1145\/1807128.1807150"},{"key":"e_1_3_3_2_5_2","doi-asserted-by":"publisher","DOI":"10.5220\/0005952300330043"},{"key":"e_1_3_3_2_6_2","doi-asserted-by":"crossref","unstructured":"Q. Chen J. Yao and Z. Xiao. 2014. Libra: Lightweight Data Skew Mitigation in MapReduce. IEEE Trans. Parallel Distrib. Syst. 26 9 (2014) 2520\u20132533.","DOI":"10.1109\/TPDS.2014.2350972"},{"key":"e_1_3_3_2_7_2","doi-asserted-by":"publisher","DOI":"10.1145\/2663165.2666089"},{"key":"e_1_3_3_2_8_2","doi-asserted-by":"publisher","DOI":"10.1145\/3404397.3404430"},{"key":"e_1_3_3_2_9_2","doi-asserted-by":"crossref","unstructured":"M. Chowdhury and I. Stoica. 2015. Efficient Coflow Scheduling Without Prior Knowledge. ACM SIGCOMM Comput. Commun. Rev. 45 4 (2015) 393\u2013406.","DOI":"10.1145\/2829988.2787480"},{"key":"e_1_3_3_2_10_2","doi-asserted-by":"crossref","unstructured":"M. Chowdhury M. Zaharia J. Ma M.\u00a0I. Jordan and I. Stoica. 2011. Managing Data Transfers in Computer Clusters with Orchestra. ACM SIGCOMM Comput. Commun. Rev. 41 4 (2011) 98\u2013109.","DOI":"10.1145\/2043164.2018448"},{"key":"e_1_3_3_2_11_2","doi-asserted-by":"publisher","DOI":"10.1145\/2619239.2626315"},{"key":"e_1_3_3_2_12_2","doi-asserted-by":"crossref","unstructured":"J. Dean and S. Ghemawat. 2008. MapReduce: Simplified Data Processing on Large Clusters. Commun. ACM 51 1 (2008) 107\u2013113.","DOI":"10.1145\/1327452.1327492"},{"key":"e_1_3_3_2_13_2","doi-asserted-by":"publisher","DOI":"10.1109\/CloudCom.2011.21"},{"key":"e_1_3_3_2_14_2","doi-asserted-by":"publisher","DOI":"10.1145\/3178487.3178510"},{"key":"e_1_3_3_2_15_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE.2012.58"},{"key":"e_1_3_3_2_16_2","doi-asserted-by":"crossref","unstructured":"Y. Guo J. Rao D. Cheng and X. Zhou. 2016. iShuffle: Improving Hadoop Performance with Shuffle-on-Write. IEEE Trans. Parallel Distrib. Syst. (TPDS) 28 6 (2016) 1649\u20131662.","DOI":"10.1109\/TPDS.2016.2587645"},{"key":"e_1_3_3_2_17_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICDEW.2010.5452747"},{"key":"e_1_3_3_2_18_2","doi-asserted-by":"publisher","DOI":"10.1145\/1272996.1273005"},{"key":"e_1_3_3_2_19_2","doi-asserted-by":"publisher","DOI":"10.1145\/1629575.1629601"},{"key":"e_1_3_3_2_20_2","doi-asserted-by":"crossref","unstructured":"C. Kurumada S.\u00a0C. Meylan and M.\u00a0C. Frank. 2013. Zipfian Frequency Distributions Facilitate Word Segmentation in Context. Cognition 127 3 (2013) 439\u2013453.","DOI":"10.1016\/j.cognition.2013.02.002"},{"key":"e_1_3_3_2_21_2","doi-asserted-by":"publisher","DOI":"10.1145\/2213836.2213840"},{"key":"e_1_3_3_2_22_2","doi-asserted-by":"publisher","DOI":"10.1145\/2670979.2670985"},{"key":"e_1_3_3_2_23_2","doi-asserted-by":"crossref","unstructured":"J.\u00a0X. Lin T. Ji X. Hao H. Cha Y. Le X. Yu and A. Akella. 2023. Towards Accelerating Data Intensive Application\u2019s Shuffle Process Using SmartNICs. Proc. ACM Meas. Anal. Comput. Syst. 7 2 (2023) 1\u201323.","DOI":"10.1145\/3589980"},{"key":"e_1_3_3_2_24_2","first-page":"383","volume-title":"Proc. 12th USENIX Symp. Oper. Syst. Des. Implement. (OSDI 16)","author":"Lion D.","year":"2016","unstructured":"D. Lion, A. Chiu, H. Sun, X. Zhuang, N. Grcevski, and D. Yuan. 2016. Don\u2019t Get Caught in the Cold, Warm-up Your JVM: Understand and Eliminate JVM Warm-up Overhead in Data-Parallel Systems. In Proc. 12th USENIX Symp. Oper. Syst. Des. Implement. (OSDI 16). 383\u2013400."},{"key":"e_1_3_3_2_25_2","doi-asserted-by":"publisher","DOI":"10.1145\/3603269.3604848"},{"key":"e_1_3_3_2_26_2","first-page":"1049","volume-title":"Proc. Int. Conf. Very Large Data Bases (VLDB)","author":"Nambiar R.\u00a0O.","year":"2006","unstructured":"R.\u00a0O. Nambiar and M. Poess. 2006. The Making of TPC-DS. In Proc. Int. Conf. Very Large Data Bases (VLDB), Vol.\u00a06. 1049\u20131058."},{"key":"e_1_3_3_2_27_2","volume-title":"Proc. 14th Workshop Hot Top. Oper. Syst. (HotOS XIV)","author":"Ousterhout K.","year":"2013","unstructured":"K. Ousterhout, A. Panda, J. Rosen, S. Venkataraman, R. Xin, S. Ratnasamy, S. Shenker, and I. Stoica. 2013. The Case for Tiny Tasks in Compute Clusters. In Proc. 14th Workshop Hot Top. Oper. Syst. (HotOS XIV)."},{"key":"e_1_3_3_2_28_2","first-page":"293","volume-title":"Proc. 12th USENIX Symp. Netw. Syst. Des. Implement. (NSDI 15)","author":"Ousterhout K.","year":"2015","unstructured":"K. Ousterhout, R. Rasti, S. Ratnasamy, S. Shenker, and B.\u00a0G. Chun. 2015. Making Sense of Performance in Data Analytics Frameworks. In Proc. 12th USENIX Symp. Netw. Syst. Des. Implement. (NSDI 15). 293\u2013307."},{"key":"e_1_3_3_2_29_2","doi-asserted-by":"publisher","DOI":"10.1145\/2597652.2597684"},{"key":"e_1_3_3_2_30_2","doi-asserted-by":"publisher","DOI":"10.1145\/2391229.2391233"},{"key":"e_1_3_3_2_31_2","doi-asserted-by":"crossref","unstructured":"M. Shen Y. Zhou and C. Singh. 2020. Magnet: Push-Based Shuffle Service for Large-Scale Data Processing. Proc. VLDB Endow. 13 12 (2020) 3382\u20133395.","DOI":"10.14778\/3415478.3415558"},{"key":"e_1_3_3_2_32_2","unstructured":"K.\u00a0V. Shvachko. 2011. Apache Hadoop. Scalability Update 36 3 (2011) 7\u201313."},{"key":"e_1_3_3_2_33_2","doi-asserted-by":"crossref","unstructured":"P. Stuedi A. Trivedi J. Pfefferle R. Stoica B. Metzler N. Ioannou and I. Koltsidas. 2017. Crail: A High-Performance I\/O Architecture for Distributed Data Processing. IEEE Data Eng. Bull. 40 1 (2017) 38\u201349.","DOI":"10.1145\/3078468.3078477"},{"key":"e_1_3_3_2_34_2","doi-asserted-by":"crossref","unstructured":"L.\u00a0G. Valiant. 1990. A Bridging Model for Parallel Computation. Commun. ACM 33 8 (1990) 103\u2013111.","DOI":"10.1145\/79173.79181"},{"key":"e_1_3_3_2_35_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-25821-3_9"},{"key":"e_1_3_3_2_36_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-25821-3_9"},{"key":"e_1_3_3_2_37_2","doi-asserted-by":"crossref","unstructured":"J.\u00a0S. Vitter. 1985. Random Sampling with a Reservoir. ACM Trans. Math. Softw. (TOMS) 11 1 (1985) 37\u201357.","DOI":"10.1145\/3147.3165"},{"key":"e_1_3_3_2_38_2","doi-asserted-by":"publisher","DOI":"10.1145\/2063384.2063461"},{"key":"e_1_3_3_2_39_2","first-page":"1908","volume-title":"Proc. IEEE Int. Symp. Parallel Distrib. Process. Workshops (IPDPSW)","author":"Rahman M. Wasi-ur","year":"2013","unstructured":"M. Wasi-ur Rahman, N.\u00a0S. Islam, X. Lu, J. Jose, H. Subramoni, H. Wang, and D.\u00a0K. Panda. 2013. High-Performance RDMA-Based Design of Hadoop MapReduce over InfiniBand. In Proc. IEEE Int. Symp. Parallel Distrib. Process. Workshops (IPDPSW). IEEE, 1908\u20131917."},{"key":"e_1_3_3_2_40_2","doi-asserted-by":"crossref","unstructured":"C. Xie R. Chen H. Guan B. Zang and H. Chen. 2015. Sync or Async: Time to Fuse for Distributed Graph-Parallel Computation. ACM SIGPLAN Not. 50 8 (2015) 194\u2013204.","DOI":"10.1145\/2858788.2688508"},{"key":"e_1_3_3_2_41_2","first-page":"15","volume-title":"Proc. 9th USENIX Symp. Netw. Syst. Des. Implement. (NSDI 12)","author":"Zaharia M.","year":"2012","unstructured":"M. Zaharia, M. Chowdhury, T. Das, A. Dave, J. Ma, M. McCauly, M.\u00a0J. Franklin, S. Shenker, and I. Stoica. 2012. Resilient Distributed Datasets: A Fault-Tolerant Abstraction for In-Memory Cluster Computing. In Proc. 9th USENIX Symp. Netw. Syst. Des. Implement. (NSDI 12). 15\u201328."},{"key":"e_1_3_3_2_42_2","doi-asserted-by":"crossref","unstructured":"M. Zaharia R.\u00a0S. Xin P. Wendell T. Das M. Armbrust A. Dave X. Meng J. Rosen S. Venkataraman M.\u00a0J. Franklin et\u00a0al. 2016. Apache Spark: A Unified Engine for Big Data Processing. Commun. ACM 59 11 (2016) 56\u201365.","DOI":"10.1145\/2934664"},{"key":"e_1_3_3_2_43_2","doi-asserted-by":"publisher","DOI":"10.1145\/3190508.3190534"}],"event":{"name":"ICPP '25: 54th International Conference on Parallel Processing","location":"San Diego CA USA","acronym":"ICPP '25"},"container-title":["Proceedings of the 54th International Conference on Parallel Processing"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3754598.3754640","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,12,20]],"date-time":"2025-12-20T08:36:54Z","timestamp":1766219814000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3754598.3754640"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,9,8]]},"references-count":42,"alternative-id":["10.1145\/3754598.3754640","10.1145\/3754598"],"URL":"https:\/\/doi.org\/10.1145\/3754598.3754640","relation":{},"subject":[],"published":{"date-parts":[[2025,9,8]]},"assertion":[{"value":"2025-12-20","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}