{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,29]],"date-time":"2026-01-29T13:42:35Z","timestamp":1769694155636,"version":"3.49.0"},"publisher-location":"New York, NY, USA","reference-count":39,"publisher":"ACM","license":[{"start":{"date-parts":[[2026,1,28]],"date-time":"2026-01-28T00:00:00Z","timestamp":1769558400000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","award":["2216971"],"award-info":[{"award-number":["2216971"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]},{"name":"National Science Foundation","award":["2106699"],"award-info":[{"award-number":["2106699"]}]},{"name":"National Science Foundation","award":["2107280"],"award-info":[{"award-number":["2107280"]}]},{"DOI":"10.13039\/100008902","name":"Los Alamos National Laboratory","doi-asserted-by":"publisher","award":["541715"],"award-info":[{"award-number":["541715"]}],"id":[{"id":"10.13039\/100008902","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000005","name":"DOD U.S. Department of Defense","doi-asserted-by":"publisher","award":["FA8750-19-2-1000"],"award-info":[{"award-number":["FA8750-19-2-1000"]}],"id":[{"id":"10.13039\/100000005","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000015","name":"DOE U.S. Department of Energy","doi-asserted-by":"publisher","award":["DE- NA0003965"],"award-info":[{"award-number":["DE- NA0003965"]}],"id":[{"id":"10.13039\/100000015","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2026,1,28]]},"DOI":"10.1145\/3774934.3786452","type":"proceedings-article","created":{"date-parts":[[2026,1,28]],"date-time":"2026-01-28T15:25:57Z","timestamp":1769613957000},"page":"68-80","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Waste-Efficient Work Stealing"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0004-3588-2215","authenticated-orcid":false,"given":"Kyle","family":"Singer","sequence":"first","affiliation":[{"name":"Massachusetts Institute of Technology, Cambridge, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5882-6647","authenticated-orcid":false,"given":"Kunal","family":"Agrawal","sequence":"additional","affiliation":[{"name":"Washington University in St. Louis, St. Louis, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0198-3283","authenticated-orcid":false,"given":"Tao B.","family":"Schardl","sequence":"additional","affiliation":[{"name":"Massachusetts Institute of Technology, Cambridge, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2026,1,28]]},"reference":[{"key":"e_1_3_2_2_1_1","doi-asserted-by":"publisher","unstructured":"Kunal Agrawal and Seth Gilbert. 2018. The Power to Schedule a Parallel Program. In IPDPS. 182\u2013193. https:\/\/doi.org\/10.1109\/IPDPS.2018.00028 10.1109\/IPDPS.2018.00028","DOI":"10.1109\/IPDPS.2018.00028"},{"key":"e_1_3_2_2_2_1","doi-asserted-by":"publisher","DOI":"10.1145\/1394441.1394443"},{"key":"e_1_3_2_2_3_1","unstructured":"Daniel Anderson. 2023. Elastic schedler. Available from. https:\/\/github.com\/cmuparlay\/parlaylib\/pull\/52"},{"key":"e_1_3_2_2_4_1","doi-asserted-by":"crossref","unstructured":"Nimar S. Arora Robert D. Blumofe and C. Greg Plaxton. 2001. Thread Scheduling for Multiprogrammed Multiprocessors. Theory of Computing Systems 115\u2013144.","DOI":"10.1007\/s002240011004"},{"key":"e_1_3_2_2_5_1","doi-asserted-by":"crossref","unstructured":"Rajkishore Barik Zoran Budimli\u0107 Vincent Cav\u00e8 Sanjay Chatterjee Yi Guo David Peixotto Raghavan Raman Jun Shirako Sa\u011fnak Ta\u015f\u0131rlar Yonghong Yan Yisheng Zhao and Vivek Sarkar. 2009. The Habanero Multicore Software Research Project. In OOPSLA. 735\u2013736.","DOI":"10.1145\/1639950.1639989"},{"key":"e_1_3_2_2_6_1","volume-title":"Jaswinder Pal Singh, and Kai Li","author":"Bienia Christian","year":"2008","unstructured":"Christian Bienia, Sanjeev Kumar, Jaswinder Pal Singh, and Kai Li. 2008. The PARSEC Benchmark Suite: Characterization and Architectural Implications. In PACT. ACM, 72\u201381."},{"key":"e_1_3_2_2_7_1","doi-asserted-by":"publisher","unstructured":"Guy E. Blelloch Daniel Anderson and Laxman Dhulipala. 2020. ParlayLib - A Toolkit for Parallel Algorithms on Shared-Memory Multicore Machines. In SPAA. 507\u2013509. https:\/\/doi.org\/10.1145\/3350755.3400254 10.1145\/3350755.3400254","DOI":"10.1145\/3350755.3400254"},{"key":"e_1_3_2_2_8_1","doi-asserted-by":"publisher","DOI":"10.1145\/324133.324234"},{"key":"e_1_3_2_2_9_1","volume-title":"Blumofe and Dionisios Papadopoulos","author":"Robert","year":"1998","unstructured":"Robert D. Blumofe and Dionisios Papadopoulos. 1998. Hood: A User-Level Threads Library for Multiprogrammed Multiprocessors. U. Texas at Austin."},{"key":"e_1_3_2_2_10_1","volume-title":"Blumofe and Dionisios Papadopoulos","author":"Robert","year":"1998","unstructured":"Robert D. Blumofe and Dionisios Papadopoulos. 1998. The Performance of Work Stealing in Multiprogrammed Environments. The University of Texas at Austin, Department of Computer Sciences."},{"key":"e_1_3_2_2_11_1","doi-asserted-by":"crossref","unstructured":"Yangjie Cao Hongyang Sun Depei Qian and Weiguo Wu. 2011. Stable Adaptive Work-Stealing for Concurrent Multi-core Runtime Systems. In HPCC. 108\u2013115.","DOI":"10.1109\/HPCC.2011.24"},{"key":"e_1_3_2_2_12_1","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS.2016.49"},{"key":"e_1_3_2_2_13_1","doi-asserted-by":"crossref","unstructured":"Vincent Cav\u00e9 Jisheng Zhao Jun Shirako and Vivek Sarkar. 2011. Habanero-Java: the new adventures of old X10. In PPPJ. 51\u201361.","DOI":"10.1145\/2093157.2093165"},{"key":"e_1_3_2_2_14_1","doi-asserted-by":"publisher","DOI":"10.1145\/3510422"},{"key":"e_1_3_2_2_15_1","volume-title":"https:\/\/google.github.io\/tcmalloc\/ Accessed","author":"Google Corporation","year":"2022","unstructured":"Google Corporation. 2022. TCMalloc. https:\/\/google.github.io\/tcmalloc\/ Accessed August 2022"},{"key":"e_1_3_2_2_16_1","unstructured":"Intel Corporation. 2022. Intel\u00ae 64 and IA-32 Architectures Software Developer\u2019s Manual."},{"key":"e_1_3_2_2_17_1","volume-title":"Theoretically Efficient Parallel Graph Algorithms Can Be Fast and Scalable. ACM TOPC, 8, 1","author":"Dhulipala Laxman","year":"2021","unstructured":"Laxman Dhulipala, Guy E. Blelloch, and Julian Shun. 2021. Theoretically Efficient Parallel Graph Algorithms Can Be Fast and Scalable. ACM TOPC, 8, 1 (2021), Article 4, 70 pages."},{"key":"e_1_3_2_2_18_1","doi-asserted-by":"publisher","DOI":"10.1145\/2168836.2168873"},{"key":"e_1_3_2_2_19_1","volume-title":"Randall","author":"Frigo Matteo","year":"1998","unstructured":"Matteo Frigo, Charles E. Leiserson, and Keith H. Randall. 1998. The Implementation of the Cilk-5 Multithreaded Language. In PLDI. 212\u2013223."},{"key":"e_1_3_2_2_20_1","volume-title":"Leiserson","author":"He Yuxiong","year":"2010","unstructured":"Yuxiong He, Charles E. Leiserson, and William M. Leiserson. 2010. The Cilkview Scalability Analyzer. In SPAA. 145\u2013156."},{"key":"e_1_3_2_2_21_1","doi-asserted-by":"publisher","unstructured":"Connor Imes Huazhe Zhang Kevin Zhao and Henry Hoffmann. 2019. CoPPer: Soft Real-Time Application Performance Using Hardware Power Capping. In ICAC. 31\u201341. https:\/\/doi.org\/10.1109\/ICAC.2019.00015 10.1109\/ICAC.2019.00015","DOI":"10.1109\/ICAC.2019.00015"},{"key":"e_1_3_2_2_22_1","unstructured":"2023. Intel(R) oneAPI Threading Building Blocks (oneTBB) Documentation. Available from https:\/\/www.intel.com\/content\/www\/us\/en\/develop\/documentation\/onetbb-documentation\/top.html"},{"key":"e_1_3_2_2_23_1","unstructured":"Michael Kerrisk. 2024. sched_yield(2) \u2014 Linux manual page. Available from. https:\/\/man7.org\/linux\/man-pages\/man2\/sched_yield.2.html"},{"key":"e_1_3_2_2_24_1","unstructured":"Michael Kerrisk. 2025. clock_gettime(3) \u2014 Linux manual page. Available from. https:\/\/man7.org\/linux\/man-pages\/man3\/clock_gettime.3.html"},{"key":"e_1_3_2_2_25_1","unstructured":"Michael Kerrisk. 2025. futex(2) \u2014 Linux manual page. Available from. https:\/\/man7.org\/linux\/man-pages\/man2\/futex.2.html"},{"key":"e_1_3_2_2_26_1","unstructured":"Michael Kerrisk. 2025. getrusage(2) \u2014 Linux manual page. Available from. https:\/\/man7.org\/linux\/man-pages\/man2\/getrusage.2.html"},{"key":"e_1_3_2_2_27_1","doi-asserted-by":"publisher","DOI":"10.1145\/337449.337465"},{"key":"e_1_3_2_2_28_1","doi-asserted-by":"publisher","DOI":"10.1007\/s11227-010-0405-3"},{"key":"e_1_3_2_2_29_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICPADS51040.2020.00018"},{"key":"e_1_3_2_2_30_1","unstructured":"Nicholas D. Matsakis. 2015. Rayon: data parallelism in Rust. Available at. http:\/\/smallcultfollowing.com\/babystep s\/blog\/2015\/12\/18\/rayon-data-parallelism-in-rust\/"},{"key":"e_1_3_2_2_31_1","unstructured":"2015. OpenMP Application Program Interface Version 4.5."},{"key":"e_1_3_2_2_32_1","doi-asserted-by":"publisher","unstructured":"Haris Ribic and Yu David Liu. 2014. Energy-efficient work-stealing language runtimes. In ASPLOS. 513\u2013528. https:\/\/doi.org\/10.1145\/2541940.2541971 10.1145\/2541940.2541971","DOI":"10.1145\/2541940.2541971"},{"key":"e_1_3_2_2_33_1","doi-asserted-by":"publisher","DOI":"10.1145\/2925426.2926260"},{"key":"e_1_3_2_2_34_1","doi-asserted-by":"publisher","DOI":"10.1145\/3572848.3577509"},{"key":"e_1_3_2_2_35_1","doi-asserted-by":"publisher","DOI":"10.5281\/zenodo.17706312"},{"key":"e_1_3_2_2_36_1","doi-asserted-by":"publisher","DOI":"10.1007\/3-540-60153-8_31"},{"key":"e_1_3_2_2_37_1","unstructured":"Josh Stone and Niko Matsakis. 2025. Introduction: the sleep module. Available from. https:\/\/github.com\/rayon-rs\/rayon\/tree\/main\/rayon-core\/src\/sleep"},{"key":"e_1_3_2_2_38_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2010.121"},{"key":"e_1_3_2_2_39_1","doi-asserted-by":"publisher","unstructured":"\u017deljko Vrba H\u00e5vard Espeland P\u00e5l Halvorsen and Carsten Griwodz. 2009. Limits of Work-Stealing Scheduling. 280\u2013299. isbn:9783642046322 https:\/\/doi.org\/10.1007\/978-3-642-04633-9_15 10.1007\/978-3-642-04633-9_15","DOI":"10.1007\/978-3-642-04633-9_15"}],"event":{"name":"PPoPP '26: 31st ACM SIGPLAN Annual Symposium on Principles and Practice of Parallel Programming","location":"Sydney NSW Australia","acronym":"PPoPP '26","sponsor":["SIGHPC ACM Special Interest Group on High Performance Computing, Special Interest Group on High Performance Computing","SIGPLAN ACM Special Interest Group on Programming Languages"]},"container-title":["Proceedings of the 31st ACM SIGPLAN Annual Symposium on Principles and Practice of Parallel Programming"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3774934.3786452","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3774934.3786452","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,1,28]],"date-time":"2026-01-28T15:26:16Z","timestamp":1769613976000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3774934.3786452"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,1,28]]},"references-count":39,"alternative-id":["10.1145\/3774934.3786452","10.1145\/3774934"],"URL":"https:\/\/doi.org\/10.1145\/3774934.3786452","relation":{},"subject":[],"published":{"date-parts":[[2026,1,28]]},"assertion":[{"value":"2026-01-28","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}