{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T10:18:42Z","timestamp":1740133122391,"version":"3.37.3"},"reference-count":71,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"12","license":[{"start":{"date-parts":[[2022,12,1]],"date-time":"2022-12-01T00:00:00Z","timestamp":1669852800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2022,12,1]],"date-time":"2022-12-01T00:00:00Z","timestamp":1669852800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2022,12,1]],"date-time":"2022-12-01T00:00:00Z","timestamp":1669852800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"name":"National Key R&amp;D Program of China","award":["2021YFB0300300"],"award-info":[{"award-number":["2021YFB0300300"]}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["U20A20226","62072459","62172419"],"award-info":[{"award-number":["U20A20226","62072459","62172419"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100004826","name":"Beijing Natural Science Foundation","doi-asserted-by":"publisher","award":["4202031","L192027","L192027"],"award-info":[{"award-number":["4202031","L192027","L192027"]}],"id":[{"id":"10.13039\/501100004826","id-type":"DOI","asserted-by":"publisher"}]},{"name":"SOAR fellowship"},{"name":"University of Sydney faculty startup funding"},{"DOI":"10.13039\/501100000923","name":"Australian Research Council","doi-asserted-by":"publisher","award":["DP210101984"],"award-info":[{"award-number":["DP210101984"]}],"id":[{"id":"10.13039\/501100000923","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100002858","name":"China Postdoctoral Science Foundation","doi-asserted-by":"publisher","award":["2020TQ0169"],"award-info":[{"award-number":["2020TQ0169"]}],"id":[{"id":"10.13039\/501100002858","id-type":"DOI","asserted-by":"publisher"}]},{"name":"ShuiMu Tsinghua Scholar Fellowship","award":["2019SM131"],"award-info":[{"award-number":["2019SM131"]}]},{"name":"Tsinghua University-Peking Union Medical College Hospital Initiative Scientific Research Program","award":["20191080594"],"award-info":[{"award-number":["20191080594"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Parallel Distrib. Syst."],"published-print":{"date-parts":[[2022,12,1]]},"DOI":"10.1109\/tpds.2022.3181799","type":"journal-article","created":{"date-parts":[[2022,6,13]],"date-time":"2022-06-13T20:22:46Z","timestamp":1655151766000},"page":"4239-4255","source":"Crossref","is-referenced-by-count":2,"title":["Detecting Performance Variance for Parallel Applications Without Source Code"],"prefix":"10.1109","volume":"33","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-7656-6428","authenticated-orcid":false,"given":"Jidong","family":"Zhai","sequence":"first","affiliation":[{"name":"Department of Computer Science and Technology, Tsinghua University, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7327-748X","authenticated-orcid":false,"given":"Liyan","family":"Zheng","sequence":"additional","affiliation":[{"name":"Department of Computer Science and Technology, Tsinghua University, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1983-7321","authenticated-orcid":false,"given":"Feng","family":"Zhang","sequence":"additional","affiliation":[{"name":"Key Laboratory of Data Engineering and Knowledge Engineering, School of Information, Renmin University of China, Beijing, China"}]},{"given":"Xiongchao","family":"Tang","sequence":"additional","affiliation":[{"name":"Department of Computer Science and Technology, Tsinghua University, Beijing, China"}]},{"given":"Haojie","family":"Wang","sequence":"additional","affiliation":[{"name":"Department of Computer Science and Technology, Tsinghua University, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4391-8295","authenticated-orcid":false,"given":"Teng","family":"Yu","sequence":"additional","affiliation":[{"name":"Department of Computer Science and Technology, Tsinghua University, Beijing, China"}]},{"given":"Yuyang","family":"Jin","sequence":"additional","affiliation":[{"name":"Department of Computer Science and Technology, Tsinghua University, Beijing, China"}]},{"given":"Shuaiwen Leon","family":"Song","sequence":"additional","affiliation":[{"name":"School of Computer Science, University of Sydney, Sydney, NSW, Australia"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3146-656X","authenticated-orcid":false,"given":"Wenguang","family":"Chen","sequence":"additional","affiliation":[{"name":"Department of Computer Science and Technology, Tsinghua University, Beijing, China"}]}],"member":"263","reference":[{"key":"ref71","doi-asserted-by":"publisher","DOI":"10.1145\/2594291.2594336"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2018.2858800"},{"year":"0","key":"ref39","article-title":"The parallel PageRank program"},{"year":"0","key":"ref38","article-title":"The cuBERT framework"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.2307\/1937887"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/ISPASS.2013.6557172"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1145\/177424.178042"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1007\/3-540-28349-8_2"},{"article-title":"Mrnet: A scalable infrastructure for the development of parallel tools and applications","year":"2010","author":"brim","key":"ref37"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1145\/44483.44488"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1145\/2024569.2024572"},{"key":"ref34","first-page":"10","article-title":"Characterizing parallel scaling of scientific applications using IPM","author":"wright","year":"2009","journal-title":"Proc 10th LCI Int Conf High-Perform Clustered Comput"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1145\/1048935.1050204"},{"key":"ref62","first-page":"47","article-title":"IASO: A fail-slow detection and mitigation framework for distributed storage services","author":"panda","year":"2019","journal-title":"Proc USENIX Annu Tech Conf"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-96983-1_4"},{"key":"ref63","first-page":"307","article-title":"X-ray: Automating root-cause diagnosis of performance anomalies in production software","author":"attariyan","year":"2012","journal-title":"Proc 10th USENIX Symp Oper Syst Des Implementation"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1145\/511399.511364"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.1145\/2371536.2371572"},{"article-title":"Memory bandwidth: Stream benchmark performance results","year":"2018","author":"mccalpin","key":"ref27"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2016.2613524"},{"key":"ref66","first-page":"1","article-title":"Stack trace analysis for large scale applications","author":"arnold","year":"2007","journal-title":"Proc 21st IEEE Int Parallel Distrib Process Symp"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2019.2955467"},{"key":"ref67","doi-asserted-by":"publisher","DOI":"10.1145\/3295500.3356167"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.1145\/2670979.2670987"},{"key":"ref69","doi-asserted-by":"publisher","DOI":"10.1145\/2451116.2451131"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1007\/s10586-011-0178-3"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1145\/2018436.2018465"},{"year":"2018","key":"ref20","article-title":"Intel 64 and IA-32 architectures software developer manuals"},{"key":"ref22","doi-asserted-by":"crossref","first-page":"155","DOI":"10.1016\/S0168-9274(01)00115-5","article-title":"Boomeramg: A parallel algebraic multigrid solver and preconditioner","volume":"41","author":"yang","year":"2002","journal-title":"Appl Numer Math"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ISPASS.2014.6844459"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2014.2314100"},{"journal-title":"The NAS Parallel Benchmarks 2 0","year":"1995","author":"bailey","key":"ref23"},{"year":"0","key":"ref26","article-title":"Stress"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1145\/3503221.3508405"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1177\/1094342006064482"},{"article-title":"Impacts of operating systems on the scalability of parallel applications","year":"2003","author":"jones","key":"ref51"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1145\/2503210.2503277"},{"key":"ref58","first-page":"1","article-title":"PAPI: A portable interface to hardware performance counters","volume":"710","author":"mucci","year":"1999","journal-title":"Proc Dept Defense HPCMP Users Group Conf"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-31476-6_7"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1145\/3514221.3526130"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2021.3059108"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2021.3119402"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1007\/s00778-020-00636-3"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2021.3093234"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/SC.2018.00021"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/SC.2014.85"},{"year":"0","key":"ref40","article-title":"The MapReduce framework"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1145\/3242086"},{"key":"ref13","doi-asserted-by":"crossref","first-page":"336","DOI":"10.1145\/871656.859657","article-title":"Phase tracking and prediction","author":"sherwood","year":"2003","journal-title":"Proc ACM SIGARCH Comput Archit News"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/PACT.2001.953283"},{"journal-title":"Compilers Principles Techniques and Tools","year":"2006","author":"aho","key":"ref15"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1145\/3503221.3508411"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/SC.2014.17"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1155\/2008\/632685"},{"year":"2022","key":"ref19","article-title":"The mpiP: tool"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.14778\/1920841.1920902"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/SC.2016.32"},{"key":"ref6","first-page":"409","article-title":"Taming performance variability","author":"maricq","year":"2018","journal-title":"Proc 13th USENIX Symp Oper Syst Des Implementation"},{"key":"ref5","article-title":"The seven deadly sins of cloud computing research","author":"schwarzkopf","year":"2012","journal-title":"Proc 4th USENIX Workshop Hot Top Cloud Comput"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/CLUSTR.2006.311846"},{"key":"ref7","first-page":"124","article-title":"Vsensor: Leveraging fixed-workload snippets of programs for performance variance detection","author":"tang","year":"2018","journal-title":"Proc 23rd ACM SIGPLAN Symp Princ Pract Parallel Program"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2016.2586074"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/SC.2010.12"},{"key":"ref46","first-page":"1","article-title":"The new linux perf tools","author":"de melo","year":"2010","journal-title":"Proc Conf Slides Linux Kongress"},{"year":"2018","key":"ref45","article-title":"Addressing potential DGEMM\/HPL perf variability on 24-core intel xeon processor scalable family"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/btl446"},{"year":"0","key":"ref47","article-title":"The nekbone program"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1145\/1454115.1454128"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1175\/BAMS-D-13-00255.1"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1002\/cpe.728"},{"key":"ref43","first-page":"410","article-title":"V-measure: A conditional entropy-based external cluster evaluation measure","author":"rosenberg","year":"2007","journal-title":"Proc Joint Conf Empir Methods Natural Lang Process Comput Natural Lang Learn"}],"container-title":["IEEE Transactions on Parallel and Distributed Systems"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/71\/9790018\/09794597.pdf?arnumber=9794597","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,9,19]],"date-time":"2022-09-19T19:59:33Z","timestamp":1663617573000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9794597\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,12,1]]},"references-count":71,"journal-issue":{"issue":"12"},"URL":"https:\/\/doi.org\/10.1109\/tpds.2022.3181799","relation":{},"ISSN":["1045-9219","1558-2183","2161-9883"],"issn-type":[{"type":"print","value":"1045-9219"},{"type":"electronic","value":"1558-2183"},{"type":"electronic","value":"2161-9883"}],"subject":[],"published":{"date-parts":[[2022,12,1]]}}}