{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T10:18:13Z","timestamp":1740133093822,"version":"3.37.3"},"reference-count":41,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"7","license":[{"start":{"date-parts":[[2024,7,1]],"date-time":"2024-07-01T00:00:00Z","timestamp":1719792000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2024,7,1]],"date-time":"2024-07-01T00:00:00Z","timestamp":1719792000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,7,1]],"date-time":"2024-07-01T00:00:00Z","timestamp":1719792000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62132017"],"award-info":[{"award-number":["62132017"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100012226","name":"Fundamental Research Funds for the Central Universities","doi-asserted-by":"publisher","award":["226-2022-00235"],"award-info":[{"award-number":["226-2022-00235"]}],"id":[{"id":"10.13039\/501100012226","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Visual. Comput. Graphics"],"published-print":{"date-parts":[[2024,7]]},"DOI":"10.1109\/tvcg.2023.3243228","type":"journal-article","created":{"date-parts":[[2023,2,9]],"date-time":"2023-02-09T18:33:25Z","timestamp":1675967605000},"page":"3915-3929","source":"Crossref","is-referenced-by-count":2,"title":["Visual Diagnostics of Parallel Performance in Training Large-Scale DNN Models"],"prefix":"10.1109","volume":"30","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-0743-7558","authenticated-orcid":false,"given":"Yating","family":"Wei","sequence":"first","affiliation":[{"name":"State Key Lab of CAD &#x0026; CG, Zhejiang University, Hangzhou, Zhejiang, China"}]},{"given":"Zhiyong","family":"Wang","sequence":"additional","affiliation":[{"name":"State Key Lab of CAD &#x0026; CG, Zhejiang University, Hangzhou, Zhejiang, China"}]},{"given":"Zhongwei","family":"Wang","sequence":"additional","affiliation":[{"name":"State Key Lab of CAD &#x0026; CG, Zhejiang University, Hangzhou, Zhejiang, China"}]},{"given":"Yong","family":"Dai","sequence":"additional","affiliation":[{"name":"State Key Lab of CAD &#x0026; CG, Zhejiang University, Hangzhou, Zhejiang, China"}]},{"given":"Gongchang","family":"Ou","sequence":"additional","affiliation":[{"name":"Distributed Data Lab, Huawei Technologies Co., Ltd., Shenzhen, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0450-1262","authenticated-orcid":false,"given":"Han","family":"Gao","sequence":"additional","affiliation":[{"name":"Distributed Data Lab, Huawei Technologies Co., Ltd., Shenzhen, China"}]},{"given":"Haitao","family":"Yang","sequence":"additional","affiliation":[{"name":"Distributed Data Lab, Huawei Technologies Co., Ltd., Shenzhen, China"}]},{"given":"Yue","family":"Wang","sequence":"additional","affiliation":[{"name":"Distributed Data Lab, Huawei Technologies Co., Ltd., Shenzhen, China"}]},{"given":"Caleb Chen","family":"Cao","sequence":"additional","affiliation":[{"name":"Distributed Data Lab, Huawei Technologies Co., Ltd., Shenzhen, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4350-9141","authenticated-orcid":false,"given":"Luoxuan","family":"Weng","sequence":"additional","affiliation":[{"name":"State Key Lab of CAD &#x0026; CG, Zhejiang University, Hangzhou, Zhejiang, China"}]},{"given":"Jiaying","family":"Lu","sequence":"additional","affiliation":[{"name":"State Key Lab of CAD &#x0026; CG, Zhejiang University, Hangzhou, Zhejiang, China"}]},{"given":"Rongchen","family":"Zhu","sequence":"additional","affiliation":[{"name":"State Key Lab of CAD &#x0026; CG, Zhejiang University, Hangzhou, Zhejiang, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8365-4741","authenticated-orcid":false,"given":"Wei","family":"Chen","sequence":"additional","affiliation":[{"name":"State Key Lab of CAD &#x0026; CG, Zhejiang University, Hangzhou, Zhejiang, China"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"article-title":"BERT: Pre-training of deep bidirectional transformers for language understanding","year":"2018","author":"Devlin","key":"ref2"},{"article-title":"A survey of deep learning techniques for neural machine translation","year":"2020","author":"Yang","key":"ref3"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref5","first-page":"173","article-title":"Deep speech 2: End-to-end speech recognition in english and mandarin","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Amodei"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/3065386"},{"key":"ref7","first-page":"1223","article-title":"Large scale distributed deep networks","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"25","author":"Dean"},{"key":"ref8","first-page":"1","article-title":"Mesh-tensorflow: Deep learning for supercomputers","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Shazeer","year":"2018"},{"article-title":"Megatron-LM: Training multi-billion parameter language models using model parallelism","year":"2019","author":"Shoeybi","key":"ref9"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1145\/3341301.3359646"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.48550\/arxiv.1811.06965"},{"article-title":"Yet another accelerated SGD: ResNet-50 training on ImageNet in 74.7 seconds","year":"2019","author":"Yamazaki","key":"ref12"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2017.2744878"},{"article-title":"Improving generalization performance by switching from adam to SGD","year":"2017","author":"Keskar","key":"ref14"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2017.2744683"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1145\/3200489"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2017.2744938"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/VISUAL.2005.1532820"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2016.2598831"},{"article-title":"TensorFlow: Large-scale machine learning on heterogeneous distributed systems","year":"2016","author":"Abadi","key":"ref20"},{"key":"ref21","first-page":"91","article-title":"La VALSE: Scalable log visualization for fault characterization in supercomputers","volume-title":"Proc. Eurographics Symp. Parallel Graph. Visualization","author":"Guo"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/VAST.2017.8585646"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/ICCC54389.2021.9674694"},{"article-title":"A review of temporal data visualizations based on space-time cube operations","volume-title":"Proc. Eurographics Conf. Visual.","author":"Bach","key":"ref24"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1097\/01445442-198507000-00012"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2015.2467592"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2016.2598664"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1145\/257089.257391"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/TCSS.2018.2858439"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2014.2346682"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2013.200"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2012.225"},{"key":"ref33","first-page":"1","article-title":"Beyond data and model parallelism for deep neural networks","volume-title":"Proc. Mach. Learn. Syst.","volume":"1","author":"Jia"},{"article-title":"PipeDream: Fast and efficient pipeline parallel DNN training","year":"2018","author":"Harlap","key":"ref34"},{"key":"ref35","first-page":"265","article-title":"TensorFlow: A. system for large-scale machine learning","volume-title":"Proc. 12th USENIX Symp. Operating Syst. Des. Implementation","author":"Abadi"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/TSMC.1981.4308636"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2007.70582"},{"volume-title":"Organizing for Work","year":"1919","author":"Gantt","key":"ref38"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1364\/JOSAA.12.002305"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/IV.2007.127"},{"article-title":"PanGu-$\\alpha$\u03b1: Large-scale autoregressive pretrained chinese language models with auto-parallel computation","year":"2021","author":"Zeng","key":"ref41"}],"container-title":["IEEE Transactions on Visualization and Computer Graphics"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/2945\/10576039\/10041726.pdf?arnumber=10041726","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,6,29]],"date-time":"2024-06-29T05:33:37Z","timestamp":1719639217000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10041726\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,7]]},"references-count":41,"journal-issue":{"issue":"7"},"URL":"https:\/\/doi.org\/10.1109\/tvcg.2023.3243228","relation":{},"ISSN":["1077-2626","1941-0506","2160-9306"],"issn-type":[{"type":"print","value":"1077-2626"},{"type":"electronic","value":"1941-0506"},{"type":"electronic","value":"2160-9306"}],"subject":[],"published":{"date-parts":[[2024,7]]}}}