{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,26]],"date-time":"2026-03-26T14:07:32Z","timestamp":1774534052138,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":47,"publisher":"ACM","license":[{"start":{"date-parts":[[2023,2,21]],"date-time":"2023-02-21T00:00:00Z","timestamp":1676937600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2023,2,25]]},"DOI":"10.1145\/3572848.3577528","type":"proceedings-article","created":{"date-parts":[[2023,2,21]],"date-time":"2023-02-21T16:02:30Z","timestamp":1676995350000},"page":"392-404","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":26,"title":["DSP"],"prefix":"10.1145","author":[{"given":"Zhenkun","family":"Cai","sequence":"first","affiliation":[{"name":"Department of Comptuer Sicence and Engineering, The Chinese University of Hong Kong"}]},{"given":"Qihui","family":"Zhou","sequence":"additional","affiliation":[{"name":"Department of Comptuer Sicence and Engineering, The Chinese University of Hong Kong"}]},{"given":"Xiao","family":"Yan","sequence":"additional","affiliation":[{"name":"Department of Computer Science and Engineering, Southern University of Science and Technology"}]},{"given":"Da","family":"Zheng","sequence":"additional","affiliation":[{"name":"Amazon Web Services"}]},{"given":"Xiang","family":"Song","sequence":"additional","affiliation":[{"name":"Amazon Web Services"}]},{"given":"Chenguang","family":"Zheng","sequence":"additional","affiliation":[{"name":"Department of Comptuer Sicence and Engineering, The Chinese University of Hong Kong"}]},{"given":"James","family":"Cheng","sequence":"additional","affiliation":[{"name":"Department of Comptuer Sicence and Engineering, The Chinese University of Hong Kong"}]},{"given":"George","family":"Karypis","sequence":"additional","affiliation":[{"name":"Amazon Web Services"}]}],"member":"320","published-online":{"date-parts":[[2023,2,21]]},"reference":[{"key":"e_1_3_2_1_1_1","unstructured":"2020. Euler. https:\/\/github.com\/alibaba\/euler."},{"key":"e_1_3_2_1_2_1","unstructured":"2021. Quiver. https:\/\/github.com\/quiver-team\/torch-quiver."},{"key":"e_1_3_2_1_3_1","unstructured":"2022. NVSHMEM. https:\/\/developer.nvidia.com\/nvshmem."},{"key":"e_1_3_2_1_4_1","volume-title":"Procedure for sampling without replacement. https:\/\/anonymous.4open.science\/r\/Anonymous-593E\/CSP-layerwise-proof.pdf. [Online","year":"2023","unstructured":"anonymous. 2022. Procedure for sampling without replacement. https:\/\/anonymous.4open.science\/r\/Anonymous-593E\/CSP-layerwise-proof.pdf. [Online; accessed January-2023]."},{"key":"e_1_3_2_1_5_1","unstructured":"K. Bhatia K. Dahiya H. Jain P. Kar A. Mittal Y. Prabhu and M. Varma. 2016. The extreme classification repository: Multi-label datasets and code. http:\/\/manikvarma.org\/downloads\/XC\/XMLRepository.html"},{"key":"e_1_3_2_1_6_1","volume-title":"6th International Conference on Learning Representations, ICLR 2018, Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings. OpenReview.net.","author":"Chen Jie","year":"2018","unstructured":"Jie Chen, Tengfei Ma, and Cao Xiao. 2018. FastGCN: Fast Learning with Graph Convolutional Networks via Importance Sampling. In 6th International Conference on Learning Representations, ICLR 2018, Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings. OpenReview.net."},{"key":"e_1_3_2_1_7_1","volume-title":"Proceedings of the 35th International Conference on Machine Learning, ICML 2018, Stockholmsm\u00e4ssan","author":"Chen Jianfei","year":"2018","unstructured":"Jianfei Chen, Jun Zhu, and Le Song. 2018. Stochastic Training of Graph Convolutional Networks with Variance Reduction. In Proceedings of the 35th International Conference on Machine Learning, ICML 2018, Stockholmsm\u00e4ssan, Stockholm, Sweden, July 10--15, 2018. 941--949."},{"key":"e_1_3_2_1_8_1","volume-title":"Graph Neural Networks for COVID-19 Drug Discovery. In 2020 IEEE International Conference on Big Data (IEEE BigData 2020","author":"Cheung Mark","year":"2020","unstructured":"Mark Cheung and Jos\u00e9 M. F. Moura. 2020. Graph Neural Networks for COVID-19 Drug Discovery. In 2020 IEEE International Conference on Big Data (IEEE BigData 2020), Atlanta, GA, USA, December 10--13, 2020. 5646--5648."},{"key":"e_1_3_2_1_9_1","volume-title":"Fast Graph Representation Learning with PyTorch Geometric. In ICLR Workshop on Representation Learning on Graphs and Manifolds.","author":"Fey Matthias","unstructured":"Matthias Fey and Jan E. Lenssen. 2019. Fast Graph Representation Learning with PyTorch Geometric. In ICLR Workshop on Representation Learning on Graphs and Manifolds."},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1145\/3219819.3219947"},{"key":"e_1_3_2_1_11_1","volume-title":"Learning Graph Representations with Embedding Propagation. In Advances in Neural Information Processing Systems 30: Annual Conference on Neural Information Processing Systems 2017","author":"Garc\u00eda-Dur\u00e1n Alberto","year":"2017","unstructured":"Alberto Garc\u00eda-Dur\u00e1n and Mathias Niepert. 2017. Learning Graph Representations with Embedding Propagation. In Advances in Neural Information Processing Systems 30: Annual Conference on Neural Information Processing Systems 2017, December 4--9, 2017, Long Beach, CA, USA. 5119--5130."},{"key":"e_1_3_2_1_12_1","volume-title":"Taylor-King","author":"Gaudelet Thomas","year":"2020","unstructured":"Thomas Gaudelet, Ben Day, Arian R. Jamasb, Jyothish Soman, Cristian Regep, Gertrude Liu, Jeremy B. R. Hayter, Richard Vickers, Charles Roberts, Jian Tang, David Roblin, Tom L. Blundell, Michael M. Bronstein, and Jake P. Taylor-King. 2020. Utilising Graph Machine Learning within Drug Discovery and Development. CoRR abs\/2012.05716 (2020)."},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1145\/2939672.2939754"},{"key":"e_1_3_2_1_14_1","volume-title":"Inductive Representation Learning on Large Graphs. In Advances in Neural Information Processing Systems 30: Annual Conference on Neural Information Processing Systems 2017","author":"Hamilton William L.","year":"2017","unstructured":"William L. Hamilton, Zhitao Ying, and Jure Leskovec. 2017. Inductive Representation Learning on Large Graphs. In Advances in Neural Information Processing Systems 30: Annual Conference on Neural Information Processing Systems 2017, December 4--9, 2017, Long Beach, CA, USA. 1024--1034."},{"key":"e_1_3_2_1_15_1","volume-title":"Open Graph Benchmark: Datasets for Machine Learning on Graphs. In Advances in Neural Information Processing Systems 33: Annual Conference on Neural Information Processing Systems 2020","author":"Hu Weihua","year":"2020","unstructured":"Weihua Hu, Matthias Fey, Marinka Zitnik, Yuxiao Dong, Hongyu Ren, Bowen Liu, Michele Catasta, and Jure Leskovec. 2020. Open Graph Benchmark: Datasets for Machine Learning on Graphs. In Advances in Neural Information Processing Systems 33: Annual Conference on Neural Information Processing Systems 2020, NeurIPS 2020, December 6--12, 2020, virtual."},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1145\/3447786.3456244"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1137\/S1064827595287997"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1145\/3476886.3477515"},{"key":"e_1_3_2_1_19_1","volume-title":"Kipf and Max Welling","author":"Thomas","year":"2017","unstructured":"Thomas N. Kipf and Max Welling. 2017. Semi-Supervised Classification with Graph Convolutional Networks. In 5th International Conference on Learning Representations, ICLR 2017, Toulon, France, April 24--26, 2017, Conference Track Proceedings. OpenReview.net."},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1145\/1553374.1553447"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1145\/3419111.3421281"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1109\/JAS.2021.1004311"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN52387.2021.9533367"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.14778\/3425879.3425883"},{"key":"e_1_3_2_1_25_1","volume-title":"Hwu","author":"Min Seungwon","year":"2021","unstructured":"Seungwon Min, Kun Wu, Mert Hidayetoglu, Jinjun Xiong, Xiang Song, and Wen-mei W. Hwu. 2021. Graph Neural Network Training with Data Tiering. CoRR abs\/2111.05894 (2021). arXiv:2111.05894 https:\/\/arxiv.org\/abs\/2111.05894"},{"key":"e_1_3_2_1_26_1","volume-title":"DGX Systems. https:\/\/www.nvidia.com\/en-sg\/data-center\/dgx-systems. [Online","author":"NVIDIA.","year":"2022","unstructured":"NVIDIA. 2022. DGX Systems. https:\/\/www.nvidia.com\/en-sg\/data-center\/dgx-systems. [Online; accessed March-2022]."},{"key":"e_1_3_2_1_27_1","volume-title":"NVIDIA Collective communications library (NCCL). https:\/\/https:\/\/developer.nvidia.com\/nccl. [Online","author":"NVIDIA.","year":"2022","unstructured":"NVIDIA. 2022. NVIDIA Collective communications library (NCCL). https:\/\/https:\/\/developer.nvidia.com\/nccl. [Online; accessed March-2022]."},{"key":"e_1_3_2_1_28_1","volume-title":"https:\/\/www.nvidia.com\/en-sg\/data-center\/nvlink. [Online","author":"Link NVIDIA.","year":"2022","unstructured":"NVIDIA. 2022. NVLink and NVSwitch. https:\/\/www.nvidia.com\/en-sg\/data-center\/nvlink. [Online; accessed March-2022]."},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1109\/SC41405.2020.00060"},{"key":"e_1_3_2_1_30_1","volume-title":"High-Performance Deep Learning Library. In Advances in Neural Information Processing Systems 32: Annual Conference on Neural Information Processing Systems 2019","author":"Paszke Adam","year":"2019","unstructured":"Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer, James Bradbury, Gregory Chanan, Trevor Killeen, Zeming Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison, Andreas K\u00f6pf, Edward Z. Yang, Zachary DeVito, Martin Raison, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner, Lu Fang, Junjie Bai, and Soumith Chintala. 2019. Py-Torch: An Imperative Style, High-Performance Deep Learning Library. In Advances in Neural Information Processing Systems 32: Annual Conference on Neural Information Processing Systems 2019, NeurIPS 2019, December 8--14, 2019, Vancouver, BC, Canada. 8024--8035."},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1145\/2623330.2623732"},{"key":"e_1_3_2_1_32_1","volume-title":"Category-aware Graph Neural Networks for Improving E-commerce Review Helpfulness Prediction. In CIKM '20: The 29th ACM International Conference on Information and Knowledge Management","author":"Qu Xiaoru","year":"2020","unstructured":"Xiaoru Qu, Zhao Li, Jialin Wang, Zhipeng Zhang, Pengcheng Zou, Junxiao Jiang, Jiaming Huang, Rong Xiao, Ji Zhang, and Jun Gao. 2020. Category-aware Graph Neural Networks for Improving E-commerce Review Helpfulness Prediction. In CIKM '20: The 29th ACM International Conference on Information and Knowledge Management, Virtual Event, Ireland, October 19--23, 2020. 2693--2700."},{"key":"e_1_3_2_1_33_1","series-title":"Series in Machine Perception and Artificial Intelligence","volume-title":"Graph Classification and Clustering Based on Vector Space Embedding","author":"Riesen Kaspar","unstructured":"Kaspar Riesen and Horst Bunke. 2010. Graph Classification and Clustering Based on Vector Space Embedding. Series in Machine Perception and Artificial Intelligence, Vol. 77. WorldScientific."},{"key":"e_1_3_2_1_34_1","series-title":"Series in Machine Perception and Artificial Intelligence","volume-title":"Graph Classification and Clustering Based on Vector Space Embedding","author":"Riesen Kaspar","unstructured":"Kaspar Riesen and Horst Bunke. 2010. Graph Classification and Clustering Based on Vector Space Embedding. Series in Machine Perception and Artificial Intelligence, Vol. 77. WorldScientific."},{"key":"e_1_3_2_1_35_1","volume-title":"GPU Technology Conference, NVIDIA.","author":"Schroeder Tim C","year":"2011","unstructured":"Tim C Schroeder. 2011. Peer-to-peer & unified virtual addressing. In GPU Technology Conference, NVIDIA."},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1145\/3469379.3469387"},{"key":"e_1_3_2_1_37_1","volume-title":"Graph Attention Networks. In 6th International Conference on Learning Representations, ICLR 2018, Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings. OpenReview.net.","author":"Velickovic Petar","year":"2018","unstructured":"Petar Velickovic, Guillem Cucurull, Arantxa Casanova, Adriana Romero, Pietro Li\u00f2, and Yoshua Bengio. 2018. Graph Attention Networks. In 6th International Conference on Learning Representations, ICLR 2018, Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings. OpenReview.net."},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.1162\/qss_a_00021"},{"key":"e_1_3_2_1_39_1","volume-title":"Deep Graph Library: Towards Efficient and Scalable Deep Learning on Graphs. CoRR abs\/1909.01315","author":"Wang Minjie","year":"2019","unstructured":"Minjie Wang, Lingfan Yu, Da Zheng, Quan Gan, Yu Gai, Zihao Ye, Mufei Li, Jinjing Zhou, Qi Huang, Chao Ma, Ziyue Huang, Qipeng Guo, Hao Zhang, Haibin Lin, Junbo Zhao, Jinyang Li, Alexander J. Smola, and Zheng Zhang. 2019. Deep Graph Library: Towards Efficient and Scalable Deep Learning on Graphs. CoRR abs\/1909.01315 (2019). arXiv:1909.01315 http:\/\/arxiv.org\/abs\/1909.01315"},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2018\/142"},{"key":"e_1_3_2_1_41_1","volume-title":"Defining and Evaluating Network Communities Based on Ground-Truth. In 12th IEEE International Conference on Data Mining, ICDM 2012","author":"Yang Jaewon","year":"2012","unstructured":"Jaewon Yang and Jure Leskovec. 2012. Defining and Evaluating Network Communities Based on Ground-Truth. In 12th IEEE International Conference on Data Mining, ICDM 2012, Brussels, Belgium, December 10--13, 2012. 745--754."},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"publisher","DOI":"10.1145\/3492321.3519557"},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1145\/3341301.3359634"},{"key":"e_1_3_2_1_44_1","volume-title":"Link Prediction Based on Graph Neural Networks. In Advances in Neural Information Processing Systems 31: Annual Conference on Neural Information Processing Systems 2018","author":"Zhang Muhan","year":"2018","unstructured":"Muhan Zhang and Yixin Chen. 2018. Link Prediction Based on Graph Neural Networks. In Advances in Neural Information Processing Systems 31: Annual Conference on Neural Information Processing Systems 2018, NeurIPS 2018, December 3--8, 2018, Montr\u00e9al, Canada. 5171--5181."},{"key":"e_1_3_2_1_45_1","doi-asserted-by":"publisher","DOI":"10.14778\/3514061.3514069"},{"key":"e_1_3_2_1_46_1","volume-title":"DistDGL: Distributed Graph Neural Network Training for Billion-Scale Graphs. In 10th IEEE\/ACM Workshop on Irregular Applications: Architectures and Algorithms, IA3 2020","author":"Zheng Da","year":"2020","unstructured":"Da Zheng, Chao Ma, Minjie Wang, Jinjing Zhou, Qidong Su, Xiang Song, Quan Gan, Zheng Zhang, and George Karypis. 2020. DistDGL: Distributed Graph Neural Network Training for Billion-Scale Graphs. In 10th IEEE\/ACM Workshop on Irregular Applications: Architectures and Algorithms, IA3 2020, Atlanta, GA, USA, November 11, 2020. IEEE, 36--44."},{"key":"e_1_3_2_1_47_1","doi-asserted-by":"publisher","DOI":"10.14778\/3352063.3352127"}],"event":{"name":"PPoPP '23: The 28th ACM SIGPLAN Annual Symposium on Principles and Practice of Parallel Programming","location":"Montreal QC Canada","acronym":"PPoPP '23","sponsor":["SIGPLAN ACM Special Interest Group on Programming Languages","SIGHPC ACM Special Interest Group on High Performance Computing, Special Interest Group on High Performance Computing"]},"container-title":["Proceedings of the 28th ACM SIGPLAN Annual Symposium on Principles and Practice of Parallel Programming"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3572848.3577528","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3572848.3577528","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T18:08:10Z","timestamp":1750183690000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3572848.3577528"}},"subtitle":["Efficient GNN Training with Multiple GPUs"],"short-title":[],"issued":{"date-parts":[[2023,2,21]]},"references-count":47,"alternative-id":["10.1145\/3572848.3577528","10.1145\/3572848"],"URL":"https:\/\/doi.org\/10.1145\/3572848.3577528","relation":{},"subject":[],"published":{"date-parts":[[2023,2,21]]},"assertion":[{"value":"2023-02-21","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}