{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,19]],"date-time":"2026-02-19T15:42:14Z","timestamp":1771515734815,"version":"3.50.1"},"reference-count":51,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"11","license":[{"start":{"date-parts":[[2024,11,1]],"date-time":"2024-11-01T00:00:00Z","timestamp":1730419200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2024,11,1]],"date-time":"2024-11-01T00:00:00Z","timestamp":1730419200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,11,1]],"date-time":"2024-11-01T00:00:00Z","timestamp":1730419200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100012166","name":"National Key R&D Program of China","doi-asserted-by":"publisher","award":["2022YFB2901103"],"award-info":[{"award-number":["2022YFB2901103"]}],"id":[{"id":"10.13039\/501100012166","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Research fund of CIE-SmartChip","award":["20220370-0060"],"award-info":[{"award-number":["20220370-0060"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Comput.-Aided Des. Integr. Circuits Syst."],"published-print":{"date-parts":[[2024,11]]},"DOI":"10.1109\/tcad.2024.3446871","type":"journal-article","created":{"date-parts":[[2024,11,6]],"date-time":"2024-11-06T18:40:50Z","timestamp":1730918450000},"page":"3997-4008","source":"Crossref","is-referenced-by-count":2,"title":["NDPGNN: A Near-Data Processing Architecture for GNN Training and Inference Acceleration"],"prefix":"10.1109","volume":"43","author":[{"ORCID":"https:\/\/orcid.org\/0009-0009-9763-0095","authenticated-orcid":false,"given":"Haoyang","family":"Wang","sequence":"first","affiliation":[{"name":"School of Computer Science, Northwestern Polytechnical University, Xi&#x2019;an, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2854-729X","authenticated-orcid":false,"given":"Shengbing","family":"Zhang","sequence":"additional","affiliation":[{"name":"School of Computer Science, Northwestern Polytechnical University, Xi&#x2019;an, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6190-8077","authenticated-orcid":false,"given":"Xiaoya","family":"Fan","sequence":"additional","affiliation":[{"name":"School of Computer Science, Northwestern Polytechnical University, Xi&#x2019;an, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9525-2096","authenticated-orcid":false,"given":"Zhao","family":"Yang","sequence":"additional","affiliation":[{"name":"College of Future Transportation, Chang&#x2019;an University, Xi&#x2019;an, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0637-249X","authenticated-orcid":false,"given":"Meng","family":"Zhang","sequence":"additional","affiliation":[{"name":"School of Computer Science, Northwestern Polytechnical University, Xi&#x2019;an, China"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1145\/3419111.3421281"},{"key":"ref2","first-page":"99","article-title":"Firmament: Fast, centralized cluster scheduling at scale","volume-title":"Proc. 12th USENIX Symp. Oper. Syst. Design Implement.","author":"Gog"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1145\/3469379.3469387"},{"key":"ref4","article-title":"Fast graph representation learning with PyTorch geometric","author":"Fey","year":"2019","journal-title":"arXiv:1903.02428"},{"key":"ref5","first-page":"1","article-title":"Semi-supervised classification with graph convolutional networks","volume-title":"Proc. Int. Conf. Learn. Represent.","author":"Kipf"},{"key":"ref6","first-page":"1","article-title":"Inductive representation learning on large graphs","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Hamilton"},{"key":"ref7","article-title":"Residual gated graph ConvNets","author":"Bresson","year":"2017","journal-title":"arXiv:1711.07553"},{"key":"ref8","first-page":"5165","article-title":"Link prediction based on graph neural networks","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"31","author":"Zhang"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/hpca47549.2020.00012"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/micro50266.2020.00079"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/dac18072.2020.9218751"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2020.2978386"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/lca.2015.2414456"},{"key":"ref14","article-title":"Redundancy-free computation graphs for graph neural networks","author":"Jia","year":"2019","journal-title":"arXiv:1906.03707"},{"key":"ref15","first-page":"17","article-title":"PowerGraph: Distributed graph-parallel computation on natural graphs","volume-title":"Proc. Symp. Oper. Syst. Design Implement. (OSDI)","author":"Gonzalez"},{"key":"ref16","first-page":"1","article-title":"Graph attention networks","volume-title":"Proc. 6th Int. Conf. Learn. Represent. (ICLR\u201918)","author":"Velickovic"},{"key":"ref17","first-page":"1","article-title":"Few-shot learning with graph neural networks","volume-title":"Proc. 6th Int. Conf. Learn. Represent. (ICLR\u201918)","author":"Garcia"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/isca45697.2020.00044"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.23919\/date.2019.8715192"},{"key":"ref20","article-title":"How powerful are graph neural networks?","author":"Xu","year":"2018","journal-title":"arXiv:1810.00826"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/MICRO56248.2022.00057"},{"key":"ref22","volume-title":"DGL framework","year":"2024"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1145\/3559009.3569670"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1145\/3308558.3313488"},{"key":"ref25","first-page":"120","article-title":"PyTorch-BigGraph: A large-scale graph embedding system","volume-title":"Proc. Mach. Learn. Syst.","volume":"1","author":"Lerer"},{"key":"ref26","article-title":"Joint 3D tracking and forecasting with graph neural network and diversity sampling","author":"Weng","year":"2020","journal-title":"arXiv:2003.07847v1"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1145\/3397271.3401072"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2020.106194"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/iv51971.2022.9827230"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1145\/3065386"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.4324\/9781410605337-29"},{"key":"ref33","first-page":"1263","article-title":"Neural message passing for quantum chemistry","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Gilmer"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS.2006.1639360"},{"key":"ref35","first-page":"1","article-title":"Distributed power-law graph computing: Theoretical and empirical analysis","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"27","author":"Xie"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1145\/2749469.2750386"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/tcad.2018.2821565"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/hpca.2017.54"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/hpca.2018.00053"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1145\/3352460.3358256"},{"key":"ref41","article-title":"FastGCN: Fast learning with graph convolutional networks via importance sampling","author":"Chen","year":"2018","journal-title":"arXiv:1801. 10247"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1145\/3292500.3330925"},{"key":"ref43","article-title":"GraphSAINT: Graph sampling based inductive learning method","author":"Zeng","year":"2019","journal-title":"arXiv:1907.04931"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1145\/3447786.3456233"},{"key":"ref45","first-page":"187","article-title":"Improving the accuracy, scalability, and performance of graph neural networks with ROC","volume-title":"Proc. Mach. Learn. Syst.","volume":"2","author":"Jia"},{"key":"ref46","article-title":"DistGNN: Scalable distributed training for large-scale graph neural networks","author":"Vasimuddin","year":"2021","journal-title":"arXiv:2104.06700"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/sc41405.2020.00074"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/hpca56546.2023.10070983"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/hpca56546.2023.10071015"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/hpca56546.2023.10071102"},{"key":"ref51","article-title":"METIS: A software package for partitioning unstructured graphs, partitioning meshes, and computing fill-reducing orderings of sparse matrices","author":"Karypis","year":"1997"}],"container-title":["IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/43\/10745760\/10745796.pdf?arnumber=10745796","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,27]],"date-time":"2024-11-27T13:57:57Z","timestamp":1732715877000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10745796\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,11]]},"references-count":51,"journal-issue":{"issue":"11"},"URL":"https:\/\/doi.org\/10.1109\/tcad.2024.3446871","relation":{},"ISSN":["0278-0070","1937-4151"],"issn-type":[{"value":"0278-0070","type":"print"},{"value":"1937-4151","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,11]]}}}