{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,13]],"date-time":"2026-03-13T21:09:42Z","timestamp":1773436182019,"version":"3.50.1"},"reference-count":32,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62472009"],"award-info":[{"award-number":["62472009"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"National Key Research and Development Program of China","award":["2024YFB2906701"],"award-info":[{"award-number":["2024YFB2906701"]}]},{"DOI":"10.13039\/501100001809","name":"Joint Research Project with China Mobile Research Institute","doi-asserted-by":"publisher","award":["CMYJY-202400586"],"award-info":[{"award-number":["CMYJY-202400586"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Netw."],"published-print":{"date-parts":[[2026]]},"DOI":"10.1109\/ton.2026.3668862","type":"journal-article","created":{"date-parts":[[2026,2,27]],"date-time":"2026-02-27T20:48:33Z","timestamp":1772225313000},"page":"3947-3962","source":"Crossref","is-referenced-by-count":0,"title":["INARouting: Efficient Multi-Job Routing Optimization for Hierarchical In-Network Aggregation"],"prefix":"10.1109","volume":"34","author":[{"ORCID":"https:\/\/orcid.org\/0009-0001-8492-7983","authenticated-orcid":false,"given":"Jianglong","family":"Nie","sequence":"first","affiliation":[{"name":"School of Computer Science, Peking University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-8754-9150","authenticated-orcid":false,"given":"Yidan","family":"Yuan","sequence":"additional","affiliation":[{"name":"School of Computer Science, Peking University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5765-3825","authenticated-orcid":false,"given":"Yuchen","family":"Xu","sequence":"additional","affiliation":[{"name":"School of Computer Science, Peking University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0005-5427-4829","authenticated-orcid":false,"given":"Yitao","family":"Yuan","sequence":"additional","affiliation":[{"name":"School of Computer Science, Peking University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Kehan","family":"Yao","sequence":"additional","affiliation":[{"name":"China Mobile Research Institute, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0000-5740-9489","authenticated-orcid":false,"given":"Lu","family":"Lu","sequence":"additional","affiliation":[{"name":"China Mobile Research Institute, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xiaodong","family":"Duan","sequence":"additional","affiliation":[{"name":"China Mobile Research Institute, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1357-3137","authenticated-orcid":false,"given":"Wenfei","family":"Wu","sequence":"additional","affiliation":[{"name":"School of Computer Science, Peking University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1007\/s13042-024-02443-6"},{"key":"ref2","article-title":"A survey of large language models","author":"Xin Zhao","year":"2023","journal-title":"arXiv:2303.18223"},{"key":"ref3","article-title":"Parameter-efficient tuning of large-scale multimodal foundation model","author":"Wang","year":"2023","journal-title":"arXiv:2305.08381"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1145\/3377454"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1145\/3394486.3406703"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/3363554"},{"key":"ref7","article-title":"Megatron-LM: Training multi-billion parameter language models using model parallelism","author":"Shoeybi","year":"2019","journal-title":"arXiv:1909.08053"},{"key":"ref8","first-page":"745","article-title":"MegaScale: Scaling large language model training to more than 10,000 GPUs","volume-title":"Proc. 21st USENIX Symp. Networked Syst. Design Implement. (NSDI)","author":"Jiang"},{"issue":"2","key":"ref9","article-title":"Parameter server for distributed machine learning","volume-title":"Proc. Big Learn. NIPS Workshop","volume":"6","author":"Li"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.5555\/2685048.2685095"},{"key":"ref11","article-title":"Scaling distributed machine learning with in-network aggregation","author":"Sapio","year":"2019","journal-title":"arXiv:1903.06701"},{"key":"ref12","volume-title":"Intel Tofino Series","year":"2024"},{"key":"ref13","volume-title":"Trident4\/BCM56880 Series","year":"2024"},{"key":"ref14","volume-title":"Cisco Silicon One\u2014Network Processors for Unified Architecture","year":"2024"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2023.3344351"},{"key":"ref16","first-page":"741","article-title":"ATP: In-network aggregation for multi-tenant learning","volume":"21","author":"Lao","year":"2021","journal-title":"NSDI"},{"key":"ref17","first-page":"829","article-title":"In-network aggregation for shared machine learning clusters","volume":"3","author":"Gebara","year":"2021","journal-title":"Proc. Mach. Learn. Syst."},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/TNET.2023.3244794"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/IPCCC59175.2023.10253874"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/TNET.2024.3423380"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1145\/3589334.3645394"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/TNET.2024.3414853"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/TON.2025.3539430"},{"key":"ref24","volume-title":"Scalable Hierarchical Aggregation and Reduction Protocol (Sharp) Rev 3.0.0","year":"2024"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/COMHPC.2016.006"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/INFOCOM53939.2023.10228956"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1145\/3617232.3624863"},{"key":"ref28","volume-title":"The Leader in Decision Intelligence Technology","year":"2024"},{"issue":"1","key":"ref29","doi-asserted-by":"crossref","first-page":"281","DOI":"10.1016\/S0377-0427(00)00433-7","article-title":"Interior-point methods","volume":"124","author":"Potra","year":"2000","journal-title":"J. Comput. Appl. Math."},{"key":"ref30","first-page":"947","article-title":"Analysis of large-scale multi-tenant GPU clusters for DNN training workloads","volume-title":"Proc. USENIX Annu. Tech. Conf.","author":"Jeon"},{"key":"ref31","first-page":"709","article-title":"Characterization of large language model development in the datacenter","volume-title":"Proc. 21st USENIX Symp. Networked Syst. Design Implement.","author":"Hu"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.17487\/rfc2992"}],"container-title":["IEEE Transactions on Networking"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10723154\/11317935\/11417310.pdf?arnumber=11417310","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,13]],"date-time":"2026-03-13T19:52:36Z","timestamp":1773431556000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11417310\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026]]},"references-count":32,"URL":"https:\/\/doi.org\/10.1109\/ton.2026.3668862","relation":{},"ISSN":["2998-4157"],"issn-type":[{"value":"2998-4157","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026]]}}}