{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,18]],"date-time":"2025-09-18T10:46:46Z","timestamp":1758192406715,"version":"3.44.0"},"publisher-location":"New York, NY, USA","reference-count":40,"publisher":"ACM","funder":[{"name":"Shanghai Municipal Science and Technology Major Project","award":["2021SHZDZX0102"],"award-info":[{"award-number":["2021SHZDZX0102"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,12,18]]},"DOI":"10.1145\/3719545.3720337","type":"proceedings-article","created":{"date-parts":[[2025,9,16]],"date-time":"2025-09-16T09:38:41Z","timestamp":1758015521000},"page":"103-111","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Multi-Agent Trajectory Prediction with Scalable Diffusion Transformer"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0006-4843-9794","authenticated-orcid":false,"given":"Shenyu","family":"Zhang","sequence":"first","affiliation":[{"name":"Shanghai Jiaotong University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-1563-3179","authenticated-orcid":false,"given":"Shixiong","family":"Kai","sequence":"additional","affiliation":[{"name":"Huawei Technologies Co.,Ltd, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-4198-3033","authenticated-orcid":false,"given":"Chang","family":"Chen","sequence":"additional","affiliation":[{"name":"Huawei Technologies Co.,Ltd, Hong Kong, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0915-0254","authenticated-orcid":false,"given":"Yuzheng","family":"Zhuang","sequence":"additional","affiliation":[{"name":"Huawei Technologies Co.,Ltd, Shenzhen, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0005-9310-3598","authenticated-orcid":false,"given":"Zhengbang","family":"Zhu","sequence":"additional","affiliation":[{"name":"Shanghai Jiaotong University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0009-5585-1746","authenticated-orcid":false,"given":"Minghuan","family":"Liu","sequence":"additional","affiliation":[{"name":"Shanghai Jiaotong University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0127-2425","authenticated-orcid":false,"given":"Weinan","family":"Zhang","sequence":"additional","affiliation":[{"name":"Shanghai Jiaotong University, Shanghai, China"}]}],"member":"320","published-online":{"date-parts":[[2025,9,16]]},"reference":[{"key":"e_1_3_3_1_2_2","unstructured":"Anurag Ajay Yilun Du Abhi Gupta Joshua Tenenbaum Tommi Jaakkola and Pulkit Agrawal. 2022. Is conditional generative modeling all you need for decision-making? arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2211.15657 (2022)."},{"key":"e_1_3_3_1_3_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.110"},{"key":"e_1_3_3_1_4_2","unstructured":"Prafulla Dhariwal and Alexander Nichol. 2021. Diffusion models beat gans on image synthesis. Advances in neural information processing systems 34 (2021) 8780\u20138794."},{"key":"e_1_3_3_1_5_2","doi-asserted-by":"publisher","unstructured":"Chen Feng Hangning Zhou Huadong Lin Zhigang Zhang Ziyao Xu Chi Zhang Boyu Zhou and Shaojie Shen. 2023. MacFormer: Map-Agent Coupled Transformer for Real-Time and Robust Trajectory Prediction. IEEE Robotics and Automation Letters 8 10 (2023) 6795\u20136802. 10.1109\/LRA.2023.3311351","DOI":"10.1109\/LRA.2023.3311351"},{"key":"e_1_3_3_1_6_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01660"},{"key":"e_1_3_3_1_7_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00240"},{"key":"e_1_3_3_1_8_2","unstructured":"Nicholas Guttenberg Nathaniel Virgo Olaf Witkowski Hidetoshi Aoki and Ryota Kanai. 2016. Permutation-equivariant neural networks applied to dynamics prediction. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/1612.04530 (2016)."},{"key":"e_1_3_3_1_9_2","unstructured":"Jonathan Ho Ajay Jain and Pieter Abbeel. 2020. Denoising diffusion probabilistic models. Advances in neural information processing systems 33 (2020) 6840\u20136851."},{"key":"e_1_3_3_1_10_2","unstructured":"Jonathan Ho and Tim Salimans. 2022. Classifier-free diffusion guidance. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2207.12598 (2022)."},{"key":"e_1_3_3_1_11_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00637"},{"key":"e_1_3_3_1_12_2","unstructured":"Michael Janner Yilun Du Joshua\u00a0B Tenenbaum and Sergey Levine. 2022. Planning with diffusion for flexible behavior synthesis. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2205.09991 (2022)."},{"key":"e_1_3_3_1_13_2","first-page":"2688","volume-title":"International conference on machine learning","author":"Kipf Thomas","year":"2018","unstructured":"Thomas Kipf, Ethan Fetaya, Kuan-Chieh Wang, Max Welling, and Richard Zemel. 2018. Neural relational inference for interacting systems. In International conference on machine learning. PMLR, 2688\u20132697."},{"key":"e_1_3_3_1_14_2","unstructured":"Vineet Kosaraju Amir Sadeghian Roberto Mart\u00edn-Mart\u00edn Ian Reid Hamid Rezatofighi and Silvio Savarese. 2019. Social-bigat: Multimodal trajectory forecasting using bicycle-gan and graph attention networks. Advances in Neural Information Processing Systems 32 (2019)."},{"key":"e_1_3_3_1_15_2","unstructured":"Jiachen Li Hengbo Ma Zhihao Zhang and Masayoshi Tomizuka. 2020. Social-wagdat: Interaction-aware trajectory prediction via wasserstein graph double-attention network. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2002.06241 (2020)."},{"key":"e_1_3_3_1_16_2","unstructured":"Jiachen Li Fan Yang Masayoshi Tomizuka and Chiho Choi. 2020. Evolvegraph: Multi-agent trajectory prediction with dynamic relational reasoning. Advances in neural information processing systems 33 (2020) 19783\u201319794."},{"key":"e_1_3_3_1_17_2","doi-asserted-by":"crossref","unstructured":"Jiachen Li Wei Zhan Yeping Hu and Masayoshi Tomizuka. 2019. Generic tracking and probabilistic prediction framework and its application in autonomous driving. IEEE Transactions on Intelligent Transportation Systems 21 9 (2019) 3634\u20133649.","DOI":"10.1109\/TITS.2019.2930310"},{"key":"e_1_3_3_1_18_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58536-5_32"},{"key":"e_1_3_3_1_19_2","unstructured":"Kostya Linou. 2016. SportVU data. https:\/\/github.com\/linouk23\/NBA-Player-Movements"},{"key":"e_1_3_3_1_20_2","unstructured":"Cheng Lu Yuhao Zhou Fan Bao Jianfei Chen Chongxuan Li and Jun Zhu. 2022. Dpm-solver: A fast ode solver for diffusion probabilistic model sampling in around 10 steps. Advances in Neural Information Processing Systems 35 (2022) 5775\u20135787."},{"key":"e_1_3_3_1_21_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00534"},{"key":"e_1_3_3_1_22_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01443"},{"key":"e_1_3_3_1_23_2","unstructured":"Jiquan Ngiam Benjamin Caine Vijay Vasudevan Zhengdong Zhang Hao-Tien\u00a0Lewis Chiang Jeffrey Ling Rebecca Roelofs Alex Bewley Chenxi Liu Ashish Venugopal et\u00a0al. 2021. Scene transformer: A unified architecture for predicting multiple agent trajectories. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2106.08417 (2021)."},{"key":"e_1_3_3_1_24_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01042"},{"key":"e_1_3_3_1_25_2","unstructured":"Tim Salzmann Boris Ivanovic Punarjay Chakravarty and Marco Pavone. 2020. Trajectron++: Multi-agent generative trajectory forecasting with heterogeneous data for control. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2001.03093 2 (2020)."},{"key":"e_1_3_3_1_26_2","unstructured":"Adam Santoro David Raposo David\u00a0G Barrett Mateusz Malinowski Razvan Pascanu Peter Battaglia and Timothy Lillicrap. 2017. A simple neural network module for relational reasoning. Advances in neural information processing systems 30 (2017)."},{"key":"e_1_3_3_1_27_2","first-page":"2256","volume-title":"International conference on machine learning","author":"Sohl-Dickstein Jascha","year":"2015","unstructured":"Jascha Sohl-Dickstein, Eric Weiss, Niru Maheswaranathan, and Surya Ganguli. 2015. Deep unsupervised learning using nonequilibrium thermodynamics. In International conference on machine learning. PMLR, 2256\u20132265."},{"key":"e_1_3_3_1_28_2","unstructured":"Jiaming Song Chenlin Meng and Stefano Ermon. 2020. Denoising diffusion implicit models. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2010.02502 (2020)."},{"key":"e_1_3_3_1_29_2","unstructured":"Yang Song Jascha Sohl-Dickstein Diederik\u00a0P Kingma Abhishek Kumar Stefano Ermon and Ben Poole. 2020. Score-based generative modeling through stochastic differential equations. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2011.13456 (2020)."},{"key":"e_1_3_3_1_30_2","doi-asserted-by":"publisher","DOI":"10.1109\/ITSC.2018.8569453"},{"key":"e_1_3_3_1_31_2","unstructured":"Guy Tevet Sigal Raab Brian Gordon Yonatan Shafir Daniel Cohen-Or and Amit\u00a0H Bermano. 2022. Human motion diffusion model. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2209.14916 (2022)."},{"key":"e_1_3_3_1_32_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00051"},{"key":"e_1_3_3_1_33_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA46639.2022.9812107"},{"key":"e_1_3_3_1_34_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2018.8460504"},{"key":"e_1_3_3_1_35_2","unstructured":"Zhendong Wang Jonathan\u00a0J Hunt and Mingyuan Zhou. 2022. Diffusion policies as an expressive policy class for offline reinforcement learning. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2208.06193 (2022)."},{"key":"e_1_3_3_1_36_2","unstructured":"Benjamin Wilson William Qi Tanmay Agarwal John Lambert Jagjeet Singh Siddhesh Khandelwal Bowen Pan Ratnesh Kumar Andrew Hartnett Jhony\u00a0Kaesemodel Pontes et\u00a0al. 2023. Argoverse 2: Next generation datasets for self-driving perception and forecasting. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2301.00493 (2023)."},{"key":"e_1_3_3_1_37_2","doi-asserted-by":"publisher","DOI":"10.1109\/ITSC.2018.8569785"},{"key":"e_1_3_3_1_38_2","unstructured":"Mingyuan Zhang Zhongang Cai Liang Pan Fangzhou Hong Xinying Guo Lei Yang and Ziwei Liu. 2022. Motiondiffuse: Text-driven human motion generation with diffusion model. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2208.15001 (2022)."},{"key":"e_1_3_3_1_39_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01713"},{"key":"e_1_3_3_1_40_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00862"},{"key":"e_1_3_3_1_41_2","unstructured":"Zhengbang Zhu Minghuan Liu Liyuan Mao Bingyi Kang Minkai Xu Yong Yu Stefano Ermon and Weinan Zhang. 2023. MADiff: Offline Multi-agent Learning with Diffusion Models. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2305.17330 (2023)."}],"event":{"name":"DAI '24: 6th International Conference on Distributed Artificial Intelligences","acronym":"DAI '24","location":"Singapore Singapore"},"container-title":["Proceedings of the 2024 Sixth International Conference on Distributed Artificial Intelligences"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3719545.3720337","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,17]],"date-time":"2025-09-17T13:12:36Z","timestamp":1758114756000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3719545.3720337"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,12,18]]},"references-count":40,"alternative-id":["10.1145\/3719545.3720337","10.1145\/3719545"],"URL":"https:\/\/doi.org\/10.1145\/3719545.3720337","relation":{},"subject":[],"published":{"date-parts":[[2024,12,18]]},"assertion":[{"value":"2025-09-16","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}