{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,2]],"date-time":"2026-06-02T21:05:33Z","timestamp":1780434333830,"version":"3.54.1"},"reference-count":103,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"6","license":[{"start":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T00:00:00Z","timestamp":1780272000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T00:00:00Z","timestamp":1780272000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T00:00:00Z","timestamp":1780272000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"name":"National Key R&#x0026;D Program of China","award":["2024YFB3213400"],"award-info":[{"award-number":["2024YFB3213400"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Artif. Intell."],"published-print":{"date-parts":[[2026,6]]},"DOI":"10.1109\/tai.2025.3639457","type":"journal-article","created":{"date-parts":[[2025,12,4]],"date-time":"2025-12-04T18:40:08Z","timestamp":1764873608000},"page":"3399-3413","source":"Crossref","is-referenced-by-count":2,"title":["SparseAD: Sparse Query-Centric Paradigm for Efficient End-to-End Autonomous Driving"],"prefix":"10.1109","volume":"7","author":[{"ORCID":"https:\/\/orcid.org\/0009-0007-9946-943X","authenticated-orcid":false,"given":"Runwen","family":"Zhu","sequence":"first","affiliation":[{"name":"School of Information Science and Technology, University of Science and Technology of China, Hefei, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0004-1255-0795","authenticated-orcid":false,"given":"Jianbo","family":"Zhao","sequence":"additional","affiliation":[{"name":"School of Information Science and Technology, University of Science and Technology of China, Hefei, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2004-0897","authenticated-orcid":false,"given":"Diankun","family":"Zhang","sequence":"additional","affiliation":[{"name":"Aerospace Information Research Institute, Key Laboratory of Electromagnetic Radiation and Sensing Technology, Chinese Academy of Sciences, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0002-1435-4291","authenticated-orcid":false,"given":"Guoan","family":"Wang","sequence":"additional","affiliation":[{"name":"Mach Drive, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5612-9848","authenticated-orcid":false,"given":"Xiwu","family":"Chen","sequence":"additional","affiliation":[{"name":"Mach Drive, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0007-3662-8691","authenticated-orcid":false,"given":"Siyu","family":"Zhang","sequence":"additional","affiliation":[{"name":"Mach Drive, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0005-7693-2204","authenticated-orcid":false,"given":"Jiahao","family":"Gong","sequence":"additional","affiliation":[{"name":"Mach Drive, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0004-5955-6799","authenticated-orcid":false,"given":"Qibin","family":"Zhou","sequence":"additional","affiliation":[{"name":"Mach Drive, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0008-8641-2001","authenticated-orcid":false,"given":"Wenyuan","family":"Zhang","sequence":"additional","affiliation":[{"name":"Mach Drive, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0005-8794-5182","authenticated-orcid":false,"given":"Ningzi","family":"Wang","sequence":"additional","affiliation":[{"name":"Mach Drive, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-6029-179X","authenticated-orcid":false,"given":"Feiyang","family":"Tan","sequence":"additional","affiliation":[{"name":"Mach Drive, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0005-8222-8379","authenticated-orcid":false,"given":"Ziyao","family":"Xu","sequence":"additional","affiliation":[{"name":"Mach Drive, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0009-8894-3137","authenticated-orcid":false,"given":"Hangning","family":"Zhou","sequence":"additional","affiliation":[{"name":"Mach Drive, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0007-8349-1122","authenticated-orcid":false,"given":"Haotian","family":"Yao","sequence":"additional","affiliation":[{"name":"Mach Drive, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0002-3514-2490","authenticated-orcid":false,"given":"Chi","family":"Zhang","sequence":"additional","affiliation":[{"name":"Mach Drive, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0625-6248","authenticated-orcid":false,"given":"Lei","family":"Liu","sequence":"additional","affiliation":[{"name":"School of Information Science and Technology, University of Science and Technology of China, Hefei, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3399-3486","authenticated-orcid":false,"given":"Xiaojun","family":"Liu","sequence":"additional","affiliation":[{"name":"Aerospace Information Research Institute, Key Laboratory of Electromagnetic Radiation and Sensing Technology, Chinese Academy of Sciences, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5709-6862","authenticated-orcid":false,"given":"Xiaoguang","family":"Di","sequence":"additional","affiliation":[{"name":"Control and Simulation Center, Harbin Institute of Technology, Harbin, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2332-3959","authenticated-orcid":false,"given":"Bin","family":"Li","sequence":"additional","affiliation":[{"name":"School of Information Science and Technology, University of Science and Technology of China, Hefei, China"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.02105"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.00731"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-72995-9_9"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.52202\/079017-0025"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/icra55743.2025.11128800"},{"key":"ref6","article-title":"DriveTransformer: Unified transformer for scalable end-to-end autonomous driving","author":"Jia","year":"2025"},{"key":"ref7","article-title":"DiFSD: Ego-centric fully sparse paradigm with uncertainty denoising and iterative refinement for efficient end-to-end self-driving","author":"Su","year":"2024"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01157"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58592-1_25"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2018.8460487"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00942"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.52202\/068431-0443"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01494"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01712"},{"key":"ref15","article-title":"FusionAD: Multi-modality fusion for prediction and planning tasks of autonomous driving","author":"Ye","year":"2023"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19812-0_31"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.00335"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01719"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.00766"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2023.3328929"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v38i3.28033"},{"key":"ref22","article-title":"An image is worth 16x16 words: Transformers for image recognition at scale","author":"Dosovitskiy","year":"2020"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01167"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01855"},{"key":"ref25","first-page":"8748","article-title":"Learning transferable visual models from natural language supervision","volume-title":"Int. Conf. Mach. Learn.","author":"Radford","year":"2021"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01164"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01161"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00535"},{"key":"ref29","first-page":"3749","article-title":"DORT: Modeling dynamic objects in recurrent for multi-camera 3d object detection and tracking","volume-title":"Proc. Conf. Robot Learn. (CoRL),","author":"Lian","year":"2023"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01296"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.02076"},{"key":"ref32","article-title":"BEVDet: High-performance multi-camera 3d object detection in bird-eye-view","author":"Huang","year":"2021"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-20077-9_1"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/TAI.2024.3492163"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v37i2.25233"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00116"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48891.2023.10160968"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01675"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58568-6_12"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01710"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/lra.2024.3401172"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v37i2.25234"},{"key":"ref43","first-page":"180","article-title":"DETR3D: 3D object detection from multi-view images via 3d-to-2d queries","volume-title":"Proc. Conf. Robot Learn.","author":"Wang","year":"2022"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.00302"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/TIV.2023.3332608"},{"key":"ref46","article-title":"Sparse4D: Multi-view 3d object detection with sparse spatial-temporal fusion","author":"Lin","year":"2022"},{"key":"ref47","article-title":"Sparse4D v2: Recurrent temporal fusion with sparse model","author":"Lin","year":"2023"},{"key":"ref48","article-title":"Sparse4D v3: Advancing end-to-end 3d detection and tracking","author":"Lin","year":"2023"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/IROS45743.2020.9341164"},{"key":"ref50","article-title":"Global correlation network: End-to-end joint multi-object detection and tracking","author":"Lin","year":"2021"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19812-0_38"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.02112"},{"key":"ref53","article-title":"MOTRv3: Release-fetch supervision for end-to-end multi-object tracking","author":"Yu","year":"2023"},{"key":"ref54","article-title":"TransTrack: Multiple object tracking with transformer","author":"Sun","year":"2020"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-25056-9_43"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00864"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01678"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW56347.2022.00500"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA46639.2022.9812383"},{"key":"ref60","first-page":"22352","article-title":"VectorMapNet: End-to-end vectorized HD map learning","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Liu","year":"2023"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01270"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.00340"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.1109\/WACV57701.2024.00719"},{"key":"ref64","article-title":"Multipath: Multiple probabilistic anchor trajectory hypotheses for behavior prediction","author":"Chai","year":"2019"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01408"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01154"},{"key":"ref67","first-page":"895","article-title":"TNT: Target-driven trajectory prediction","volume-title":"Proc. Conf. Robot Learn.","author":"Zhao","year":"2021"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA46639.2022.9812107"},{"key":"ref69","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00862"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01713"},{"key":"ref71","doi-asserted-by":"publisher","DOI":"10.52202\/068431-0473"},{"key":"ref72","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2024.3352811"},{"key":"ref73","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00532"},{"key":"ref74","doi-asserted-by":"publisher","DOI":"10.3390\/vehicles4020021"},{"key":"ref75","doi-asserted-by":"publisher","DOI":"10.3389\/fbioe.2022.905983"},{"key":"ref76","doi-asserted-by":"publisher","DOI":"10.1109\/TAI.2021.3116216"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.1177\/0954407014522443"},{"key":"ref78","doi-asserted-by":"publisher","DOI":"10.1016\/j.robot.2024.104630"},{"key":"ref79","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2015.2389215"},{"key":"ref80","doi-asserted-by":"publisher","DOI":"10.1016\/j.ifacol.2020.12.2499"},{"key":"ref81","doi-asserted-by":"publisher","DOI":"10.1146\/annurev-control-061623-094742"},{"key":"ref82","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2019.8793742"},{"key":"ref83","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2020.3024655"},{"key":"ref84","doi-asserted-by":"publisher","DOI":"10.1016\/j.sysarc.2022.102505"},{"key":"ref85","article-title":"Deformable DETR: Deformable transformers for end-to-end object detection","author":"Zhu","year":"2020"},{"key":"ref86","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref87","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.324"},{"key":"ref88","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01392"},{"key":"ref89","article-title":"DEFT: Detection embeddings for tracking","author":"Chaabane","year":"2021"},{"key":"ref90","article-title":"Time will tell: New outlooks and a baseline for temporal multi-view 3d object detection","author":"Park","year":"2022"},{"key":"ref91","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2022.3168781"},{"key":"ref92","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW56347.2022.00496"},{"key":"ref93","article-title":"CC-3DT: Panoramic 3d object tracking via cross-camera fusion","author":"Fischer","year":"2022"},{"key":"ref94","doi-asserted-by":"publisher","DOI":"10.1109\/iros58592.2024.10801741"},{"key":"ref95","article-title":"SRCN3D: Sparse R-CNN 3d surround-view camera object detection and tracking for autonomous driving","author":"Shi","year":"2022"},{"key":"ref96","article-title":"MapTR: Structured modeling and learning for online vectorized HD map construction","author":"Liao","year":"2022"},{"key":"ref97","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.01463"},{"key":"ref98","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2022.3200245"},{"key":"ref99","article-title":"VADv2: End-to-end vectorized autonomous driving via probabilistic planning","author":"Chen","year":"2024"},{"key":"ref100","article-title":"Hydra-MDP: End-to-end multimodal planning with multi-target hydra-distillation","author":"Li","year":"2024"},{"key":"ref101","doi-asserted-by":"publisher","DOI":"10.1109\/cvpr52733.2024.01408"},{"key":"ref102","doi-asserted-by":"publisher","DOI":"10.52202\/079017-0902"},{"key":"ref103","article-title":"Rethinking the open-loop evaluation of end-to-end autonomous driving in nuscenes","author":"Zhai","year":"2023"}],"container-title":["IEEE Transactions on Artificial Intelligence"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/9078688\/11541276\/11278053.pdf?arnumber=11278053","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,6,2]],"date-time":"2026-06-02T20:10:09Z","timestamp":1780431009000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11278053\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,6]]},"references-count":103,"journal-issue":{"issue":"6"},"URL":"https:\/\/doi.org\/10.1109\/tai.2025.3639457","relation":{},"ISSN":["2691-4581"],"issn-type":[{"value":"2691-4581","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,6]]}}}