{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,22]],"date-time":"2026-04-22T20:05:11Z","timestamp":1776888311000,"version":"3.51.2"},"reference-count":39,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,10,19]],"date-time":"2025-10-19T00:00:00Z","timestamp":1760832000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,10,19]],"date-time":"2025-10-19T00:00:00Z","timestamp":1760832000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100010226","name":"Department of Education of Guangdong Province","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100010226","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,10,19]]},"DOI":"10.1109\/iros60139.2025.11247519","type":"proceedings-article","created":{"date-parts":[[2025,11,27]],"date-time":"2025-11-27T18:54:45Z","timestamp":1764269685000},"page":"13162-13169","source":"Crossref","is-referenced-by-count":3,"title":["PD-VLA: Accelerating Vision-Language-Action Model Integrated with Action Chunking via Parallel Decoding"],"prefix":"10.1109","author":[{"given":"Wenxuan","family":"Song","sequence":"first","affiliation":[{"name":"The Hong Kong University of Science and Technology (Guangzhou),Thrust of Robotics and Autonomous Systems and Thrust of Intelligent Transportation,Guangzhou,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jiayi","family":"Chen","sequence":"additional","affiliation":[{"name":"The Hong Kong University of Science and Technology (Guangzhou),Thrust of Robotics and Autonomous Systems and Thrust of Intelligent Transportation,Guangzhou,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Pengxiang","family":"Ding","sequence":"additional","affiliation":[{"name":"Westlake University,AI Division, School of Engineering,Hangzhou,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Han","family":"Zhao","sequence":"additional","affiliation":[{"name":"Westlake University,AI Division, School of Engineering,Hangzhou,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Wei","family":"Zhao","sequence":"additional","affiliation":[{"name":"Westlake University,AI Division, School of Engineering,Hangzhou,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zhide","family":"Zhong","sequence":"additional","affiliation":[{"name":"The Hong Kong University of Science and Technology (Guangzhou),Thrust of Robotics and Autonomous Systems and Thrust of Intelligent Transportation,Guangzhou,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zongyuan","family":"Ge","sequence":"additional","affiliation":[{"name":"Monash University,Department of Data Science &#x0026; AI,Melbourne,Australia"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zhijun","family":"Li","sequence":"additional","affiliation":[{"name":"Harbin Institute of Technology,School of Computer Science and Technology,Harbin,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Donglin","family":"Wang","sequence":"additional","affiliation":[{"name":"Westlake University,AI Division, School of Engineering,Hangzhou,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Lujia","family":"Wang","sequence":"additional","affiliation":[{"name":"The Hong Kong University of Science and Technology (Guangzhou),Thrust of Robotics and Autonomous Systems and Thrust of Intelligent Transportation,Guangzhou,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jun","family":"Ma","sequence":"additional","affiliation":[{"name":"The Hong Kong University of Science and Technology (Guangzhou),Thrust of Robotics and Autonomous Systems and Thrust of Intelligent Transportation,Guangzhou,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Haoang","family":"Li","sequence":"additional","affiliation":[{"name":"The Hong Kong University of Science and Technology (Guangzhou),Thrust of Robotics and Autonomous Systems and Thrust of Intelligent Transportation,Guangzhou,China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","first-page":"5286","article-title":"Domain adaptive imitation learning","volume-title":"International Conference on Machine Learning","author":"Kim"},{"key":"ref2","article-title":"Openflamingo: An open-source framework for training large autoregressive vision-language models","author":"Awadalla","year":"2023"},{"key":"ref3","article-title":"Visual instruction tuning","volume":"36","author":"Liu","year":"2024","journal-title":"Advances in neural information processing systems"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2023.XIX.025"},{"key":"ref5","first-page":"2165","article-title":"Rt-2: Vision-language-action models transfer web knowledge to robotic control","volume-title":"Conference on Robot Learning","author":"Zitkovich"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2024.XX.090"},{"key":"ref7","article-title":"Llarva: Vision-action instruction tuning enhances robot learning","author":"Niu","year":"2024"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/IROS58592.2024.10801816"},{"key":"ref9","article-title":"Openvla: An open-source vision-language-action model","author":"Kim","year":"2024"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA57147.2024.10611477"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA57147.2024.10611615"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.15607\/rss.2025.xxi.010"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2025.XXI.012"},{"key":"ref14","article-title":"Vlas: Vision-language-action model with speech instructions for customized robot manipulation","volume-title":"International Conference on Learning Representations (ICLR)","author":"Zhao"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2023.XIX.016"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/lra.2025.3544909"},{"key":"ref17","article-title":"Robomamba: Multimodal state space model for efficient robot reasoning and manipulation","author":"Liu","year":"2024"},{"key":"ref18","article-title":"Quantization-aware imitation-learning for resource-efficient robotic control","author":"Park","year":"2024"},{"key":"ref19","article-title":"Deer-vla: Dynamic inference of multimodal large language models for efficient robot execution","volume-title":"The Thirty-eighth Annual Conference on Neural Information Processing Systems","author":"Yue"},{"key":"ref20","article-title":"Sparsevlm: Visual token sparsification for efficient vision-language model inference","author":"Zhang","year":"2024"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-73004-7_2"},{"key":"ref22","article-title":"Vla-cache: Towards efficient vision-language-action model via adaptive token caching in robotic manipulation","author":"Xu","year":"2025"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1137\/1.9780898719468"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-72652-1_21"},{"key":"ref25","article-title":"Vision-language foundation models as effective robot imitators","volume-title":"The Twelfth International Conference on Learning Representations","author":"Li"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1177\/02783649241273668"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.15607\/rss.2024.xx.071"},{"key":"ref28","article-title":"Planning with diffusion for flexible behavior synthesis","author":"Janner","year":"2022"},{"key":"ref29","article-title":"Behavior generation with latent actions","author":"Lee","year":"2024"},{"key":"ref30","article-title":"Bidirectional decoding: Improving action chunking via closed-loop resampling","author":"Liu","year":"2024"},{"key":"ref31","first-page":"87","article-title":"Awq: Activation-aware weight quantization for on-device llm compression and acceleration","volume-title":"Proceedings of Machine Learning and Systems","volume":"6","author":"Lin"},{"key":"ref32","article-title":"Visual instruction tuning","author":"Liu","year":"2023"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.acl-long.689"},{"key":"ref34","article-title":"Cllms: Consistency large language models","volume-title":"Forty-first International Conference on Machine Learning","author":"Kou"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2022.3180108"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2022.3196123"},{"key":"ref37","first-page":"2016","article-title":"Pybullet, a python module for physics simulation for games, robotics and machine learning","author":"Coumans"},{"key":"ref38","article-title":"Vicuna: An open-source chatbot impressing gpt-4 with 90%* chatgpt quality","author":"Chiang","year":"2023"},{"key":"ref39","first-page":"8748","article-title":"Learning transferable visual models from natural language supervision","volume-title":"International conference on machine learning","author":"Radford"}],"event":{"name":"2025 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS)","location":"Hangzhou, China","start":{"date-parts":[[2025,10,19]]},"end":{"date-parts":[[2025,10,25]]}},"container-title":["2025 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11245651\/11245652\/11247519.pdf?arnumber=11247519","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,12,18]],"date-time":"2025-12-18T12:38:34Z","timestamp":1766061514000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11247519\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,19]]},"references-count":39,"URL":"https:\/\/doi.org\/10.1109\/iros60139.2025.11247519","relation":{},"subject":[],"published":{"date-parts":[[2025,10,19]]}}}