{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,22]],"date-time":"2025-12-22T21:01:02Z","timestamp":1766437262244,"version":"3.48.0"},"reference-count":38,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"2","license":[{"start":{"date-parts":[[2026,2,1]],"date-time":"2026-02-01T00:00:00Z","timestamp":1769904000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2026,2,1]],"date-time":"2026-02-01T00:00:00Z","timestamp":1769904000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,2,1]],"date-time":"2026-02-01T00:00:00Z","timestamp":1769904000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62203147"],"award-info":[{"award-number":["62203147"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62273129"],"award-info":[{"award-number":["62273129"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Anhui Provincial Key Research and Development Project","award":["202304a05020077"],"award-info":[{"award-number":["202304a05020077"]}]},{"DOI":"10.13039\/501100012226","name":"Fundamental Research Funds for the Central Universities","doi-asserted-by":"publisher","award":["JZ2024HGTB0225"],"award-info":[{"award-number":["JZ2024HGTB0225"]}],"id":[{"id":"10.13039\/501100012226","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Robot. Autom. Lett."],"published-print":{"date-parts":[[2026,2]]},"DOI":"10.1109\/lra.2025.3640983","type":"journal-article","created":{"date-parts":[[2025,12,5]],"date-time":"2025-12-05T18:40:34Z","timestamp":1764960034000},"page":"1626-1633","source":"Crossref","is-referenced-by-count":0,"title":["PIDiff: Integrating a High-Performance Transformer Into Diffusion Models for Robust and Efficient Imitation Learning"],"prefix":"10.1109","volume":"11","author":[{"given":"Yunzhi","family":"Huang","sequence":"first","affiliation":[{"name":"School of Electrical and Automation Engineering, Hefei University of Technology, Hefei, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0008-2832-0416","authenticated-orcid":false,"given":"Peng","family":"Jin","sequence":"additional","affiliation":[{"name":"School of Electrical and Automation Engineering, Hefei University of Technology, Hefei, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7779-0280","authenticated-orcid":false,"given":"Liang","family":"Han","sequence":"additional","affiliation":[{"name":"School of Electrical and Automation Engineering, Hefei University of Technology, Hefei, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5699-4097","authenticated-orcid":false,"given":"Yingzhao","family":"Li","sequence":"additional","affiliation":[{"name":"School of Mechatronics Engineering, Harbin Institute of Technology, Harbin, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0007-1191-3621","authenticated-orcid":false,"given":"Xudong","family":"Hou","sequence":"additional","affiliation":[{"name":"School of Mechatronics Engineering, Harbin Institute of Technology, Harbin, China"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48891.2023.10160275"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2023.XIX.009"},{"key":"ref3","first-page":"2195","article-title":"Waypoint-based imitation learning for robotic manipulation","volume-title":"Conf. Robot Learn.","author":"Shi","year":"2023"},{"key":"ref4","first-page":"201","article-title":"MimicPlay: Long-horizon imitation learning by watching human play","volume-title":"Proc. Conf. Robot Learn.","author":"Wang","year":"2023"},{"key":"ref5","first-page":"4066","article-title":"Mobile Aloha: Learning bimanual mobile manipulation with low-cost whole-body teleoperation","volume-title":"Proc. Conf. Robot Learn.","author":"Fu","year":"2024"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2024.XX.067"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1177\/02783649241273668"},{"key":"ref8","first-page":"5105","article-title":"PointNet++ : Deep hierarchical feature learning on point sets in a metric space","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Qi","year":"2017"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.52202\/079017-2515"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-72973-7_8"},{"key":"ref11","first-page":"3766","article-title":"Scaling up and distilling down: Language-guided robot skill acquisition","volume-title":"Proc. Conf. Robot Learn.","author":"Ha","year":"2023"},{"key":"ref12","first-page":"29982","article-title":"RDT-1B: A diffusion foundation model for bimanual manipulation","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Liu","year":"2025"},{"article-title":"Equibot: Sim (3)-equivariant diffusion policy for generalizable and data efficient learning","year":"2024","author":"Yang","key":"ref13"},{"key":"ref14","first-page":"2905","article-title":"Generative skill chaining: Long-horizon skill planning with diffusion models","volume-title":"Proc. Conf. Robot Learn.","author":"Mishra","year":"2023"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA57147.2024.10610665"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2018.XIV.049"},{"key":"ref17","first-page":"1094","article-title":"Meta-World: A benchmark and evaluation for multi-task and meta reinforcement learning","volume-title":"Proc. Conf. Robot Learn.","author":"Yu","year":"2020"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.02030"},{"article-title":"3D Diffuser Actor: Policy Diffusion with 3D Scene Representations.","year":"2024","author":"Ke","key":"ref19"},{"key":"ref20","article-title":"Diffusion policies as an expressive policy class for offline reinforcement learning","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Wang","year":"2023"},{"key":"ref21","first-page":"2323","article-title":"ChainedDiffuser: Unifying trajectory diffusion and keypose prediction for robotic manipulation","volume-title":"Proc. Conf. Robot Learn.","author":"Xian","year":"2023"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2024.XX.071"},{"key":"ref23","article-title":"Memory-consistent neural networks for imitation learning","volume-title":"Proc. 12th Int. Conf. Learn. Representations","author":"Sridhar","year":"2024"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1007\/s41095-022-0274-8"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00599"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00995"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"article-title":"Denoising diffusion implicit models","year":"2020","author":"Song","key":"ref28"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/iros60139.2025.11246340"},{"key":"ref30","article-title":"Imitating human behaviour with diffusion models","volume-title":"Proc. 11th Int. Conf. Learn. Representations","author":"Pearce","year":"2023"},{"key":"ref31","first-page":"6840","article-title":"Denoising diffusion probabilistic models","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"33","author":"Ho","year":"2020"},{"key":"ref32","article-title":"EquiBot: SIM(3)-equivariant diffusion policy for generalizable and data efficient learning","volume-title":"Proc. 8th Annu. Conf. Robot Learn.","author":"Yang","year":"2024"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2023.XIX.015"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2024.XX.045"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.01712"},{"key":"ref36","first-page":"158","article-title":"Implicit behavioral cloning","volume-title":"Proc. Conf. Robot Learn.","author":"Florence","year":"2022"},{"key":"ref37","first-page":"1678","article-title":"What matters in learning from offline human demonstrations for robot manipulation","volume-title":"Proc. Conf. Robot Learn.","author":"Mandlekar","year":"2022"},{"key":"ref38","first-page":"22955","article-title":"Behavior Transformers: Cloning $ k$ modes with one stone","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"35","author":"Shafiullah","year":"2022"}],"container-title":["IEEE Robotics and Automation Letters"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/7083369\/11293803\/11278644.pdf?arnumber=11278644","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,12,22]],"date-time":"2025-12-22T18:43:47Z","timestamp":1766429027000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11278644\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,2]]},"references-count":38,"journal-issue":{"issue":"2"},"URL":"https:\/\/doi.org\/10.1109\/lra.2025.3640983","relation":{},"ISSN":["2377-3766","2377-3774"],"issn-type":[{"type":"electronic","value":"2377-3766"},{"type":"electronic","value":"2377-3774"}],"subject":[],"published":{"date-parts":[[2026,2]]}}}