{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,18]],"date-time":"2025-12-18T10:51:26Z","timestamp":1766055086575,"version":"3.48.0"},"reference-count":31,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,10,19]],"date-time":"2025-10-19T00:00:00Z","timestamp":1760832000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,10,19]],"date-time":"2025-10-19T00:00:00Z","timestamp":1760832000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100002858","name":"China Postdoctoral Science Foundation","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100002858","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,10,19]]},"DOI":"10.1109\/iros60139.2025.11246116","type":"proceedings-article","created":{"date-parts":[[2025,11,27]],"date-time":"2025-11-27T18:54:45Z","timestamp":1764269685000},"page":"604-611","source":"Crossref","is-referenced-by-count":0,"title":["DRARL: Disengagement-Reason-Augmented Reinforcement Learning for Efficient Improvement of Autonomous Driving Policy"],"prefix":"10.1109","author":[{"given":"Weitao","family":"Zhou","sequence":"first","affiliation":[{"name":"Tsinghua University,School of Vehicle and Mobility"}]},{"given":"Bo","family":"Zhang","sequence":"additional","affiliation":[{"name":"Tsinghua University,School of Vehicle and Mobility"}]},{"given":"Zhong","family":"Cao","sequence":"additional","affiliation":[{"name":"University of Michigan,Department of Civil and Environmental Engineering"}]},{"given":"Xiang","family":"Li","sequence":"additional","affiliation":[{"name":"Tsinghua University,Lab for High Technology"}]},{"given":"Qian","family":"Cheng","sequence":"additional","affiliation":[{"name":"Tsinghua University,School of Vehicle and Mobility"}]},{"given":"Chunyang","family":"Liu","sequence":"additional","affiliation":[{"name":"Tsinghua University,School of Vehicle and Mobility"}]},{"given":"Yaqin","family":"Zhang","sequence":"additional","affiliation":[{"name":"Tsinghua University,Institute for AI Industry Research"}]},{"given":"Diange","family":"Yang","sequence":"additional","affiliation":[{"name":"Tsinghua University,School of Vehicle and Mobility"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.3390\/su13147938"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/IV47402.2020.9304647"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2023.3266885"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1038\/s42256-023-00610-y"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/tiv.2022.3184729"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/IROS45743.2020.9341072"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2019.8793970"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.146"},{"article-title":"Uncertainty-aware reinforcement learning for collision avoidance","year":"2017","author":"Kahn","key":"ref9"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2021.3069497"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/tiv.2022.3185159"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1145\/3534678.3539391"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.52202\/079017-1255"},{"issue":"77","key":"ref14","article-title":"Analysis of accident data for test scenario definition in the assess project","author":"Fagerlind","year":"2010","journal-title":"Berichte Der Bundesanstalt Fuer Strassenwesen. Unterreihe Fahrzeugtechnik"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1145\/3177753"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1103\/PhysRevE.62.1805"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.3141\/1999-10"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01026"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48506.2021.9561666"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2022.3225538"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1145\/3206157.3206174"},{"article-title":"Generalization in visual reinforcement learning with the reward sequence distribution","year":"2023","author":"Wang","key":"ref22"},{"key":"ref23","first-page":"1282","article-title":"Quantifying generalization in reinforcement learning","volume-title":"International Conference on Machine Learning","author":"Cobbe"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58523-5_40"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1214\/aoms\/1177704472"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/TIV.2015.2503342"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1080\/00423110903365910"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1016\/j.trf.2005.08.006"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2014.6942636"},{"key":"ref30","first-page":"1","article-title":"Carla: An open urban driving simulator","volume-title":"Conference on robot learning","author":"Dosovitskiy"},{"key":"ref31","first-page":"1861","article-title":"Soft actor-critic: Off-policy maximum entropy deep reinforcement learning with a stochastic actor","volume-title":"International conference on machine learning","author":"Haarnoja"}],"event":{"name":"2025 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS)","start":{"date-parts":[[2025,10,19]]},"location":"Hangzhou, China","end":{"date-parts":[[2025,10,25]]}},"container-title":["2025 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11245651\/11245652\/11246116.pdf?arnumber=11246116","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,12,18]],"date-time":"2025-12-18T10:48:13Z","timestamp":1766054893000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11246116\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,19]]},"references-count":31,"URL":"https:\/\/doi.org\/10.1109\/iros60139.2025.11246116","relation":{},"subject":[],"published":{"date-parts":[[2025,10,19]]}}}