{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,3]],"date-time":"2026-06-03T18:19:45Z","timestamp":1780510785524,"version":"3.54.1"},"reference-count":29,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"7","license":[{"start":{"date-parts":[[2022,7,1]],"date-time":"2022-07-01T00:00:00Z","timestamp":1656633600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2022,7,1]],"date-time":"2022-07-01T00:00:00Z","timestamp":1656633600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2022,7,1]],"date-time":"2022-07-01T00:00:00Z","timestamp":1656633600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Intell. Transport. Syst."],"published-print":{"date-parts":[[2022,7]]},"DOI":"10.1109\/tits.2021.3069497","type":"journal-article","created":{"date-parts":[[2021,4,6]],"date-time":"2021-04-06T19:47:45Z","timestamp":1617738465000},"page":"7419-7430","source":"Crossref","is-referenced-by-count":63,"title":["Confidence-Aware Reinforcement Learning for Self-Driving Cars"],"prefix":"10.1109","volume":"23","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-2243-5705","authenticated-orcid":false,"given":"Zhong","family":"Cao","sequence":"first","affiliation":[{"name":"School of Vehicle and Mobility, Tsinghua University, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4127-2411","authenticated-orcid":false,"given":"Shaobing","family":"Xu","sequence":"additional","affiliation":[{"name":"Department of Mechanical Engineering, University of Michigan, Ann Arbor, MI, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7684-1696","authenticated-orcid":false,"given":"Huei","family":"Peng","sequence":"additional","affiliation":[{"name":"Department of Mechanical Engineering, University of Michigan, Ann Arbor, MI, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0825-5609","authenticated-orcid":false,"given":"Diange","family":"Yang","sequence":"additional","affiliation":[{"name":"School of Vehicle and Mobility, Tsinghua University, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Robert","family":"Zidek","sequence":"additional","affiliation":[{"name":"Toyota Research Institute, Ann Arbor, MI, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref1","article-title":"Understanding V2 V driving scenarios through traffic primitives","volume-title":"arXiv:1807.10422","author":"Wang","year":"2018"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1007\/978-981-10-8506-2_56"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/IV47402.2020.9304647"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2019.2961739"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ITSC45102.2020.9294275"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1016\/j.tra.2016.09.010"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ICCPS.2018.00035"},{"key":"ref8","article-title":"Baidu apollo EM motion planner","volume-title":"arXiv:1807.08048","author":"Fan","year":"2018"},{"issue":"8","key":"ref9","volume-title":"UPDATE: Disengagement Reports 2018-Final Results","volume":"15","author":"Herger","year":"2019"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/TNN.1998.712192"},{"issue":"1","key":"ref11","first-page":"1437","article-title":"A comprehensive survey on safe reinforcement learning","volume":"16","author":"Garc\u00eda","year":"2015","journal-title":"J. Mach. Learn. Res."},{"key":"ref12","first-page":"1","article-title":"Generative adversarial imitation learning","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Ho"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1145\/3054912"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1016\/j.robot.2019.01.003"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/SMC.2019.8914621"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/TCST.2017.2654063"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.33014967"},{"key":"ref18","first-page":"2380","article-title":"High confidence policy improvement","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Thomas"},{"key":"ref19","article-title":"Safe policy improvement with an estimated baseline policy","volume-title":"arXiv:1909.05236","author":"Sim\u00e3o","year":"2019"},{"key":"ref20","first-page":"9156","article-title":"Towards safe policy improvement for non-stationary MDPs","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"33","author":"Chandak"},{"key":"ref21","first-page":"1","article-title":"Security analysis of safe and seldonian reinforcement learning algorithms","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"33","author":"Ozisik"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.7551\/mitpress\/10187.001.0001"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.23919\/ACC.2017.7963408"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1145\/93605.98741"},{"key":"ref25","first-page":"1","article-title":"CARLA: An open urban driving simulator","volume-title":"Proc. 1st Annu. Conf. Robot Learn.","author":"Dosovitskiy"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2019.2892926"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.2972329"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1103\/physreve.62.1805"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.3141\/1999-10"}],"container-title":["IEEE Transactions on Intelligent Transportation Systems"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6979\/9826234\/09397429.pdf?arnumber=9397429","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,1,9]],"date-time":"2024-01-09T23:40:08Z","timestamp":1704843608000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9397429\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,7]]},"references-count":29,"journal-issue":{"issue":"7"},"URL":"https:\/\/doi.org\/10.1109\/tits.2021.3069497","relation":{},"ISSN":["1524-9050","1558-0016"],"issn-type":[{"value":"1524-9050","type":"print"},{"value":"1558-0016","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022,7]]}}}