{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,29]],"date-time":"2025-10-29T06:27:45Z","timestamp":1761719265912,"version":"3.28.0"},"reference-count":42,"publisher":"IEEE","license":[{"start":{"date-parts":[[2023,9,24]],"date-time":"2023-09-24T00:00:00Z","timestamp":1695513600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,9,24]],"date-time":"2023-09-24T00:00:00Z","timestamp":1695513600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023,9,24]]},"DOI":"10.1109\/itsc57777.2023.10422605","type":"proceedings-article","created":{"date-parts":[[2024,2,13]],"date-time":"2024-02-13T23:32:39Z","timestamp":1707867159000},"page":"2811-2818","source":"Crossref","is-referenced-by-count":4,"title":["Safety Reinforced Model Predictive Control (SRMPC): Improving MPC with Reinforcement Learning for Motion Planning in Autonomous Driving"],"prefix":"10.1109","author":[{"given":"Johannes","family":"Fischer","sequence":"first","affiliation":[{"name":"Institute of Measurement and Control Systems, Karlsruhe Institute of Technology (KIT),Karlsruhe,Germany"}]},{"given":"Marlon","family":"Steiner","sequence":"additional","affiliation":[{"name":"Institute of Measurement and Control Systems, Karlsruhe Institute of Technology (KIT),Karlsruhe,Germany"}]},{"given":"\u00d6mer \u015eahin","family":"Ta\u015f","sequence":"additional","affiliation":[{"name":"FZI Research Center for Information Technology,Karlsruhe,Germany"}]},{"given":"Christoph","family":"Stiller","sequence":"additional","affiliation":[{"name":"Institute of Measurement and Control Systems, Karlsruhe Institute of Technology (KIT),Karlsruhe,Germany"}]}],"member":"263","reference":[{"key":"ref1","isbn-type":"print","doi-asserted-by":"crossref","DOI":"10.1007\/978-981-19-5053-7_7","article-title":"Advanced Driver Assistance Systems and Autonomous Vehicles: From Fundamentals to Applications","volume-title":"ser. Springer eBook Collection","author":"Li","year":"2022","ISBN":"http:\/\/id.crossref.org\/isbn\/9789811950537"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/IranianCEE.2013.6599610"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.23919\/EETA.2018.8493215"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/CCDC49329.2020.9163994"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CVCI56766.2022.9964888"},{"key":"ref6","article-title":"Motion planning for autonomous vehicles in partially observable environments","volume-title":"PhD thesis, Karlsruhe Institute of Technology (KIT), Karlsruhe, Germany","author":"Ta\u00a7","year":"2022"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/CDC.2017.8264062"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/IVS.2019.8813982"},{"issue":"42","key":"ref9","first-page":"1437","article-title":"A comprehensive survey on safe reinforcement learning","volume":"16","author":"Garc\u00eda","year":"2015","journal-title":"Journal of Machine Learning Research"},{"journal-title":"Benchmarking safe exploration in deep reinforcement learning","year":"2019","author":"Ray","key":"ref10"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/tnnls.2023.3348422"},{"journal-title":"Learning safe multi-agent control with decentralized neural barrier certificates","year":"2021","author":"Qin","key":"ref12"},{"key":"ref13","first-page":"97","article-title":"Joint synthesis of safety certificate and safe control policy using constrained reinforcement learning","volume-title":"Proceedings of The 4th Annual Learning for Dynamics and Control Conference","volume":"168","author":"Ma","year":"2022"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/IROS51168.2021.9636672"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/IROS51168.2021.9636847"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ITSC55140.2022.9921907"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2017.7989202"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.23919\/ACC.2019.8814476"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1016\/j.automatica.2013.02.003"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1177\/0278364916645661"},{"journal-title":"Learning-based model predictive control for safe exploration and reinforcement learning","year":"2019","author":"Koller","key":"ref21"},{"journal-title":"Differentiable MPC for end-to-end planning and control","year":"2018","author":"Amos","key":"ref22"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.3389\/fbuil.2020.562239"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1016\/j.ifacol.2021.08.518"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1016\/j.apenergy.2021.118346"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1007\/s10514-019-09829-4"},{"key":"ref27","isbn-type":"print","volume-title":"Reinforcement Learning: An Introduction, Second, ser. Adaptive computation and machine learning","author":"Sutton","year":"2018","ISBN":"http:\/\/id.crossref.org\/isbn\/9780262039246"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1201\/9781315140223"},{"journal-title":"Constrained policy optimization","year":"2017","author":"Achiam","key":"ref29"},{"journal-title":"Constrained variational policy optimization for safe reinforcement learning","year":"2022","author":"Liu","key":"ref30"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/CDC40024.2019.9029720"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1016\/j.ifacol.2021.11.200"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/IVS.2017.7995816"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/lra.2019.2929976"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-01094-1_32"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1007\/s12532-020-00179-2"},{"key":"ref37","article-title":"Control in a safe set: Addressing safety in human-robot interactions","volume-title":"Proceedings of the ASME 2014 Dynamic Systems and Control Conference, V003T42A003","volume":"3","author":"Liu","year":"2014"},{"journal-title":"Feasible actor-critic: Constrained reinforcement learning for ensuring statewise safety","year":"2021","author":"Ma","key":"ref38"},{"journal-title":"Proximal policy optimization algorithms","year":"2017","author":"Schulman","key":"ref39"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/IVS.2015.7225909"},{"volume-title":"An environment for autonomous driving decision-making","year":"2018","author":"Leurent","key":"ref41"},{"key":"ref42","article-title":"On a formal model of safe and scalable self-driving cars","volume":"abs\/1708.06374","author":"Shalev-Shwartz","year":"2017","journal-title":"CoRR"}],"event":{"name":"2023 IEEE 26th International Conference on Intelligent Transportation Systems (ITSC)","start":{"date-parts":[[2023,9,24]]},"location":"Bilbao, Spain","end":{"date-parts":[[2023,9,28]]}},"container-title":["2023 IEEE 26th International Conference on Intelligent Transportation Systems (ITSC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10420842\/10420843\/10422605.pdf?arnumber=10422605","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,3]],"date-time":"2024-03-03T11:55:57Z","timestamp":1709466957000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10422605\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,9,24]]},"references-count":42,"URL":"https:\/\/doi.org\/10.1109\/itsc57777.2023.10422605","relation":{},"subject":[],"published":{"date-parts":[[2023,9,24]]}}}