{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,23]],"date-time":"2026-03-23T22:45:31Z","timestamp":1774305931730,"version":"3.50.1"},"reference-count":33,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018,10]]},"DOI":"10.1109\/iros.2018.8593420","type":"proceedings-article","created":{"date-parts":[[2019,1,24]],"date-time":"2019-01-24T02:33:30Z","timestamp":1548297210000},"page":"1-6","source":"Crossref","is-referenced-by-count":51,"title":["Safe Reinforcement Learning on Autonomous Vehicles"],"prefix":"10.1109","author":[{"given":"David","family":"Isele","sequence":"first","affiliation":[]},{"given":"Alireza","family":"Nakhaei","sequence":"additional","affiliation":[]},{"given":"Kikuo","family":"Fujimura","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref33","article-title":"Lecture 6.5-rmsprop, coursera: Neural networks for machine learning","author":"tieleman","year":"2012","journal-title":"University of Toronto Tech Rep"},{"key":"ref32","author":"krauss","year":"1998","journal-title":"Microscopic Modeling of Traffic Flow Investigation of Collision Free Vehicle Dynamics"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1103\/PhysRevE.62.1805"},{"key":"ref30","article-title":"Recent development and applications of SUMO-simulation of urban mobility","volume":"5","author":"krajzewicz","year":"2012","journal-title":"International Journal on Advances in Systems and Measurements"},{"key":"ref10","author":"shalev-shwartz","year":"2016","journal-title":"Safe multiagent reinforcement learning for autonomous driving"},{"key":"ref11","doi-asserted-by":"crossref","first-page":"81","DOI":"10.7551\/mitpress\/9816.003.0016","article-title":"Reducing conservativeness in safety guarantees by learning disturbances online: iterated guaranteed safe online learning","author":"gillula","year":"2013","journal-title":"Robotics Science and Systems VIII"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2018.8461233"},{"key":"ref13","author":"moldovan","year":"2012","journal-title":"Safe exploration in markov decision processes"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1016\/B978-1-55860-335-6.50027-1"},{"key":"ref15","first-page":"1039","article-title":"Nash q-learning for general-sum stochastic games","volume":"4","author":"hu","year":"2003","journal-title":"Journal of Machine Learning Research"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1186\/s40648-014-0001-z"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ITSC.2015.113"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ARSO.2015.7428204"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ITSC.2011.6082928"},{"key":"ref28","doi-asserted-by":"crossref","DOI":"10.1609\/aaai.v32i1.11595","article-title":"Selective experience replay for lifelong learning","author":"isele","year":"2018","journal-title":"AAAI Conference on Artificial Intelligence (AAAI)"},{"key":"ref4","author":"lipton","year":"2016","journal-title":"Combinating reinforcement learning's sisyphean curse with intrinsic fear"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/ITSC.2013.6728484"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1016\/B978-1-55860-335-6.50021-0"},{"key":"ref6","first-page":"143","article-title":"Safe exploration for reinforcement learning","author":"hans","year":"2008","journal-title":"ESANN"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/IVS.2017.7995818"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1613\/jair.1666"},{"key":"ref8","first-page":"3630","article-title":"Probably approximately correct learning in stochastic games with temporal logic specifications","author":"wen","year":"2016","journal-title":"IJCAI"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2015.7354078"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1287\/mnsc.18.7.356"},{"key":"ref9","doi-asserted-by":"crossref","DOI":"10.1609\/aaai.v32i1.11797","article-title":"Safe reinforcement learning via shielding","author":"alshiekh","year":"2018","journal-title":"AAAI Conference on Artificial Intelligence (AAAI)"},{"key":"ref1","first-page":"1437","article-title":"A comprehensive survey on safe reinforcement learning","volume":"16","author":"garcia","year":"2015","journal-title":"Journal of Machine Learning Research"},{"key":"ref20","first-page":"1","article-title":"Comparison and evaluation of advanced motion models for vehicle tracking","author":"schubert","year":"2008","journal-title":"Information Fusion"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.2514\/6.2011-1512"},{"key":"ref21","article-title":"Stochastic predictive control of autonomous vehicles in uncertain environments","author":"carvalho","year":"2014","journal-title":"Int Symposium on Advanced Vehicle Control"},{"key":"ref24","doi-asserted-by":"crossref","first-page":"855","DOI":"10.1109\/TRO.2012.2195829","article-title":"Estimation of multivehicle dynamics by considering contextual information","volume":"28","author":"agamennoni","year":"2012","journal-title":"IEEE Transactions on Robotics"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/IVS.2014.6856508"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1155\/2016\/1025349"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/IVS.2017.7995721"}],"event":{"name":"2018 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS)","location":"Madrid","start":{"date-parts":[[2018,10,1]]},"end":{"date-parts":[[2018,10,5]]}},"container-title":["2018 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8574473\/8593358\/08593420.pdf?arnumber=8593420","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,9,13]],"date-time":"2023-09-13T03:52:12Z","timestamp":1694577132000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8593420\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,10]]},"references-count":33,"URL":"https:\/\/doi.org\/10.1109\/iros.2018.8593420","relation":{},"subject":[],"published":{"date-parts":[[2018,10]]}}}