{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,7,11]],"date-time":"2026-07-11T15:44:00Z","timestamp":1783784640789,"version":"3.55.0"},"reference-count":26,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,9,27]],"date-time":"2021-09-27T00:00:00Z","timestamp":1632700800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2021,9,27]],"date-time":"2021-09-27T00:00:00Z","timestamp":1632700800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,9,27]],"date-time":"2021-09-27T00:00:00Z","timestamp":1632700800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100004608","name":"Natural Science Foundation of Jiangsu Province","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100004608","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,9,27]]},"DOI":"10.1109\/iros51168.2021.9636468","type":"proceedings-article","created":{"date-parts":[[2021,12,16]],"date-time":"2021-12-16T20:45:38Z","timestamp":1639687538000},"page":"4552-4559","source":"Crossref","is-referenced-by-count":48,"title":["Model-based Constrained Reinforcement Learning using Generalized Control Barrier Function"],"prefix":"10.1109","author":[{"given":"Haitong","family":"Ma","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Jianyu","family":"Chen","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Shengbo","family":"Eben","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Ziyu","family":"Lin","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Yang","family":"Guan","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Yangang","family":"Ren","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Sifa","family":"Zheng","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref10","article-title":"Benchmarking safe exploration in deep reinforcement learning","author":"ray","year":"2019"},{"key":"ref11","article-title":"Deep adaptive dynamic programming for nonaffine nonlinear optimal control problem with state constraints","author":"duan","year":"2019"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1016\/j.strusafe.2019.04.003"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/CDC.2018.8619572"},{"key":"ref14","first-page":"1889","article-title":"Trust region policy optimization","author":"schulman","year":"2015","journal-title":"International Conference on Machine Learning"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICCCR49711.2021.9349412"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1016\/j.automatica.2005.08.007"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2017.XIII.073"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ACC.2016.7524935"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.23919\/ECC.2019.8796030"},{"key":"ref4","first-page":"1","article-title":"Risk-constrained reinforcement learning with percentile risk criteria","volume":"18","author":"chow","year":"2018","journal-title":"Journal of Machine Learning Research"},{"key":"ref3","first-page":"22","article-title":"Constrained policy optimization","volume":"70","author":"achiam","year":"2017","journal-title":"Proceedings of the 34th International Conference on Machine Learning"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/DEVLRN.2007.4354030"},{"key":"ref5","first-page":"1437","article-title":"A comprehensive survey on safe reinforcement learning","volume":"16","author":"garc\u00eda","year":"2015","journal-title":"Journal of Machine Learning Research"},{"key":"ref8","author":"jorion","year":"2007","journal-title":"Value at Risk The New Benchmark for Managing Financial Risk"},{"key":"ref7","article-title":"Reward constrained policy optimization","author":"tessler","year":"2018"},{"key":"ref2","article-title":"Concrete problems in AI safety","author":"amodei","year":"2016"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1016\/S0378-4266(02)00271-6"},{"key":"ref1","author":"li","year":"2020","journal-title":"Reinforcement learning and control"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/ICPS49255.2021.9468220"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2014.2354052"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/TCST.2010.2049203"},{"key":"ref24","first-page":"1","article-title":"Improving generalization of reinforcement learning with minimax distributional soft actorcritic","author":"ren","year":"2020","journal-title":"2020 IEEE 23rd International Conference on Intelligent Transportation Systems (ITSC)"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2020.3026111"},{"key":"ref26","article-title":"Integrated decision and control: Towards interpretable and efficient driving intelligence","author":"guan","year":"2021"},{"key":"ref25","article-title":"Numerically stable dynamic bicycle model for discrete-time control","author":"ge","year":"2020"}],"event":{"name":"2021 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS)","location":"Prague, Czech Republic","start":{"date-parts":[[2021,9,27]]},"end":{"date-parts":[[2021,10,1]]}},"container-title":["2021 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9635848\/9635849\/09636468.pdf?arnumber=9636468","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,5,10]],"date-time":"2022-05-10T16:54:51Z","timestamp":1652201691000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9636468\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,9,27]]},"references-count":26,"URL":"https:\/\/doi.org\/10.1109\/iros51168.2021.9636468","relation":{},"subject":[],"published":{"date-parts":[[2021,9,27]]}}}