{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,29]],"date-time":"2024-10-29T11:06:54Z","timestamp":1730200014470,"version":"3.28.0"},"reference-count":16,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018,11]]},"DOI":"10.1109\/besc.2018.8697262","type":"proceedings-article","created":{"date-parts":[[2019,4,26]],"date-time":"2019-04-26T00:13:19Z","timestamp":1556237599000},"page":"115-120","source":"Crossref","is-referenced-by-count":4,"title":["Ship Collision Avoidance Using Constrained Deep Reinforcement Learning"],"prefix":"10.1109","author":[{"given":"Rui","family":"Zhang","sequence":"first","affiliation":[]},{"given":"Xiao","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Kezhong","family":"Liu","sequence":"additional","affiliation":[]},{"given":"Xiaolie","family":"Wu","sequence":"additional","affiliation":[]},{"given":"Tianyou","family":"Lu","sequence":"additional","affiliation":[]},{"given":"Chao","family":"Zhaohui","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/JOE.2014.2304793"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1016\/j.ifacol.2017.08.2525"},{"key":"ref12","article-title":"Towards vision-based deep reinforcement learning for robotic motion control","author":"zhang","year":"2015","journal-title":"Computer Science"},{"key":"ref13","article-title":"End to end learning for self-driving cars","volume":"abs 1604 7316","author":"bojarski","year":"2016","journal-title":"CoRR"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.2352\/ISSN.2470-1173.2017.19.AVM-023"},{"key":"ref15","article-title":"Virtual to real reinforcement learning for autonomous driving","author":"you","year":"2017","journal-title":"British Machine Vision Conference"},{"key":"ref16","first-page":"1928","article-title":"Asynchronous methods for deep reinforcement learning","author":"mnih","year":"2016","journal-title":"International Conference on Machine Learning"},{"key":"ref4","article-title":"Continuous control with deep reinforcement learning","volume":"8","author":"lillicrap","year":"2015","journal-title":"Computer Science"},{"key":"ref3","first-page":"834","article-title":"Improving stochastic policy gradients in continuous control with deep reinforcement learning using the beta distribution","author":"chou","year":"2017","journal-title":"International Conference on Machine Learning"},{"key":"ref6","doi-asserted-by":"crossref","first-page":"529","DOI":"10.1038\/nature14236","article-title":"Human-level control through deep reinforcement learning","volume":"518","author":"mnih","year":"2015","journal-title":"Nature"},{"key":"ref5","first-page":"2322","article-title":"Where to add actions in human-in-the-loop reinforcement learning","author":"mandel","year":"2017","journal-title":"AAAI"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1016\/j.ifacol.2016.10.315"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2016.2551780"},{"key":"ref2","first-page":"1719","article-title":"Multi-objective pomdps with lexicographic reward preferences","author":"wray","year":"2015","journal-title":"IlCAI"},{"key":"ref1","first-page":"2891","article-title":"Query-efficient imitation learning for end-to-end simulated driving","author":"zhang","year":"2017","journal-title":"AAAI"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1016\/j.ifacol.2016.10.344"}],"event":{"name":"2018 5th International Conference on Behavioral, Economic, and Socio-Cultural Computing (BESC)","start":{"date-parts":[[2018,11,12]]},"location":"Kaohsiung, Taiwan","end":{"date-parts":[[2018,11,14]]}},"container-title":["2018 5th International Conference on Behavioral, Economic, and Socio-Cultural Computing (BESC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8683941\/8697225\/08697262.pdf?arnumber=8697262","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,5,13]],"date-time":"2019-05-13T19:11:01Z","timestamp":1557774661000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8697262\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,11]]},"references-count":16,"URL":"https:\/\/doi.org\/10.1109\/besc.2018.8697262","relation":{},"subject":[],"published":{"date-parts":[[2018,11]]}}}