{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,30]],"date-time":"2024-10-30T06:42:12Z","timestamp":1730270532658,"version":"3.28.0"},"reference-count":30,"publisher":"IEEE","license":[{"start":{"date-parts":[[2020,10,24]],"date-time":"2020-10-24T00:00:00Z","timestamp":1603497600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2020,10,24]],"date-time":"2020-10-24T00:00:00Z","timestamp":1603497600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2020,10,24]],"date-time":"2020-10-24T00:00:00Z","timestamp":1603497600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020,10,24]]},"DOI":"10.1109\/iros45743.2020.9341620","type":"proceedings-article","created":{"date-parts":[[2021,2,13]],"date-time":"2021-02-13T02:26:48Z","timestamp":1613183208000},"page":"6061-6068","source":"Crossref","is-referenced-by-count":17,"title":["Efficient Exploration in Constrained Environments with Goal-Oriented Reference Path"],"prefix":"10.1109","author":[{"given":"Kei","family":"Ota","sequence":"first","affiliation":[]},{"given":"Yoko","family":"Sasaki","sequence":"additional","affiliation":[]},{"given":"Devesh K.","family":"Jha","sequence":"additional","affiliation":[]},{"given":"Yusuke","family":"Yoshiyasu","sequence":"additional","affiliation":[]},{"given":"Asako","family":"Kanezaki","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2012.6386109"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2019.8793611"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1038\/nature24270"},{"key":"ref12","first-page":"1889","article-title":"Trust region policy optimization","volume":"37","author":"schulman","year":"2015","journal-title":"ICML"},{"article-title":"Continuous control with deep reinforcement learning","year":"2015","author":"lillicrap","key":"ref13"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2018.8461096"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2018.8460696"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2019.2899918"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/IROS40897.2019.8968010"},{"key":"ref18","article-title":"Probabilistic roadmaps for path planning in high-dimensional configuration spaces","volume":"12","author":"kavralu","year":"1996","journal-title":"IEEE Trans Robotics and Automation"},{"key":"ref19","first-page":"1","article-title":"Guided policy search","author":"levine","year":"2013","journal-title":"Proceedings of International Conference on Machine Learning (ICML)"},{"key":"ref28","first-page":"1861","article-title":"Soft actor-critic: Off-policy maximum entropy deep reinforcement learning with a stochastic actor","author":"haarnoja","year":"2018","journal-title":"Proceedings of International Conference on Machine Learning (ICML)"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1016\/j.mcm.2004.05.001"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/TSSC.1968.300136"},{"key":"ref3","article-title":"Optimal and Efficient Path Planning for Partially-Known Environments","author":"stentz","year":"1994","journal-title":"Technical Report"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref29","doi-asserted-by":"crossref","first-page":"529","DOI":"10.1038\/nature14236","article-title":"Human-level control through deep reinforcement learning","volume":"518","author":"mnih","year":"2015","journal-title":"Nature"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9780511546877"},{"key":"ref8","doi-asserted-by":"crossref","first-page":"529","DOI":"10.1038\/nature14236","article-title":"Human-level control through deep reinforcement learning","volume":"518","author":"mnih","year":"2015","journal-title":"Nature"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.243"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1126\/science.aab3050"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2018.8593871"},{"article-title":"Benchmarking Safe Exploration in Deep Reinforcement Learning","year":"2019","author":"ray","key":"ref1"},{"article-title":"Combining optimal control and learning for visual navigation in novel environments","year":"2019","author":"bansal","key":"ref20"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2017.2783400"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2017\/700"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2018.8593772"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2019.XV.031"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1016\/j.neunet.2018.07.006"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2019.8793889"}],"event":{"name":"2020 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS)","start":{"date-parts":[[2020,10,24]]},"location":"Las Vegas, NV, USA","end":{"date-parts":[[2021,1,24]]}},"container-title":["2020 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9340668\/9340635\/09341620.pdf?arnumber=9341620","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,6,28]],"date-time":"2022-06-28T21:54:47Z","timestamp":1656453287000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9341620\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,10,24]]},"references-count":30,"URL":"https:\/\/doi.org\/10.1109\/iros45743.2020.9341620","relation":{},"subject":[],"published":{"date-parts":[[2020,10,24]]}}}