{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,28]],"date-time":"2026-02-28T17:46:12Z","timestamp":1772300772046,"version":"3.50.1"},"reference-count":37,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,5,30]],"date-time":"2021-05-30T00:00:00Z","timestamp":1622332800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2021,5,30]],"date-time":"2021-05-30T00:00:00Z","timestamp":1622332800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,5,30]],"date-time":"2021-05-30T00:00:00Z","timestamp":1622332800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,5,30]]},"DOI":"10.1109\/icra48506.2021.9561188","type":"proceedings-article","created":{"date-parts":[[2021,10,19]],"date-time":"2021-10-19T20:28:35Z","timestamp":1634675315000},"page":"1088-1094","source":"Crossref","is-referenced-by-count":45,"title":["Deep Reinforcement Learning for Mapless Navigation of a Hybrid Aerial Underwater Vehicle with Medium Transition"],"prefix":"10.1109","author":[{"given":"Ricardo B.","family":"Grando","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Junior C.","family":"de Jesus","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Victor A.","family":"Kich","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Alisson H.","family":"Kolling","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Nicolas P.","family":"Bortoluzzi","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Pedro M.","family":"Pinheiro","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Armando A.","family":"Neto","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Paulo L. J.","family":"Drews","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1103\/PhysRev.36.823"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/OCEANS.2016.7761080"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.2970433"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/IROS40897.2019.8967612"},{"key":"ref37","first-page":"1587","article-title":"Addressing function approximation error in actor-critic methods","author":"fujimoto","year":"2018","journal-title":"International Conference on Machine Learning"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/ICAR46387.2019.8981667"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/CDC.2010.5717652"},{"key":"ref34","first-page":"1861","article-title":"Soft actor-critic: Off-policy maximum entropy deep reinforcement learning with a stochastic actor","volume":"80","author":"haarnoja","year":"0"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2015.7139029"},{"key":"ref11","first-page":"7460","article-title":"A comparative study on sigmapoint kalman filters for trajectory estimation of hybrid aerial-aquatic vehicles","author":"da rosa","year":"2018","journal-title":"IEEE\/RSJ Int Conf on Intelligent Robots and Systems (IROS)"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2017.8202261"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2019.8793985"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1177\/1729881418770531"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1007\/s10846-018-0820-x"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-08338-4_112"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2016.2591587"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1177\/0278364913495721"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.3390\/robotics2030122"},{"key":"ref4","first-page":"2829","article-title":"Continuous deep q-learning with model-based acceleration","author":"gu","year":"2016","journal-title":"Int Conf on Machine Learning"},{"key":"ref28","first-page":"1","article-title":"Deep reinforcement learning for mapless navigation of unmanned aerial vehicles","author":"grando","year":"2020"},{"key":"ref3","article-title":"Continuous control with deep reinforcement learning","author":"lillicrap","year":"0"},{"key":"ref27","article-title":"Using Soft Actor-Critic for Low-Level UAV Control","author":"barros","year":"2020"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2017.8202134"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2017.7989381"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.23919\/ChiCC.2017.8028138"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/OCEANS.2018.8604791"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2018.8594472"},{"key":"ref2","article-title":"Prioritized experience replay","author":"schaul","year":"2016"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2014.6943220"},{"key":"ref1","article-title":"Playing atari with deep reinforcement learning","author":"mnih","year":"2013","journal-title":"NIPS Deep Learning Workshop"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2017.8202133"},{"key":"ref22","doi-asserted-by":"crossref","DOI":"10.1109\/IROS45743.2020.9341620","article-title":"Efficient exploration in constrained environments with goal-oriented reference path","author":"ota","year":"2020"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2017.8202312"},{"key":"ref24","doi-asserted-by":"crossref","first-page":"595","DOI":"10.1007\/978-3-319-26054-9_23","article-title":"Rotors&#x2014;a modular gazebo mav simulator framework","author":"furrer","year":"2016","journal-title":"Robot Operating System (ROS)"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/ICAR46387.2019.8981638"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2019.8793735"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1007\/s10846-018-0898-1"}],"event":{"name":"2021 IEEE International Conference on Robotics and Automation (ICRA)","location":"Xi'an, China","start":{"date-parts":[[2021,5,30]]},"end":{"date-parts":[[2021,6,5]]}},"container-title":["2021 IEEE International Conference on Robotics and Automation (ICRA)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9560720\/9560666\/09561188.pdf?arnumber=9561188","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,1,12]],"date-time":"2023-01-12T17:54:49Z","timestamp":1673546089000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9561188\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,5,30]]},"references-count":37,"URL":"https:\/\/doi.org\/10.1109\/icra48506.2021.9561188","relation":{},"subject":[],"published":{"date-parts":[[2021,5,30]]}}}