{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,2]],"date-time":"2026-04-02T17:48:49Z","timestamp":1775152129680,"version":"3.50.1"},"reference-count":38,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode"}],"funder":[{"name":"Key Digital Technologies Joint Undertaking (KDT JU), in collaboration with the Horizon Europe (HORIZON) Framework Program and National Authorities under Agreement","award":["101112306"],"award-info":[{"award-number":["101112306"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Access"],"published-print":{"date-parts":[[2024]]},"DOI":"10.1109\/access.2024.3508031","type":"journal-article","created":{"date-parts":[[2024,11,27]],"date-time":"2024-11-27T19:41:56Z","timestamp":1732736516000},"page":"178209-178221","source":"Crossref","is-referenced-by-count":6,"title":["Adaptive Deep Reinforcement Learning for Efficient 3D Navigation of Autonomous Underwater Vehicles"],"prefix":"10.1109","volume":"12","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-8795-5560","authenticated-orcid":false,"given":"Elena","family":"Politi","sequence":"first","affiliation":[{"name":"Department of Informatics and Telematics, Harokopio University of Athens, Athens, Greece"}]},{"ORCID":"https:\/\/orcid.org\/0009-0008-2059-7429","authenticated-orcid":false,"given":"Artemis","family":"Stefanidou","sequence":"additional","affiliation":[{"name":"Department of Informatics and Telematics, Harokopio University of Athens, Athens, Greece"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2768-7119","authenticated-orcid":false,"given":"Christos","family":"Chronis","sequence":"additional","affiliation":[{"name":"Department of Informatics and Telematics, Harokopio University of Athens, Athens, Greece"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7424-8557","authenticated-orcid":false,"given":"George","family":"Dimitrakopoulos","sequence":"additional","affiliation":[{"name":"Department of Informatics and Telematics, Harokopio University of Athens, Athens, Greece"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0876-8167","authenticated-orcid":false,"given":"and","family":"Iraklis Varlamis","sequence":"additional","affiliation":[{"name":"Department of Informatics and Telematics, Harokopio University of Athens, Athens, Greece"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"crossref","DOI":"10.1016\/j.oceaneng.2022.112421","article-title":"Dynamic path planning of a three-dimensional underwater AUV based on an adaptive genetic algorithm","volume":"263","author":"Hao","year":"2022","journal-title":"Ocean Eng."},{"key":"ref2","doi-asserted-by":"crossref","DOI":"10.1016\/j.oceaneng.2024.116846","article-title":"An AUV collision avoidance algorithm in unknown environment with multiple constraints","volume":"294","author":"Dai","year":"2024","journal-title":"Ocean Eng."},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1016\/j.oceaneng.2024.117911"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1016\/j.oceaneng.2024.118498"},{"key":"ref5","doi-asserted-by":"crossref","DOI":"10.1016\/j.apor.2022.103326","article-title":"Deep reinforcement learning for adaptive path planning and control of an autonomous underwater vehicle","volume":"129","author":"Hadi","year":"2022","journal-title":"Appl. Ocean Res."},{"key":"ref6","doi-asserted-by":"crossref","first-page":"61","DOI":"10.1016\/j.robot.2016.03.011","article-title":"A comparison of optimization techniques for AUV path planning in environments with ocean currents","volume":"82","author":"Zeng","year":"2016","journal-title":"Robot. Auto. Syst."},{"key":"ref7","doi-asserted-by":"crossref","DOI":"10.1016\/j.cie.2022.108123","article-title":"Global path planning based on a bidirectional alternating search a algorithm for mobile robots","volume":"168","author":"Li","year":"2022","journal-title":"Comput. Ind. Eng."},{"issue":"2","key":"ref8","doi-asserted-by":"crossref","first-page":"223","DOI":"10.3390\/jmse12020223","article-title":"Collaborative path planning of multiple AUVs based on adaptive multi-population PSO","volume":"12","author":"Zhi","year":"2024","journal-title":"J. Mar. Sci. Eng."},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1016\/j.oceaneng.2021.109355"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2022.3203072"},{"key":"ref11","doi-asserted-by":"crossref","DOI":"10.1016\/j.apor.2023.103591","article-title":"Integrated path planning and control through proximal policy optimization for a marine current turbine","volume":"137","author":"Hasankhani","year":"2023","journal-title":"Appl. Ocean Res."},{"key":"ref12","article-title":"Continuous control with deep reinforcement learning","author":"Lillicrap","year":"2015","journal-title":"arXiv:1509.02971"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.3233\/JIFS-192171"},{"issue":"10","key":"ref14","first-page":"81","article-title":"Autonomous navigation of UAV in multi-obstacle environments based on a deep reinforcement learning approach","volume":"115","author":"Sitong","year":"2022","journal-title":"Appl. Soft Comput. J."},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.3390\/s23136101"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2023.3249966"},{"key":"ref17","doi-asserted-by":"crossref","first-page":"929","DOI":"10.1016\/j.asoc.2017.10.025","article-title":"Online path planning for AUV rendezvous in dynamic cluttered undersea environment using evolutionary algorithms","volume":"70","author":"MahmoudZadeh","year":"2018","journal-title":"Appl. Soft Comput."},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1007\/s00500-016-2474-6"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1007\/s10846-022-01794-y"},{"key":"ref20","doi-asserted-by":"crossref","DOI":"10.1016\/j.oceaneng.2022.113391","article-title":"Motion planning for an under-actuated autonomous underwater vehicle based on fast marching nonlinear model-predictive quantum particle swarm optimization","volume":"268","author":"Chen","year":"2023","journal-title":"Ocean Eng."},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1016\/j.cie.2022.108905"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.2200\/s00268ed1v01y201005aim009"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1016\/j.oceaneng.2024.117547"},{"key":"ref24","doi-asserted-by":"crossref","first-page":"63","DOI":"10.1016\/j.neucom.2017.06.066","article-title":"Concise deep reinforcement learning obstacle avoidance for underactuated unmanned marine vessels","volume":"272","author":"Cheng","year":"2018","journal-title":"Neurocomputing"},{"issue":"3","key":"ref25","doi-asserted-by":"crossref","first-page":"252","DOI":"10.3390\/jmse9030252","article-title":"A 2D optimal path planning algorithm for autonomous underwater vehicle driving in unknown underwater canyons","volume":"9","author":"Sun","year":"2021","journal-title":"J. Mar. Sci. Eng."},{"key":"ref26","article-title":"Addressing function approximation error in actor-critic methods","author":"Fujimoto","year":"2018","journal-title":"arXiv:1802.09477"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1155\/2021\/8847863"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1016\/j.oceaneng.2024.119111"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/JOE.2023.3278290"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1016\/j.oceaneng.2023.116216"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1016\/j.oceaneng.2024.117287"},{"key":"ref32","article-title":"Bridging the gap between value and policy based reinforcement learning","author":"Nachum","year":"2017","journal-title":"arXiv:1702.08892"},{"key":"ref33","article-title":"Proximal policy optimization algorithms","author":"Schulman","year":"2017","journal-title":"arXiv:1707.06347"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2023.3326435"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1575\/1912\/3040"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1017\/S0890060420000141"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/INMIC50486.2020.9318195"},{"issue":"1","key":"ref38","doi-asserted-by":"crossref","first-page":"38","DOI":"10.47992\/IJAEML.2581.7000.0091","article-title":"A custom robotic ARM in coppeliasim","volume":"5","author":"Chakraborty","year":"2021","journal-title":"Int. J. Appl. Eng. Manag. Lett."}],"container-title":["IEEE Access"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/6287639\/10380310\/10770217.pdf?arnumber=10770217","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,12,11]],"date-time":"2024-12-11T02:11:59Z","timestamp":1733883119000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10770217\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024]]},"references-count":38,"URL":"https:\/\/doi.org\/10.1109\/access.2024.3508031","relation":{},"ISSN":["2169-3536"],"issn-type":[{"value":"2169-3536","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024]]}}}