{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,3]],"date-time":"2026-03-03T16:02:55Z","timestamp":1772553775941,"version":"3.50.1"},"reference-count":47,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"12","license":[{"start":{"date-parts":[[2021,12,1]],"date-time":"2021-12-01T00:00:00Z","timestamp":1638316800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2021,12,1]],"date-time":"2021-12-01T00:00:00Z","timestamp":1638316800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,12,1]],"date-time":"2021-12-01T00:00:00Z","timestamp":1638316800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100012166","name":"National Key Research and Development Plan of China","doi-asserted-by":"publisher","award":["2018AAA0102504"],"award-info":[{"award-number":["2018AAA0102504"]}],"id":[{"id":"10.13039\/501100012166","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["U1913204"],"award-info":[{"award-number":["U1913204"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61991411"],"award-info":[{"award-number":["61991411"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["U19B2038"],"award-info":[{"award-number":["U19B2038"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100017445","name":"Natural Science Foundation of Shandong Province for Distinguished Young Scholars","doi-asserted-by":"publisher","award":["ZR2020JQ29"],"award-info":[{"award-number":["ZR2020JQ29"]}],"id":[{"id":"10.13039\/100017445","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100018532","name":"Shandong Major Scientific and Technological Innovation Project","doi-asserted-by":"publisher","award":["2018CXGC1503"],"award-info":[{"award-number":["2018CXGC1503"]}],"id":[{"id":"10.13039\/501100018532","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Neural Netw. Learning Syst."],"published-print":{"date-parts":[[2021,12]]},"DOI":"10.1109\/tnnls.2021.3057424","type":"journal-article","created":{"date-parts":[[2021,3,5]],"date-time":"2021-03-05T20:31:53Z","timestamp":1614976313000},"page":"5445-5455","source":"Crossref","is-referenced-by-count":47,"title":["Visual Navigation With Multiple Goals Based on Deep Reinforcement Learning"],"prefix":"10.1109","volume":"32","author":[{"given":"Zhenhuan","family":"Rao","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5615-8016","authenticated-orcid":false,"given":"Yuechen","family":"Wu","sequence":"additional","affiliation":[]},{"given":"Zifei","family":"Yang","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4960-3190","authenticated-orcid":false,"given":"Wei","family":"Zhang","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6766-2506","authenticated-orcid":false,"given":"Shijian","family":"Lu","sequence":"additional","affiliation":[]},{"given":"Weizhi","family":"Lu","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2510-8993","authenticated-orcid":false,"given":"ZhengJun","family":"Zha","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref39","first-page":"4190","article-title":"A unified game-theoretic approach to multiagent reinforcement learning","author":"lanctot","year":"2017","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/TRO.2020.2994002"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2019.2910188"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2018.2817340"},{"key":"ref31","first-page":"1312","article-title":"Universal value function approximators","author":"schaul","year":"2015","journal-title":"Proc Int Conf Mach Learn"},{"key":"ref30","first-page":"5048","article-title":"Hindsight experience replay","author":"andrychowicz","year":"2017","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2019.2955699"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2018.2852711"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2020.2966319"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2016.2557349"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2019\/86"},{"key":"ref40","article-title":"Generalization and regularization in DQN","author":"farebrother","year":"2018","journal-title":"arXiv 1810 00123"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2017.7989381"},{"key":"ref12","first-page":"2419","article-title":"Learning to navigate in cities without a map","author":"mirowski","year":"2018","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1007\/s10846-008-9235-4"},{"key":"ref14","article-title":"Semi-parametric topological memory for navigation","author":"savinov","year":"2018","journal-title":"arXiv 1803 00653"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2019.2927869"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2020.2977924"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN.2017.7965896"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.769"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-44188-7_1"},{"key":"ref28","article-title":"Prioritized experience replay","author":"schaul","year":"2015","journal-title":"arXiv 1511 05952"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00387"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW.2018.00278"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2019.2934906"},{"key":"ref6","doi-asserted-by":"crossref","first-page":"484","DOI":"10.1038\/nature16961","article-title":"Mastering the game of go with deep neural networks and tree search","volume":"529","author":"silver","year":"2016","journal-title":"Nature"},{"key":"ref29","article-title":"Learning to reinforcement learn","author":"wang","year":"2016","journal-title":"arXiv 1611 05763"},{"key":"ref5","doi-asserted-by":"crossref","first-page":"529","DOI":"10.1038\/nature14236","article-title":"Human-level control through deep reinforcement learning","volume":"518","author":"mnih","year":"2015","journal-title":"Nature"},{"key":"ref8","article-title":"Learning to navigate in complex environments","author":"mirowski","year":"2016","journal-title":"arXiv 1611 03673"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2017.2672989"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/TRO.2015.2424032"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1038\/s41586-018-0102-6"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2018.2805379"},{"key":"ref46","first-page":"1928","article-title":"Asynchronous methods for deep reinforcement learning","author":"mnih","year":"2016","journal-title":"Proc Int Conf Mach Learn"},{"key":"ref20","article-title":"Building generalizable agents with a realistic and rich 3D environment","author":"wu","year":"2018","journal-title":"arXiv 1801 02209"},{"key":"ref45","author":"sutton","year":"2018","journal-title":"Reinforcement Learning An Introduction"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2018.8594352"},{"key":"ref47","article-title":"AI2-THOR: An interactive 3D environment for visual AI","author":"kolve","year":"2017","journal-title":"arXiv 1712 05474"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW.2017.70"},{"key":"ref42","article-title":"Assessing generalization in deep reinforcement learning","author":"packer","year":"2018","journal-title":"arXiv 1810 12282"},{"key":"ref24","article-title":"Reinforcement learning with unsupervised auxiliary tasks","author":"jaderberg","year":"2016","journal-title":"arXiv 1611 05397"},{"key":"ref41","article-title":"Robust reinforcement learning for continuous control with model misspecification","author":"mankowitz","year":"2019","journal-title":"arXiv 1906 07516"},{"key":"ref23","article-title":"Learning to act by predicting the future","author":"dosovitskiy","year":"2016","journal-title":"arXiv 1611 01779"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2018.2869978"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00077"},{"key":"ref43","article-title":"A study on overfitting in deep reinforcement learning","author":"zhang","year":"2018","journal-title":"arXiv 1804 06893"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.13"}],"container-title":["IEEE Transactions on Neural Networks and Learning Systems"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/5962385\/9629429\/09370169.pdf?arnumber=9370169","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,5,10]],"date-time":"2022-05-10T14:53:13Z","timestamp":1652194393000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9370169\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,12]]},"references-count":47,"journal-issue":{"issue":"12"},"URL":"https:\/\/doi.org\/10.1109\/tnnls.2021.3057424","relation":{},"ISSN":["2162-237X","2162-2388"],"issn-type":[{"value":"2162-237X","type":"print"},{"value":"2162-2388","type":"electronic"}],"subject":[],"published":{"date-parts":[[2021,12]]}}}