{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,29]],"date-time":"2026-05-29T09:44:18Z","timestamp":1780047858679,"version":"3.53.1"},"reference-count":221,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode"}],"funder":[{"DOI":"10.13039\/100016171","name":"Maroun Semaan Faculty of Engineering and Architecture, American University of Beirut","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100016171","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Access"],"published-print":{"date-parts":[[2023]]},"DOI":"10.1109\/access.2023.3236801","type":"journal-article","created":{"date-parts":[[2023,1,13]],"date-time":"2023-01-13T21:48:17Z","timestamp":1673646497000},"page":"19941-19968","source":"Crossref","is-referenced-by-count":52,"title":["Reinforcement Learning in the Sky: A Survey on Enabling Intelligence in NTN-Based Communications"],"prefix":"10.1109","volume":"11","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-0049-9318","authenticated-orcid":false,"given":"Tarek","family":"Naous","sequence":"first","affiliation":[{"name":"Electrical and Computer Engineering Department, American University of Beirut, Beirut, Lebanon"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0738-0822","authenticated-orcid":false,"given":"May","family":"Itani","sequence":"additional","affiliation":[{"name":"Mathematics and Computer Science Department, Beirut Arab University, Beirut, Lebanon"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4815-6894","authenticated-orcid":false,"given":"Mariette","family":"Awad","sequence":"additional","affiliation":[{"name":"Electrical and Computer Engineering Department, American University of Beirut, Beirut, Lebanon"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Sanaa","family":"Sharafeddine","sequence":"additional","affiliation":[{"name":"Department of Computer Science, American University of Beirut, Beirut, Lebanon"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.3390\/s22093136"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/MCOMSTD.011.2100038"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/MCOM.2016.7470933"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/MCOM.2018.1700643"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/MVT.2019.2917363"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2019.2929241"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.12676\/j.cc.2018.12.009"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-33039-2"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.3022981"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1016\/j.cja.2021.12.013"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/JPROC.2022.3169690"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2022.3151028"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/OJCOMS.2021.3093110"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/5GWF.2019.8911669"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/MNET.011.2000493"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2019.2963223"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2019.2895263"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1016\/j.comnet.2020.107588"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2020.3028247"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1016\/j.comcom.2020.04.020"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ComNet47917.2020.9306090"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.3389\/frcmn.2021.716265"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1016\/j.comcom.2021.07.014"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1016\/j.array.2022.100142"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1016\/j.comnet.2020.107212"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.23919\/ICN.2021.0015"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/JPROC.2019.2952892"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2018.2864423"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1016\/j.csi.2020.103451"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2019.2902862"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1016\/j.comnet.2020.107451"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2019.2906228"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2018.2887086"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/TCCN.2020.2968311"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.2994494"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2015.2495297"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1016\/j.comcom.2019.10.014"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2018.05.033"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2016.2612119"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2019.2919613"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.3390\/s19235170"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1002\/9781119471509.w5gref231"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.2981430"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/MWC.2018.1800155"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1016\/j.comnet.2020.107478"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/ojcoms.2021.3075201"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2019.2916583"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.23919\/JCIN.2019.8917870"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.23919\/JCIN.2019.8917869"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2021.3063822"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2020.2988367"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2021.3073036"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1109\/tnn.1998.712192"},{"key":"ref54","volume-title":"Cs234: Reinforcement Learning Winter 2022","author":"Brunskill","year":"2022"},{"key":"ref55","first-page":"1126","article-title":"Model-agnostic meta-learning for fast adaptation of deep networks","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Finn"},{"key":"ref56","article-title":"A simple neural attentive meta-learner","author":"Mishra","year":"2017","journal-title":"arXiv:1707.03141"},{"key":"ref57","article-title":"ProMP: Proximal meta-policy search","author":"Rothfuss","year":"2018","journal-title":"arXiv:1810.06784"},{"key":"ref58","first-page":"387","article-title":"Deterministic policy gradient algorithms","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Silver"},{"key":"ref59","first-page":"1928","article-title":"Asynchronous methods for deep reinforcement learning","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Mnih"},{"key":"ref60","article-title":"Proximal policy optimization algorithms","author":"Schulman","year":"2017","journal-title":"arXiv:1707.06347"},{"key":"ref61","article-title":"Maximum a posteriori policy optimisation","volume-title":"arXiv:1806.06920","author":"Abdolmaleki"},{"key":"ref62","article-title":"Continuous control with deep reinforcement learning","author":"Lillicrap","year":"2015","journal-title":"arXiv:1509.02971"},{"key":"ref63","article-title":"Multiagent actor-critic for mixed cooperative-competitive environments","volume-title":"Advances in Neural Information Processing Systems","volume":"30","author":"Lowe","year":"2017"},{"key":"ref64","first-page":"1861","article-title":"Soft actor-critic: Offpolicy maximum entropy deep reinforcement learning with a stochastic actor","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Haarnoja"},{"key":"ref65","article-title":"Playing atari with deep reinforcement learning","volume-title":"arXiv:1312.5602","author":"Mnih"},{"key":"ref66","first-page":"449","article-title":"Adistributional perspective on reinforcement learning","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Bellemare"},{"key":"ref67","article-title":"Hindsight experience replay","volume-title":"Advances in Neural Information Processing Systems","volume":"30","author":"Andrychowicz","year":"2017"},{"key":"ref68","article-title":"Recurrent experience replay in distributed reinforcement learning","volume-title":"Proc. Int. Conf. Learn. Represent.","author":"Kapturowski"},{"key":"ref69","first-page":"507","article-title":"Agent57: Outperforming the Atari human benchmark","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Badia"},{"key":"ref70","article-title":"Never give up: Learning directed exploration strategies","author":"Badia","year":"2020","journal-title":"arXiv:2002.06038"},{"key":"ref71","article-title":"Imagination-augmented agents for deep reinforcement learning","volume-title":"Advances in Neural Information Processing Systems","volume":"30","author":"Racani\u00e8re","year":"2017"},{"key":"ref72","article-title":"Recurrent world models facilitate policy evolution","volume-title":"Advances in Neural Information Processing Systems","volume":"31","author":"Ha","year":"2018"},{"key":"ref73","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2018.8463189"},{"key":"ref74","article-title":"Model-based value estimation for efficient model-free reinforcement learning","author":"Feinberg","year":"2018","journal-title":"arXiv:1803.00101"},{"key":"ref75","doi-asserted-by":"publisher","DOI":"10.1038\/s41586-020-03051-4"},{"key":"ref76","article-title":"Modelbased reinforcement learning for Atari","author":"Kaiser","year":"2019","journal-title":"arXiv:1903.00374"},{"key":"ref77","article-title":"Mastering chess and shogi by self-play with a general reinforcement learning algorithm","author":"Silver","year":"2017","journal-title":"arXiv:1712.01815"},{"key":"ref78","doi-asserted-by":"publisher","DOI":"10.4249\/scholarpedia.3698"},{"key":"ref79","doi-asserted-by":"publisher","DOI":"10.1109\/WCNC51071.2022.9771555"},{"key":"ref80","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2021.3118322"},{"key":"ref81","doi-asserted-by":"publisher","DOI":"10.1109\/MVT.2019.2921208"},{"key":"ref82","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2022.3189552"},{"key":"ref83","doi-asserted-by":"publisher","DOI":"10.1109\/MWC.2018.1800023"},{"key":"ref84","doi-asserted-by":"publisher","DOI":"10.1109\/TCOMM.2018.2880468"},{"key":"ref85","doi-asserted-by":"publisher","DOI":"10.1109\/MCOM.2016.7470932"},{"key":"ref86","doi-asserted-by":"publisher","DOI":"10.1109\/MCOM.2017.1700442"},{"key":"ref87","doi-asserted-by":"publisher","DOI":"10.1109\/GLOCOMW.2017.8269068"},{"key":"ref88","doi-asserted-by":"publisher","DOI":"10.1109\/ICC.2018.8422685"},{"key":"ref89","doi-asserted-by":"publisher","DOI":"10.1109\/VTC2020-Spring48590.2020.9129453"},{"key":"ref90","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2022.3182908"},{"key":"ref91","doi-asserted-by":"publisher","DOI":"10.1007\/s42452-021-04658-6"},{"key":"ref92","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2019.2952549"},{"key":"ref93","doi-asserted-by":"publisher","DOI":"10.1109\/ICCS.2018.8689249"},{"key":"ref94","doi-asserted-by":"publisher","DOI":"10.1109\/ICC40277.2020.9149258"},{"key":"ref95","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2018.2864373"},{"key":"ref96","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2019.2908171"},{"key":"ref97","doi-asserted-by":"publisher","DOI":"10.1109\/LCOMM.2022.3166961"},{"key":"ref98","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2019.2923214"},{"key":"ref99","doi-asserted-by":"publisher","DOI":"10.1109\/SPAWC.2018.8445768"},{"key":"ref100","doi-asserted-by":"publisher","DOI":"10.1109\/VTC2021-Fall52928.2021.9625395"},{"key":"ref101","doi-asserted-by":"publisher","DOI":"10.1109\/ICOIN53446.2022.9687270"},{"key":"ref102","doi-asserted-by":"publisher","DOI":"10.1109\/INFOCOMWKSHPS51825.2021.9484490"},{"key":"ref103","doi-asserted-by":"publisher","DOI":"10.1109\/ICC40277.2020.9149151"},{"key":"ref104","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2019.2935201"},{"key":"ref105","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2022.3142018"},{"key":"ref106","doi-asserted-by":"publisher","DOI":"10.3390\/s22082979"},{"key":"ref107","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2019.2922849"},{"key":"ref108","doi-asserted-by":"publisher","DOI":"10.1109\/GLOCOMW.2018.8644345"},{"key":"ref109","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2020.3004197"},{"key":"ref110","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2019.2936025"},{"key":"ref111","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.3031959"},{"key":"ref112","doi-asserted-by":"publisher","DOI":"10.1109\/GLOBECOM38437.2019.9013626"},{"key":"ref113","doi-asserted-by":"publisher","DOI":"10.1109\/tmc.2022.3200998"},{"key":"ref114","volume-title":"Study on Integrated Access and Backhaul (Release 16)","year":"2019"},{"key":"ref115","doi-asserted-by":"publisher","DOI":"10.3390\/s21061960"},{"key":"ref116","doi-asserted-by":"publisher","DOI":"10.1109\/TCOMM.2020.3041347"},{"key":"ref117","doi-asserted-by":"publisher","DOI":"10.1109\/GLOBECOM42002.2020.9348105"},{"key":"ref118","doi-asserted-by":"publisher","DOI":"10.1109\/GCWkshps45667.2019.9024685"},{"key":"ref119","doi-asserted-by":"publisher","DOI":"10.1109\/ICCWorkshops49005.2020.9145423"},{"key":"ref120","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2021.3082862"},{"key":"ref121","doi-asserted-by":"publisher","DOI":"10.1109\/MWC.2017.1700015"},{"key":"ref122","doi-asserted-by":"publisher","DOI":"10.1109\/MWC.001.1900207"},{"key":"ref123","doi-asserted-by":"publisher","DOI":"10.1109\/ICCWorkshops53468.2022.9814506"},{"key":"ref124","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2017.2785414"},{"key":"ref125","doi-asserted-by":"publisher","DOI":"10.1109\/WCSP.2018.8555700"},{"key":"ref126","doi-asserted-by":"publisher","DOI":"10.1155\/2020\/8825120"},{"key":"ref127","doi-asserted-by":"publisher","DOI":"10.1109\/WCNC45663.2020.9120592"},{"key":"ref128","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2020.3014788"},{"key":"ref129","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref130","article-title":"Neural machine translation by jointly learning to align and translate","volume-title":"Proc. 3rd Int. Conf. Learn. Represent. (ICLR)","author":"Bahdanau"},{"key":"ref131","doi-asserted-by":"publisher","DOI":"10.1109\/iccworkshops50388.2021.9473714"},{"key":"ref132","doi-asserted-by":"publisher","DOI":"10.1109\/INFCOM.2012.6195689"},{"key":"ref133","doi-asserted-by":"publisher","DOI":"10.1109\/INFCOMW.2018.8406973"},{"key":"ref134","doi-asserted-by":"publisher","DOI":"10.1109\/LWC.2019.2925796"},{"key":"ref135","doi-asserted-by":"publisher","DOI":"10.1109\/globecom38437.2019.9013924"},{"key":"ref136","doi-asserted-by":"publisher","DOI":"10.1109\/jsac.2021.3065049"},{"key":"ref137","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2020.3042925"},{"key":"ref138","doi-asserted-by":"publisher","DOI":"10.1109\/tvt.2021.3063953"},{"key":"ref139","doi-asserted-by":"publisher","DOI":"10.1109\/INFOCOMWKSHPS50562.2020.9162896"},{"key":"ref140","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2020.3039617"},{"key":"ref141","doi-asserted-by":"publisher","DOI":"10.1109\/GLOBECOM38437.2019.9014214"},{"key":"ref142","article-title":"UAVto- device underlay communications: Age of information minimization by multi-agent deep reinforcement learning","author":"Wu","year":"2020","journal-title":"arXiv:2003.05830"},{"key":"ref143","doi-asserted-by":"publisher","DOI":"10.1109\/TCOMM.2020.3013599"},{"key":"ref144","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2021.3063953"},{"key":"ref145","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2022.3179987"},{"key":"ref146","doi-asserted-by":"publisher","DOI":"10.1016\/j.asoc.2021.107607"},{"key":"ref147","doi-asserted-by":"publisher","DOI":"10.1109\/ICNP52444.2021.9651962"},{"key":"ref148","doi-asserted-by":"publisher","DOI":"10.1016\/j.procs.2022.04.013"},{"key":"ref149","doi-asserted-by":"publisher","DOI":"10.1109\/LWC.2021.3091164"},{"key":"ref150","doi-asserted-by":"publisher","DOI":"10.1016\/j.comcom.2022.06.017"},{"key":"ref151","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2021.3082862"},{"key":"ref152","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2022.109075"},{"key":"ref153","doi-asserted-by":"publisher","DOI":"10.1109\/ICC42927.2021.9500978"},{"key":"ref154","doi-asserted-by":"publisher","DOI":"10.3390\/s21238111"},{"key":"ref155","doi-asserted-by":"publisher","DOI":"10.1016\/j.jksuci.2022.03.025"},{"key":"ref156","doi-asserted-by":"publisher","DOI":"10.1186\/s13638-019-1463-8"},{"key":"ref157","doi-asserted-by":"publisher","DOI":"10.23919\/JCC.2020.10.009"},{"key":"ref158","doi-asserted-by":"publisher","DOI":"10.1109\/LCOMM.2021.3131556"},{"key":"ref159","doi-asserted-by":"publisher","DOI":"10.1109\/ICCW.2018.8403623"},{"key":"ref160","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2019.2910112"},{"key":"ref161","doi-asserted-by":"publisher","DOI":"10.1109\/ICUAS.2017.7991402"},{"key":"ref162","doi-asserted-by":"publisher","DOI":"10.1109\/GLOBECOM38437.2019.9014041"},{"key":"ref163","doi-asserted-by":"publisher","DOI":"10.1109\/twc.2021.3056573"},{"key":"ref164","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2022.3143230"},{"key":"ref165","doi-asserted-by":"publisher","DOI":"10.1145\/3325421.3329770"},{"key":"ref166","doi-asserted-by":"publisher","DOI":"10.1109\/WCNC45663.2020.9120595"},{"key":"ref167","article-title":"A deep reinforcement learning approach to efficient drone mobility support","author":"Chen","year":"2020","journal-title":"arXiv:2005.05229"},{"key":"ref168","doi-asserted-by":"publisher","DOI":"10.1109\/GCWkshps50303.2020.9367580"},{"key":"ref169","doi-asserted-by":"publisher","DOI":"10.1109\/MCOM.2018.1800087"},{"key":"ref170","doi-asserted-by":"publisher","DOI":"10.1109\/49.345884"},{"key":"ref171","doi-asserted-by":"publisher","DOI":"10.1109\/GLOBECOM38437.2019.9013281"},{"key":"ref172","doi-asserted-by":"publisher","DOI":"10.1109\/TCCN.2020.2973376"},{"key":"ref173","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2021.3086503"},{"key":"ref174","doi-asserted-by":"publisher","DOI":"10.1109\/TCCN.2020.3048399"},{"key":"ref175","doi-asserted-by":"publisher","DOI":"10.1109\/MCOM.2016.7470934"},{"key":"ref176","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2016.2531652"},{"key":"ref177","doi-asserted-by":"publisher","DOI":"10.1109\/ICC.2018.8422706"},{"key":"ref178","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2019.2900035"},{"key":"ref179","article-title":"Adaptive height optimisation for cellular-connected UAVs using reinforcement learning","author":"Fonseca","year":"2020","journal-title":"arXiv:2007.13695"},{"key":"ref180","doi-asserted-by":"publisher","DOI":"10.1109\/WCNCW48565.2020.9124759"},{"key":"ref181","doi-asserted-by":"publisher","DOI":"10.1016\/j.vehcom.2021.100391"},{"key":"ref182","doi-asserted-by":"publisher","DOI":"10.1016\/j.cja.2020.12.027"},{"key":"ref183","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA40945.2020.9196540"},{"key":"ref184","first-page":"1859","article-title":"Domain adaptation for reinforcement learning on the Atari","volume-title":"Proc. 18th Int. Conf. Auto. Agents MultiAgent Syst.","author":"Carr"},{"key":"ref185","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2020.3028078"},{"key":"ref186","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.01291"},{"key":"ref187","doi-asserted-by":"publisher","DOI":"10.1145\/3396864.3400304"},{"key":"ref188","doi-asserted-by":"publisher","DOI":"10.1145\/3325421.3329765"},{"key":"ref189","doi-asserted-by":"publisher","DOI":"10.3390\/drones6060147"},{"key":"ref190","doi-asserted-by":"publisher","DOI":"10.3390\/drones6070154"},{"key":"ref191","doi-asserted-by":"publisher","DOI":"10.1109\/LWC.2021.3136444"},{"key":"ref192","doi-asserted-by":"publisher","DOI":"10.1109\/LWC.2021.3136444"},{"key":"ref193","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2022.3154401"},{"key":"ref194","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2022.3161970"},{"key":"ref195","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2022.3142674"},{"key":"ref196","doi-asserted-by":"publisher","DOI":"10.1109\/ICC45855.2022.9838676"},{"key":"ref197","doi-asserted-by":"publisher","DOI":"10.1145\/3536221.3558174"},{"key":"ref198","doi-asserted-by":"publisher","DOI":"10.1109\/ICMLA.2011.159"},{"key":"ref199","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2015.7353711"},{"key":"ref200","doi-asserted-by":"publisher","DOI":"10.1109\/AERO.2016.7500855"},{"key":"ref201","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2017.10.037"},{"key":"ref202","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2019.2906088"},{"key":"ref203","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2019.2947929"},{"key":"ref204","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2019.2961993"},{"key":"ref205","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.3010896"},{"key":"ref206","doi-asserted-by":"publisher","DOI":"10.1109\/MNET.104.2100351"},{"key":"ref207","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2021.3102230"},{"key":"ref208","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2022.3173211"},{"key":"ref209","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2020.2982508"},{"key":"ref210","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2019.2923702"},{"key":"ref211","doi-asserted-by":"publisher","DOI":"10.1109\/AIM.2018.8452263"},{"key":"ref212","doi-asserted-by":"publisher","DOI":"10.1109\/MSPEC.2020.9126102"},{"key":"ref213","doi-asserted-by":"publisher","DOI":"10.1109\/SEC.2018.00038"},{"key":"ref214","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.2981430"},{"key":"ref215","doi-asserted-by":"publisher","DOI":"10.1109\/MNET.111.2100044"},{"key":"ref216","doi-asserted-by":"publisher","DOI":"10.1109\/ICOIN50884.2021.9333960"},{"key":"ref217","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2022.3150176"},{"key":"ref218","doi-asserted-by":"publisher","DOI":"10.1016\/j.adhoc.2017.09.001"},{"key":"ref219","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2021.3135632"},{"key":"ref220","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2021.3104875"},{"key":"ref221","doi-asserted-by":"publisher","DOI":"10.1109\/access.2022.3205426"}],"container-title":["IEEE Access"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6287639\/10005208\/10016705.pdf?arnumber=10016705","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,14]],"date-time":"2024-03-14T04:31:20Z","timestamp":1710390680000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10016705\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023]]},"references-count":221,"URL":"https:\/\/doi.org\/10.1109\/access.2023.3236801","relation":{},"ISSN":["2169-3536"],"issn-type":[{"value":"2169-3536","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023]]}}}