{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,19]],"date-time":"2026-05-19T04:17:18Z","timestamp":1779164238946,"version":"3.51.4"},"reference-count":41,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"7","license":[{"start":{"date-parts":[[2020,7,1]],"date-time":"2020-07-01T00:00:00Z","timestamp":1593561600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2020,7,1]],"date-time":"2020-07-01T00:00:00Z","timestamp":1593561600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2020,7,1]],"date-time":"2020-07-01T00:00:00Z","timestamp":1593561600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61625101"],"award-info":[{"award-number":["61625101"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61829101"],"award-info":[{"award-number":["61829101"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61941101"],"award-info":[{"award-number":["61941101"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"National Key Research and Development Project of China","award":["SQ2020AAA010062"],"award-info":[{"award-number":["SQ2020AAA010062"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Commun."],"published-print":{"date-parts":[[2020,7]]},"DOI":"10.1109\/tcomm.2020.2986289","type":"journal-article","created":{"date-parts":[[2020,4,7]],"date-time":"2020-04-07T21:57:08Z","timestamp":1586296628000},"page":"4175-4189","source":"Crossref","is-referenced-by-count":71,"title":["Cellular UAV-to-Device Communications: Trajectory Design and Mode Selection by Multi-Agent Deep Reinforcement Learning"],"prefix":"10.1109","volume":"68","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-8766-0885","authenticated-orcid":false,"given":"Fanyi","family":"Wu","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3393-8612","authenticated-orcid":false,"given":"Hongliang","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jianjun","family":"Wu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8644-8241","authenticated-orcid":false,"given":"Lingyang","family":"Song","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref39","first-page":"1057","article-title":"Policy gradient methods for reinforcement learning with function approximation","author":"sutton","year":"1999","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/INFCOM.2013.6567124"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2018.2876513"},{"key":"ref32","author":"rappaport","year":"1996","journal-title":"Wireless Communications Principles and Practice"},{"key":"ref31","author":"marcum","year":"1950","journal-title":"Table of Q functions"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1002\/j.1538-7305.1944.tb00874.x"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1038\/nature14236"},{"key":"ref36","first-page":"440","article-title":"Deep reinforcement learning based distributed resource allocation for V2 V broadcasting","author":"ye","year":"2018","journal-title":"Proc 14th Int Wireless Commun Mobile Comput Conf (IWCMC)"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1007\/BF00993306"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1007\/BF00992698"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/MWC.2019.1800591"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2013.6639346"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/IEMCON.2017.8117160"},{"key":"ref12","article-title":"Reinforcement learning for a cellular Internet of UAVs: Protocol design, trajectory control, and resource management","author":"hu","year":"2019","journal-title":"arXiv 1911 08771"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/TNN.1998.712192"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2017.2743240"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/MVT.2019.2903655"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/LCOMM.2018.2868075"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2019.2892131"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/LCOMM.2017.2763135"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2017.2680898"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/LCOMM.2019.2913631"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ICUAS.2013.6564694"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/JSEN.2013.2260147"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/MVT.2016.2645481"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/AERO.2017.7943593"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-33039-2"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/AERO.2013.6496959"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/DASC.2013.6712625"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ICUAS.2017.7991306"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/CC.2017.8246341"},{"key":"ref9","year":"2017","journal-title":"Enhanced LTE Support for Aerial Vehicles Release 15"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/GLOBECOM38437.2019.9013973"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/MNET.001.1900095"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/LWC.2017.2778242"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/LWC.2017.2779483"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2019.2900035"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/CDC.2010.5718053"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2018.2874230"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/JSEN.2017.2766089"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2019.2891629"}],"container-title":["IEEE Transactions on Communications"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/26\/9139896\/09058679.pdf?arnumber=9058679","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,4,27]],"date-time":"2022-04-27T13:47:10Z","timestamp":1651067230000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9058679\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,7]]},"references-count":41,"journal-issue":{"issue":"7"},"URL":"https:\/\/doi.org\/10.1109\/tcomm.2020.2986289","relation":{},"ISSN":["0090-6778","1558-0857"],"issn-type":[{"value":"0090-6778","type":"print"},{"value":"1558-0857","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020,7]]}}}