{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,21]],"date-time":"2026-05-21T16:22:46Z","timestamp":1779380566164,"version":"3.53.1"},"reference-count":35,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"6","license":[{"start":{"date-parts":[[2025,6,1]],"date-time":"2025-06-01T00:00:00Z","timestamp":1748736000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2025,6,1]],"date-time":"2025-06-01T00:00:00Z","timestamp":1748736000000},"content-version":"am","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2025,6,1]],"date-time":"2025-06-01T00:00:00Z","timestamp":1748736000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,6,1]],"date-time":"2025-06-01T00:00:00Z","timestamp":1748736000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","award":["CNS-2430773"],"award-info":[{"award-number":["CNS-2430773"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","award":["OIA-2417062"],"award-info":[{"award-number":["OIA-2417062"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","award":["CNS-2323050"],"award-info":[{"award-number":["CNS-2323050"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","award":["CNS-2148178"],"award-info":[{"award-number":["CNS-2148178"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","award":["CNS-2148178"],"award-info":[{"award-number":["CNS-2148178"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Intelligent NextG Systems"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. on Mobile Comput."],"published-print":{"date-parts":[[2025,6]]},"DOI":"10.1109\/tmc.2025.3532204","type":"journal-article","created":{"date-parts":[[2025,1,21]],"date-time":"2025-01-21T18:29:59Z","timestamp":1737484199000},"page":"5482-5495","source":"Crossref","is-referenced-by-count":11,"title":["Hybrid Transformer Based Multi-Agent Reinforcement Learning for Multiple Unpiloted Aerial Vehicle Coordination in Air Corridors"],"prefix":"10.1109","volume":"24","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-4062-2499","authenticated-orcid":false,"given":"Liangkun","family":"Yu","sequence":"first","affiliation":[{"name":"Department of Electrical and Computer Engineering, SECNet Laboratory, University of New Mexico, Albuquerque, NM, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0005-3538-7975","authenticated-orcid":false,"given":"Zhirun","family":"Li","sequence":"additional","affiliation":[{"name":"Department of Electrical and Computer Engineering, SECNet Laboratory, University of New Mexico, Albuquerque, NM, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8541-3565","authenticated-orcid":false,"given":"Nirwan","family":"Ansari","sequence":"additional","affiliation":[{"name":"Department of Electrical and Computing Engineering, Advanced Networking Laboratory, New Jersey Institute of Technology, Newark, NJ, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6954-7018","authenticated-orcid":false,"given":"Xiang","family":"Sun","sequence":"additional","affiliation":[{"name":"Department of Electrical and Computer Engineering, SECNet Laboratory, University of New Mexico, Albuquerque, NM, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref1","volume-title":"Urban Air Mobility (UAM): Concept of Operations","year":"2023"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/PIMRC56721.2023.10294054"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/vtc2020-spring48590.2020.9128488"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.3390\/electronics11071128"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.3390\/s22145437"},{"key":"ref6","first-page":"1814","article-title":"Multiagent rollout and policy iteration for POMDP with application to multi-robot repair problems","volume-title":"Proc. 2020 Conf. Robot Learn.","author":"Bhattacharya"},{"key":"ref7","first-page":"1458","article-title":"Learning in observable POMDPs, without computationally intractable oracles","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Golowich"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2022.3142743"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/TCOMM.2020.3013599"},{"issue":"9","key":"ref10","article-title":"A low-altitude obstacle avoidance method for UAVs based on polyhedral flight corridor","volume-title":"Drones","volume":"7","author":"Ma","year":"2023"},{"issue":"22","key":"ref11","article-title":"Air corridors: Concept, design, simulation, and rules of engagement","volume-title":"Sensors","volume":"21","author":"Muna","year":"2021"},{"key":"ref12","doi-asserted-by":"crossref","DOI":"10.1109\/ISCAS45731.2020.9181245","article-title":"Autonomous UAV navigation: A DDPG-based deep reinforcement learning approach","author":"Bouhamed","year":"2020"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/ICUAS48674.2020.9213856"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/mwc.003.2400047"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1997.9.8.1735"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.2971780"},{"key":"ref17","article-title":"A reinforcement learning approach to vehicle coordination for structured advanced air mobility","volume-title":"Green Energy Intell. Transp.","volume":"3","author":"Deniz","year":"2024"},{"issue":"11","key":"ref18","doi-asserted-by":"crossref","DOI":"10.3390\/info12110442","article-title":"Analysis of gradient vanishing of RNNs and performance comparison","volume":"12","author":"Noh","year":"2021","journal-title":"Information"},{"key":"ref19","first-page":"3394","article-title":"Deep sets","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Zaheer"},{"key":"ref20","article-title":"Learning safe multi-agent control with decentralized neural barrier certificates","author":"Qin","year":"2021"},{"issue":"178","key":"ref21","first-page":"1","article-title":"Monotonic value function factorisation for deep multi-agent reinforcement learning","volume":"21","author":"Rashid","year":"2020","journal-title":"J. Mach. Learn. Res."},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-51497-5_28"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2023.3298601"},{"key":"ref24","first-page":"3744","article-title":"Set transformer: A framework for attention-based permutation-invariant neural networks","volume-title":"Proc. 36th Int. Conf. Mach. Learn.","author":"Lee"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/IROS51168.2021.9636344"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/iccworkshops59551.2024.10615924"},{"key":"ref27","article-title":"Efficient memory-based learning for robot control","author":"Moore","year":"1990"},{"key":"ref28","first-page":"482","article-title":"Reverse curriculum generation for reinforcement learning","volume-title":"Proc. 1st Annu. Conf. Robot Learn.","author":"Florensa"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/TII.2020.3041159"},{"key":"ref30","first-page":"387","article-title":"Deterministic policy gradient algorithms","volume-title":"Proc. 31st Int. Conf. Mach. Learn.","author":"Silver"},{"key":"ref31","article-title":"Proximal policy optimization algorithms","author":"Schulman","year":"2017"},{"key":"ref32","article-title":"High-dimensional continuous control using generalized advantage estimation","author":"Schulman","year":"2015"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2021.3069908"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2021.3103715"}],"container-title":["IEEE Transactions on Mobile Computing"],"original-title":[],"link":[{"URL":"https:\/\/ieeexplore.ieee.org\/ielam\/7755\/10990048\/10848344-aam.pdf","content-type":"application\/pdf","content-version":"am","intended-application":"syndication"},{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/7755\/10990048\/10848344.pdf?arnumber=10848344","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,5,8]],"date-time":"2025-05-08T04:25:09Z","timestamp":1746678309000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10848344\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,6]]},"references-count":35,"journal-issue":{"issue":"6"},"URL":"https:\/\/doi.org\/10.1109\/tmc.2025.3532204","relation":{},"ISSN":["1536-1233","1558-0660","2161-9875"],"issn-type":[{"value":"1536-1233","type":"print"},{"value":"1558-0660","type":"electronic"},{"value":"2161-9875","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,6]]}}}