{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,7,15]],"date-time":"2026-07-15T15:58:17Z","timestamp":1784131097685,"version":"3.55.0"},"reference-count":48,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"2","license":[{"start":{"date-parts":[[2026,2,1]],"date-time":"2026-02-01T00:00:00Z","timestamp":1769904000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2026,2,1]],"date-time":"2026-02-01T00:00:00Z","timestamp":1769904000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,2,1]],"date-time":"2026-02-01T00:00:00Z","timestamp":1769904000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["623B2060"],"award-info":[{"award-number":["623B2060"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62127801"],"award-info":[{"award-number":["62127801"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["U24A20213"],"award-info":[{"award-number":["U24A20213"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Singapore Ministry of Education (MOE) Tier 1","award":["RG87\/22"],"award-info":[{"award-number":["RG87\/22"]}]},{"name":"Singapore Ministry of Education (MOE) Tier 1","award":["RG24\/24"],"award-info":[{"award-number":["RG24\/24"]}]},{"name":"NTU Centre for Computational Technologies in Finance"},{"name":"RIE2025 Industry Alignment Fund - Industry Collaboration Projects","award":["I2301E0026"],"award-info":[{"award-number":["I2301E0026"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. on Mobile Comput."],"published-print":{"date-parts":[[2026,2]]},"DOI":"10.1109\/tmc.2025.3607882","type":"journal-article","created":{"date-parts":[[2025,9,9]],"date-time":"2025-09-09T17:34:55Z","timestamp":1757439295000},"page":"2091-2106","source":"Crossref","is-referenced-by-count":2,"title":["Is FISHER All You Need in the Multi-AUV Underwater Target Tracking Task?"],"prefix":"10.1109","volume":"25","author":[{"ORCID":"https:\/\/orcid.org\/0009-0000-2410-2878","authenticated-orcid":false,"given":"Guanwen","family":"Xie","sequence":"first","affiliation":[{"name":"Tsinghua Shenzhen International Graduate School, Tsinghua University, Shenzhen, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0007-2860-5203","authenticated-orcid":false,"given":"Jingzehua","family":"Xu","sequence":"additional","affiliation":[{"name":"Tsinghua Shenzhen International Graduate School, Tsinghua University, Shenzhen, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Ziqi","family":"Zhang","sequence":"additional","affiliation":[{"name":"School of Engineering, WestLake University, Zhejiang, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9449-4854","authenticated-orcid":false,"given":"Xiangwang","family":"Hou","sequence":"additional","affiliation":[{"name":"Department of Electronic Engineering, Tsinghua University, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9334-1570","authenticated-orcid":false,"given":"Dongfang","family":"Ma","sequence":"additional","affiliation":[{"name":"Ocean College, Zhejiang University, Zhoushan, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Shuai","family":"Zhang","sequence":"additional","affiliation":[{"name":"Department of Data Science, New Jersey Institute of Technology, Newark, NJ, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0312-9371","authenticated-orcid":false,"given":"Yong","family":"Ren","sequence":"additional","affiliation":[{"name":"Department of Electronic Engineering, Tsinghua University, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7442-7416","authenticated-orcid":false,"given":"Dusit","family":"Niyato","sequence":"additional","affiliation":[{"name":"College of Computing and Data Science, Nanyang Technological University, Singapore"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/TIV.2020.3029369"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/MNET.011.2000684"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2022.3202225"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2021.3129504"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/GLOBECOM46510.2021.9685323"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2022.3230916"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2024.3395568"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v39i28.35316"},{"key":"ref9","first-page":"1","article-title":"The effects of reward misspecification: Mapping and mitigating misaligned models","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Pan","year":"2022"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2023.3240671"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2023.3345393"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/tit.2022.3185139"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2024.3414628"},{"key":"ref14","first-page":"4572","article-title":"Generative adversarial imitation learning","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Ho","year":"2016"},{"key":"ref15","article-title":"Offline reinforcement learning: Tutorial, review, and perspectives on open problems","author":"Levine","year":"2020"},{"key":"ref16","first-page":"23851","article-title":"Rorl: Robust offline reinforcement learning via conservative smoothing","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Yang","year":"2022"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/NIR50484.2020.9290189"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2022.3152829"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2021.3057068"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2015.2482501"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2024.3377226"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2023.3325580"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/ICCAR57134.2023.10151768"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2022.3146976"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2024.3521889"},{"key":"ref26","article-title":"Multi-UAV pursuit-evasion with online planning in unknown environments by deep reinforcement learning","author":"Chen","year":"2024"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2018.8461203"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1002\/int.22778"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2018.2856922"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1016\/j.asoc.2023.110604"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.3390\/cmsf2024009004"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/21.61218"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1177\/027836498600500106"},{"key":"ref34","first-page":"1889","article-title":"Trust region policy optimization","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Schulman","year":"2015"},{"key":"ref35","article-title":"Proximal policy optimization algorithms","author":"Schulman","year":"2017"},{"key":"ref36","first-page":"1","article-title":"Discriminator-actor-critic: Addressing sample inefficiency and reward bias in adversarial imitation learning","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Kostrikov","year":"2019"},{"key":"ref37","first-page":"1861","article-title":"Soft actor-critic: Off-policy maximum entropy deep reinforcement learning with a stochastic actor","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Haarnoja","year":"2018"},{"key":"ref38","first-page":"1587","article-title":"Addressing function approximation error in actor-critic methods","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Fujimoto","year":"2018"},{"key":"ref39","first-page":"1","article-title":"Improved training of Wasserstein GANs","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Gulrajani","year":"2017"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.1802.05957"},{"key":"ref41","volume-title":"Reinforcement Learning: An Introduction","volume":"22447","author":"Sutton","year":"2018"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4612-4054-9"},{"key":"ref43","article-title":"A study of gradient descent schemes for general-sum stochastic games","author":"Prasad","year":"2015"},{"key":"ref44","first-page":"1","article-title":"Multi-agent generative adversarial imitation learning","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Song","year":"2018"},{"key":"ref45","first-page":"15084","article-title":"Decision transformer: Reinforcement learning via sequence modeling","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Chen","year":"2021"},{"key":"ref46","first-page":"1","article-title":"Generalized decision transformer for offline hindsight information matching","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Furuta","year":"2022"},{"key":"ref47","article-title":"Efficient exploration via state marginal matching","author":"Lee","year":"2019"},{"key":"ref48","first-page":"1179","article-title":"Conservative q-learning for offline reinforcement learning","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Kumar","year":"2020"}],"container-title":["IEEE Transactions on Mobile Computing"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/7755\/11345503\/11153860.pdf?arnumber=11153860","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,5,12]],"date-time":"2026-05-12T19:51:20Z","timestamp":1778615480000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11153860\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,2]]},"references-count":48,"journal-issue":{"issue":"2"},"URL":"https:\/\/doi.org\/10.1109\/tmc.2025.3607882","relation":{},"ISSN":["1536-1233","1558-0660","2161-9875"],"issn-type":[{"value":"1536-1233","type":"print"},{"value":"1558-0660","type":"electronic"},{"value":"2161-9875","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,2]]}}}