{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,6]],"date-time":"2026-01-06T13:53:02Z","timestamp":1767707582317,"version":"3.28.0"},"reference-count":21,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,6,9]],"date-time":"2024-06-09T00:00:00Z","timestamp":1717891200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,6,9]],"date-time":"2024-06-09T00:00:00Z","timestamp":1717891200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62272194,62172186"],"award-info":[{"award-number":["62272194,62172186"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,6,9]]},"DOI":"10.1109\/icc51166.2024.10622564","type":"proceedings-article","created":{"date-parts":[[2024,8,20]],"date-time":"2024-08-20T15:34:42Z","timestamp":1724168082000},"page":"4985-4990","source":"Crossref","is-referenced-by-count":4,"title":["Enabling Urban MmWave Communications with UAV-Carried IRS via Deep Reinforcement Learning"],"prefix":"10.1109","author":[{"given":"Geng","family":"Sun","sequence":"first","affiliation":[{"name":"College of Computer Science and Technology, Jilin University,Changchun,China,130012"}]},{"given":"Bei","family":"Liu","sequence":"additional","affiliation":[{"name":"College of Computer Science and Technology, Jilin University,Changchun,China,130012"}]},{"given":"Jiahui","family":"Li","sequence":"additional","affiliation":[{"name":"College of Computer Science and Technology, Jilin University,Changchun,China,130012"}]},{"given":"Shuang","family":"Liang","sequence":"additional","affiliation":[{"name":"School of Information Science and Technology, Northeast Normal University,Changchun,China,130012"}]},{"given":"Hongyang","family":"Pan","sequence":"additional","affiliation":[{"name":"College of Computer Science and Technology, Jilin University,Changchun,China,130012"}]},{"given":"Xiaoya","family":"Zheng","sequence":"additional","affiliation":[{"name":"College of Computer Science and Technology, Jilin University,Changchun,China,130012"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2023.3249835"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/TCOMM.2022.3171800"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/OJCOMS.2023.3245669"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2024.3350885"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/TCOMM.2022.3229014"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2022.3232856"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/TCOMM.2021.3051897"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/TCOMM.2022.3206884"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/TCOMM.2022.3201122"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2023.3273293"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2022.3200998"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2023.3277809"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/tmc.2023.3298888"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/SECON55815.2022.9918588"},{"key":"ref15","article-title":"Proximal policy optimization algorithms","author":"Schulman","year":"2017","journal-title":"arXiv preprint"},{"key":"ref16","article-title":"Neural episodic control with state abstraction","volume-title":"Proc. ICLR","author":"Li","year":"2023"},{"key":"ref17","article-title":"Mogrifier LSTM","volume-title":"Proc. ICLR","author":"Melis","year":"2020"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2020.3042977"},{"key":"ref19","article-title":"Continuous control with deep reinforcement learning","volume-title":"Proc. ICLR","author":"Lillicrap","year":"2016"},{"issue":"2018","key":"ref20","first-page":"1582","article-title":"Addressing function approx-imation error in actor-critic methods","volume-title":"Proc. ICML","volume":"80","author":"Fujimoto"},{"key":"ref21","first-page":"1856","article-title":"Soft actor-critic: Off-policy maximum entropy deep reinforcement learning with a stochastic actor","volume-title":"Proc. ICML","volume":"80","author":"Haarnoja","year":"2018"}],"event":{"name":"ICC 2024 - IEEE International Conference on Communications","start":{"date-parts":[[2024,6,9]]},"location":"Denver, CO, USA","end":{"date-parts":[[2024,6,13]]}},"container-title":["ICC 2024 - IEEE International Conference on Communications"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10622104\/10622158\/10622564.pdf?arnumber=10622564","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,8,29]],"date-time":"2024-08-29T20:18:56Z","timestamp":1724962736000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10622564\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,6,9]]},"references-count":21,"URL":"https:\/\/doi.org\/10.1109\/icc51166.2024.10622564","relation":{},"subject":[],"published":{"date-parts":[[2024,6,9]]}}}