{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,3]],"date-time":"2025-12-03T18:13:51Z","timestamp":1764785631943,"version":"3.40.5"},"reference-count":17,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,3,24]],"date-time":"2025-03-24T00:00:00Z","timestamp":1742774400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,3,24]],"date-time":"2025-03-24T00:00:00Z","timestamp":1742774400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,3,24]]},"DOI":"10.1109\/wcnc61545.2025.10978561","type":"proceedings-article","created":{"date-parts":[[2025,5,9]],"date-time":"2025-05-09T17:53:33Z","timestamp":1746813213000},"page":"1-6","source":"Crossref","is-referenced-by-count":1,"title":["Accelerated Constrained Reinforcement Learning Based Energy-Efficient Power Scheduling Algorithm for Extended Reality Transmission"],"prefix":"10.1109","author":[{"given":"Kexuan","family":"Wang","sequence":"first","affiliation":[{"name":"College of Information Science and Electronic Engineering, Zhejiang University"}]},{"given":"An","family":"Liu","sequence":"additional","affiliation":[{"name":"College of Information Science and Electronic Engineering, Zhejiang University"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.23919\/ETR.2021.9904681"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/TCOMM.2024.3370441"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/18.995554"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TSP.2022.3158737"},{"key":"ref5","article-title":"A single-loop deep actor-critic algorithm for constrained reinforcement learning with provable convergence","author":"Wang","year":"2023","journal-title":"arXiv preprint"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/313256.313273"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/INFCOM.2004.1354603"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICC.2018.8422088"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/NOMS56928.2023.10154267"},{"journal-title":"Benchmarking safe exploration in deep reinforcement learning","year":"2019","author":"Achiam","key":"ref10"},{"key":"ref11","first-page":"22","article-title":"Constrained policy optimization","author":"Achiam","year":"2017","journal-title":"ICML. PMLR"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2021.3105407"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1145\/1160633.1160762"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.2011.2177770"},{"key":"ref15","article-title":"Reward shaping via metalearning","author":"Zou","year":"2019","journal-title":"arXiv preprint"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICC.2018.8422088"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ICC.2019.8761721"}],"event":{"name":"2025 IEEE Wireless Communications and Networking Conference (WCNC)","start":{"date-parts":[[2025,3,24]]},"location":"Milan, Italy","end":{"date-parts":[[2025,3,27]]}},"container-title":["2025 IEEE Wireless Communications and Networking Conference (WCNC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10978109\/10978116\/10978561.pdf?arnumber=10978561","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,5,10]],"date-time":"2025-05-10T06:49:01Z","timestamp":1746859741000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10978561\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,3,24]]},"references-count":17,"URL":"https:\/\/doi.org\/10.1109\/wcnc61545.2025.10978561","relation":{},"subject":[],"published":{"date-parts":[[2025,3,24]]}}}