{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,7]],"date-time":"2026-01-07T06:15:16Z","timestamp":1767766516146,"version":"3.48.0"},"reference-count":24,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,10,19]],"date-time":"2025-10-19T00:00:00Z","timestamp":1760832000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,10,19]],"date-time":"2025-10-19T00:00:00Z","timestamp":1760832000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,10,19]]},"DOI":"10.1109\/vtc2025-fall65116.2025.11310705","type":"proceedings-article","created":{"date-parts":[[2026,1,6]],"date-time":"2026-01-06T18:33:45Z","timestamp":1767724425000},"page":"1-6","source":"Crossref","is-referenced-by-count":0,"title":["Optimized Power Allocation in Multi-cell 4G\/5G Systems using Multi-Agent Deep Reinforcement Learning"],"prefix":"10.1109","author":[{"given":"Nadia Yoza","family":"Mitsuishi","sequence":"first","affiliation":[{"name":"National Institute of Standards and Technology,Communications Technology Laboratory,Boulder,CO,USA,80305"}]},{"given":"Yao","family":"Ma","sequence":"additional","affiliation":[{"name":"National Institute of Standards and Technology,Communications Technology Laboratory,Boulder,CO,USA,80305"}]},{"given":"Jason B.","family":"Coder","sequence":"additional","affiliation":[{"name":"National Institute of Standards and Technology,Communications Technology Laboratory,Boulder,CO,USA,80305"}]}],"member":"263","reference":[{"year":"2022","key":"ref1","article-title":"NR dynamic spectrum sharing in Rel-17"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/25.120145"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/49.414651"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.2005.850045"},{"volume-title":"Reinforcement Learning: An Introduction.","year":"2018","author":"Sutton","key":"ref5"},{"key":"ref6","article-title":"Q-learning","author":"Watkins","year":"2010","journal-title":"Machine Learning"},{"key":"ref7","article-title":"Double Q-learning","author":"Van Hasselt","year":"2010","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1038\/nature14236"},{"article-title":"An introduction to centralized training for decentralized execution in cooperative multi-agent reinforcement learning","year":"2024","author":"Amato","key":"ref9"},{"article-title":"Proximal policy optimization algorithms","year":"2017","author":"Schulman","key":"ref10"},{"key":"ref11","first-page":"24611","article-title":"The surprising effectiveness of PPO in cooperative, multi-agent games","author":"Yu","year":"2022","journal-title":"Advances in neural information processing systems"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ICC.2017.7997440"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2019.2933973"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/ICC.2019.8761431"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICC40277.2020.9149157"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2020.3001736"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/WCNC61545.2025.10978810"},{"year":"2018","key":"ref18","article-title":"TR 38.901: Study on channel model for frequencies from 0.5 to 100 GHz (Release 15)"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ICC51166.2024.10622536"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/PIMRC54779.2022.9977746"},{"key":"ref21","article-title":"B210 USRP"},{"key":"ref22","article-title":"Software Radio Systems (SRS) project, release 23.04"},{"key":"ref23","article-title":"OpenAirInterface (OAI) project"},{"year":"2021","key":"ref24","article-title":"TS 36.214: Evolved universal terrestrial radio access (E-UTRA); Physical layer; Measurements (Release 16)"}],"event":{"name":"2025 IEEE 102nd Vehicular Technology Conference (VTC2025-Fall)","start":{"date-parts":[[2025,10,19]]},"location":"Chengdu, China","end":{"date-parts":[[2025,10,22]]}},"container-title":["2025 IEEE 102nd Vehicular Technology Conference (VTC2025-Fall)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11309821\/11309345\/11310705.pdf?arnumber=11310705","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,1,7]],"date-time":"2026-01-07T06:09:26Z","timestamp":1767766166000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11310705\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,19]]},"references-count":24,"URL":"https:\/\/doi.org\/10.1109\/vtc2025-fall65116.2025.11310705","relation":{},"subject":[],"published":{"date-parts":[[2025,10,19]]}}}