{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,11]],"date-time":"2025-09-11T05:42:37Z","timestamp":1757569357087,"version":"3.37.3"},"reference-count":19,"publisher":"IEEE","license":[{"start":{"date-parts":[[2023,8,26]],"date-time":"2023-08-26T00:00:00Z","timestamp":1693008000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,8,26]],"date-time":"2023-08-26T00:00:00Z","timestamp":1693008000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001729","name":"Swedish Foundation for Strategic Research","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100001729","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100004270","name":"KTH Royal Institute of Technology","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100004270","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023,8,26]]},"DOI":"10.1109\/case56687.2023.10260368","type":"proceedings-article","created":{"date-parts":[[2023,9,28]],"date-time":"2023-09-28T17:32:23Z","timestamp":1695922343000},"page":"1-7","source":"Crossref","is-referenced-by-count":1,"title":["Network Parameter Control in Cellular Networks through Graph-Based Multi-Agent Constrained Reinforcement Learning"],"prefix":"10.1109","author":[{"given":"Albin Larsson","family":"Forsberg","sequence":"first","affiliation":[{"name":"Ericsson Research, Research Area Artificial Intelligence (AI),Stockholm,Sweden"}]},{"given":"Alexandros","family":"Nikou","sequence":"additional","affiliation":[{"name":"KTH,Division of Robotics, Perception and Learning,Department of Electrical Engineering and Computer Science,Stockholm,Sweden"}]},{"given":"Aneta Vulgarakis","family":"Feljan","sequence":"additional","affiliation":[{"name":"KTH,Division of Robotics, Perception and Learning,Department of Electrical Engineering and Computer Science,Stockholm,Sweden"}]},{"given":"Jana","family":"Tumova","sequence":"additional","affiliation":[{"name":"Ericsson Research, Research Area Artificial Intelligence (AI),Stockholm,Sweden"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/MCOM.2014.6979983"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/VETECS.2011.5956370"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2019.2914040"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.3033325"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/WCNC.2012.6214281"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1186\/1687-1499-2014-57"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/PIMRC.2010.5671622"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1007\/s11277-016-3849-9"},{"key":"ref9","article-title":"Coordinated reinforcement learning for optimizing mobile networks","author":"Bouton","year":"2021","journal-title":"arXiv preprint"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/6GNet54646.2022.9830258"},{"journal-title":"Ericsson Mobility Report","article-title":"Ai: enhancing customer experience in a complex 5g world","year":"2021","key":"ref11"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/PIMRC50174.2021.9569387"},{"key":"ref13","doi-asserted-by":"crossref","DOI":"10.1109\/ICCA54724.2022.9831850","article-title":"Symbolic reinforcement learning for safe ran control","volume-title":"International Conference of Autonomous Agents and Multi-agent Systems (AAMAS), Link","author":"Nikou"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/ICCA54724.2022.9831850"},{"key":"ref15","first-page":"1179","article-title":"Conservative q-learning for offline reinforcement learning","volume":"33","author":"Kumar","year":"2020","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref16","article-title":"Conservative safety critics for exploration","author":"Bharadhwaj","year":"2020","journal-title":"arXiv preprint"},{"key":"ref17","first-page":"980","article-title":"Deep coordination graphs","volume-title":"International Conference on Machine Learning","author":"B\u00f6hmer"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1007\/11780519_1"},{"key":"ref19","article-title":"Safe multi-agent reinforcement learning via shielding","author":"ElSayed-Aly","year":"2021","journal-title":"arXiv preprint"}],"event":{"name":"2023 IEEE 19th International Conference on Automation Science and Engineering (CASE)","start":{"date-parts":[[2023,8,26]]},"location":"Auckland, New Zealand","end":{"date-parts":[[2023,8,30]]}},"container-title":["2023 IEEE 19th International Conference on Automation Science and Engineering (CASE)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10260321\/10260291\/10260368.pdf?arnumber=10260368","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,2]],"date-time":"2024-03-02T06:09:12Z","timestamp":1709359752000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10260368\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,8,26]]},"references-count":19,"URL":"https:\/\/doi.org\/10.1109\/case56687.2023.10260368","relation":{},"subject":[],"published":{"date-parts":[[2023,8,26]]}}}