{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,12]],"date-time":"2025-06-12T04:25:13Z","timestamp":1749702313656},"reference-count":9,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,10,31]],"date-time":"2021-10-31T00:00:00Z","timestamp":1635638400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,10,31]],"date-time":"2021-10-31T00:00:00Z","timestamp":1635638400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,10,31]]},"DOI":"10.1109\/ieeeconf53345.2021.9723284","type":"proceedings-article","created":{"date-parts":[[2022,3,4]],"date-time":"2022-03-04T15:26:46Z","timestamp":1646407606000},"page":"1477-1481","source":"Crossref","is-referenced-by-count":1,"title":["Multi-agent Policy Optimization for Pilot Selection in Delay-constrained Grant-free Multiple Access"],"prefix":"10.1109","author":[{"given":"Jianan","family":"Bai","sequence":"first","affiliation":[{"name":"Link&#x00F6;ping University,Department of Electrical Engineering (ISY),Link&#x00F6;ping,Sweden,58183"}]},{"given":"Zheng","family":"Chen","sequence":"additional","affiliation":[{"name":"Link&#x00F6;ping University,Department of Electrical Engineering (ISY),Link&#x00F6;ping,Sweden,58183"}]},{"given":"Erik G.","family":"Larsson","sequence":"additional","affiliation":[{"name":"Link&#x00F6;ping University,Department of Electrical Engineering (ISY),Link&#x00F6;ping,Sweden,58183"}]}],"member":"263","reference":[{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2017.2743240"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2017.2776868"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1038\/nature14236"},{"key":"ref5","article-title":"Playing atari with deep reinforcement learning","author":"mnih","year":"2013","journal-title":"arXiv preprint arXiv 1312 5602"},{"key":"ref8","first-page":"1","article-title":"Throughput optimization for grant-free multiple access with multiagent deep reinforcement learning","author":"huang","year":"2020","journal-title":"IEEE Transactions on Wireless Communications"},{"article-title":"Continuous control with deep reinforcement learning","year":"2015","author":"lillicrap","key":"ref7"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2018.2844952"},{"article-title":"Dynamic power control for time-critical networking with heterogeneous traffic","year":"2020","author":"fountoulakis","key":"ref9"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/MNET.2018.1700232"}],"event":{"name":"2021 55th Asilomar Conference on Signals, Systems, and Computers","start":{"date-parts":[[2021,10,31]]},"location":"Pacific Grove, CA, USA","end":{"date-parts":[[2021,11,3]]}},"container-title":["2021 55th Asilomar Conference on Signals, Systems, and Computers"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9723034\/9723086\/09723284.pdf?arnumber=9723284","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,6,20]],"date-time":"2022-06-20T17:20:16Z","timestamp":1655745616000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9723284\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,10,31]]},"references-count":9,"URL":"https:\/\/doi.org\/10.1109\/ieeeconf53345.2021.9723284","relation":{},"subject":[],"published":{"date-parts":[[2021,10,31]]}}}