{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,17]],"date-time":"2026-01-17T22:47:37Z","timestamp":1768690057982,"version":"3.49.0"},"reference-count":25,"publisher":"IEEE","license":[{"start":{"date-parts":[[2023,10,30]],"date-time":"2023-10-30T00:00:00Z","timestamp":1698624000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,10,30]],"date-time":"2023-10-30T00:00:00Z","timestamp":1698624000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023,10,30]]},"DOI":"10.1109\/milcom58377.2023.10356356","type":"proceedings-article","created":{"date-parts":[[2023,12,25]],"date-time":"2023-12-25T14:37:01Z","timestamp":1703515021000},"page":"464-470","source":"Crossref","is-referenced-by-count":1,"title":["Learning Technique to Solve Periodic Markov Decision Process for Network Resource Allocation"],"prefix":"10.1109","author":[{"given":"Zheyu","family":"Chen","sequence":"first","affiliation":[{"name":"Imperial College London,UK"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Kin K.","family":"Leung","sequence":"additional","affiliation":[{"name":"Imperial College London,UK"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Shiqiang","family":"Wang","sequence":"additional","affiliation":[{"name":"IBM T.J. Watson Research Center,Yorktown Heights,NY,USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Leandros","family":"Tassiulas","sequence":"additional","affiliation":[{"name":"Yale University,New Haven,CT,USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Kevin","family":"Chan","sequence":"additional","affiliation":[{"name":"DEVCOM Army Research Laboratory,Adelphi,MD,USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Patrick J.","family":"Baker","sequence":"additional","affiliation":[{"name":"UK Royal Air Force and Dstl,UK"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","first-page":"533","article-title":"On the diversity of cluster workloads and its impact on research results","volume-title":"2018 USENIX Annual Technical Conference (USENIXATC 18)","author":"Amvrosiadis"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/INFOCOM.2014.6848013"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/MASCOTS.2018.00025"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2018.2799945"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1145\/3326285.3329074"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1287\/opre.13.6.920"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1007\/BF01720020"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1007\/BF01068380"},{"key":"ref9","first-page":"1167","article-title":"Efficient Policy Iteration for Periodic Markov Decision Processes","volume-title":"Proceedings of the Twenty-First European Conference on Artificial Intelligence","author":"Osogami"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ADPRL.2014.7010627"},{"key":"ref11","article-title":"Proximal Policy Optimization Algorithms","author":"Schulman","year":"2017"},{"key":"ref12","volume-title":"Introduction to reinforcement learning","volume":"135","author":"Sutton","year":"1998"},{"key":"ref13","article-title":"High-dimensional continuous control using generalized advantage estimation","author":"Schulman","year":"2015"},{"key":"ref14","first-page":"1928","article-title":"Asynchronous methods for deep reinforcement learning","volume-title":"International conference on machine learning","author":"Mnih"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1038\/nature14236"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1038\/nature16961"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ICDCS.2018.00159"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2020.3000371"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/TNSM.2020.3036911"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/TNSE.2020.3017751"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/INFOCOMWKSHPS50562.2020.9162720"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/ICC.2019.8761385"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/PCCC.2018.8710960"},{"key":"ref24","article-title":"Part 3: Intro to Policy Optimization"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/ICDCS.2019.00021"}],"event":{"name":"MILCOM 2023 - 2023 IEEE Military Communications Conference (MILCOM)","location":"Boston, MA, USA","start":{"date-parts":[[2023,10,30]]},"end":{"date-parts":[[2023,11,3]]}},"container-title":["MILCOM 2023 - 2023 IEEE Military Communications Conference (MILCOM)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10356123\/10356124\/10356356.pdf?arnumber=10356356","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,1,12]],"date-time":"2024-01-12T15:43:27Z","timestamp":1705074207000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10356356\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,10,30]]},"references-count":25,"URL":"https:\/\/doi.org\/10.1109\/milcom58377.2023.10356356","relation":{},"subject":[],"published":{"date-parts":[[2023,10,30]]}}}