{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,22]],"date-time":"2026-04-22T18:06:18Z","timestamp":1776881178350,"version":"3.51.2"},"reference-count":62,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode"}],"funder":[{"DOI":"10.13039\/501100003845","name":"Indian Institute of Technology Madras","doi-asserted-by":"publisher","award":["RF\/23-24\/1327\/EE\/NFIG\/009056"],"award-info":[{"award-number":["RF\/23-24\/1327\/EE\/NFIG\/009056"]}],"id":[{"id":"10.13039\/501100003845","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001843","name":"Science and Engineering Research Board","doi-asserted-by":"publisher","award":["EEQ\/2021\/000812"],"award-info":[{"award-number":["EEQ\/2021\/000812"]}],"id":[{"id":"10.13039\/501100001843","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Access"],"published-print":{"date-parts":[[2024]]},"DOI":"10.1109\/access.2024.3510558","type":"journal-article","created":{"date-parts":[[2024,12,2]],"date-time":"2024-12-02T18:41:02Z","timestamp":1733164862000},"page":"182274-182295","source":"Crossref","is-referenced-by-count":3,"title":["Constrained Restless Bandits for Dynamic Scheduling in Cyber-Physical Systems"],"prefix":"10.1109","volume":"12","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-9051-4624","authenticated-orcid":false,"given":"Kesav Ram","family":"Kaza","sequence":"first","affiliation":[{"name":"School of Electrical Engineering and Computer Science, University of Ottawa, Ottawa, ON, Canada"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Rahul H.","family":"Meshram","sequence":"additional","affiliation":[{"name":"Department of Electrical Engineering, Indian Institute of Technology Madras, Chennai, India"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5087-8175","authenticated-orcid":false,"given":"Varunkumar","family":"Mehta","sequence":"additional","affiliation":[{"name":"Aerospace Research Centre, National Research Council Canada, Ottawa, ON, Canada"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9119-6795","authenticated-orcid":false,"given":"Shabbir N.","family":"Merchant","sequence":"additional","affiliation":[{"name":"Department of Electrical Engineering, Indian Institute of Technology Bombay, Mumbai, India"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/ICC56513.2022.10093670"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.2010.2068950"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/TCCN.2019.2898000"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/WCNC.2018.8377345"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1002\/9780470980033"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TAC.2019.2912492"},{"issue":"1","key":"ref7","doi-asserted-by":"crossref","first-page":"21","DOI":"10.1007\/s001860200257","article-title":"Whittle\u2019s index policy for a multi-class queueing system with convex holding costs","volume":"57","author":"Ansell","year":"2003","journal-title":"Math. Methods Oper. Res."},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1239\/aap\/999187898"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1007\/s11750-007-0025-0"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/TCNS.2016.2619066"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-67235-9_19"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ACC.2008.4587156"},{"key":"ref13","first-page":"2440","article-title":"Maintenance of a collection of machines under partial observability: Indexability and computation of whittle index","volume":"711","author":"Akbarzadeh","year":"2021","journal-title":"Les Cahiers du GERAD ISSN"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/TNET.2018.2856883"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v36i11.21460"},{"issue":"3","key":"ref16","first-page":"341","article-title":"An overview and some challenges in cyber-physical systems","volume":"93","author":"Kim","year":"2013","journal-title":"J. Indian Inst. Sci."},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/JAS.2016.7373757"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.2307\/3214163"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1239\/aap\/1214950209"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/TAC.2018.2799521"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2018.2871054"},{"key":"ref22","article-title":"Simulation based algorithms for Markov decision processes and multi-action restless bandits","author":"Meshram","year":"2020","journal-title":"arXiv:2007.12933"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/CDC51059.2022.9992898"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v37i10.26427"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1007\/s00186-024-00868-x"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1016\/j.automatica.2019.108759"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1111\/j.2517-6161.1979.tb01068.x"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.2307\/3214547"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/INFCOM.2012.6195483"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/TAC.2017.2715329"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/CDC45484.2021.9683132"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/NGI.2005.1431640"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1007\/s11134-006-9002-9"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1287\/opre.35.5.736"},{"key":"ref35","volume-title":"Markov Decision Processes: Discrete Stochastic Dynamic Programming","author":"Puterman","year":"2014"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1287\/moor.24.2.293"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1007\/978-93-86279-38-5"},{"key":"ref38","first-page":"1","article-title":"Finite sample analysis of two-timescale stochastic approximation with applications to reinforcement learning","volume-title":"Proc. 31st Conf. Learn. Theory","volume":"75","author":"Dalal"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/ALLERTON.2018.8636078"},{"key":"ref40","first-page":"2144","article-title":"Finite time analysis of linear two-timescale stochastic approximation with Markovian noise","volume-title":"Proc. 33rd Conf. Learn. Theory","volume":"125","author":"Kaledin"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1137\/20M1322649"},{"key":"ref42","first-page":"1","article-title":"Finite-time analysis of asynchronous stochastic approximation and Q-learning","volume-title":"Proc. 33rd Annu. Conf. Learn. Theory","volume":"125","author":"Qu"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1002\/nav.21992"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/TAC.2021.3057299"},{"key":"ref45","first-page":"394","article-title":"On the complexity of solving Markov decision problems","volume-title":"Proc. 11th Conf. Uncertainty Artif. Intell.","author":"Littman"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/JSAIT.2021.3081108"},{"key":"ref47","volume-title":"Numerical Optimization","author":"Nocedal","year":"2006"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1016\/j.sysconle.2004.08.007"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/COMSNETS51098.2021.9352741"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/CDC45484.2021.9683132"},{"key":"ref51","article-title":"A Lagrangian decomposition approach to weakly coupled dynamic optimization problems and its applications","author":"Hawkins","year":"2003"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1287\/opre.1070.0445"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.2737\/RMRS-RP-4"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.3138\/infor.45.1.001"},{"key":"ref55","article-title":"Dynamic model for fire behaviour prediction","author":"Rossa","year":"2009"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1007\/s10694-018-0774-3"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.22499\/2.5801.005"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.5558\/tfc65450-6"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1007\/s11027-006-9043-8"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.3390\/fire2010003"},{"key":"ref61","volume-title":"Rollout, Policy Iteration, and Distributed Reinforcement Learning","author":"Bertsekas","year":"2021"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1016\/0022-247X(69)90163-2"}],"container-title":["IEEE Access"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/6287639\/10380310\/10772464.pdf?arnumber=10772464","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,12,12]],"date-time":"2024-12-12T06:36:25Z","timestamp":1733985385000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10772464\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024]]},"references-count":62,"URL":"https:\/\/doi.org\/10.1109\/access.2024.3510558","relation":{},"ISSN":["2169-3536"],"issn-type":[{"value":"2169-3536","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024]]}}}