{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,9]],"date-time":"2026-01-09T21:46:08Z","timestamp":1767995168754,"version":"3.49.0"},"reference-count":15,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"name":"J. C. Bose Fellowship from DRDO through DIA-RCOE","award":["DFTM\/02\/3125\/M\/04\/AIR-04"],"award-info":[{"award-number":["DFTM\/02\/3125\/M\/04\/AIR-04"]}]},{"name":"Project from DST-ICPS"},{"name":"RBCCPS, IISc"},{"DOI":"10.13039\/501100001412","name":"S. S. Bhatnagar Fellowship from the Council of Scientific and Industrial Research, Government of India","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100001412","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Control Syst. Lett."],"published-print":{"date-parts":[[2023]]},"DOI":"10.1109\/lcsys.2023.3288931","type":"journal-article","created":{"date-parts":[[2023,6,24]],"date-time":"2023-06-24T06:17:47Z","timestamp":1687587467000},"page":"2671-2676","source":"Crossref","is-referenced-by-count":5,"title":["Actor\u2013Critic or Critic\u2013Actor? A Tale of Two Time Scales"],"prefix":"10.1109","volume":"7","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-7644-3914","authenticated-orcid":false,"given":"Shalabh","family":"Bhatnagar","sequence":"first","affiliation":[{"name":"Department of Computer Science and Automation, Indian Institute of Science, Bengaluru, India"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0756-5402","authenticated-orcid":false,"given":"Vivek S.","family":"Borkar","sequence":"additional","affiliation":[{"name":"Department of Electrical Engineering, Indian Institute of Technology Bombay, Mumbai, India"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2327-3549","authenticated-orcid":false,"given":"Soumyajit","family":"Guin","sequence":"additional","affiliation":[{"name":"Department of Computer Science and Automation, Indian Institute of Science, Bengaluru, India"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref13","first-page":"1057","article-title":"Policy gradient methods for reinforcement learning with function approximation","author":"sutton","year":"1999","journal-title":"Proc NeurIPS"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1007\/BF00115009"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1007\/BF00992698"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/9.580874"},{"key":"ref11","author":"puterman","year":"2014","journal-title":"Markov Decision Processes Discrete Stochastic Dynamic Programming"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1137\/S0363012901385691"},{"key":"ref2","author":"berstekas","year":"2019","journal-title":"REINFORCEMENT LEARNING AND OPTIMAL CONTROL"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/TSMC.1983.6313077"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1007\/978-81-951961-1-1"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1137\/S0363012995282784"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1137\/S036301299731669X"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1007\/s10626-015-0216-z"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1016\/j.automatica.2007.09.009"},{"key":"ref6","article-title":"Actor-critic or critic-actor? a tale of two time scales","author":"bhatnagar","year":"2022","journal-title":"arXiv 2212 10477"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1016\/j.automatica.2009.07.008"}],"container-title":["IEEE Control Systems Letters"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7782633\/9828546\/10160088.pdf?arnumber=10160088","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,8,1]],"date-time":"2023-08-01T18:29:21Z","timestamp":1690914561000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10160088\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023]]},"references-count":15,"URL":"https:\/\/doi.org\/10.1109\/lcsys.2023.3288931","relation":{},"ISSN":["2475-1456"],"issn-type":[{"value":"2475-1456","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023]]}}}