{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,10]],"date-time":"2025-10-10T06:48:13Z","timestamp":1760078893597,"version":"3.28.0"},"reference-count":11,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"DOI":"10.1109\/cdc.2002.1184811","type":"proceedings-article","created":{"date-parts":[[2003,8,27]],"date-time":"2003-08-27T11:38:00Z","timestamp":1061984280000},"page":"1940-1945","source":"Crossref","is-referenced-by-count":10,"title":["Self learning control of constrained Markov chains - a gradient approach"],"prefix":"10.1109","volume":"2","author":[{"given":"F.V.","family":"Abad","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"V.","family":"Krishnamurthy","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"K.","family":"Martin","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"I.","family":"Baltcheva","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"article-title":"Direct gradient-based reinforcement learning: I. Gradient estimation algorithms","year":"1999","author":"baxter","key":"3"},{"journal-title":"Constrained Markov Decision Processes","year":"1999","author":"altman","key":"2"},{"journal-title":"Self-Learning Control of Finite Markov Chains","year":"2000","author":"poznyak","key":"10"},{"key":"1","article-title":"Self learning control of constrained Markov decision processes- a measure valued gradient approach","author":"abad","year":"2002","journal-title":"IEEE Trans Automatic Control"},{"key":"7","doi-asserted-by":"publisher","DOI":"10.1117\/12.319338"},{"key":"6","first-page":"71","article-title":"The relations amongst potentials, perturbation analysis and Markov decision processes","volume":"8","author":"cao","year":"1998","journal-title":"J DEDS"},{"journal-title":"Neuro-Dynamic Programming","year":"1996","author":"bertsekas","key":"5"},{"journal-title":"Nonlinear Programming","year":"2000","author":"bertsekas","key":"4"},{"key":"9","doi-asserted-by":"publisher","DOI":"10.1137\/S0363012994263743"},{"key":"8","doi-asserted-by":"publisher","DOI":"10.1109\/78.489036"},{"key":"11","doi-asserted-by":"crossref","DOI":"10.1002\/9780470316887","author":"puterman","year":"1994","journal-title":"Markov Decision Processes"}],"event":{"name":"IEEE Conference on Decision and Control","acronym":"CDC-02","location":"Las Vegas, NV, USA"},"container-title":["Proceedings of the 41st IEEE Conference on Decision and Control, 2002."],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx5\/8437\/26567\/01184811.pdf?arnumber=1184811","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,6,15]],"date-time":"2017-06-15T20:09:12Z","timestamp":1497557352000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/1184811\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[null]]},"references-count":11,"URL":"https:\/\/doi.org\/10.1109\/cdc.2002.1184811","relation":{},"subject":[]}}