{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,23]],"date-time":"2024-10-23T06:41:35Z","timestamp":1729665695024,"version":"3.28.0"},"reference-count":16,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2009,3]]},"DOI":"10.1109\/adprl.2009.4927531","type":"proceedings-article","created":{"date-parts":[[2009,5,19]],"date-time":"2009-05-19T15:50:44Z","timestamp":1242748244000},"page":"96-100","source":"Crossref","is-referenced-by-count":2,"title":["Adaptive computation of optimal nonrandomized policies in constrained average-reward MDPs"],"prefix":"10.1109","author":[{"given":"Eugene A.","family":"Feinberg","sequence":"first","affiliation":[],"role":[{"role":"author","vocab":"crossref"}]}],"member":"263","reference":[{"key":"15","doi-asserted-by":"publisher","DOI":"10.1287\/opre.37.3.474"},{"key":"16","doi-asserted-by":"publisher","DOI":"10.1016\/j.orl.2006.06.005"},{"key":"13","article-title":"linear programming and finite markovian control problems","author":"kallenberg","year":"1983","journal-title":"Mathematical Center Tracts 148"},{"key":"14","doi-asserted-by":"publisher","DOI":"10.1287\/moor.27.3.545.316"},{"key":"11","doi-asserted-by":"publisher","DOI":"10.1287\/moor.21.4.922"},{"key":"12","doi-asserted-by":"crossref","first-page":"527","DOI":"10.1016\/j.orl.2008.06.002","article-title":"on polynomial classification problems for markov decision processes","volume":"36","author":"feinberg","year":"2008","journal-title":"Oper Res Lett"},{"key":"3","doi-asserted-by":"publisher","DOI":"10.1007\/BF02055577"},{"key":"2","doi-asserted-by":"publisher","DOI":"10.1137\/0329043"},{"key":"1","article-title":"constrained markov decision processes","author":"altman","year":"1999","journal-title":"Chapman & Hall\/Crc"},{"key":"10","doi-asserted-by":"publisher","DOI":"10.1007\/s00186-005-0443-4"},{"key":"7","doi-asserted-by":"publisher","DOI":"10.1109\/CDC.2008.4739426"},{"key":"6","article-title":"splitting randomized stationary policies in total-reward markov decision processes","author":"denardo","year":"2008","journal-title":"Preprint Department of Applied Mathematics and Statistics"},{"key":"5","doi-asserted-by":"publisher","DOI":"10.1287\/opre.41.6.1116"},{"key":"4","doi-asserted-by":"publisher","DOI":"10.1109\/9.75103"},{"key":"9","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-69532-5_8"},{"key":"8","doi-asserted-by":"publisher","DOI":"10.1007\/BF01435458"}],"event":{"name":"2009 IEEE Symposium on Adaptive Dynamic Programming and Reinforcement Learning (ADPRL)","start":{"date-parts":[[2009,3,30]]},"location":"Nashville, TN, USA","end":{"date-parts":[[2009,4,2]]}},"container-title":["2009 IEEE Symposium on Adaptive Dynamic Programming and Reinforcement Learning"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx5\/4910084\/4927513\/04927531.pdf?arnumber=4927531","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,6,18]],"date-time":"2017-06-18T16:02:34Z","timestamp":1497801754000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/4927531\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2009,3]]},"references-count":16,"URL":"https:\/\/doi.org\/10.1109\/adprl.2009.4927531","relation":{},"subject":[],"published":{"date-parts":[[2009,3]]}}}