{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,23]],"date-time":"2024-10-23T03:24:51Z","timestamp":1729653891057,"version":"3.28.0"},"reference-count":28,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2013,10]]},"DOI":"10.1109\/allerton.2013.6736508","type":"proceedings-article","created":{"date-parts":[[2014,2,13]],"date-time":"2014-02-13T22:46:12Z","timestamp":1392331572000},"page":"78-84","source":"Crossref","is-referenced-by-count":3,"title":["Approximation of stationary control policies by quantized control in Markov decision processes"],"prefix":"10.1109","author":[{"given":"Naci","family":"Saldi","sequence":"first","affiliation":[]},{"given":"Tamas","family":"Linder","sequence":"additional","affiliation":[]},{"given":"Serdar","family":"Yuksel","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"19","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4612-0729-0"},{"key":"17","doi-asserted-by":"publisher","DOI":"10.1109\/Allerton.2013.6736508"},{"key":"18","doi-asserted-by":"crossref","first-page":"29","DOI":"10.1214\/lnms\/1215453563","article-title":"On measurability and representation of strategic measures in Markov decision processes","volume":"30","author":"feinberg","year":"1996","journal-title":"Statistics Probability and Game Theory"},{"key":"15","doi-asserted-by":"publisher","DOI":"10.1016\/j.automatica.2007.09.013"},{"key":"16","doi-asserted-by":"publisher","DOI":"10.1109\/TAC.2009.2033848"},{"key":"13","doi-asserted-by":"publisher","DOI":"10.1007\/BF01442225"},{"key":"14","doi-asserted-by":"publisher","DOI":"10.1016\/0022-247X(86)90311-2"},{"key":"11","doi-asserted-by":"publisher","DOI":"10.1016\/0022-247X(80)90128-6"},{"key":"12","doi-asserted-by":"publisher","DOI":"10.1016\/0022-247X(82)90271-2"},{"key":"21","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-0348-8024-4"},{"key":"20","doi-asserted-by":"publisher","DOI":"10.1137\/1127058"},{"key":"22","doi-asserted-by":"publisher","DOI":"10.1016\/0304-4149(75)90031-9"},{"key":"23","doi-asserted-by":"publisher","DOI":"10.1016\/0304-4149(89)90058-6"},{"key":"24","first-page":"181","article-title":"On the weak topology on a space of probability measures induced by policies","volume":"36","author":"nowak","year":"1988","journal-title":"Bull Polish Acad Sci Math"},{"key":"25","first-page":"380","article-title":"Convergence of Lebesgue integrals with varying measures","author":"serfozo","year":"1982","journal-title":"Sankhya Ser A"},{"key":"26","doi-asserted-by":"publisher","DOI":"10.1007\/BF02055573"},{"key":"27","article-title":"Ergodic properties of Markov processes","author":"hairer","year":"2006","journal-title":"Lecture notes"},{"key":"28","doi-asserted-by":"crossref","DOI":"10.1007\/978-1-4419-8714-3","author":"herna?ndez-lerma","year":"1989","journal-title":"Adaptive Markov Control Processes"},{"key":"3","article-title":"Error propagation for approximate policy and value iteration","author":"farahmand","year":"2010","journal-title":"Advances in neural information processing systems"},{"key":"2","doi-asserted-by":"publisher","DOI":"10.1016\/0167-6911(94)90060-4"},{"key":"10","doi-asserted-by":"publisher","DOI":"10.1016\/0022-247X(71)90106-5"},{"key":"1","doi-asserted-by":"crossref","DOI":"10.1007\/978-1-4615-0805-2_11","article-title":"Convex analytic methods in markov decision processes","author":"borkar","year":"2002","journal-title":"Handbook of Markov Decision Processes"},{"key":"7","article-title":"State aggregation in Markov decision processes","author":"ren","year":"2002","journal-title":"CDC"},{"key":"6","doi-asserted-by":"publisher","DOI":"10.1007\/BF00114724"},{"journal-title":"Neuro-Dynamic Programming Athena Scientific","year":"1996","author":"bertsekas","key":"5"},{"key":"4","doi-asserted-by":"publisher","DOI":"10.1016\/j.automatica.2010.02.006"},{"key":"9","doi-asserted-by":"crossref","DOI":"10.1007\/978-3-540-75225-7_30","article-title":"Pseudometrics for state aggregation in average reward Markov decision processes","author":"ortner","year":"2007","journal-title":"Algorithmic Learning Theory"},{"key":"8","doi-asserted-by":"publisher","DOI":"10.1109\/CDC.2009.5400343"}],"event":{"name":"2013 51st Annual Allerton Conference on Communication, Control, and Computing (Allerton)","start":{"date-parts":[[2013,10,2]]},"location":"Monticello, IL","end":{"date-parts":[[2013,10,4]]}},"container-title":["2013 51st Annual Allerton Conference on Communication, Control, and Computing (Allerton)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6725831\/6736491\/06736508.pdf?arnumber=6736508","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,6,22]],"date-time":"2017-06-22T07:51:32Z","timestamp":1498117892000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/6736508\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2013,10]]},"references-count":28,"URL":"https:\/\/doi.org\/10.1109\/allerton.2013.6736508","relation":{},"subject":[],"published":{"date-parts":[[2013,10]]}}}