{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,4,6]],"date-time":"2025-04-06T23:03:25Z","timestamp":1743980605972},"publisher-location":"Berlin, Heidelberg","reference-count":10,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783540407201"},{"type":"electronic","value":"9783540451679"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2003]]},"DOI":"10.1007\/978-3-540-45167-9_42","type":"book-chapter","created":{"date-parts":[[2010,7,22]],"date-time":"2010-07-22T23:10:53Z","timestamp":1279840253000},"page":"581-594","source":"Crossref","is-referenced-by-count":5,"title":["Approximate Equivalence of Markov Decision Processes"],"prefix":"10.1007","author":[{"given":"Eyal","family":"Even-Dar","sequence":"first","affiliation":[]},{"given":"Yishay","family":"Mansour","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"42_CR1","unstructured":"Allender, E., Arora, S., Kearns, M., Moore, C., Russell, A.: Note on the representational incompatabilty of function approximation and factored dynamics. In: Advances in Neural Information Processing Systems 15 (2002)"},{"key":"42_CR2","volume-title":"Neuro-Dynamic Programming","author":"D.P. Bertsekas","year":"1996","unstructured":"Bertsekas, D.P., Tsitsiklis, J.N.: Neuro-Dynamic Programming. Athena Scientific, Belmont (1996)"},{"issue":"3","key":"42_CR3","doi-asserted-by":"publisher","first-page":"142","DOI":"10.1111\/j.1467-8640.1989.tb00324.x","volume":"5","author":"T. Dean","year":"1989","unstructured":"Dean, T., Kanazawa, K.: A model for reasoning about persistence and causation. Computational Intelligence\u00a05(3), 142\u2013150 (1989)","journal-title":"Computational Intelligence"},{"key":"42_CR4","doi-asserted-by":"crossref","unstructured":"Dean, T., Givan, R., Leach, S.: Model reduction techniques for computing approximately optimal solutions for Markov decision processes. In: UAI, pp. 124\u2013131 (1997)","DOI":"10.1007\/3-540-63912-8_89"},{"key":"42_CR5","doi-asserted-by":"crossref","unstructured":"Givan, R., Dean, T., Greig, M.: Equivalence notions and model minimization in markov decision processes. Artificial Intelligence (2003) (to appear)","DOI":"10.1016\/S0004-3702(02)00376-4"},{"key":"42_CR6","doi-asserted-by":"publisher","first-page":"293","DOI":"10.1016\/0304-3975(85)90224-5","volume":"38","author":"T.F. Gonzalez","year":"1985","unstructured":"Gonzalez, T.F.: Clustering to minimize the maximum inter-cluster distance. Theoretical Computer Science\u00a038, 293\u2013306 (1985)","journal-title":"Theoretical Computer Science"},{"key":"42_CR7","doi-asserted-by":"publisher","first-page":"71","DOI":"10.1016\/S0004-3702(00)00047-3","volume":"122","author":"R. Givan","year":"2000","unstructured":"Givan, R., Leach, S., Dean, T.: Bounded parameter markov decision processes. Artificial Intelligence\u00a0122, 71\u2013109 (2000)","journal-title":"Artificial Intelligence"},{"key":"42_CR8","doi-asserted-by":"crossref","first-page":"83","DOI":"10.1613\/jair.714","volume":"14","author":"C. Lusena","year":"2001","unstructured":"Lusena, C., Goldsmith, J., Mundhenk, M.: Nonapproximability results for partially observable markov decision processes. Journal of Artificial Intelligence Research\u00a014, 83\u2013103 (2001)","journal-title":"Journal of Artificial Intelligence Research"},{"key":"42_CR9","doi-asserted-by":"crossref","DOI":"10.1002\/9780470316887","volume-title":"Markov Decision Processes : Discrete Stochastic Dynamic Programming.","author":"M. Puterman","year":"1994","unstructured":"Puterman, M.: Markov Decision Processes: Discrete Stochastic Dynamic Programming. John Wiley & Sons, Chichester (1994)"},{"key":"42_CR10","volume-title":"Reinforcement Learning.","author":"R. Sutton","year":"1998","unstructured":"Sutton, R., Barto, A.: Reinforcement Learning. MIT Press, Cambridge (1998)"}],"container-title":["Lecture Notes in Computer Science","Learning Theory and Kernel Machines"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-540-45167-9_42","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,11,1]],"date-time":"2021-11-01T04:57:11Z","timestamp":1635742631000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-540-45167-9_42"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2003]]},"ISBN":["9783540407201","9783540451679"],"references-count":10,"URL":"https:\/\/doi.org\/10.1007\/978-3-540-45167-9_42","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2003]]}}}