{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,26]],"date-time":"2025-10-26T21:01:09Z","timestamp":1761512469443},"publisher-location":"Berlin, Heidelberg","reference-count":17,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783540440369"},{"type":"electronic","value":"9783540367550"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2002]]},"DOI":"10.1007\/3-540-36755-1_33","type":"book-chapter","created":{"date-parts":[[2007,11,13]],"date-time":"2007-11-13T21:03:29Z","timestamp":1194987809000},"page":"391-404","source":"Crossref","is-referenced-by-count":5,"title":["Characterizing Markov Decision Processes"],"prefix":"10.1007","author":[{"given":"Bohdana","family":"Ratitch","sequence":"first","affiliation":[]},{"given":"Doina","family":"Precup","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2002,9,20]]},"reference":[{"key":"33_CR1","volume-title":"Neuro-Dynamic Programming","author":"D. P. Bertsekas","year":"1996","unstructured":"Bertsekas, D. P., Tsitsiklis, J. N.: Neuro-Dynamic Programming. Belmont, MA: Athena Scientific (1996)"},{"key":"33_CR2","volume-title":"Empirical Methods for Artificial Intelligence","author":"P. R. Cohen","year":"1995","unstructured":"Cohen, P. R.: Empirical Methods for Artificial Intelligence. Cambridge, MA: The MIT Press (1995)"},{"issue":"1","key":"33_CR3","doi-asserted-by":"publisher","first-page":"35","DOI":"10.1016\/0004-3702(94)00086-G","volume":"76","author":"T. Dean","year":"1995","unstructured":"Dean, T., Kaelbling, L., Kirman, J., Nicholson, A.: Planning under Time Constraints in Stochastic Domains. Artificial Intelligence 76(1\u20132) (1995) 35\u201374","journal-title":"Artificial Intelligence"},{"key":"33_CR4","unstructured":"Dearden, R., Friedman, N., Andre, D.: Model-Based Bayesian Exploration. In Uncertainty in Artificial Intelligence: Proceedings of the Fifteenth Conference (UAI-1999) 150\u2013159"},{"key":"33_CR5","first-page":"1040","volume":"13","author":"J. G. Gordon","year":"2001","unstructured":"Gordon, J. G.: Reinforcement Learning with Function Approximation Converges to a Region. Advances in Neural Information Processing Systems 13 (2001) 1040\u20131046","journal-title":"Advances in Neural Information Processing Systems"},{"key":"33_CR6","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/0004-3702(95)00044-5","volume":"81","author":"T. Hogg","year":"1996","unstructured":"Hogg, T., Huberman, B. A., Williams, C. P.: Phase Transitions and the Search Problem (Editorial). Artificial Intelligence, 81 (1996) 1\u201316","journal-title":"Artificial Intelligence"},{"key":"33_CR7","doi-asserted-by":"publisher","first-page":"421","DOI":"10.1023\/A:1006350622830","volume":"24","author":"H. H. Hoos","year":"2000","unstructured":"Hoos, H. H., Stutzle, T.: Local Search Algorithms for SAT: An Empirical Evaluation. Journal of Automated Reasoning, 24 (2000) 421\u2013481.","journal-title":"Journal of Automated Reasoning"},{"key":"33_CR8","unstructured":"Kearns, M., Singh, S.: Near-Optimal Reinforcement Learning in Polynomial Time. In Proceedings of the 15th International Conference on Machine Learning (1998) 260\u2013268"},{"key":"33_CR9","unstructured":"Kirman, J.: Predicting Real-Time Planner Performance by Domain Characterization. Ph.D. Thesis, Brown University (1995)"},{"key":"33_CR10","unstructured":"Lagoudakis, M., Littman, M. L.: Algorithm Selection using Reinforcement Learning Proceedings of the 17th International Conference on Machine Learning (2000) 511\u2013518"},{"issue":"2","key":"33_CR11","doi-asserted-by":"publisher","first-page":"117","DOI":"10.1023\/A:1007541107674","volume":"35","author":"N. Meuleau","year":"1999","unstructured":"Meuleau, N., Bourgine, P.: Exploration of Multi-State Environments: Local Measures and Back-Propagation of Uncertainty. Machine Learning 35(2) (1999) 117\u2013154","journal-title":"Machine Learning"},{"key":"33_CR12","first-page":"103","volume":"13","author":"A. W. Moore","year":"1993","unstructured":"Moore, A. W., Atkeson, C. G.: Prioritized Sweeping: Reinforcement Learning with Less Data and Less Time. Machine Learning, 13 (1993) 103\u2013130","journal-title":"Machine Learning"},{"key":"33_CR13","unstructured":"Papadimitriou, C. H., Steiglitz, K: Combinatorial Optimization: Algorithms and Complexity. Prentice Hall (1982)"},{"issue":"3","key":"33_CR14","doi-asserted-by":"publisher","first-page":"441","DOI":"10.1287\/moor.12.3.441","volume":"12","author":"C. H. Papadimitriou","year":"1987","unstructured":"Papadimitriou, C. H., Tsitsiklis, J. N.: The Complexity of Markov Chain Decision Processes. Mathematics of Operations Research 12(3) (1987) 441\u2013450","journal-title":"Mathematics of Operations Research"},{"key":"33_CR15","doi-asserted-by":"crossref","unstructured":"Puterman, M. L.: Markov Decision Processes: Discrete Stochastic Dynamic Programming. Wiley (1994)","DOI":"10.1002\/9780470316887"},{"key":"33_CR16","first-page":"361","volume":"7","author":"S. P. Singh","year":"1995","unstructured":"Singh, S. P., Jaakkola, T., Jordan, M. I.: Reinforcement Learning with Soft State Aggregation. Advances in Neural Information Processing Systems, 7 (1995) 361\u2013368","journal-title":"Advances in Neural Information Processing Systems"},{"key":"33_CR17","volume-title":"Reinforcement Learning. An Introduction","author":"R. S. Sutton","year":"1998","unstructured":"Sutton, R. S., Barto, A. G.: Reinforcement Learning. An Introduction. Cambridge, MA: The MIT Press (1998)"}],"container-title":["Lecture Notes in Computer Science","Machine Learning: ECML 2002"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/3-540-36755-1_33","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,2,25]],"date-time":"2019-02-25T07:13:11Z","timestamp":1551078791000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/3-540-36755-1_33"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2002]]},"ISBN":["9783540440369","9783540367550"],"references-count":17,"URL":"https:\/\/doi.org\/10.1007\/3-540-36755-1_33","relation":{},"ISSN":["0302-9743"],"issn-type":[{"type":"print","value":"0302-9743"}],"subject":[],"published":{"date-parts":[[2002]]}}}