{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,27]],"date-time":"2025-03-27T00:16:59Z","timestamp":1743034619536,"version":"3.40.3"},"publisher-location":"Berlin, Heidelberg","reference-count":15,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783642041792"},{"type":"electronic","value":"9783642041808"}],"license":[{"start":{"date-parts":[[2009,1,1]],"date-time":"2009-01-01T00:00:00Z","timestamp":1230768000000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2009]]},"DOI":"10.1007\/978-3-642-04180-8_64","type":"book-chapter","created":{"date-parts":[[2009,8,27]],"date-time":"2009-08-27T08:11:20Z","timestamp":1251360680000},"page":"721-735","source":"Crossref","is-referenced-by-count":0,"title":["Considering Unseen States as Impossible in Factored Reinforcement Learning"],"prefix":"10.1007","author":[{"given":"Olga","family":"Kozlova","sequence":"first","affiliation":[]},{"given":"Olivier","family":"Sigaud","sequence":"additional","affiliation":[]},{"given":"Pierre-Henri","family":"Wuillemin","sequence":"additional","affiliation":[]},{"given":"Christophe","family":"Meyer","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"64_CR1","unstructured":"Boutilier, C.: Correlated action effects in decision theoretic regression. In: Proceedings of the 13th International Conference on Uncertainty in Artificial Intelligence, pp. 30\u201337. AUAI Press (1997)"},{"key":"64_CR2","unstructured":"Boutilier, C., Dearden, R., Goldszmidt, M.: Exploiting structure in policy construction. In: Proceedings of the 14th International Joint Conference on Artificial Intelligence, Montreal, pp. 1104\u20131111 (1995)"},{"key":"64_CR3","doi-asserted-by":"publisher","first-page":"49","DOI":"10.1016\/S0004-3702(00)00033-3","volume":"121","author":"C. Boutilier","year":"2000","unstructured":"Boutilier, C., Dearden, R., Goldszmidt, M.: Stochastic dynamic programming with factored representations. Artificial Intelligence\u00a0121, 49\u2013100 (2000)","journal-title":"Artificial Intelligence"},{"key":"64_CR4","doi-asserted-by":"publisher","first-page":"427","DOI":"10.1023\/A:1021330114221","volume":"1","author":"M.V. Butz","year":"2002","unstructured":"Butz, M.V., Goldberg, D.E., Stolzmann, W.: The Anticipatory Classifier System and Genetic Generalization. Natural Computing\u00a01, 427\u2013467 (2002)","journal-title":"Natural Computing"},{"key":"64_CR5","doi-asserted-by":"publisher","first-page":"142","DOI":"10.1111\/j.1467-8640.1989.tb00324.x","volume":"5","author":"T. Dean","year":"1989","unstructured":"Dean, T., Kanazawa, K.: A model for reasoning about persistence and causation. Computational Intelligence\u00a05, 142\u2013150 (1989)","journal-title":"Computational Intelligence"},{"key":"64_CR6","first-page":"122","volume-title":"Proceedings of the 22nd International Conference on Uncertainty in Artificial Intelligence","author":"T. Degris","year":"2006","unstructured":"Degris, T., Sigaud, O., Wuillemin, P.-H.: Chi-square tests driven method for learning the structure of factored MDPs. In: Proceedings of the 22nd International Conference on Uncertainty in Artificial Intelligence, Massachusetts Institute of Technology, pp. 122\u2013129. AUAI Press, Cambridge (2006a)"},{"key":"64_CR7","doi-asserted-by":"crossref","first-page":"257","DOI":"10.1145\/1143844.1143877","volume-title":"Proceedings of the 23rd International Conference on Machine Learning","author":"T. Degris","year":"2006","unstructured":"Degris, T., Sigaud, O., Wuillemin, P.-H.: Learning the structure of factored markov decision processes in reinforcement learning problems. In: Proceedings of the 23rd International Conference on Machine Learning, pp. 257\u2013264. ACM Press, Pittsburgh (2006b)"},{"key":"64_CR8","doi-asserted-by":"crossref","first-page":"399","DOI":"10.1613\/jair.1000","volume":"19","author":"C. Guestrin","year":"2003","unstructured":"Guestrin, C., Koller, D., Parr, R., Venkataraman, S.: Efficient Solution Algorithms for Factored MDPs. Journal of Artificial Intelligence Research\u00a019, 399\u2013468 (2003)","journal-title":"Journal of Artificial Intelligence Research"},{"key":"64_CR9","unstructured":"Hoey, J., St-Aubin, R., Hu, A., Boutilier, C.: SPUDD: Stochastic planning using decision diagrams. In: Proceedings of the 15th Conference on International Conference on Uncertainty in Artificial Intelligence, Stockholm, pp. 279\u2013288 (1999)"},{"key":"64_CR10","series-title":"LNAI","volume-title":"ABiALS 2008","author":"O. Sigaud","year":"2009","unstructured":"Sigaud, O., Butz, M.V., Kozlova, O., Meyer, C.: Anticipatory Learning Classifier Systems and Factored Reinforcement Learning. In: ABiALS 2008. LNCS (LNAI), vol.\u00a05499, Springer. Heidelberg (2009)"},{"key":"64_CR11","doi-asserted-by":"publisher","first-page":"1065","DOI":"10.1007\/s00500-007-0164-0","volume":"11","author":"O. Sigaud","year":"2007","unstructured":"Sigaud, O., Wilson, S.W.: Learning Classifier Systems: a survey. Journal of Soft Computing\u00a011, 1065\u20131078 (2007)","journal-title":"Journal of Soft Computing"},{"key":"64_CR12","doi-asserted-by":"crossref","unstructured":"Sutton, R.S.: DYNA, an integrated architecture for learning, planning and reacting. In: Working Notes of the AAAI Spring Symposium on Integrated Intelligent Architectures (1991)","DOI":"10.1145\/122344.122377"},{"key":"64_CR13","volume-title":"Reinforcement learning: An introduction","author":"R.S. Sutton","year":"1998","unstructured":"Sutton, R.S., Barto, A.G.: Reinforcement learning: An introduction. MIT Press, Cambridge (1998)"},{"key":"64_CR14","doi-asserted-by":"publisher","first-page":"1048","DOI":"10.1145\/1390156.1390288","volume-title":"ICML 2008: Proceedings of the 25th international conference on Machine learning","author":"I. Szita","year":"2008","unstructured":"Szita, I., L\u0151rincz, A.: The many faces of optimism: a unifying approach. In: ICML 2008: Proceedings of the 25th international conference on Machine learning, pp. 1048\u20131055. ACM Press, New York (2008)"},{"key":"64_CR15","doi-asserted-by":"publisher","first-page":"161","DOI":"10.1023\/A:1022699900025","volume":"4","author":"P.E. Utgoff","year":"1989","unstructured":"Utgoff, P.E.: Incremental induction of decision trees. Machine Learning\u00a04, 161\u2013186 (1989)","journal-title":"Machine Learning"}],"container-title":["Lecture Notes in Computer Science","Machine Learning and Knowledge Discovery in Databases"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-04180-8_64","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,10,10]],"date-time":"2021-10-10T03:23:42Z","timestamp":1633836222000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-642-04180-8_64"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2009]]},"ISBN":["9783642041792","9783642041808"],"references-count":15,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-04180-8_64","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2009]]}}}