{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,5]],"date-time":"2024-09-05T19:49:12Z","timestamp":1725565752283},"publisher-location":"Berlin, Heidelberg","reference-count":15,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783642151927"},{"type":"electronic","value":"9783642151934"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2010]]},"DOI":"10.1007\/978-3-642-15193-4_46","type":"book-chapter","created":{"date-parts":[[2010,9,15]],"date-time":"2010-09-15T08:34:37Z","timestamp":1284539677000},"page":"489-500","source":"Crossref","is-referenced-by-count":1,"title":["TeXDYNA: Hierarchical Reinforcement Learning in Factored MDPs"],"prefix":"10.1007","author":[{"given":"Olga","family":"Kozlova","sequence":"first","affiliation":[]},{"given":"Olivier","family":"Sigaud","sequence":"additional","affiliation":[]},{"given":"Christophe","family":"Meyer","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"46_CR1","volume-title":"Reinforcement Learning: An Introduction","author":"R.S. Sutton","year":"1998","unstructured":"Sutton, R.S., Barto, A.G.: Reinforcement Learning: An Introduction. MIT Press, Cambridge (1998)"},{"key":"46_CR2","unstructured":"Boutilier, C., Dearden, R., Goldszmidt, M.: Exploiting structure in policy construction. In: Proceedings of the 14th International Joint Conference on Artificial Intelligence, pp. 1104\u20131111 (1995)"},{"key":"46_CR3","doi-asserted-by":"publisher","first-page":"41","DOI":"10.1023\/A:1022140919877","volume":"13","author":"A. Barto","year":"2003","unstructured":"Barto, A., Mahadevan, S.: Recent advances in hierarchical reinforcement learning. Discrete Event Systems Journal\u00a013, 41\u201377 (2003)","journal-title":"Discrete Event Systems Journal"},{"key":"46_CR4","unstructured":"Hengst, B.: Discovering hierarchy in reinforcement learning with HEXQ. In: Proceedings of the 19th International Conference on Machine Learning, pp. 243\u2013250 (2002)"},{"key":"46_CR5","first-page":"2259","volume":"7","author":"A. Jonsson","year":"2006","unstructured":"Jonsson, A., Barto, A.: Causal graph based decomposition of factored MDPs. Journal of Machine Learning Research\u00a07, 2259\u20132301 (2006)","journal-title":"Journal of Machine Learning Research"},{"key":"46_CR6","first-page":"257","volume-title":"Proceedings of the 23rd International Conference on Machine Learning, Pittsburgh, Pennsylvania","author":"T. Degris","year":"2006","unstructured":"Degris, T., Sigaud, O., Wuillemin, P.H.: Learning the structure of factored markov decision processes in reinforcement learning problems. In: Proceedings of the 23rd International Conference on Machine Learning, Pittsburgh, Pennsylvania, pp. 257\u2013264. ACM, New York (2006)"},{"issue":"1-2","key":"46_CR7","doi-asserted-by":"publisher","first-page":"49","DOI":"10.1016\/S0004-3702(00)00033-3","volume":"121","author":"C. Boutilier","year":"2000","unstructured":"Boutilier, C., Dearden, R., Goldszmidt, M.: Stochastic dynamic programming with factored representations. Artificial Intelligence\u00a0121(1-2), 49\u2013107 (2000)","journal-title":"Artificial Intelligence"},{"key":"46_CR8","doi-asserted-by":"crossref","unstructured":"Sutton, R.S.: DYNA, an integrated architecture for learning, planning and reacting. In: Working Notes of the AAAI Spring Symposium on Integrated Intelligent Architectures (1991)","DOI":"10.1145\/122344.122377"},{"key":"46_CR9","doi-asserted-by":"publisher","first-page":"181","DOI":"10.1016\/S0004-3702(99)00052-1","volume":"112","author":"R. Sutton","year":"1999","unstructured":"Sutton, R., Precup, D., Singh, S.: Between MDPs and semi-MDPs: A framework for temporal abstraction in reinforcement learning. Artificial Intelligence\u00a0112, 181\u2013211 (1999)","journal-title":"Artificial Intelligence"},{"key":"46_CR10","doi-asserted-by":"crossref","unstructured":"Jonsson, A.: A causal approach to hierarchical decomposition in reinforcement learning. PhD thesis, University of Massachusetts Amherst (2006)","DOI":"10.1145\/1102351.1102402"},{"key":"46_CR11","unstructured":"Vigorito, C.M., Barto, A.G.: Autonomous Hierarchical Skill Acquisition in Factored MDPs. In: Yale Workshop on Adaptive and Learning Systems, New Haven, Connecticut (2008)"},{"key":"46_CR12","unstructured":"Vigorito, C., Barto, A.: Hierarchical Representations of Behavior for Efficient Creative Search. In: AAAI Spring Symposium on Creative Intelligent Systems, Palo Alto, CA (2008)"},{"key":"46_CR13","first-page":"1281","volume":"18","author":"S. Singh","year":"2004","unstructured":"Singh, S., Barto, A., Chentanez, N.: Intrinsically motivated reinforcement learning. Advances in Neural Information Processing Systems\u00a018, 1281\u20131288 (2004)","journal-title":"Advances in Neural Information Processing Systems"},{"key":"46_CR14","doi-asserted-by":"publisher","first-page":"1048","DOI":"10.1145\/1390156.1390288","volume-title":"Proceedings of the 25th International Conference on Machine Learning","author":"I. Szita","year":"2008","unstructured":"Szita, I., L\u00f6rincz, A.: The many faces of optimism: a unifying approach. In: Proceedings of the 25th International Conference on Machine Learning, pp. 1048\u20131055. ACM, New York (2008)"},{"key":"46_CR15","doi-asserted-by":"crossref","unstructured":"Oudeyer, P.Y., Kaplan, F., Hafner, V.: Intrinsic motivation systems for autonomous mental development. IEEE Transactions on Evolutionary Computation\u00a011 (2007)","DOI":"10.1109\/TEVC.2006.890271"}],"container-title":["Lecture Notes in Computer Science","From Animals to Animats 11"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-15193-4_46.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,11,24]],"date-time":"2020-11-24T03:02:19Z","timestamp":1606186939000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-642-15193-4_46"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2010]]},"ISBN":["9783642151927","9783642151934"],"references-count":15,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-15193-4_46","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2010]]}}}