{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,26]],"date-time":"2025-03-26T09:36:29Z","timestamp":1742981789038,"version":"3.40.3"},"publisher-location":"Berlin, Heidelberg","reference-count":10,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783642392498"},{"type":"electronic","value":"9783642392504"}],"license":[{"start":{"date-parts":[[2013,1,1]],"date-time":"2013-01-01T00:00:00Z","timestamp":1356998400000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2013]]},"DOI":"10.1007\/978-3-642-39250-4_14","type":"book-chapter","created":{"date-parts":[[2013,6,9]],"date-time":"2013-06-09T22:21:00Z","timestamp":1370816460000},"page":"141-153","source":"Crossref","is-referenced-by-count":8,"title":["Towards a Principled Solution to Simulated Robot Soccer"],"prefix":"10.1007","author":[{"given":"Aijun","family":"Bai","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Feng","family":"Wu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xiaoping","family":"Chen","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","reference":[{"key":"14_CR1","unstructured":"Bai, A., Wu, F., Chen, X.: Online planning for large MDPs with MAXQ decomposition (extended abstract). In: Proc. of 11th Int. Conf. on Autonomous Agents and Multiagent Systems, Valencia, Spain (June 2012)"},{"key":"14_CR2","unstructured":"Barry, J.: Fast Approximate Hierarchical Solution of MDPs. Ph.D. thesis, Massachusetts Institute of Technology (2009)"},{"key":"14_CR3","unstructured":"Barry, J., Kaelbling, L., Lozano-Perez, T.: Deth*: Approximate hierarchical solution of large markov decision processes. In: International Joint Conference on Artificial Intelligence, pp. 1928\u20131935 (2011)"},{"key":"14_CR4","doi-asserted-by":"crossref","unstructured":"Dietterich, T.G.: Hierarchical reinforcement learning with the MAXQ value function decomposition. Journal of Machine Learning Research 13(1), 63 (May 1999)","DOI":"10.1613\/jair.639"},{"key":"14_CR5","series-title":"LNAI","doi-asserted-by":"publisher","first-page":"36","DOI":"10.1007\/978-3-642-20217-9_4","volume-title":"RoboCup 2010: Robot Soccer World Cup XIV","author":"T. Gabel","year":"2011","unstructured":"Gabel, T., Riedmiller, M.: On progress in roboCup: The simulation league showcase. In: Ruiz-del-Solar, J. (ed.) RoboCup 2010. LNCS (LNAI), vol.\u00a06556, pp. 36\u201347. Springer, Heidelberg (2011)"},{"key":"14_CR6","series-title":"Lecture Notes in Artificial Intelligence","doi-asserted-by":"publisher","first-page":"72","DOI":"10.1007\/978-3-540-74024-7_7","volume-title":"RoboCup 2006: Robot Soccer World Cup X","author":"S. Kalyanakrishnan","year":"2007","unstructured":"Kalyanakrishnan, S., Liu, Y., Stone, P.: Half field offense in roboCup soccer: A multiagent reinforcement learning case study. In: Lakemeyer, G., Sklar, E., Sorrenti, D.G., Takahashi, T. (eds.) RoboCup 2006. LNCS (LNAI), vol.\u00a04434, pp. 72\u201385. Springer, Heidelberg (2007)"},{"issue":"1","key":"14_CR7","doi-asserted-by":"publisher","first-page":"55","DOI":"10.1007\/s10514-009-9120-4","volume":"27","author":"M. Riedmiller","year":"2009","unstructured":"Riedmiller, M., Gabel, T., Hafner, R., Lange, S.: Reinforcement learning for robot soccer. Autonomous Robots\u00a027(1), 55\u201373 (2009)","journal-title":"Autonomous Robots"},{"key":"14_CR8","doi-asserted-by":"crossref","unstructured":"Stone, P.: Layered learning in multiagent systems: A winning approach to robotic soccer. The MIT press (2000)","DOI":"10.7551\/mitpress\/4151.001.0001"},{"issue":"3","key":"14_CR9","doi-asserted-by":"publisher","first-page":"165","DOI":"10.1177\/105971230501300301","volume":"13","author":"P. Stone","year":"2005","unstructured":"Stone, P., Sutton, R., Kuhlmann, G.: Reinforcement learning for robocup soccer keepaway. Adaptive Behavior\u00a013(3), 165\u2013188 (2005)","journal-title":"Adaptive Behavior"},{"issue":"1-2","key":"14_CR10","doi-asserted-by":"publisher","first-page":"99","DOI":"10.1016\/S0004-3702(01)00069-8","volume":"128","author":"S. Thrun","year":"2001","unstructured":"Thrun, S., Fox, D., Burgard, W., Dellaert, F.: Robust monte carlo localization for mobile robots. Artificial Intelligence\u00a0128(1-2), 99\u2013141 (2001)","journal-title":"Artificial Intelligence"}],"container-title":["Lecture Notes in Computer Science","RoboCup 2012: Robot Soccer World Cup XVI"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-39250-4_14","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,5,19]],"date-time":"2019-05-19T21:45:51Z","timestamp":1558302351000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-642-39250-4_14"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2013]]},"ISBN":["9783642392498","9783642392504"],"references-count":10,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-39250-4_14","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2013]]}}}