{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,25]],"date-time":"2026-03-25T16:15:54Z","timestamp":1774455354083,"version":"3.50.1"},"publisher-location":"Cham","reference-count":24,"publisher":"Springer International Publishing","isbn-type":[{"value":"9783030275433","type":"print"},{"value":"9783030275440","type":"electronic"}],"license":[{"start":{"date-parts":[[2019,1,1]],"date-time":"2019-01-01T00:00:00Z","timestamp":1546300800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2019,1,1]],"date-time":"2019-01-01T00:00:00Z","timestamp":1546300800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2019]]},"DOI":"10.1007\/978-3-030-27544-0_7","type":"book-chapter","created":{"date-parts":[[2019,8,5]],"date-time":"2019-08-05T23:06:44Z","timestamp":1565046404000},"page":"83-95","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":9,"title":["Learning Skills for Small Size League RoboCup"],"prefix":"10.1007","author":[{"given":"Devin","family":"Schwab","sequence":"first","affiliation":[]},{"given":"Yifeng","family":"Zhu","sequence":"additional","affiliation":[]},{"given":"Manuela","family":"Veloso","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2019,8,4]]},"reference":[{"key":"7_CR1","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"346","DOI":"10.1007\/3-540-48422-1_28","volume-title":"RoboCup-98: Robot Soccer World Cup II","author":"D Andre","year":"1999","unstructured":"Andre, D., Teller, A.: Evolving team Darwin united. In: Asada, M., Kitano, H. (eds.) RoboCup 1998. LNCS, vol. 1604, pp. 346\u2013351. Springer, Heidelberg (1999). https:\/\/doi.org\/10.1007\/3-540-48422-1_28"},{"key":"7_CR2","unstructured":"Ba, J.L., Kiros, J.R., Hinton, G.E.: Layer normalization. arXiv preprint arXiv:1607.06450 (2016)"},{"key":"7_CR3","first-page":"33","volume":"219","author":"B Browning","year":"2005","unstructured":"Browning, B., Bruce, J., Bowling, M., Veloso, M.: STP: skills, tactics and plays for multi-robot control in adversarial environments. J. Syst. Control Eng. 219, 33\u201352 (2005). The 2005 Professional Engineering Publishing Award","journal-title":"J. Syst. Control Eng."},{"key":"7_CR4","doi-asserted-by":"publisher","first-page":"866","DOI":"10.1016\/j.robot.2010.03.007","volume":"58","author":"F Fernandez","year":"2009","unstructured":"Fernandez, F., Garcia, J., Veloso, M.: Probabilistic policy reuse for inter-task transfer learning. Robot. Auton. Syst. 58, 866\u2013871 (2009). Special Issue on Advances in Autonomous Robots for Service and Entertainment","journal-title":"Robot. Auton. Syst."},{"key":"7_CR5","unstructured":"Hausknecht, M., Chen, Y., Stone, P.: Deep imitation learning for parameterized action spaces. In: AAMAS Adaptive Learning Agents (ALA) Workshop, May 2016"},{"key":"7_CR6","unstructured":"Hausknecht, M., Stone, P.: Deep reinforcement learning in parameterized action space. In: Proceedings of the International Conference on Learning Representations (ICLR), May 2016"},{"key":"7_CR7","unstructured":"Heess, N., et al.: Emergence of locomotion behaviours in rich environments. CoRR (2017). http:\/\/arxiv.org\/abs\/1707.02286v2"},{"key":"7_CR8","unstructured":"Hsu, W.H., Gustafson, S.M.: Genetic programming and multi-agent layered learning by reinforcements. In: GECCO, pp. 764\u2013771 (2002)"},{"issue":"5","key":"7_CR9","doi-asserted-by":"publisher","first-page":"378","DOI":"10.1177\/02783640122067453","volume":"20","author":"SM LaValle","year":"2001","unstructured":"LaValle, S.M., Kuffner Jr., J.J.: Randomized kinodynamic planning. Int. J. Robot. Res. 20(5), 378\u2013400 (2001)","journal-title":"Int. J. Robot. Res."},{"key":"7_CR10","unstructured":"Lillicrap, T.P., et al.: Continuous control with deep reinforcement learning. In: Internal Conference on Learning Representations (2016). http:\/\/arxiv.org\/abs\/1509.02971v5"},{"key":"7_CR11","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"398","DOI":"10.1007\/3-540-64473-3_76","volume-title":"RoboCup-97: Robot Soccer World Cup I","author":"S Luke","year":"1998","unstructured":"Luke, S., Hohn, C., Farris, J., Jackson, G., Hendler, J.: Co-evolving soccer softbot team coordination with genetic programming. In: Kitano, H. (ed.) RoboCup 1997. LNCS, vol. 1395, pp. 398\u2013411. Springer, Heidelberg (1998). https:\/\/doi.org\/10.1007\/3-540-64473-3_76"},{"key":"7_CR12","unstructured":"Mnih, V., et al.: Asynchronous methods for deep reinforcement learning (2016). http:\/\/arxiv.org\/abs\/1602.01783v2"},{"key":"7_CR13","unstructured":"Mnih, V., et al.: Playing atari with deep reinforcement learning (2013). http:\/\/arxiv.org\/abs\/1312.5602v1"},{"issue":"7540","key":"7_CR14","doi-asserted-by":"publisher","first-page":"529","DOI":"10.1038\/nature14236","volume":"518","author":"V Mnih","year":"2015","unstructured":"Mnih, V., et al.: Human-level control through deep reinforcement learning. Nature 518(7540), 529\u2013533 (2015)","journal-title":"Nature"},{"key":"7_CR15","unstructured":"Schulman, J., Levine, S., Moritz, P., Jordan, M.I., Abbeel, P.: Trust region policy optimization. CoRR, abs\/1502.05477 (2015)"},{"key":"7_CR16","unstructured":"Schulman, J., Wolski, F., Dhariwal, P., Radford, A., Klimov, O.: Proximal policy optimization algorithms. arXiv preprint arXiv:1707.06347 (2017)"},{"issue":"7587","key":"7_CR17","doi-asserted-by":"publisher","first-page":"484","DOI":"10.1038\/nature16961","volume":"529","author":"D Silver","year":"2016","unstructured":"Silver, D., et al.: Mastering the game of go with deep neural networks and tree search. Nature 529(7587), 484\u2013489 (2016). https:\/\/doi.org\/10.1038\/nature16961","journal-title":"Nature"},{"issue":"7676","key":"7_CR18","doi-asserted-by":"publisher","first-page":"354","DOI":"10.1038\/nature24270","volume":"550","author":"D Silver","year":"2017","unstructured":"Silver, D., et al.: Mastering the game of go without human knowledge. Nature 550(7676), 354 (2017)","journal-title":"Nature"},{"key":"7_CR19","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"212","DOI":"10.1007\/3-540-45622-8_16","volume-title":"Abstraction, Reformulation, and Approximation","author":"M Stolle","year":"2002","unstructured":"Stolle, M., Precup, D.: Learning options in reinforcement learning. In: Koenig, S., Holte, R.C. (eds.) SARA 2002. LNCS, vol. 2371, pp. 212\u2013223. Springer, Heidelberg (2002). https:\/\/doi.org\/10.1007\/3-540-45622-8_16"},{"key":"7_CR20","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"93","DOI":"10.1007\/11780519_9","volume-title":"RoboCup 2005: Robot Soccer World Cup IX","author":"P Stone","year":"2006","unstructured":"Stone, P., Kuhlmann, G., Taylor, M.E., Liu, Y.: Keepaway soccer: from machine learning testbed to benchmark. In: Bredenfeld, A., Jacoff, A., Noda, I., Takahashi, Y. (eds.) RoboCup 2005. LNCS, vol. 4020, pp. 93\u2013105. Springer, Heidelberg (2006). https:\/\/doi.org\/10.1007\/11780519_9"},{"issue":"3","key":"7_CR21","doi-asserted-by":"publisher","first-page":"165","DOI":"10.1177\/105971230501300301","volume":"13","author":"P Stone","year":"2005","unstructured":"Stone, P., Sutton, R.S., Kuhlmann, G.: Reinforcement learning for RoboCup soccer keepaway. Adapt. Behav. 13(3), 165\u2013188 (2005). https:\/\/doi.org\/10.1177\/105971230501300301","journal-title":"Adapt. Behav."},{"key":"7_CR22","unstructured":"The RoboCup Federation: RoboCup (2017). http:\/\/www.robocup.org\/"},{"key":"7_CR23","unstructured":"Uchibe, E.: Cooperative behavior acquisition by learning and evolution in a multi-agent environment for mobile robots. Ph.D. thesis. Osaka University (1999)"},{"key":"7_CR24","unstructured":"Vecerik, M., et al.: Leveraging demonstrations for deep reinforcement learning on robotics problems with sparse rewards. CoRR (2017). http:\/\/arxiv.org\/abs\/1707.08817"}],"container-title":["Lecture Notes in Computer Science","RoboCup 2018: Robot World Cup XXII"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-27544-0_7","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,8,6]],"date-time":"2023-08-06T00:02:36Z","timestamp":1691280156000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-030-27544-0_7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019]]},"ISBN":["9783030275433","9783030275440"],"references-count":24,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-27544-0_7","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2019]]},"assertion":[{"value":"4 August 2019","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"RoboCup","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Robot World Cup","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Montr\u00e9al, QC","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Canada","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2018","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18 June 2018","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"22 June 2018","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"22","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"robocup2018","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/www.robocup2018.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"This content has been made available to all.","name":"free","label":"Free to read"}]}}