{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,11]],"date-time":"2026-04-11T13:06:31Z","timestamp":1775912791107,"version":"3.50.1"},"publisher-location":"Berlin, Heidelberg","reference-count":19,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"value":"9783540292432","type":"print"},{"value":"9783540316923","type":"electronic"}],"license":[{"start":{"date-parts":[[2005,1,1]],"date-time":"2005-01-01T00:00:00Z","timestamp":1104537600000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2005]]},"DOI":"10.1007\/11564096_40","type":"book-chapter","created":{"date-parts":[[2005,11,9]],"date-time":"2005-11-09T06:54:27Z","timestamp":1131519267000},"page":"412-424","source":"Crossref","is-referenced-by-count":38,"title":["Using Advice to Transfer Knowledge Acquired in One Reinforcement Learning Task to Another"],"prefix":"10.1007","author":[{"given":"Lisa","family":"Torrey","sequence":"first","affiliation":[]},{"given":"Trevor","family":"Walker","sequence":"additional","affiliation":[]},{"given":"Jude","family":"Shavlik","sequence":"additional","affiliation":[]},{"given":"Richard","family":"Maclin","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"40_CR1","unstructured":"Andre, D., Russell, S.: Programmable reinforcement learning agents. In: NIPS (2001)"},{"key":"40_CR2","doi-asserted-by":"crossref","unstructured":"Clouse, J., Utgoff, P.: A teaching method for reinforcement learning. In: Proc. ICML 1992 (1992)","DOI":"10.1016\/B978-1-55860-247-2.50017-6"},{"key":"40_CR3","first-page":"331","volume":"17","author":"D. Gordon","year":"1994","unstructured":"Gordon, D., Subramanian, D.: A multistrategy learning scheme for agent knowledge acquisition. Informatica\u00a017, 331\u2013346 (1994)","journal-title":"Informatica"},{"key":"40_CR4","unstructured":"Kuhlmann, G., Stone, P., Mooney, R., Shavlik, J.: Guiding a reinforcement learner with natural language advice: Initial results in RoboCup soccer. In: AAAI Workshop on Supervisory Control of Learning and Adaptive Systems (2004)"},{"key":"40_CR5","unstructured":"Laud, A., DeJong, G.: Reinforcement learning and shaping: Encouraging intended behaviors. In: ICML (2002)"},{"key":"40_CR6","first-page":"293","volume":"8","author":"L. Lin","year":"1992","unstructured":"Lin, L.: Self-improving reactive agents based on reinforcement learning, planning, and teaching. Machine Learning\u00a08, 293\u2013321 (1992)","journal-title":"Machine Learning"},{"key":"40_CR7","first-page":"251","volume":"22","author":"R. Maclin","year":"1996","unstructured":"Maclin, R., Shavlik, J.: Creating advice-taking reinforcement learners. Machine Learning\u00a022, 251\u2013281 (1996)","journal-title":"Machine Learning"},{"key":"40_CR8","unstructured":"Maclin, R., Shavlik, J., Torrey, L., Walker, T.: Knowledge-based support vector regression for reinforcement learning. In: IJCAI Workshop on Reasoning, Representation, and Learning in Computer Games (2005)"},{"key":"40_CR9","unstructured":"Maclin, R., Shavlik, J., Torrey, L., Walker, T., Wild, E.: Giving advice about preferred actions to reinforcement learners via knowledge-based kernel regression. In: AAAI (2005)"},{"key":"40_CR10","first-page":"1127","volume":"5","author":"O. Mangasarian","year":"2004","unstructured":"Mangasarian, O., Shavlik, J., Wild, E.: Knowledge-based kernel approximation. JMLR\u00a05, 1127\u20131141 (2004)","journal-title":"JMLR"},{"key":"40_CR11","doi-asserted-by":"publisher","first-page":"233","DOI":"10.1080\/088395198117848","volume":"12","author":"I. Noda","year":"1998","unstructured":"Noda, I., Matsubara, H., Hiraki, K., Frank, I.: Soccer server: A tool for research on multiagent systems. Applied Artificial Intelligence\u00a012, 233\u2013250 (1998)","journal-title":"Applied Artificial Intelligence"},{"key":"40_CR12","unstructured":"Price, B., Boutilier, C.: Implicit imitation in multiagent reinforcement learning. In: ICML (1999)"},{"key":"40_CR13","unstructured":"Selfridge, O., Sutton, R., Barto, A.: Training and tracking in robotics. In: IJCAI (1985)"},{"key":"40_CR14","unstructured":"Sherstov, A., Stone, P.: Improving action selection in MDP\u2019s via knowledge transfer. In: AAAI (2005)"},{"issue":"3-4","key":"40_CR15","doi-asserted-by":"publisher","first-page":"323","DOI":"10.1007\/BF00992700","volume":"8","author":"S. Singh","year":"1992","unstructured":"Singh, S.: Transfer of learning by composing solutions of elemental sequential tasks. Machine Learning\u00a08(3-4), 323\u2013339 (1992)","journal-title":"Machine Learning"},{"key":"40_CR16","unstructured":"Stone, P., Sutton, R.: Scaling reinforcement learning toward RoboCup soccer. In: ICML (2001)"},{"key":"40_CR17","volume-title":"Reinforcement Learning: An Introduction","author":"R. Sutton","year":"1998","unstructured":"Sutton, R., Barto, A.: Reinforcement Learning: An Introduction. MIT Press, Cambridge (1998)"},{"key":"40_CR18","doi-asserted-by":"crossref","unstructured":"Taylor, M., Stone, P.: Behavior transfer for value-function-based reinforcement learning. In: 4th Int. Joint Conf. on Autonomous Agents and Multiagent Sys. (2005)","DOI":"10.1145\/1082473.1082482"},{"key":"40_CR19","doi-asserted-by":"crossref","unstructured":"Thrun, S., Mitchell, T.: Learning one more thing. In: IJCAI (1995)","DOI":"10.21236\/ADA285342"}],"container-title":["Lecture Notes in Computer Science","Machine Learning: ECML 2005"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/11564096_40","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,5,19]],"date-time":"2019-05-19T16:42:03Z","timestamp":1558284123000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/11564096_40"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2005]]},"ISBN":["9783540292432","9783540316923"],"references-count":19,"URL":"https:\/\/doi.org\/10.1007\/11564096_40","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2005]]}}}