{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,16]],"date-time":"2026-01-16T10:14:49Z","timestamp":1768558489270,"version":"3.49.0"},"reference-count":25,"publisher":"Springer Science and Business Media LLC","issue":"3-4","license":[{"start":{"date-parts":[[1992,5,1]],"date-time":"1992-05-01T00:00:00Z","timestamp":704678400000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Mach Learn"],"published-print":{"date-parts":[[1992,5]]},"DOI":"10.1007\/bf00992700","type":"journal-article","created":{"date-parts":[[2005,1,9]],"date-time":"2005-01-09T16:35:16Z","timestamp":1105288516000},"page":"323-339","source":"Crossref","is-referenced-by-count":123,"title":["Transfer of learning by composing solutions of elemental sequential tasks"],"prefix":"10.1007","volume":"8","author":[{"given":"Satinder Pal","family":"Singh","sequence":"first","affiliation":[]}],"member":"297","reference":[{"key":"CR1","series-title":"Technical Report","volume-title":"Real-time learning and control using asynchronous dynamic programming","author":"A.G. Barto","year":"1991","unstructured":"Barto, A.G., Bradtke, S.J., & Singh, S.P. (1991).Real-time learning and control using asynchronous dynamic programming. (Technical Report 91-57). Amherst, MA: University of Massachusetts, COINS Dept."},{"key":"CR2","volume-title":"Proceedings of the 1990 Connectionist Models Summer School","author":"A.G. Barto","year":"1990","unstructured":"Barto, A.G. & Singh, S.P. (1990). On the computational economics of reinforcement learning.Proceedings of the 1990 Connectionist Models Summer School. San Mateo, CA: Morgan Kaufmann."},{"key":"CR3","first-page":"835","volume":"13","author":"A.G. Barto","year":"1983","unstructured":"Barto, A.G., Sutton, R.S., & Anderson, C.W. (1983). Neuronlike elements that can solve difficult learning control problems.IEEE SMC, 13, 835?846.","journal-title":"IEEE SMC"},{"key":"CR4","volume-title":"Advances in neural information processing systems 2","author":"A.G. Barto","year":"1990","unstructured":"Barto, A.G., Sutton, R.S., & Watkins, C.J.C.H. (1990). Sequential decision problems and neural networks. In D.S. Touretzky, (Ed.),Advances in neural information processing systems 2, San Mateo, CA: Morgan Kaufmann."},{"key":"CR5","volume-title":"Dynamic programming: Deterministic and stochastic models","author":"D.P. Bertsekas","year":"1987","unstructured":"Bertsekas, D.P. (1987).Dynamic programming: Deterministic and stochastic models. Englewood Cliffs, NJ: Prentice-Hall."},{"key":"CR6","doi-asserted-by":"crossref","first-page":"253","DOI":"10.1162\/neco.1989.1.2.253","volume":"1","author":"R. Brooks","year":"1989","unstructured":"Brooks, R. (1989). A robot that walks: Emergent behaviors from a carefully evolved network.Neural Computation, 1, 253?262.","journal-title":"Neural Computation"},{"key":"CR7","volume-title":"Pattern classification and scene analysis","author":"R.O. Duda","year":"1973","unstructured":"Duda, R.O. & Hart, P.E. (1973).Pattern classification and scene analysis. New York: Wiley."},{"key":"CR8","first-page":"285","volume":"3","author":"G.A. Iba","year":"1989","unstructured":"Iba, G.A. (1989). A heuristic approach to the discovery of macro-operators.Machine Learning, 3, 285?317.","journal-title":"Machine Learning"},{"key":"CR9","volume-title":"Task decomposition through competition in a modular connectionist architecture","author":"R.A. Jacobs","year":"1990","unstructured":"Jacobs, R.A. (1990).Task decomposition through competition in a modular connectionist architecture. Ph.D. Thesis, COINS Dept., Univ. of Massachusetts, Amherst, Mass."},{"key":"CR10","unstructured":"Jacobs, R.A. & Jordan, M.I. (1991). A competitive modular connectionist architecture.Advances in neural information processing systems, 3."},{"key":"CR11","doi-asserted-by":"crossref","unstructured":"Jacobs, R.A., Jordan, M.I., Nowlan, S.J., & Hinton, G.E. (1991). Adaptive mixtures of local experts.Neural Computation, 3.","DOI":"10.1162\/neco.1991.3.1.79"},{"key":"CR12","series-title":"Technical Report","volume-title":"Learning in embedded systems","author":"L.P. Kaelbling","year":"1990","unstructured":"Kaelbling, L.P. (1990).Learning in embedded systems. Ph.D. Thesis, Stanford University, Department of Computer Science, Stanford CA. Technical Report TR-90-04."},{"key":"CR13","first-page":"35","volume":"26","author":"R.E. Korf","year":"1985","unstructured":"Korf, R.E. (1985). Macro-operators: A weak method for learning.Artificial Learning, 26, 35?77.","journal-title":"Artificial Learning"},{"key":"CR14","unstructured":"Maes, P. & Brooks, R. (1990). Learning to coordinate behaviours.Proceedings of the Eighth AAAI (pp. 796?802). Morgan Kaufmann."},{"key":"CR15","series-title":"Technical Report","volume-title":"Automatic programming of behavior-based robots using reinforcement learning","author":"S. Mahadevan","year":"1990","unstructured":"Mahadevan, S. & Connell, J. (1990). Automatic programming of behavior-based robots using reinforcement learning. (Technical Report) Yorktown Heights, NY: IBM Research Division, T.J. Watson Research Center."},{"key":"CR16","series-title":"Technical Report","volume-title":"Competing experts: An experimental investigation of associative mixture models","author":"S.J. Nowlan","year":"1990","unstructured":"Nowlan, S.J. (1990). Competing experts: An experimental investigation of associative mixture models. (Technical Report CRG-TR-90-5). Toronto, Canada: Univ. of Toronto, Department of Computer Science."},{"key":"CR17","volume-title":"Introduction to stochastic dynamic programming","author":"S. Ross","year":"1983","unstructured":"Ross, S. (1983).Introduction to stochastic dynamic programming. New York: Academic Press."},{"key":"CR18","volume-title":"Advances in neural information processing systems 4","author":"S.P. Singh","year":"1992","unstructured":"Singh, S.P. (1992a). On the efficient learning of multiple sequential tasks. In J. Moody, S.J. Hanson, & R.P. Lippman, (Eds.),Advances in neural information processing systems 4, San Mateo, CA: Morgan Kaufmann."},{"key":"CR19","unstructured":"Singh, S.P. (1992b). Solving multiple sequential tasks using a hierarchy of variable temporal resolution models. Submitted to Machine Learning Conference, 1992."},{"key":"CR20","volume-title":"The behavior of organisms: An experimental analysis","author":"B.F. Skinner","year":"1938","unstructured":"Skinner, B.F. (1938).The behavior of organisms: An experimental analysis. New York: D. Appleton Century."},{"key":"CR21","first-page":"9","volume":"3","author":"R.S. Sutton","year":"1988","unstructured":"Sutton, R.S. (1988). Learning to predict by the methods of temporal differences.Machine Learning, 3, 9?44.","journal-title":"Machine Learning"},{"key":"CR22","first-page":"216","volume-title":"Proceedings of the Seventh International Workshop on Machine Learning","author":"R.S. Sutton","year":"1990","unstructured":"Sutton, R.S. (1990). Integrating architectures for learning, planning, and reacting based on approximating dynamic programming.Proceedings of the Seventh International Workshop on Machine Learning (pp. 216?224). San Mateo, CA: Morgan Kaufmann"},{"key":"CR23","volume-title":"Learning from delayed rewards","author":"C.J.C.H. Watkins","year":"1989","unstructured":"Watkins, C.J.C.H. (1989).Learning from delayed rewards. Ph.D. Thesis, Cambridge Univ., Cambridge, England."},{"key":"CR24","first-page":"279","volume":"8","author":"C.J.C.H. Watkins","year":"1992","unstructured":"Watkins, C.J.C.H. & Dayan, P. (1992). Q-learning.Machine Learning, 8, 279?292.","journal-title":"Machine Learning"},{"key":"CR25","doi-asserted-by":"crossref","unstructured":"Whitehead, S.D. & Ballard, D.H. (1990). Active perception and reinforcement learning.Proceedings of the Seventh International Conference on Machine Learning. Austin, TX.","DOI":"10.1016\/B978-1-55860-141-3.50025-0"}],"container-title":["Machine Learning"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/BF00992700.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/BF00992700\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/BF00992700","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,4,29]],"date-time":"2019-04-29T22:58:34Z","timestamp":1556578714000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/BF00992700"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[1992,5]]},"references-count":25,"journal-issue":{"issue":"3-4","published-print":{"date-parts":[[1992,5]]}},"alternative-id":["BF00992700"],"URL":"https:\/\/doi.org\/10.1007\/bf00992700","relation":{},"ISSN":["0885-6125","1573-0565"],"issn-type":[{"value":"0885-6125","type":"print"},{"value":"1573-0565","type":"electronic"}],"subject":[],"published":{"date-parts":[[1992,5]]}}}