{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,15]],"date-time":"2026-04-15T02:38:49Z","timestamp":1776220729706,"version":"3.50.1"},"reference-count":7,"publisher":"Elsevier","isbn-type":[{"value":"9781558602007","type":"print"}],"license":[{"start":{"date-parts":[[1991,1,1]],"date-time":"1991-01-01T00:00:00Z","timestamp":662688000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[1991,1,1]],"date-time":"1991-01-01T00:00:00Z","timestamp":662688000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/legal\/tdmrep-license"}],"funder":[{"DOI":"10.13039\/100000104","name":"National Aeronautics and Space Administration","doi-asserted-by":"publisher","award":["NAGW-1175"],"award-info":[{"award-number":["NAGW-1175"]}],"id":[{"id":"10.13039\/100000104","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[1991]]},"DOI":"10.1016\/b978-1-55860-200-7.50067-2","type":"book-chapter","created":{"date-parts":[[2014,6,30]],"date-time":"2014-06-30T06:11:49Z","timestamp":1404108709000},"page":"323-327","source":"Crossref","is-referenced-by-count":12,"title":["Self-improvement Based On Reinforcement Learning, Planning and Teaching"],"prefix":"10.1016","author":[{"given":"Long-Ji","family":"Lin","sequence":"first","affiliation":[]}],"member":"78","reference":[{"key":"10.1016\/B978-1-55860-200-7.50067-2_bib1","doi-asserted-by":"crossref","unstructured":"Lin, Long-Ji. Self-improving Reactive Agents: Case Studies of Reinforcement Learning Frameworks. In Proceedings of the First International Conference on Simulation of Adaptive Behavior: From Animals to Animats, 297\u2013305. Also Tech. Report CMU-CS-90\u2013109, Carnegie Mellon University.","DOI":"10.7551\/mitpress\/3115.003.0041"},{"key":"10.1016\/B978-1-55860-200-7.50067-2_bib2","unstructured":"Lin, Long-Ji. Programming Robots Using Reinforcement Learning and Teaching. In Proceedings of AAAI-91."},{"key":"10.1016\/B978-1-55860-200-7.50067-2_bib3","unstructured":"Pomerleau, D.A. ALVINN: An Autonomous Land Vehicle in a Neural Network. Tech Report CMU-CS-89\u2013107, Carnegie Mellon University."},{"key":"10.1016\/B978-1-55860-200-7.50067-2_bib4","unstructured":"Sutton, R.S. Temporal Credit Assignment in Reinforcement Learning. Ph.D. diss., Dept. of Computer and Information Science, University of Massachusetts."},{"key":"10.1016\/B978-1-55860-200-7.50067-2_bib5","doi-asserted-by":"crossref","unstructured":"Sutton, R.S. Learning to predict by the methods of temporal differences. In Machine Learning, 3:9\u201344.","DOI":"10.1023\/A:1022633531479"},{"key":"10.1016\/B978-1-55860-200-7.50067-2_bib6","doi-asserted-by":"crossref","unstructured":"Sutton, R.S. Integrated architectures for learning, planning, and reacting based on approximating dynamic programming. In Proceedings of the Seventh International Conference on Machine Learning, 216\u2013224.","DOI":"10.1016\/B978-1-55860-141-3.50030-4"},{"key":"10.1016\/B978-1-55860-200-7.50067-2_bib7","unstructured":"Watkins, C.J.C.H. Learning with Delayed Rewards. Ph.D. diss., Psychology Department, Cambridge University."}],"container-title":["Machine Learning Proceedings 1991"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:B9781558602007500672?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:B9781558602007500672?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2025,11,13]],"date-time":"2025-11-13T10:03:05Z","timestamp":1763028185000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/B9781558602007500672"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[1991]]},"ISBN":["9781558602007"],"references-count":7,"URL":"https:\/\/doi.org\/10.1016\/b978-1-55860-200-7.50067-2","relation":{},"subject":[],"published":{"date-parts":[[1991]]}}}