{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,5]],"date-time":"2024-09-05T00:01:14Z","timestamp":1725494474279},"publisher-location":"Berlin, Heidelberg","reference-count":11,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783540767183"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"DOI":"10.1007\/978-3-540-76719-0_12","type":"book-chapter","created":{"date-parts":[[2007,11,12]],"date-time":"2007-11-12T14:38:05Z","timestamp":1194878285000},"page":"85-91","source":"Crossref","is-referenced-by-count":3,"title":["Convergence Analysis on Approximate Reinforcement Learning"],"prefix":"10.1007","author":[{"given":"Jinsong","family":"Leng","sequence":"first","affiliation":[]},{"given":"Lakhmi","family":"Jain","sequence":"additional","affiliation":[]},{"given":"Colin","family":"Fyfe","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"unstructured":"Teambots (2000), http:\/\/www.cs.cmu.edu\/~trb\/Teambots\/Domains\/SoccerBots","key":"12_CR1"},{"key":"12_CR2","doi-asserted-by":"publisher","first-page":"25","DOI":"10.1016\/0025-5564(71)90051-4","volume":"10","author":"J.S. Albus","year":"1971","unstructured":"Albus, J.S.: A Theory of Cerebellar Function. Mathematical Biosciences\u00a010, 25\u201361 (1971)","journal-title":"Mathematical Biosciences"},{"doi-asserted-by":"crossref","unstructured":"Bellman, R.: A Markovian Decision Process. Journal of Mathematics and Mechanics 6 (1957)","key":"12_CR3","DOI":"10.1512\/iumj.1957.6.56038"},{"key":"12_CR4","volume-title":"Dynamic Programming","author":"R. Bellman","year":"1957","unstructured":"Bellman, R.: Dynamic Programming. Princeton University Press, Princeton, NJ (1957)"},{"issue":"1","key":"12_CR5","first-page":"295","volume":"14","author":"P. Dayan","year":"1994","unstructured":"Dayan, P., Sejnowski, T.J.: TD(\u03bb) Converges with Probability 1. Machine Learning\u00a014(1), 295\u2013301 (1994)","journal-title":"Machine Learning"},{"key":"12_CR6","volume-title":"Dynamic Programming and Markov Processes","author":"R.A. Howard","year":"1960","unstructured":"Howard, R.A.: Dynamic Programming and Markov Processes. MIT Press, Cambridge (1960)"},{"key":"12_CR7","volume-title":"Journal of Multiagent and Grid systems","author":"J. Leng","year":"2008","unstructured":"Leng, J., Jain, L., Fyfe, C.: Simulation and Reinforcement Learning with Soccer Agents. In: Journal of Multiagent and Grid systems, vol.\u00a04(4), IOS Press, The Netherlands (to be published in 2008)"},{"key":"12_CR8","first-page":"9","volume":"3","author":"R.S. Sutton","year":"1988","unstructured":"Sutton, R.S.: Learning to Predict by the Method of Temporal Differences. Machine Learning\u00a03, 9\u201344 (1988)","journal-title":"Machine Learning"},{"key":"12_CR9","volume-title":"Reinforcement Learning: An Introduction","author":"R.S. Sutton","year":"1998","unstructured":"Sutton, R.S., Barto, A.G.: Reinforcement Learning: An Introduction. MIT Press, Cambridge (1998)"},{"unstructured":"Watkins, C.J.C.H.: Learning from Delayed Rewards. PhD thesis, Cambridge University, Cambridge, England (1989)","key":"12_CR10"},{"issue":"2","key":"12_CR11","doi-asserted-by":"publisher","first-page":"115","DOI":"10.1017\/S0269888900008122","volume":"10","author":"M. Wooldridge","year":"1995","unstructured":"Wooldridge, M., Jennings, N.: Intelligent Agents: Theory and Practice. Knowledge Engineering Review\u00a010(2), 115\u2013152 (1995)","journal-title":"Knowledge Engineering Review"}],"container-title":["Lecture Notes in Computer Science","Knowledge Science, Engineering and Management"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-540-76719-0_12.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,4,27]],"date-time":"2021-04-27T11:00:32Z","timestamp":1619521232000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-540-76719-0_12"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[null]]},"ISBN":["9783540767183"],"references-count":11,"URL":"https:\/\/doi.org\/10.1007\/978-3-540-76719-0_12","relation":{},"subject":[]}}