{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,4]],"date-time":"2024-09-04T05:04:12Z","timestamp":1725426252675},"reference-count":14,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2007,8]]},"DOI":"10.1109\/ijcnn.2007.4370979","type":"proceedings-article","created":{"date-parts":[[2007,11,6]],"date-time":"2007-11-06T20:35:49Z","timestamp":1194381349000},"page":"338-343","source":"Crossref","is-referenced-by-count":1,"title":["Optimality of LSTD and its Relation to MC"],"prefix":"10.1109","author":[{"given":"Steffen","family":"Grunewalder","sequence":"first","affiliation":[]},{"given":"Sepp","family":"Hochreiter","sequence":"additional","affiliation":[]},{"given":"Klaus","family":"Obermayer","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1007\/978-0-585-33656-5_7"},{"journal-title":"Kendall's Advanced Theory of Statistics","year":"1991","key":"ref11"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1007\/BF00115009"},{"journal-title":"Reinforcement Learning An Introduction","year":"1998","author":"sutton","key":"ref13"},{"key":"ref14","article-title":"Q-learning","author":"chris","year":"1992","journal-title":"Machines Learning"},{"key":"ref4","article-title":"On the convergence of stochastic iterative dynamic programming algorithms","author":"tommi","year":"1994","journal-title":"Neural Computation"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1023\/A:1018056104778"},{"key":"ref6","article-title":"Bias-variance error bounds for temporal difference updates","author":"kearns","year":"2000","journal-title":"Conference on Computational Learning Theory"},{"journal-title":"Fundamentals of Statistical Signal Processing Estimation Theory","year":"1993","author":"kay","key":"ref5"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1145\/1015330.1015402"},{"key":"ref7","article-title":"Theory of PointEstimation","author":"leo lehmann","year":"1998","journal-title":"Springer Texts in Statistics"},{"key":"ref2","article-title":"Least-squares temporal difference learning","author":"boyan","year":"1999","journal-title":"International Conference Machine Learning"},{"journal-title":"Learning evaluation functions for global optimization","year":"1998","author":"boyan","key":"ref1"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1023\/A:1007495401240"}],"event":{"name":"International Joint Conference on Neural Networks","start":{"date-parts":[[2007,8,12]]},"location":"Orlando, FL","end":{"date-parts":[[2007,8,17]]}},"container-title":["2007 International Joint Conference on Neural Networks"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx5\/4370890\/4370891\/04370979.pdf?arnumber=4370979","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,4,17]],"date-time":"2020-04-17T06:55:34Z","timestamp":1587106534000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/4370979\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2007,8]]},"references-count":14,"URL":"https:\/\/doi.org\/10.1109\/ijcnn.2007.4370979","relation":{},"subject":[],"published":{"date-parts":[[2007,8]]}}}