{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,22]],"date-time":"2024-10-22T15:50:48Z","timestamp":1729612248714,"version":"3.28.0"},"reference-count":18,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2009,3]]},"DOI":"10.1109\/adprl.2009.4927519","type":"proceedings-article","created":{"date-parts":[[2009,5,19]],"date-time":"2009-05-19T19:50:44Z","timestamp":1242762644000},"page":"8-15","source":"Crossref","is-referenced-by-count":0,"title":["Efficient data reuse in value function approximation"],"prefix":"10.1109","author":[{"family":"Hirotaka Hachiya","sequence":"first","affiliation":[],"role":[{"role":"author","vocab":"crossref"}]},{"family":"Takayuki Akiyama","sequence":"additional","affiliation":[],"role":[{"role":"author","vocab":"crossref"}]},{"given":"Masashi","family":"Sugiyama","sequence":"additional","affiliation":[],"role":[{"role":"author","vocab":"crossref"}]},{"given":"Jan","family":"Peters","sequence":"additional","affiliation":[],"role":[{"role":"author","vocab":"crossref"}]}],"member":"263","reference":[{"journal-title":"Reinforcement Learning An Introduction","year":"1998","author":"sutton","key":"17"},{"key":"18","doi-asserted-by":"publisher","DOI":"10.1109\/91.481841"},{"key":"15","doi-asserted-by":"publisher","DOI":"10.1016\/S0378-3758(00)00115-4"},{"key":"16","first-page":"985","article-title":"covariate shift adaptation by importance weighted cross validation","volume":"8","author":"sugiyama","year":"2007","journal-title":"Journal of Machine Learning Research"},{"key":"13","first-page":"1555","article-title":"optimality of reinforcement learning algorithms with linear function approximation","volume":"15","author":"schoknecht","year":"2003","journal-title":"Neural Information Processing Systems"},{"key":"14","first-page":"496","article-title":"policy improvement for pomdps using normalized importance sampling","author":"shelton","year":"2001","journal-title":"Proceedings of Uncertainty in Artificial Intelligence"},{"key":"11","first-page":"759","article-title":"eligibility traces for offpolicy policy evaluation","author":"precup","year":"2000","journal-title":"Proceedings of International Conference on Machine Learning"},{"key":"12","doi-asserted-by":"crossref","DOI":"10.1002\/9780470316436","author":"rao","year":"1973","journal-title":"Linear Statistical Inference and its Applications"},{"key":"3","doi-asserted-by":"publisher","DOI":"10.1109\/EURCON.2003.1248235"},{"key":"2","article-title":"neuro-dynamic programming","author":"bertsekas","year":"1996","journal-title":"Athena Scientific"},{"key":"1","article-title":"policy search by dynamic programming","volume":"16","author":"bagnell","year":"2003","journal-title":"Neural Information Processing Systems"},{"key":"10","first-page":"417","article-title":"off-policy temporaldifference learning with function approximation","author":"precup","year":"2001","journal-title":"Proceedings of International Conference on Machine Learning"},{"key":"7","first-page":"498","article-title":"learning from scarce experience","author":"peshkin","year":"2002","journal-title":"Proceedings of International Conference on Machine Learning"},{"key":"6","doi-asserted-by":"publisher","DOI":"10.1162\/jmlr.2003.4.6.1107"},{"key":"5","first-page":"1531","article-title":"a natural policy gradient","volume":"14","author":"kakade","year":"2002","journal-title":"Neural Information Processing Systems"},{"key":"4","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4757-2553-7"},{"key":"9","doi-asserted-by":"publisher","DOI":"10.1016\/j.neunet.2008.02.003"},{"key":"8","doi-asserted-by":"publisher","DOI":"10.1145\/1273496.1273590"}],"event":{"name":"2009 IEEE Symposium on Adaptive Dynamic Programming and Reinforcement Learning (ADPRL)","start":{"date-parts":[[2009,3,30]]},"location":"Nashville, TN, USA","end":{"date-parts":[[2009,4,2]]}},"container-title":["2009 IEEE Symposium on Adaptive Dynamic Programming and Reinforcement Learning"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx5\/4910084\/4927513\/04927519.pdf?arnumber=4927519","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,6,18]],"date-time":"2017-06-18T20:02:34Z","timestamp":1497816154000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/4927519\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2009,3]]},"references-count":18,"URL":"https:\/\/doi.org\/10.1109\/adprl.2009.4927519","relation":{},"subject":[],"published":{"date-parts":[[2009,3]]}}}