{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,23]],"date-time":"2025-08-23T00:05:25Z","timestamp":1755907525502,"version":"3.44.0"},"reference-count":18,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,7,8]],"date-time":"2025-07-08T00:00:00Z","timestamp":1751932800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,7,8]],"date-time":"2025-07-08T00:00:00Z","timestamp":1751932800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,7,8]]},"DOI":"10.23919\/acc63710.2025.11107856","type":"proceedings-article","created":{"date-parts":[[2025,8,21]],"date-time":"2025-08-21T18:17:51Z","timestamp":1755800271000},"page":"3533-3538","source":"Crossref","is-referenced-by-count":0,"title":["Maximum A Posteriori Least-Squares Temporal Difference"],"prefix":"10.23919","author":[{"given":"R.A.C.","family":"van Zuijlen","sequence":"first","affiliation":[{"name":"Eindhoven University of Technology,Control Systems Technology Section,Dep. of Mechanical Eng.,The Netherlands"}]},{"given":"D.J.","family":"Antunes","sequence":"additional","affiliation":[{"name":"Eindhoven University of Technology,Control Systems Technology Section,Dep. of Mechanical Eng.,The Netherlands"}]}],"member":"263","reference":[{"key":"ref1","volume-title":"Dynamic Programming and Optimal Control","volume":"2","author":"Bertsekas","year":"2018"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1023\/A:1018056104778"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1023\/A:1017936530646"},{"volume-title":"Reinforcement Learning: An Introduction.","year":"2018","author":"Sutton","key":"ref4"},{"key":"ref5","first-page":"809","article-title":"Policy evaluation with temporal differences: A survey and comparison","volume":"15","author":"Dann","year":"2014","journal-title":"Journal of Machine Learning Research"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/1390156.1390251"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1007\/s10994-021-05961-4"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1561\/2200000049"},{"volume-title":"Optimal Learning: Computational procedures for Bayes-adaptive Markov decision processes.","year":"2002","author":"Duff","key":"ref9"},{"issue":"5","key":"ref10","article-title":"A bayesian approach for learning and planning in partially observable markov decision processes","volume":"12","author":"Ross","year":"2011","journal-title":"Journal of Machine Learning Research"},{"key":"ref11","article-title":"Efficient bayes-adaptive reinforcement learning using sample-based search","volume":"25","author":"Guez","year":"2012","journal-title":"Advances in neural information processing systems"},{"volume-title":"Deep learning.","year":"2016","author":"Goodfellow","key":"ref12"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/89.279278"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1140\/epjds\/s13688-023-00416-3"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1214\/aoms\/1177707039"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1002\/SERIES1345"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1016\/j.cam.2008.07.037"},{"key":"ref18","volume-title":"Efficient Reinforcement Learning using Gaussian Processes","volume":"9","author":"Deisenroth","year":"2010"}],"event":{"name":"2025 American Control Conference (ACC)","start":{"date-parts":[[2025,7,8]]},"location":"Denver, CO, USA","end":{"date-parts":[[2025,7,10]]}},"container-title":["2025 American Control Conference (ACC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11107441\/11107442\/11107856.pdf?arnumber=11107856","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T05:46:13Z","timestamp":1755841573000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11107856\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,7,8]]},"references-count":18,"URL":"https:\/\/doi.org\/10.23919\/acc63710.2025.11107856","relation":{},"subject":[],"published":{"date-parts":[[2025,7,8]]}}}