{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,13]],"date-time":"2026-05-13T07:25:42Z","timestamp":1778657142328,"version":"3.51.4"},"reference-count":17,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2009,3]]},"DOI":"10.1109\/adprl.2009.4927541","type":"proceedings-article","created":{"date-parts":[[2009,5,19]],"date-time":"2009-05-19T15:50:44Z","timestamp":1242748244000},"page":"169-176","source":"Crossref","is-referenced-by-count":6,"title":["Learning continuous-action control policies"],"prefix":"10.1109","author":[{"given":"Jason","family":"Pazis","sequence":"first","affiliation":[],"role":[{"role":"author","vocab":"crossref"}]},{"given":"Michail G.","family":"Lagoudakis","sequence":"additional","affiliation":[],"role":[{"role":"author","vocab":"crossref"}]}],"member":"263","reference":[{"key":"17","first-page":"463","article-title":"learning to drive a bicycle using reinforcement learning and shaping","author":"randl\ufffdv","year":"1998","journal-title":"Proceedings of the Fifteenth International Conference on Machine Learning"},{"key":"15","article-title":"application of a self-learning controller with continuous control signals based on the doe-approach","author":"riedmiller","year":"1997","journal-title":"Proceedings of the European Symposium on Neural Networks"},{"key":"16","doi-asserted-by":"publisher","DOI":"10.1109\/91.481841"},{"key":"13","first-page":"1063","article-title":"reinforcement learning with factored states and actions","volume":"5","author":"sallans","year":"2004","journal-title":"Journal of Machine Learning Research"},{"key":"14","doi-asserted-by":"publisher","DOI":"10.1177\/105971239700600201"},{"key":"11","first-page":"833","article-title":"reinforcement learning in continuous action spaces through sequential monte carlo methods","volume":"20","author":"lazaric","year":"2008","journal-title":"Advances in neural information processing systems"},{"key":"12","doi-asserted-by":"publisher","DOI":"10.1023\/A:1022685208277"},{"key":"3","article-title":"tree-based batch mode reinforcement learning","volume":"6","author":"ernst","year":"2005","journal-title":"Journal of Machine Learning Research"},{"key":"2","author":"watkins","year":"1989","journal-title":"Learning from delayed rewards"},{"key":"1","author":"sutton","year":"1998","journal-title":"Reinforcement Learning An Introduction"},{"key":"10","doi-asserted-by":"publisher","DOI":"10.1016\/S0921-8890(97)00042-0"},{"key":"7","first-page":"417","article-title":"q-learning in continuous state and action spaces","author":"gaskett","year":"1999","journal-title":"Proceedings of the 5th Australian Joint conference on Artificial Intelligence"},{"key":"6","author":"proakis","year":"2001","journal-title":"Communication Systems Engineering"},{"key":"5","doi-asserted-by":"publisher","DOI":"10.1162\/jmlr.2003.4.6.1107"},{"key":"4","doi-asserted-by":"publisher","DOI":"10.1023\/A:1017928328829"},{"key":"9","article-title":"reinforcement learning in continuous state and action space","author":"stro?sslin","year":"2003","journal-title":"International Conference on Artificial Neural Networks"},{"key":"8","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN.1998.687165"}],"event":{"name":"2009 IEEE Symposium on Adaptive Dynamic Programming and Reinforcement Learning (ADPRL)","location":"Nashville, TN, USA","start":{"date-parts":[[2009,3,30]]},"end":{"date-parts":[[2009,4,2]]}},"container-title":["2009 IEEE Symposium on Adaptive Dynamic Programming and Reinforcement Learning"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx5\/4910084\/4927513\/04927541.pdf?arnumber=4927541","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,3,17]],"date-time":"2017-03-17T16:13:56Z","timestamp":1489767236000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/4927541\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2009,3]]},"references-count":17,"URL":"https:\/\/doi.org\/10.1109\/adprl.2009.4927541","relation":{},"subject":[],"published":{"date-parts":[[2009,3]]}}}