{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,30]],"date-time":"2024-10-30T05:26:33Z","timestamp":1730265993302,"version":"3.28.0"},"reference-count":7,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2010,7]]},"DOI":"10.1109\/ijcnn.2010.5596516","type":"proceedings-article","created":{"date-parts":[[2010,10,19]],"date-time":"2010-10-19T18:58:15Z","timestamp":1287514695000},"page":"1-8","source":"Crossref","is-referenced-by-count":2,"title":["Multi-resolution state-space discretization for Q-Learning with pseudo-randomized discretization"],"prefix":"10.1109","author":[{"given":"Amanda","family":"Lampton","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"John","family":"Valasek","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mrinal","family":"Kumar","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref4","first-page":"2008","article-title":"Reinforcement learning of a morphing airfoil-policy and discrete learning analysis","year":"2008","journal-title":"Proceedings of the AIAA Guidance Navigation and Control Conference"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.2514\/1.35793"},{"key":"ref6","first-page":"51","volume":"9","author":"sutton","year":"1998","journal-title":"Reinforcement Learning - An Introduction"},{"key":"ref5","first-page":"2008","article-title":"Morphing airfoil with reinforcement learning of four shape changing parameters","year":"2008","journal-title":"Proceedings of the AIAA Guidance Navigation and Control Conference"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1137\/1.9781611970081"},{"key":"ref2","article-title":"Multi-resolution state-space discretization method for q-learning applied to highly reconfigurable systems","author":"lampton","year":"0","journal-title":"Journal of Machine Learning Research"},{"article-title":"Learning from delayed rewards","year":"1989","author":"watkins","key":"ref1"}],"event":{"name":"2010 International Joint Conference on Neural Networks (IJCNN)","start":{"date-parts":[[2010,7,18]]},"location":"Barcelona, Spain","end":{"date-parts":[[2010,7,23]]}},"container-title":["The 2010 International Joint Conference on Neural Networks (IJCNN)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx5\/5581822\/5595732\/05596516.pdf?arnumber=5596516","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,3,19]],"date-time":"2017-03-19T05:45:29Z","timestamp":1489902329000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/5596516\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2010,7]]},"references-count":7,"URL":"https:\/\/doi.org\/10.1109\/ijcnn.2010.5596516","relation":{},"subject":[],"published":{"date-parts":[[2010,7]]}}}