{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,23]],"date-time":"2024-10-23T10:06:15Z","timestamp":1729677975386,"version":"3.28.0"},"reference-count":23,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2012,9]]},"DOI":"10.1109\/is.2012.6335136","type":"proceedings-article","created":{"date-parts":[[2012,10,24]],"date-time":"2012-10-24T20:32:39Z","timestamp":1351110759000},"page":"202-207","source":"Crossref","is-referenced-by-count":3,"title":["Simultaneous discovery of multiple alternative optimal policies by reinforcement learning"],"prefix":"10.1109","author":[{"given":"Petar","family":"Kormushev","sequence":"first","affiliation":[]},{"given":"Darwin G.","family":"Caldwell","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"19","doi-asserted-by":"publisher","DOI":"10.1109\/FUZZY.2011.6007337"},{"key":"22","first-page":"644","author":"bishop","year":"2006","journal-title":"Pattern Recognition and Machine Learning"},{"key":"17","doi-asserted-by":"publisher","DOI":"10.1109\/CRV.2006.25"},{"key":"23","doi-asserted-by":"publisher","DOI":"10.1049\/ip-f-2.1993.0015"},{"key":"18","doi-asserted-by":"publisher","DOI":"10.1177\/0278364906072250"},{"key":"15","doi-asserted-by":"publisher","DOI":"10.1109\/ROBOT.2003.1242022"},{"key":"16","first-page":"1151","article-title":"Fastslam 2. 0: An improved particle filtering algorithm for simultaneous localization and mapping that provably converges","volume":"18","author":"montemerlo","year":"2003","journal-title":"International Joint Conference on Artificial Intelligence"},{"key":"13","doi-asserted-by":"publisher","DOI":"10.1145\/504729.504754"},{"key":"14","first-page":"343","article-title":"Monte carlo localization: Efficient position estimation for mobile robots","author":"fox","year":"1999","journal-title":"Proceedings of the National Conference on Artificial Intelligence"},{"key":"11","doi-asserted-by":"publisher","DOI":"10.1023\/A:1008935410038"},{"key":"12","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4757-3437-9"},{"key":"21","first-page":"1335","article-title":"Estimating internal variables and parameters of a learning agent by a particle filter","volume":"16","author":"samejima","year":"2004","journal-title":"Advances in neural information processing systems"},{"key":"3","doi-asserted-by":"crossref","first-page":"14","DOI":"10.2478\/s13230-010-0002-4","article-title":"Exploring parameter space in reinforcement learning","volume":"1","author":"r?uckstie\ufffd","year":"2010","journal-title":"Paladyn Journal of Behavioral Robotics"},{"key":"20","doi-asserted-by":"publisher","DOI":"10.1109\/ICMLA.2011.75"},{"key":"2","first-page":"839","article-title":"Robot weightlifting by direct policy search","volume":"17","author":"rosenstein","year":"2001","journal-title":"International Joint Conference on Artificial Intelligence"},{"journal-title":"Reinforcement Learning An Introduction Ser Adaptive Computation and Machine Learning","year":"1998","author":"sutton","key":"1"},{"key":"10","article-title":"PILCO: A model-based and data-efficient approach to policy search","author":"deisenroth","year":"2011","journal-title":"Proceedings of the 28th International Conference on Machine Learning"},{"key":"7","doi-asserted-by":"publisher","DOI":"10.1007\/s10514-009-9132-0"},{"key":"6","doi-asserted-by":"publisher","DOI":"10.1109\/ROBOT.2009.5152577"},{"key":"5","doi-asserted-by":"publisher","DOI":"10.1007\/BF00992696"},{"key":"4","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2007.11.026"},{"key":"9","first-page":"288","article-title":"Locally weighted projection regression: An O(n) algorithm for incremental real time learning in high dimensional spaces","author":"vijayakumar","year":"2000","journal-title":"Proc Intl Conf on Machine Learning (ICML)"},{"key":"8","first-page":"3137","article-title":"A generalized path integral control approach to reinforcement learning","volume":"11","author":"theodorou","year":"2010","journal-title":"The Journal of Machine Learning Research"}],"event":{"name":"2012 6th IEEE International Conference Intelligent Systems (IS)","start":{"date-parts":[[2012,9,6]]},"location":"Sofia, Bulgaria","end":{"date-parts":[[2012,9,8]]}},"container-title":["2012 6th IEEE INTERNATIONAL CONFERENCE INTELLIGENT SYSTEMS"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx5\/6320720\/6335103\/06335136.pdf?arnumber=6335136","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,4,30]],"date-time":"2024-04-30T18:11:43Z","timestamp":1714500703000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/6335136\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2012,9]]},"references-count":23,"URL":"https:\/\/doi.org\/10.1109\/is.2012.6335136","relation":{},"subject":[],"published":{"date-parts":[[2012,9]]}}}