{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,26]],"date-time":"2025-10-26T22:34:06Z","timestamp":1761518046651},"reference-count":45,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"4","license":[{"start":{"date-parts":[[2011,10,1]],"date-time":"2011-10-01T00:00:00Z","timestamp":1317427200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Automat. Sci. Eng."],"published-print":{"date-parts":[[2011,10]]},"DOI":"10.1109\/tase.2011.2159708","type":"journal-article","created":{"date-parts":[[2011,7,11]],"date-time":"2011-07-11T19:47:48Z","timestamp":1310413668000},"page":"835-845","source":"Crossref","is-referenced-by-count":10,"title":["Model-Assisted Stochastic Learning for Robotic Applications"],"prefix":"10.1109","volume":"8","author":[{"given":"Jeremy A.","family":"Marvel","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Wyatt S.","family":"Newman","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref39","doi-asserted-by":"crossref","first-page":"385","DOI":"10.1007\/978-3-642-00196-3_45","article-title":"Autonomous autorotation of an RC helicopter","volume":"54","author":"abbeel","year":"2009","journal-title":"Exp Robotics"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/ROBOT.2010.5509181"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2005.1545358"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2003.1249251"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/ROBOT.1984.1087155"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/ICET.2006.335941"},{"key":"ref37","first-page":"2845","article-title":"Bayesian reinforcement learning in continuous PMDBPs with application to robot navigation","author":"ross","year":"2008","journal-title":"Proc EEEE Int Conf Robot Autom"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1090\/S0273-0979-1985-15365-0"},{"key":"ref35","author":"lay","year":"1999","journal-title":"Linear Algebra and its Applications"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/TSMCC.2003.813149"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1162\/089976605774320557"},{"key":"ref40","first-page":"283","article-title":"Autonomous transfer for reinforcement learning","volume":"1","author":"taylor","year":"2008","journal-title":"Proc 7th Int Joint Conf Autom Agents and Multiagent Syst"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICNN.1988.23980"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/64.506755"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4615-3184-5_2"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/ROBOT.2001.932611"},{"key":"ref15","author":"goldberg","year":"1989","journal-title":"Genetic Algorithms in Search Optimization and Machine Learning"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ETFA.1995.496663"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ISATP.1999.782993"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1080\/00207540110056135"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.5772\/5622"},{"key":"ref28","doi-asserted-by":"crossref","first-page":"481","DOI":"10.1016\/S0360-8352(99)00123-0","article-title":"A feature-based prototype system for the evaluation and optimization of manufacturing processes","volume":"37","author":"gayretli","year":"1999","journal-title":"Proc 24th Int Conf Comp Ind Eng"},{"key":"ref4","first-page":"406","article-title":"PEGASUS: A policy search method for large MDPs and POMDPs","author":"ng","year":"2000","journal-title":"Proc 16th Conf Uncertainty Artif Intell"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1023\/A:1008912429442"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2007.4399185"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ROBOT.2000.844871"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1016\/S0736-5845(00)00014-4"},{"key":"ref5","first-page":"799","article-title":"Autonomous helicopter flight via reinforcement learning","author":"ng","year":"2004","journal-title":"Adv Neural Inf Process Syst"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ROBOT.2000.844072"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/37.257895"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/ROBOT.1990.126068"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1023\/A:1013258808932"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/WCICA.2008.4592982"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1243\/09544054JEM359"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/TEPRA.2009.5339647"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/ROBOT.1997.614389"},{"key":"ref21","author":"wei","year":"2001","journal-title":"Intelligent Robotic Learning using Guided Evolutionary Simulated Annealing"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/ICEC.1994.349986"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2003.1249229"},{"key":"ref41","first-page":"3303","article-title":"Improving robotic assembly performance through autonomous exploration","author":"wei","year":"2002","journal-title":"Proc IEEE Int Conf Robot Autom"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2001.976256"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/CEC.2006.1688566"},{"key":"ref26","doi-asserted-by":"crossref","first-page":"287","DOI":"10.1007\/BF02136832","article-title":"Artificial intelligence in simulation","volume":"53","author":"ren","year":"1994","journal-title":"Ann Oper Res"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/ROBIO.2009.4913000"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2003.1249250"}],"container-title":["IEEE Transactions on Automation Science and Engineering"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx5\/8856\/6025294\/05937024.pdf?arnumber=5937024","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,1,12]],"date-time":"2022-01-12T16:53:29Z","timestamp":1642006409000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/5937024\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2011,10]]},"references-count":45,"journal-issue":{"issue":"4"},"URL":"https:\/\/doi.org\/10.1109\/tase.2011.2159708","relation":{},"ISSN":["1545-5955"],"issn-type":[{"value":"1545-5955","type":"print"}],"subject":[],"published":{"date-parts":[[2011,10]]}}}