{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,26]],"date-time":"2026-03-26T15:16:35Z","timestamp":1774538195341,"version":"3.50.1"},"reference-count":18,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018,10]]},"DOI":"10.1109\/iros.2018.8593894","type":"proceedings-article","created":{"date-parts":[[2019,1,24]],"date-time":"2019-01-24T02:33:30Z","timestamp":1548297210000},"page":"4635-4640","source":"Crossref","is-referenced-by-count":29,"title":["Setting up a Reinforcement Learning Task with a Real-World Robot"],"prefix":"10.1109","author":[{"given":"A.","family":"Rupam Mahmood","sequence":"first","affiliation":[]},{"given":"Dmytro","family":"Korenkevych","sequence":"additional","affiliation":[]},{"given":"Brent J.","family":"Komer","sequence":"additional","affiliation":[]},{"given":"James","family":"Bergstra","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"crossref","first-page":"735","DOI":"10.1007\/978-3-642-35289-8_39","article-title":"10 steps and some tricks to set up neural reinforcement controllers","author":"riedmiller","year":"2012","journal-title":"Neural Networks Tricks of the Trade"},{"key":"ref11","first-page":"262","article-title":"Sim-to-Real robot learning from pixels with progressive nets","author":"rusu","year":"2017","journal-title":"Conference on Robot Learning"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2010.5650765"},{"key":"ref13","first-page":"1889","article-title":"Trust region policy optimization","author":"schulman","year":"2015","journal-title":"International Conference on Machine Learning"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/TRO.2012.2210294"},{"key":"ref15","author":"sutton","year":"2018","journal-title":"Reinforcement Learning An Introduction"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2012.6386109"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1007\/s10458-008-9056-7"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2017.8202141"},{"key":"ref4","first-page":"1329","article-title":"Benchmarking deep reinforcement learning for continuous control","author":"duan","year":"2016","journal-title":"International Conference on Machine Learning"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ACC.2012.6315022"},{"key":"ref6","author":"henderson","year":"2017","journal-title":"Deep reinforcement learning that matters"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2017.7989385"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/TAC.2003.809799"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1007\/s10994-012-5322-7"},{"key":"ref2","author":"brockman","year":"2016","journal-title":"OpenAI Gym"},{"key":"ref1","first-page":"281","article-title":"Random search for hyper-parameter optimization","author":"bergstra","year":"2012","journal-title":"Journal of Machine Learning Research"},{"key":"ref9","first-page":"1334","article-title":"End-to-end training of deep visuomotor policies","volume":"17","author":"levine","year":"2016","journal-title":"The Journal of Machine Learning Research"}],"event":{"name":"2018 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS)","location":"Madrid","start":{"date-parts":[[2018,10,1]]},"end":{"date-parts":[[2018,10,5]]}},"container-title":["2018 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8574473\/8593358\/08593894.pdf?arnumber=8593894","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,8,24]],"date-time":"2020-08-24T06:05:24Z","timestamp":1598249124000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8593894\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,10]]},"references-count":18,"URL":"https:\/\/doi.org\/10.1109\/iros.2018.8593894","relation":{},"subject":[],"published":{"date-parts":[[2018,10]]}}}