{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,12]],"date-time":"2025-12-12T13:42:04Z","timestamp":1765546924195,"version":"3.28.0"},"reference-count":11,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,12,27]],"date-time":"2021-12-27T00:00:00Z","timestamp":1640563200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,12,27]],"date-time":"2021-12-27T00:00:00Z","timestamp":1640563200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,12,27]]},"DOI":"10.1109\/robio54168.2021.9739340","type":"proceedings-article","created":{"date-parts":[[2022,3,28]],"date-time":"2022-03-28T21:20:39Z","timestamp":1648502439000},"page":"595-600","source":"Crossref","is-referenced-by-count":3,"title":["Training a Robotic Arm Movement with Deep Reinforcement Learning"],"prefix":"10.1109","author":[{"given":"Xiaohan","family":"Ni","sequence":"first","affiliation":[{"name":"Waseda University,Graduate School of Information, Production and Systems,Fukuoka,Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xin","family":"He","sequence":"additional","affiliation":[{"name":"Waseda University,Graduate School of Information, Production and Systems,Fukuoka,Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Takafumi","family":"Matsumaru","sequence":"additional","affiliation":[{"name":"Waseda University,Graduate School of Information, Production and Systems,Fukuoka,Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"doi-asserted-by":"publisher","key":"ref4","DOI":"10.1146\/annurev-psych-122414-033625"},{"doi-asserted-by":"publisher","key":"ref3","DOI":"10.1109\/ICCV.2017.321"},{"doi-asserted-by":"publisher","key":"ref10","DOI":"10.1109\/ICRA.2017.7989385"},{"key":"ref6","first-page":"1805","article-title":"Simple random search of static linear policies is competitive for reinforcement learning","author":"mania","year":"2018","journal-title":"Proceedings of the 32Nd International Conference on Neural Information Processing Systems"},{"doi-asserted-by":"publisher","key":"ref11","DOI":"10.1109\/IROS.2018.8594353"},{"key":"ref5","doi-asserted-by":"crossref","DOI":"10.1609\/aaai.v32i1.11694","article-title":"Deep reinforcement learning that matters","volume":"32","author":"henderson","year":"2018","journal-title":"Proceedings of the AAAI Conference on Artificial Intelligence"},{"doi-asserted-by":"publisher","key":"ref8","DOI":"10.1038\/nature16961"},{"key":"ref7","first-page":"176","article-title":"Averaged-dqn: Variance reduction and stabilization for deep reinforcement learning","author":"anschel","year":"2017","journal-title":"International Conference on Machine Learning"},{"year":"2018","author":"sutton","journal-title":"Reinforcement Learning An Introduction","key":"ref2"},{"doi-asserted-by":"publisher","key":"ref9","DOI":"10.1109\/IROS40897.2019.8967946"},{"year":"2015","author":"lillicrap","article-title":"Continuous control with deep reinforcement learning","key":"ref1"}],"event":{"name":"2021 IEEE International Conference on Robotics and Biomimetics (ROBIO)","start":{"date-parts":[[2021,12,27]]},"location":"Sanya, China","end":{"date-parts":[[2021,12,31]]}},"container-title":["2021 IEEE International Conference on Robotics and Biomimetics (ROBIO)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9739207\/9739208\/09739340.pdf?arnumber=9739340","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,1,30]],"date-time":"2023-01-30T14:10:07Z","timestamp":1675087807000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9739340\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,12,27]]},"references-count":11,"URL":"https:\/\/doi.org\/10.1109\/robio54168.2021.9739340","relation":{},"subject":[],"published":{"date-parts":[[2021,12,27]]}}}