{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,4]],"date-time":"2025-09-04T14:24:50Z","timestamp":1756995890202,"version":"3.28.0"},"reference-count":36,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,5,30]],"date-time":"2021-05-30T00:00:00Z","timestamp":1622332800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2021,5,30]],"date-time":"2021-05-30T00:00:00Z","timestamp":1622332800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,5,30]],"date-time":"2021-05-30T00:00:00Z","timestamp":1622332800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,5,30]]},"DOI":"10.1109\/icra48506.2021.9561030","type":"proceedings-article","created":{"date-parts":[[2021,10,19]],"date-time":"2021-10-19T20:28:35Z","timestamp":1634675315000},"page":"6657-6663","source":"Crossref","is-referenced-by-count":3,"title":["Multi-Step Recurrent Q-Learning for Robotic Velcro Peeling"],"prefix":"10.1109","author":[{"given":"Jiacheng","family":"Yuan","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Nicolai","family":"Hani","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Volkan","family":"Isler","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref33","doi-asserted-by":"crossref","first-page":"279","DOI":"10.1007\/BF00992698","article-title":"Q-learning","volume":"8","author":"watkins","year":"1992","journal-title":"Machine Learning"},{"journal-title":"Reinforcement Learning An Introduction","year":"2018","author":"sutton","key":"ref32"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2014.6943119"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/TRO.2018.2830405"},{"key":"ref36","first-page":"1587","article-title":"Addressing function approximation error in actor-critic methods","author":"fujimoto","year":"2018","journal-title":"International Conference on Machine Learning"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1038\/s41467-019-13073-w"},{"key":"ref34","article-title":"Deep recurrent q-learning for partially observable mdps","author":"hausknecht","year":"2015","journal-title":"2015 AAAI Fall Symposium Series"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2012.6386002"},{"key":"ref11","first-page":"734","article-title":"Sim-to-real reinforcement learning for deformable object manipulation","author":"matas","year":"2018","journal-title":"Conference on Robot Learning"},{"article-title":"Learning to manipulate deformable objects without demonstrations","year":"2019","author":"wu","key":"ref12"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1177\/0278364918779698"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1038\/nature14236"},{"key":"ref15","article-title":"Continuous control with deep reinforcement learning","volume":"abs 1509 2971","author":"lillicrap","year":"2015","journal-title":"CoRR"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2019.8793485"},{"key":"ref17","article-title":"Grasping pomdps: Theory and experiments","author":"glashan","year":"2007","journal-title":"RSS Workshop manip for human env"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2016.7487754"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2017.7989326"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1177\/0278364917710318"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.01086"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2018.XIV.021"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/ROBOT.2008.4543737"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1016\/j.sna.2011.02.038"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2018.8593986"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1007\/s10514-013-9344-1"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2020.2974439"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1177\/0278364919887447"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2016.7487517"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1177\/027836499601500302"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/TRO.2016.2533639"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-32520-6_14"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2014.6943202"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/70.880799"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/TRO.2011.2139150"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2017.7989543"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2010.5653949"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2019.8793520"}],"event":{"name":"2021 IEEE International Conference on Robotics and Automation (ICRA)","start":{"date-parts":[[2021,5,30]]},"location":"Xi'an, China","end":{"date-parts":[[2021,6,5]]}},"container-title":["2021 IEEE International Conference on Robotics and Automation (ICRA)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9560720\/9560666\/09561030.pdf?arnumber=9561030","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,5,10]],"date-time":"2022-05-10T11:47:17Z","timestamp":1652183237000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9561030\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,5,30]]},"references-count":36,"URL":"https:\/\/doi.org\/10.1109\/icra48506.2021.9561030","relation":{},"subject":[],"published":{"date-parts":[[2021,5,30]]}}}