{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,10]],"date-time":"2026-01-10T00:44:20Z","timestamp":1768005860259,"version":"3.49.0"},"reference-count":28,"publisher":"IEEE","license":[{"start":{"date-parts":[[2022,10,23]],"date-time":"2022-10-23T00:00:00Z","timestamp":1666483200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2022,10,23]],"date-time":"2022-10-23T00:00:00Z","timestamp":1666483200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2022,10,23]]},"DOI":"10.1109\/iros47612.2022.9981185","type":"proceedings-article","created":{"date-parts":[[2022,12,26]],"date-time":"2022-12-26T19:38:15Z","timestamp":1672083495000},"page":"2476-2482","source":"Crossref","is-referenced-by-count":4,"title":["A Contact-Safe Reinforcement Learning Framework for Contact-Rich Robot Manipulation"],"prefix":"10.1109","author":[{"given":"Xiang","family":"Zhu","sequence":"first","affiliation":[{"name":"institute for interdisciplinary information sciences, Tsinghua University,Beijing,China"}]},{"given":"Shucheng","family":"Kang","sequence":"additional","affiliation":[{"name":"institute for interdisciplinary information sciences, Tsinghua University,Beijing,China"}]},{"given":"Jianyu","family":"Chen","sequence":"additional","affiliation":[{"name":"Shanghai Qizhi Insitute,Shanghai,China"}]}],"member":"263","reference":[{"key":"ref1","first-page":"651","article-title":"Scalable deep reinforcement learning for vision-based robotic manipulation","volume-title":"Conference on Robot Learning","author":"Kalashnikov","year":"2018"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1177\/0278364917710318"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2020.3010739"},{"key":"ref4","article-title":"Deep reinforcement learning for contact-rich skills using compliant movement primitives","author":"Spector","year":"2020","journal-title":"arXiv preprint"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2018.8460696"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2019.8793506"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/TNN.1998.712192"},{"key":"ref8","article-title":"Exploration by random network distillation","author":"Burda","year":"2018","journal-title":"arXiv preprint"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1115\/1.3140702"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.3389\/frobt.2020.590681"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/IROS40897.2019.8968201"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1007\/s10846-020-01183-3"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/ECMR50962.2021.9568848"},{"key":"ref14","article-title":"Rmps for safe impedance control in contact-rich manipulation","author":"Shaw","year":"2021","journal-title":"arXiv preprint"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2021.3088091"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA40945.2020.9196924"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1177\/0278364914559753"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/JRA.1987.1087068"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1177\/027836498700600201"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1177\/0278364914566516"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/TRO.2009.2017135"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/ROBOT.2005.1570247"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/TRO.2017.2723903"},{"key":"ref24","article-title":"Proximal policy optimization algorithms","author":"Schulman","year":"2017","journal-title":"arXiv preprint"},{"key":"ref25","author":"Higgins","year":"2016","journal-title":"beta-vae: Learning basic visual concepts with a constrained variational framework"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2019.8793691"},{"key":"ref27","volume-title":"Pybullet, a python module for physics simulation for games, robotics and machine learning"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/HUMANOIDS.2015.7363472"}],"event":{"name":"2022 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS)","location":"Kyoto, Japan","start":{"date-parts":[[2022,10,23]]},"end":{"date-parts":[[2022,10,27]]}},"container-title":["2022 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9981026\/9981028\/09981185.pdf?arnumber=9981185","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,2]],"date-time":"2024-03-02T08:35:32Z","timestamp":1709368532000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9981185\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,10,23]]},"references-count":28,"URL":"https:\/\/doi.org\/10.1109\/iros47612.2022.9981185","relation":{},"subject":[],"published":{"date-parts":[[2022,10,23]]}}}