{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,11]],"date-time":"2025-11-11T13:44:22Z","timestamp":1762868662506,"version":"3.37.3"},"reference-count":27,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,5,30]],"date-time":"2021-05-30T00:00:00Z","timestamp":1622332800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,5,30]],"date-time":"2021-05-30T00:00:00Z","timestamp":1622332800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100003977","name":"Israel Science Foundation","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100003977","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,5,30]]},"DOI":"10.1109\/icra48506.2021.9561097","type":"proceedings-article","created":{"date-parts":[[2021,10,20]],"date-time":"2021-10-20T00:28:35Z","timestamp":1634689715000},"page":"4650-4656","source":"Crossref","is-referenced-by-count":4,"title":["Efficient Self-Supervised Data Collection for Offline Robot Learning"],"prefix":"10.1109","author":[{"given":"Shadi","family":"Endrawis","sequence":"first","affiliation":[{"name":"Technion &#x2013; Israel Institute of Technology"}]},{"given":"Gal","family":"Leibovich","sequence":"additional","affiliation":[{"name":"Intel Labs"}]},{"given":"Guy","family":"Jacob","sequence":"additional","affiliation":[{"name":"Intel Labs"}]},{"given":"Gal","family":"Novik","sequence":"additional","affiliation":[{"name":"Intel Labs"}]},{"given":"Aviv","family":"Tamar","sequence":"additional","affiliation":[{"name":"Technion &#x2013; Israel Institute of Technology"}]}],"member":"263","reference":[{"key":"ref10","first-page":"1471","article-title":"Unifying count-based exploration and intrinsic motivation","author":"bellemare","year":"2016","journal-title":"NIPS"},{"key":"ref11","first-page":"6","article-title":"What is intrinsic motivation? a typology of computational approaches","volume":"1","author":"oudeyer","year":"2009","journal-title":"Frontiers in Neurorobotics"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-32375-1_2"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW.2017.70"},{"key":"ref14","article-title":"Large-scale study of curiosity-driven learning","author":"burda","year":"2018","journal-title":"CoRR"},{"key":"ref15","article-title":"Exploration by random network distillation","author":"burda","year":"2018","journal-title":"CoRR"},{"key":"ref16","article-title":"Addressing function approximation error in actor-critic methods","author":"fujimoto","year":"2018","journal-title":"CoRR"},{"key":"ref17","article-title":"Count-based exploration with neural density models","author":"ostrovski","year":"2017","journal-title":"CoRR"},{"key":"ref18","first-page":"1312","article-title":"Universal value function approximators","author":"schaul","year":"0"},{"key":"ref19","first-page":"5055","article-title":"Hindsight experience replay","author":"andrychowicz","year":"0","journal-title":"Advances in Neural Information Processing Systems 30 Annual Conference on Neural Information Processing Systems 2017"},{"key":"ref4","doi-asserted-by":"crossref","first-page":"45","DOI":"10.1007\/978-3-642-27645-3_2","article-title":"Batch reinforcement learning","author":"lange","year":"2012","journal-title":"Reinforcement Learning"},{"key":"ref3","article-title":"Qt-opt: Scalable deep reinforcement learning for vision-based robotic manipulation","author":"kalashnikov","year":"2018","journal-title":"CoRR"},{"key":"ref27","article-title":"Off-policy deep reinforcement learning without exploration","author":"fujimoto","year":"2018","journal-title":"CoRR"},{"key":"ref6","first-page":"5074","article-title":"Learning to poke by poking: Experiential learning of intuitive physics","author":"agrawal","year":"2016","journal-title":"Advances in neural information processing systems"},{"article-title":"Offline reinforcement learning: Tutorial, review, and perspectives on open problems","year":"2020","author":"levine","key":"ref5"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2017.7989324"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2019.XV.074"},{"key":"ref2","first-page":"1334","article-title":"End-to-end training of deep visuomotor policies","volume":"17","author":"levine","year":"2016","journal-title":"The Journal of Machine Learning Research"},{"key":"ref9","doi-asserted-by":"crossref","DOI":"10.1109\/TRO.2020.2988642","article-title":"Tossingbot: Learning to throw arbitrary objects with residual physics","author":"zeng","year":"2020","journal-title":"IEEE Transactions on Robotics"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1177\/0278364913495721"},{"key":"ref20","article-title":"Intrinsically motivated goal exploration processes with automatic curriculum learning","author":"forestier","year":"2017","journal-title":"CoRR"},{"key":"ref22","article-title":"Directed exploration for reinforcement learning","author":"guo","year":"2019","journal-title":"CoRR"},{"key":"ref21","article-title":"Go-explore: a new approach for hard-exploration problems","author":"ecoffet","year":"2019","journal-title":"CoRR"},{"article-title":"robosuite: A modular simulation framework and benchmark for robot learning","year":"2020","author":"zhu","key":"ref24"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1023\/A:1017984413808"},{"key":"ref26","doi-asserted-by":"crossref","first-page":"529","DOI":"10.1038\/nature14236","article-title":"Human-level control through deep reinforcement learning","volume":"518","author":"mnih","year":"2015","journal-title":"Nature"},{"article-title":"Reinforcement learning coach","year":"2017","author":"caspi","key":"ref25"}],"event":{"name":"2021 IEEE International Conference on Robotics and Automation (ICRA)","start":{"date-parts":[[2021,5,30]]},"location":"Xi'an, China","end":{"date-parts":[[2021,6,5]]}},"container-title":["2021 IEEE International Conference on Robotics and Automation (ICRA)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9560720\/9560666\/09561097.pdf?arnumber=9561097","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,1,12]],"date-time":"2023-01-12T22:49:09Z","timestamp":1673563749000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9561097\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,5,30]]},"references-count":27,"URL":"https:\/\/doi.org\/10.1109\/icra48506.2021.9561097","relation":{},"subject":[],"published":{"date-parts":[[2021,5,30]]}}}