{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,7]],"date-time":"2024-09-07T12:11:04Z","timestamp":1725711064973},"reference-count":45,"publisher":"IEEE","license":[{"start":{"date-parts":[[2022,10,23]],"date-time":"2022-10-23T00:00:00Z","timestamp":1666483200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2022,10,23]],"date-time":"2022-10-23T00:00:00Z","timestamp":1666483200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2022,10,23]]},"DOI":"10.1109\/iros47612.2022.9981614","type":"proceedings-article","created":{"date-parts":[[2022,12,26]],"date-time":"2022-12-26T14:38:15Z","timestamp":1672065495000},"page":"9259-9265","source":"Crossref","is-referenced-by-count":0,"title":["Noisy Agents: Self-supervised Exploration by Predicting Auditory Events"],"prefix":"10.1109","volume":"529","author":[{"given":"Chuang","family":"Gan","sequence":"first","affiliation":[{"name":"Massachusetts Institute of Technology"}]},{"given":"Xiaoyu","family":"Chen","sequence":"additional","affiliation":[{"name":"Tsinghua University"}]},{"given":"Phillip","family":"Isola","sequence":"additional","affiliation":[{"name":"Massachusetts Institute of Technology"}]},{"given":"Antonio","family":"Torralba","sequence":"additional","affiliation":[{"name":"Massachusetts Institute of Technology"}]},{"given":"Joshua B.","family":"Tenenbaum","sequence":"additional","affiliation":[{"name":"Massachusetts Institute of Technology"}]}],"member":"263","reference":[{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.73"},{"key":"ref35","first-page":"17","article-title":"Soundspaces: Audio-visual navigation in 3d environments","author":"chen","year":"2020","journal-title":"ECCV"},{"key":"ref12","first-page":"892","article-title":"Soundnet: Learning sound representations from unlabeled video","author":"aytar","year":"2016","journal-title":"Advances in neural information processing systems"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA40945.2020.9197008"},{"key":"ref15","article-title":"Audio-visual scene analysis with self-supervised multisensory features","author":"owens","year":"2018","journal-title":"ECCV"},{"key":"ref37","article-title":"Swoosh! rattle! thump! - actions that sound","author":"dhiraj","year":"2020","journal-title":"IROS"},{"key":"ref14","article-title":"Co-training of audio and video representations from self-supervised temporal synchronization","author":"korbar","year":"2018","journal-title":"ArXiv Preprint"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01027"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.264"},{"key":"ref30","first-page":"8388","article-title":"Learning to play with intrinsically-motivated, self-aware agents","author":"haber","year":"2018","journal-title":"NIPS"},{"key":"ref11","first-page":"801","article-title":"Ambient sound provides supervision for visual learning","author":"owens","year":"0","journal-title":"European Conference on Computer Vision"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00361"},{"key":"ref10","article-title":"Threedworld: A platform for interactive multi-modal physical simulation","author":"gan","year":"2020","journal-title":"ArXiv Preprint"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00790"},{"key":"ref2","doi-asserted-by":"crossref","first-page":"484","DOI":"10.1038\/nature16961","article-title":"Mastering the game of go with deep neural networks and tree search","volume":"529","author":"silver","year":"2016","journal-title":"Nature"},{"key":"ref1","doi-asserted-by":"crossref","first-page":"529","DOI":"10.1038\/nature14236","article-title":"Human-level control through deep reinforcement learning","volume":"518","author":"mnih","year":"2015","journal-title":"Nature"},{"key":"ref17","first-page":"222","article-title":"A possibility for implementing curiosity and boredom in model-building neural controllers","author":"schmidhuber","year":"0","journal-title":"Proc of the International Conference on Simulation of Adaptive Behavior From Animals to Animats"},{"key":"ref39","first-page":"139","article-title":"Crossmodal attentive skill learner","author":"omidshafiei","year":"0","journal-title":"Proceedings of the 17th International Conference on Autonomous Agents and MultiAgent Systems International Foundation for Autonomous Agents and Multiagent Systems"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.3389\/fncir.2013.00037"},{"key":"ref38","first-page":"2930","article-title":"Playing hard exploration games by watching youtube","author":"aytar","year":"2018","journal-title":"NIPS"},{"key":"ref19","first-page":"2753","article-title":"# exploration: A study of count-based exploration for deep reinforcement learning","author":"tang","year":"2017","journal-title":"NIPS"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/TAMD.2010.2056368"},{"journal-title":"Deep Exploration via Randomized Value Functions","year":"2019","author":"osband","key":"ref24"},{"key":"ref23","article-title":"Self-supervised exploration via disagreement","author":"pathak","year":"2019","journal-title":"ICML"},{"key":"ref45","article-title":"Proximal policy optimization algorithms","author":"schulman","year":"2017","journal-title":"ArXiv Preprint"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1016\/j.jcss.2007.08.009"},{"key":"ref25","first-page":"4026","article-title":"Deep exploration via bootstrapped dqn","author":"osband","year":"2016","journal-title":"NIPS"},{"key":"ref20","first-page":"1471","article-title":"Unifying count-based exploration and intrinsic motivation","author":"bellemare","year":"2016","journal-title":"NIPS"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.1982.1056489"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1016\/j.neuron.2011.06.032"},{"key":"ref22","article-title":"Large-scale study of curiosity-driven learning","author":"burda","year":"2018","journal-title":"ICLRE"},{"key":"ref44","article-title":"The replica dataset: A digital replica of indoor spaces","author":"straub","year":"2019","journal-title":"ArXiv Preprint"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/CEC.2005.1554676"},{"key":"ref43","article-title":"Gotta learn fast: A new benchmark for generalization in rl","author":"nichol","year":"2018","journal-title":"ArXiv Preprint"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2017\/344"},{"key":"ref27","first-page":"2721","article-title":"Count-based exploration with neural density models","author":"ostrovski","year":"2017","journal-title":"ICML"},{"key":"ref29","article-title":"Incentivizing exploration in reinforcement learning with deep predictive models","author":"stadie","year":"2015","journal-title":"ArXiv Preprint"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1613\/jair.3912"},{"key":"ref7","doi-asserted-by":"crossref","first-page":"746","DOI":"10.1038\/264746a0","article-title":"Hearing lips and seeing voices","volume":"264","author":"mcgurk","year":"1976","journal-title":"Nature"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00943"},{"key":"ref4","article-title":"Exploration by random network distillation","author":"burda","year":"2018","journal-title":"ICLRE"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2017.7989381"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1016\/0010-0285(76)90018-9"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW.2017.70"},{"key":"ref40","article-title":"See, hear, explore: Curiosity via audio-visual association","author":"dean","year":"2020","journal-title":"ArXiv Preprint"}],"event":{"name":"2022 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS)","start":{"date-parts":[[2022,10,23]]},"location":"Kyoto, Japan","end":{"date-parts":[[2022,10,27]]}},"container-title":["2022 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9981026\/9981028\/09981614.pdf?arnumber=9981614","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,11,29]],"date-time":"2023-11-29T15:13:53Z","timestamp":1701270833000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9981614\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,10,23]]},"references-count":45,"URL":"https:\/\/doi.org\/10.1109\/iros47612.2022.9981614","relation":{},"subject":[],"published":{"date-parts":[[2022,10,23]]}}}