{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,7]],"date-time":"2025-11-07T13:36:16Z","timestamp":1762522576824,"version":"3.28.0"},"reference-count":39,"publisher":"IEEE","license":[{"start":{"date-parts":[[2020,10,24]],"date-time":"2020-10-24T00:00:00Z","timestamp":1603497600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2020,10,24]],"date-time":"2020-10-24T00:00:00Z","timestamp":1603497600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2020,10,24]],"date-time":"2020-10-24T00:00:00Z","timestamp":1603497600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020,10,24]]},"DOI":"10.1109\/iros45743.2020.9341049","type":"proceedings-article","created":{"date-parts":[[2021,3,15]],"date-time":"2021-03-15T14:49:56Z","timestamp":1615819796000},"page":"1637-1644","source":"Crossref","is-referenced-by-count":36,"title":["Learning Visuomotor Policies for Aerial Navigation Using Cross-Modal Representations"],"prefix":"10.1109","author":[{"given":"Rogerio","family":"Bonatti","sequence":"first","affiliation":[{"name":"Carnegie Mellon University,The Robotics Institute,Pittsburgh,PA"}]},{"given":"Ratnesh","family":"Madaan","sequence":"additional","affiliation":[{"name":"Microsoft Corporation,Redmond,WA"}]},{"given":"Vibhav","family":"Vineet","sequence":"additional","affiliation":[{"name":"Microsoft Corporation,Redmond,WA"}]},{"given":"Sebastian","family":"Scherer","sequence":"additional","affiliation":[{"name":"Carnegie Mellon University,The Robotics Institute,Pittsburgh,PA"}]},{"given":"Ashish","family":"Kapoor","sequence":"additional","affiliation":[{"name":"Microsoft Corporation,Redmond,WA"}]}],"member":"263","reference":[{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1177\/0278364919870227"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1561\/2300000053"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.2514\/6.2018-2138"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2018.2808368"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1002\/rob.21743"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-28872-7_37"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2015.7353622"},{"article-title":"Disentangling by factorising","year":"2018","author":"kim","key":"ref36"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"article-title":"Stochastic backpropagation and approximate inference in deep generative models","year":"2014","author":"rezende","key":"ref34"},{"article-title":"Deep drone racing: From simulation to reality with domain randomization","year":"2019","author":"loquercio","key":"ref10"},{"key":"ref11","article-title":"Airsim: High-fidelity visual and physical simulation for autonomous vehicles","author":"shah","year":"2017","journal-title":"Field and Service Robotics"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00017"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2018.8460664"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2012.6385773"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2011.5980409"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2016.7759784"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/IROS40897.2019.8968163"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2013.6630809"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2018.2795643"},{"key":"ref28","first-page":"689","article-title":"Multimodal deep learning","author":"ngiam","year":"2011","journal-title":"Proceedings of the 28th International Conference on Machine Learning (ICML-11)"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2017.8202134"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2017.2753232"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2019.8793735"},{"article-title":"(CAD)2RL: Real single-image flight without a single real image","year":"2016","author":"sadeghi","key":"ref6"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.439"},{"key":"ref5","article-title":"Visual object networks: Image generation with disentangled 3d representation","volume":"abs 1812 2725","author":"zhu","year":"2018","journal-title":"CoRR"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2017.8202133"},{"key":"ref7","first-page":"2096","article-title":"Domain-adversarial training of neural networks","volume":"17","author":"ganin","year":"2016","journal-title":"The Journal of Machine Learning Research"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2019.8793631"},{"article-title":"Building generalizable agents with a realistic and rich 3d environment","year":"2018","author":"wu","key":"ref9"},{"article-title":"Deep drone racing: Learning agile flight in dynamic environments","year":"2018","author":"kaufmann","key":"ref1"},{"article-title":"World models","year":"2018","author":"ha","key":"ref20"},{"article-title":"Learning latent dynamics for planning from pixels","year":"2018","author":"hafner","key":"ref22"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1016\/j.neunet.2018.07.006"},{"key":"ref24","article-title":"beta-vae: Learning basic visual concepts with a constrained variational framework","author":"higgins","year":"2017","journal-title":"5th International Conference on Learning Representations - ICLR 2017"},{"key":"ref23","article-title":"Autoencoding variational bayes","author":"diederik kingma","year":"2014","journal-title":"ICLRE"},{"key":"ref26","article-title":"Monet: Unsupervised scene decomposition and representation","author":"burgess","year":"2019","journal-title":"CoRR"},{"article-title":"Disentangling by factorising","year":"2018","author":"kim","key":"ref25"}],"event":{"name":"2020 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS)","start":{"date-parts":[[2020,10,24]]},"location":"Las Vegas, NV, USA","end":{"date-parts":[[2021,1,24]]}},"container-title":["2020 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9340668\/9340635\/09341049.pdf?arnumber=9341049","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,6,28]],"date-time":"2022-06-28T21:51:45Z","timestamp":1656453105000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9341049\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,10,24]]},"references-count":39,"URL":"https:\/\/doi.org\/10.1109\/iros45743.2020.9341049","relation":{},"subject":[],"published":{"date-parts":[[2020,10,24]]}}}