{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,12]],"date-time":"2025-12-12T13:42:25Z","timestamp":1765546945250,"version":"3.37.3"},"reference-count":31,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"4","license":[{"start":{"date-parts":[[2022,10,1]],"date-time":"2022-10-01T00:00:00Z","timestamp":1664582400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2022,10,1]],"date-time":"2022-10-01T00:00:00Z","timestamp":1664582400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2022,10,1]],"date-time":"2022-10-01T00:00:00Z","timestamp":1664582400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100003725","name":"National Research Foundation of Korea","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100003725","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Ministry of Science and ICT","award":["2021R1A2C1093957","2017R1E1A1A01075171"],"award-info":[{"award-number":["2021R1A2C1093957","2017R1E1A1A01075171"]}]},{"name":"Institute of Engineering Research at Seoul National University"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Robot. Autom. Lett."],"published-print":{"date-parts":[[2022,10]]},"DOI":"10.1109\/lra.2022.3189447","type":"journal-article","created":{"date-parts":[[2022,7,8]],"date-time":"2022-07-08T19:24:54Z","timestamp":1657308294000},"page":"9099-9106","source":"Crossref","is-referenced-by-count":3,"title":["UNICON: Uncertainty-Conditioned Policy for Robust Behavior in Unfamiliar Scenarios"],"prefix":"10.1109","volume":"7","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-1642-6789","authenticated-orcid":false,"given":"Chan","family":"Kim","sequence":"first","affiliation":[{"name":"Seoul National University, Seoul, South Korea"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1835-534X","authenticated-orcid":false,"given":"Jae-Kyung","family":"Cho","sequence":"additional","affiliation":[{"name":"Seoul National University, Seoul, South Korea"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9976-139X","authenticated-orcid":false,"given":"Hyung-Suk","family":"Yoon","sequence":"additional","affiliation":[{"name":"Seoul National University, Seoul, South Korea"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4890-8563","authenticated-orcid":false,"given":"Seung-Woo","family":"Seo","sequence":"additional","affiliation":[{"name":"Seoul National University, Seoul, South Korea"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1633-573X","authenticated-orcid":false,"given":"Seong-Woo","family":"Kim","sequence":"additional","affiliation":[{"name":"Seoul National University, Seoul, South Korea"}]}],"member":"263","reference":[{"key":"ref1","article-title":"High-dimensional continuous control using generalized advantage estimation","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Schulman","year":"2016"},{"article-title":"Emergence of locomotion behaviours in rich environments","year":"2017","author":"Heess","key":"ref2"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2017.7989385"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1016\/j.inffus.2021.05.008"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.5555\/3045390.3045502"},{"key":"ref6","first-page":"1613","article-title":"Weight uncertainty in neural network","volume-title":"Proc. 32nd Int. Conf. Mach. Learn.","volume":"37","author":"Blundell","year":"2015"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.5555\/2986459.2986721"},{"key":"ref8","first-page":"1708","article-title":"Structured and efficient variational deep learning with matrix gaussian posteriors","volume-title":"Proc. 33rd Int. Conf. Mach. Learn.","volume":"48","author":"Louizos","year":"2016"},{"key":"ref9","article-title":"Simple and scalable predictive uncertainty estimation using deep ensembles","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"30","author":"Lakshminarayanan","year":"2017"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2019.8793611"},{"article-title":"Uncertainty aware reinforcement learning for collision avoidance","year":"2017","author":"Kahn","key":"ref11"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA40945.2020.9196785"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1126\/science.1115327"},{"key":"ref14","article-title":"Continuous control with deep reinforcement learning","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Lillicrap","year":"2016"},{"key":"ref15","first-page":"387","article-title":"Deterministic policy gradient algorithms","volume-title":"Proc. 31st Int. Conf. Mach. Learn.","volume":"32","author":"Silver","year":"2014"},{"key":"ref16","first-page":"1587","article-title":"Addressing function approximation error in actor-critic methods","volume-title":"Proc. 35th Int. Conf. Mach. Learn.","volume":"80","author":"Fujimoto","year":"2018"},{"key":"ref17","first-page":"1861","article-title":"Soft actor-critic: Off-policy maximum entropy deep reinforcement learning with a stochastic actor","volume-title":"Proc. 35th Int. Conf. Mach. Learn.","volume":"80","author":"Haarnoja","year":"2018"},{"key":"ref18","first-page":"3686","article-title":"Deep reinforcement and infomax learning","volume":"33","author":"Mazoure","year":"2020","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"ref19","article-title":"Diversity is all you need: Learning skills without a reward function","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Eysenbach","year":"2019"},{"key":"ref20","first-page":"3815","article-title":"Infogail: Interpretable imitation learning from visual demonstrations","volume":"30","author":"Li","year":"2017","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/IV47402.2020.9304614"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.15607\/rss.2020.xvi.064"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-42553-1_3"},{"key":"ref24","first-page":"2172","article-title":"InfoGAN: Interpretable representation learning by information maximizing generative adversarial nets","volume":"29","author":"Chen","year":"2016","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"ref25","first-page":"531","article-title":"Mutual information neural estimation","volume-title":"Proc. 35th Int. Conf. Mach. Learn.","volume":"80","author":"Belghazi","year":"2018"},{"key":"ref26","article-title":"Learning deep representations by mutual information estimation and maximization","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Hjelm","year":"2019"},{"key":"ref27","first-page":"5949","article-title":"Exploring generalization in deep learning","volume":"30","author":"Neyshabur","year":"2017","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.5555\/3295222.3295309"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/ITSC.2019.8917306"},{"key":"ref30","first-page":"2817","article-title":"Robust adversarial reinforcement learning","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Pinto","year":"2017"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2017.8202133"}],"container-title":["IEEE Robotics and Automation Letters"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7083369\/9831196\/09822401.pdf?arnumber=9822401","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,2,1]],"date-time":"2024-02-01T04:17:57Z","timestamp":1706761077000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9822401\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,10]]},"references-count":31,"journal-issue":{"issue":"4"},"URL":"https:\/\/doi.org\/10.1109\/lra.2022.3189447","relation":{},"ISSN":["2377-3766","2377-3774"],"issn-type":[{"type":"electronic","value":"2377-3766"},{"type":"electronic","value":"2377-3774"}],"subject":[],"published":{"date-parts":[[2022,10]]}}}