{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,4]],"date-time":"2025-11-04T06:03:36Z","timestamp":1762236216089,"version":"build-2065373602"},"reference-count":30,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,8,25]],"date-time":"2025-08-25T00:00:00Z","timestamp":1756080000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,8,25]],"date-time":"2025-08-25T00:00:00Z","timestamp":1756080000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,8,25]]},"DOI":"10.1109\/ro-man63969.2025.11217576","type":"proceedings-article","created":{"date-parts":[[2025,11,3]],"date-time":"2025-11-03T18:42:29Z","timestamp":1762195349000},"page":"251-258","source":"Crossref","is-referenced-by-count":0,"title":["Maximizing Query Diversity for Terrain Cost Preference Learning in Robot Navigation"],"prefix":"10.1109","author":[{"given":"Jordan","family":"Sinclair","sequence":"first","affiliation":[{"name":"Ritchie School of Computer Science and Engineering, University of Denver,Department of Computer Science,USA"}]},{"given":"Elijah","family":"Alabi","sequence":"additional","affiliation":[{"name":"Ritchie School of Computer Science and Engineering, University of Denver,Department of Computer Science,USA"}]},{"given":"Maggie","family":"Wigness","sequence":"additional","affiliation":[{"name":"DEVCOM Army Research Laboratory,Adelphi,MD,USA"}]},{"given":"Brian","family":"Reily","sequence":"additional","affiliation":[{"name":"DEVCOM Army Research Laboratory,Adelphi,MD,USA"}]},{"given":"Christopher","family":"Reardon","sequence":"additional","affiliation":[{"name":"The MITRE Corporation,McLean,VA,USA"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1146\/annurev-control-100819-063206"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1177\/0278364910369715"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/SMC53654.2022.9945333"},{"article-title":"Reward learning from human preferences and demonstrations in atari","volume-title":"International Conference on Neural Information Processing Systems","author":"Ibarz","key":"ref4"},{"key":"ref5","article-title":"Auto-encoding variational bayes","volume-title":"CoRR","volume":"abs\/1312.6114","author":"Kingma","year":"2013"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/HRI53351.2022.9889650"},{"key":"ref7","first-page":"1177","article-title":"Asking easy questions: A user-friendly approach to active reward learning","volume-title":"Proceedings of the Conference on Robot Learning","volume":"100","author":"Biyik"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1145\/3649885"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/IROS55552.2023.10342081"},{"article-title":"Data driven reward initialization for preference-based reinforcement learning","volume-title":"AAAI Workshop on Representation Learning for Responsible Human-Centric AI","author":"Verma","key":"ref10"},{"article-title":"Pebble: Feedback-efficient interactive reinforcement learning via relabeling experience and unsupervised pre-training","volume-title":"International Conference on Machine Learning","author":"Lee","key":"ref11"},{"article-title":"Few-shot preference learning for human-in-the-loop RL","volume-title":"6th Annual Conference on Robot Learning","author":"H","key":"ref12"},{"article-title":"Provable offline preference-based reinforcement learning","volume-title":"International Conference on Learning Representations","author":"Zhan","key":"ref13"},{"article-title":"SURF: Semi-supervised reward learning with data augmentation for feedback-efficient preference-based reinforcement learning","volume-title":"International Conference on Learning Representations","author":"Park","key":"ref14"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ROBIO58561.2023.10355039"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/RO-MAN60168.2024.10731470"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48891.2023.10161081"},{"article-title":"Flow to better: Offline preference-based reinforcement learning via preferred trajectory generation","volume-title":"International Conference on Learning Representations","author":"Zhang","key":"ref18"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/cdc40024.2019.9030169"},{"key":"ref20","doi-asserted-by":"crossref","DOI":"10.15607\/RSS.2019.XV.023","article-title":"Learning reward functions by integrating human demonstrations and preferences","author":"Palan","year":"2019"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2022.3194068"},{"article-title":"Query-policy misalignment in preference-based reinforcement learning","volume-title":"ICML 2023 Workshop The Many Facets of Preference-Based Learning","author":"Hu","key":"ref22"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/IROS55552.2023.10341795"},{"key":"ref24","article-title":"Terrain cost learning from human preferences for robot path planning using a visual user interface","volume-title":"Master\u2019s thesis","author":"Velagapudi","year":"2023"},{"key":"ref25","article-title":"Terrain and adversary-aware autonomous robot navigation","volume-title":"Master\u2019s thesis","author":"Inyang","year":"2023"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA57147.2024.10611472"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.25080\/TCWV9851"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/DASC43569.2019.9081648"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2017.XIII.053"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA40945.2020.9196661"}],"event":{"name":"2025 34th IEEE International Conference on Robot and Human Interactive Communication (RO-MAN)","start":{"date-parts":[[2025,8,25]]},"location":"Eindhoven, Netherlands","end":{"date-parts":[[2025,8,29]]}},"container-title":["2025 34th IEEE International Conference on Robot and Human Interactive Communication (RO-MAN)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11217544\/11217526\/11217576.pdf?arnumber=11217576","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,11,4]],"date-time":"2025-11-04T06:00:09Z","timestamp":1762236009000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11217576\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,8,25]]},"references-count":30,"URL":"https:\/\/doi.org\/10.1109\/ro-man63969.2025.11217576","relation":{},"subject":[],"published":{"date-parts":[[2025,8,25]]}}}