{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,21]],"date-time":"2026-05-21T07:11:32Z","timestamp":1779347492425,"version":"3.51.4"},"reference-count":24,"publisher":"IEEE","license":[{"start":{"date-parts":[[2026,4,22]],"date-time":"2026-04-22T00:00:00Z","timestamp":1776816000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,4,22]],"date-time":"2026-04-22T00:00:00Z","timestamp":1776816000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2026,4,22]]},"DOI":"10.1109\/icarsc70216.2026.11523235","type":"proceedings-article","created":{"date-parts":[[2026,5,20]],"date-time":"2026-05-20T19:50:30Z","timestamp":1779306630000},"page":"3-8","source":"Crossref","is-referenced-by-count":0,"title":["Interactive Construction of Multi-Grid MDPs: Bridging Natural Language and Real-Time Policy Visualization"],"prefix":"10.1109","author":[{"given":"Tiago","family":"Caldeira","sequence":"first","affiliation":[{"name":"University of Lisbon,Instituto Superior T&#x00E9;cnico,Portugal"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Tiago","family":"Antunes","sequence":"additional","affiliation":[{"name":"University of Coimbra,Portugal"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Majid","family":"Khonji","sequence":"additional","affiliation":[{"name":"Khalifa University,Abu Dhabi,U.A.E"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jorge","family":"Dias","sequence":"additional","affiliation":[{"name":"Khalifa University,Abu Dhabi,U.A.E"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Pedro U.","family":"Lima","sequence":"additional","affiliation":[{"name":"University of Lisbon,Instituto Superior T&#x00E9;cnico,Portugal"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1090\/S0002-9904-1954-09848-8"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-97051-1_17"},{"key":"ref3","volume-title":"Reinforcement Learning: An Introduction","author":"Sutton","year":"2018"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.5040\/9781501365072.2213"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1007\/s10458-022-09552-y"},{"key":"ref6","article-title":"Evaluating large language models trained on code","author":"Chen","year":"2021"},{"issue":"5","key":"ref7","first-page":"1","article-title":"Gpt-4 technical report. arxiv 2303.08774","volume":"2","year":"2023","journal-title":"View in Article"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1098\/rsta.2022.0050"},{"key":"ref9","article-title":"Draft, sketch, and prove: Guiding formal theorem provers with informal proofs","author":"Jiang","year":"2022"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1145\/1597735.1597738"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1145\/604045.604056"},{"key":"ref12","article-title":"Active learning literature survey","author":"Settles","year":"2009"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/TIV.2016.2578706"},{"key":"ref14","first-page":"1","article-title":"Carla: An open urban driving simulator","volume-title":"Proceedings of the Conference on Robot Learning (CoRL)","author":"Dosovitskiy"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1016\/S0004-3702(99)00052-1"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1613\/jair.639"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1080\/24725854.2021.1895454"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/IROS45743.2020.9341496"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1126\/science.abq1158"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1177\/02783649211046285"},{"key":"ref21","article-title":"Inverse reward design","volume":"30","author":"Hadfield-Menell","year":"2017","journal-title":"Advances in neural information processing systems"},{"key":"ref22","volume-title":"Interpretable machine learning","author":"Molnar","year":"2020"},{"key":"ref23","article-title":"How hard is my mdp?","volume":"27","author":"Maillard","year":"2014","journal-title":"the distribution-norm to the rescue\",\" Advances in Neural Information Processing Systems"},{"key":"ref24","article-title":"Multigrid mdp using llm","author":"Antunes","year":"2026"}],"event":{"name":"2026 IEEE International Conference on Autonomous Robot Systems and Competitions (ICARSC)","location":"Barcelos, Portugal","start":{"date-parts":[[2026,4,22]]},"end":{"date-parts":[[2026,4,23]]}},"container-title":["2026 IEEE International Conference on Autonomous Robot Systems and Competitions (ICARSC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11523214\/11523222\/11523235.pdf?arnumber=11523235","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,5,21]],"date-time":"2026-05-21T06:34:24Z","timestamp":1779345264000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11523235\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,4,22]]},"references-count":24,"URL":"https:\/\/doi.org\/10.1109\/icarsc70216.2026.11523235","relation":{},"subject":[],"published":{"date-parts":[[2026,4,22]]}}}