{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,23]],"date-time":"2024-10-23T05:03:37Z","timestamp":1729659817450,"version":"3.28.0"},"reference-count":30,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,8,17]],"date-time":"2021-08-17T00:00:00Z","timestamp":1629158400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2021,8,17]],"date-time":"2021-08-17T00:00:00Z","timestamp":1629158400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,8,17]],"date-time":"2021-08-17T00:00:00Z","timestamp":1629158400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,8,17]]},"DOI":"10.1109\/cog52621.2021.9618999","type":"proceedings-article","created":{"date-parts":[[2021,12,7]],"date-time":"2021-12-07T20:53:06Z","timestamp":1638910386000},"page":"01-08","source":"Crossref","is-referenced-by-count":2,"title":["Interactive Explanations: Diagnosis and Repair of Reinforcement Learning Based Agent Behaviors"],"prefix":"10.1109","author":[{"given":"Christian Arzate","family":"Cruz","sequence":"first","affiliation":[]},{"given":"Takeo","family":"Igarashi","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1017\/S0269888919000079"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/TG.2018.2808198"},{"key":"ref11","first-page":"1","article-title":"Interactive design exploration of game stages using adjustable synthetic testers","author":"suetake","year":"0","journal-title":"International Conference on the Foundations of Digital Games"},{"key":"ref12","article-title":"Customizing scripted bots: Sample efficient imitation learning for human-like behavior in minecraft","author":"broll","year":"0","journal-title":"AAMAS Workshop on Adaptive and Learning Agents 2019"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/CIG.2019.8847995"},{"key":"ref14","doi-asserted-by":"crossref","first-page":"95","DOI":"10.1609\/aiide.v16i1.7416","article-title":"Pcgrl: Procedural content generation via reinforcement learning","volume":"16","author":"khalifa","year":"0","journal-title":"Proceedings of the AAAI Conference on Artificial Intelligence and Interactive Digital Entertainment"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/DISA.2018.8490530"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1145\/3328485"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/CoG47356.2020.9231843"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1145\/3332165.3347899"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1145\/1166253.1166275"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1145\/3383668.3419938"},{"key":"ref4","first-page":"7","article-title":"Interestingness elements for explainable reinforcement learning through introspection","author":"sequeira","year":"0","journal-title":"IUI Workshops"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pcbi.1000209"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/CoG47356.2020.9231687"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/2909824.3020233"},{"key":"ref29","first-page":"278","article-title":"Policy invariance under reward transformations: Theory and application to reward shaping","volume":"99","author":"ng","year":"1999","journal-title":"ICML"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.29007\/k3nd"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D17-1106"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2018.8460937"},{"key":"ref2","first-page":"1","article-title":"Teaching on a budget in multiagent deep reinforcement learning","author":"ilhan","year":"0","journal-title":"2019 IEEE Conference on Games (COG)"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1613\/jair.1.11263"},{"key":"ref1","article-title":"Scalable agent alignment via reward modeling: a research direction","author":"leike","year":"2018","journal-title":"ArXiv Preprint"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1145\/3357236.3395525"},{"key":"ref22","article-title":"Interactive grounded language acquisition and generalization in a 2d world","author":"yu","year":"2018","journal-title":"ArXiv Preprint"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ROMAN.2011.6005223"},{"key":"ref24","article-title":"Guiding a reinforcement learner with natural language advice: Initial results in robocup soccer","author":"kuhlmann","year":"0","journal-title":"The AAAI-2004 Workshop on Supervisory Control of Learning and Adaptive Systems"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1145\/985692.985712"},{"key":"ref26","article-title":"Metrics and continuity in reinforcement learning","author":"lan","year":"2021","journal-title":"ArXiv Preprint"},{"key":"ref25","article-title":"A survey of reinforcement learning informed by natural language","author":"whiteson","year":"0","journal-title":"International Joint Conferences on Artificial Intelligence"}],"event":{"name":"2021 IEEE Conference on Games (CoG)","start":{"date-parts":[[2021,8,17]]},"location":"Copenhagen, Denmark","end":{"date-parts":[[2021,8,20]]}},"container-title":["2021 IEEE Conference on Games (CoG)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9618888\/9618891\/09618999.pdf?arnumber=9618999","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,1,17]],"date-time":"2023-01-17T15:42:34Z","timestamp":1673970154000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9618999\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,8,17]]},"references-count":30,"URL":"https:\/\/doi.org\/10.1109\/cog52621.2021.9618999","relation":{},"subject":[],"published":{"date-parts":[[2021,8,17]]}}}