{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,18]],"date-time":"2026-01-18T03:09:50Z","timestamp":1768705790249,"version":"3.49.0"},"reference-count":32,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,9,8]],"date-time":"2021-09-08T00:00:00Z","timestamp":1631059200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2021,9,8]],"date-time":"2021-09-08T00:00:00Z","timestamp":1631059200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,9,8]],"date-time":"2021-09-08T00:00:00Z","timestamp":1631059200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100005762","name":"National Taiwan University Hospital","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100005762","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,9,8]]},"DOI":"10.1109\/ichms53169.2021.9582667","type":"proceedings-article","created":{"date-parts":[[2021,10,27]],"date-time":"2021-10-27T20:07:19Z","timestamp":1635365239000},"page":"1-6","source":"Crossref","is-referenced-by-count":7,"title":["Human-Centered AI using Ethical Causality and Learning Representation for Multi-Agent Deep Reinforcement Learning"],"prefix":"10.1109","author":[{"given":"Joshua","family":"Ho","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Chien-Min","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref32","article-title":"Causality for machine learning","author":"bernhard","year":"2019","journal-title":"arXiv preprint arXiv 1911 12945"},{"key":"ref31","year":"2021","journal-title":"Learning from Human P"},{"key":"ref30","author":"naumov","year":"2021","journal-title":"Ethical Dilemmas in Strategic Games"},{"key":"ref10","doi-asserted-by":"crossref","first-page":"12487e","DOI":"10.1111\/exsy.12487","article-title":"Situation? centered goal reinforcement of activities of daily living in smart home environments","volume":"37 1","author":"oyeleke","year":"2020","journal-title":"Expert Systems"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.3035728"},{"key":"ref12","article-title":"Interactive learning from policy-dependent human feedback","author":"macglashan","year":"2017","journal-title":"International Conference on Machine Learning"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2017.7989385"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1145\/3029798.3038381"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.3390\/app10165574"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-57321-8_5"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ROMAN.2012.6343862"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-39077-2_13"},{"key":"ref19","year":"2021","journal-title":"Fast reinforcement learning through the composition of behaviours"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i04.5887"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/JAS.2017.7510604"},{"key":"ref27","article-title":"Scaling data-driven robotics with reward sketching and batch reinforcement learning","author":"cabi","year":"2019","journal-title":"arXiv preprint arXiv 1909 11324"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1145\/3277904"},{"key":"ref6","doi-asserted-by":"crossref","DOI":"10.1609\/aiide.v15i1.5237","article-title":"Improving deep reinforcement learning in minecraft with action advice","volume":"15","author":"frazier","year":"2019","journal-title":"Proceedings of the AAAI Conference on Artificial Intelligence and Interactive Digital Entertainment"},{"key":"ref29","article-title":"Toward causal representation learning","author":"bernhard","year":"2021","journal-title":"Proceedings of the IEEE"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1145\/3434074.3446361"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1145\/3313831.3376701"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/AIKE48582.2020.00031"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/THMS.2019.2912447"},{"key":"ref9","article-title":"Human-centered collaborative robots with deep reinforcement learning","author":"ghadirzadeh","year":"2020","journal-title":"IEEE l of Robotics and Automation"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1145\/3414472"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i04.5955"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/ICHMS49158.2020.9209525"},{"key":"ref21","article-title":"Transfer in deep reinforcement learning using successor features and generalised policy improvement","author":"barreto","year":"2018","journal-title":"International Conference on Machine Learning"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1145\/3377325.3377512"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/ICHMS49158.2020.9209555"},{"key":"ref26","article-title":"Acme: A research framework for distributed reinforcement learning","author":"hoffman","year":"2020","journal-title":"arXiv preprint arXiv 2006 04989"},{"key":"ref25","author":"lu","year":"2021","journal-title":"Decentralized Policy Gradient Descent Ascent for Safe Multi-Agent Reinforcement Learning"}],"event":{"name":"2021 IEEE 2nd International Conference on Human-Machine Systems (ICHMS)","location":"Magdeburg, Germany","start":{"date-parts":[[2021,9,8]]},"end":{"date-parts":[[2021,9,10]]}},"container-title":["2021 IEEE 2nd International Conference on Human-Machine Systems (ICHMS)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9582416\/9582443\/09582667.pdf?arnumber=9582667","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,11,11]],"date-time":"2023-11-11T20:57:45Z","timestamp":1699736265000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9582667\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,9,8]]},"references-count":32,"URL":"https:\/\/doi.org\/10.1109\/ichms53169.2021.9582667","relation":{},"subject":[],"published":{"date-parts":[[2021,9,8]]}}}