{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T01:12:54Z","timestamp":1740100374855,"version":"3.37.3"},"reference-count":11,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,10,20]],"date-time":"2021-10-20T00:00:00Z","timestamp":1634688000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2021,10,20]],"date-time":"2021-10-20T00:00:00Z","timestamp":1634688000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,10,20]],"date-time":"2021-10-20T00:00:00Z","timestamp":1634688000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100003561","name":"Ministry of Culture, Sports and Tourism (MCST)","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100003561","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100006465","name":"Korea Creative Content Agency (KOCCA)","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100006465","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,10,20]]},"DOI":"10.1109\/ictc52510.2021.9620856","type":"proceedings-article","created":{"date-parts":[[2021,12,7]],"date-time":"2021-12-07T20:49:57Z","timestamp":1638910197000},"page":"283-286","source":"Crossref","is-referenced-by-count":0,"title":["An Efficient Policy Improvement in Human Interactive Learning Using Entropy"],"prefix":"10.1109","author":[{"given":"Sung-Yun","family":"Park","sequence":"first","affiliation":[]},{"given":"Dae-Wook","family":"Kim","sequence":"additional","affiliation":[]},{"given":"Sang-Kwang","family":"Lee","sequence":"additional","affiliation":[]},{"given":"Seong-Il","family":"Yang","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TNN.1998.712192"},{"journal-title":"Learning from Human-generated Reward","year":"2012","author":"knox","key":"ref3"},{"key":"ref10","article-title":"Openai gym","author":"brockman","year":"0","journal-title":"ArXiv Preprint"},{"key":"ref6","first-page":"5","article-title":"Combining manual feedback with subsequent MDP reward signals for reinforcement learning","volume":"1","author":"knox","year":"0","journal-title":"IEEE International Conference on Autonomous Agents and Multiagent Systems"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1145\/1597735.1597738"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4419-7970-4"},{"key":"ref8","article-title":"Deep tamer: Interactive agent shaping in high-dimensional state spaces","volume":"32","author":"warnell","year":"0","journal-title":"32nd AAAI Conference on Artificial Intelligence AAAI 2018"},{"key":"ref7","first-page":"4","article-title":"Reinforcement Learning from Simultaneous Human and MDP Reward","author":"knox","year":"0","journal-title":"2012 11th International Conference on Autonomous Agents and Multiagent Systems"},{"key":"ref2","first-page":"10","article-title":"On the numeric stability of gaussian processes regression for relational reinforcement learning","author":"ramon","year":"0","journal-title":"ICML-2004 Workshop on Relational Reinforcement Learning"},{"key":"ref9","article-title":"Deep q-learning from demonstrations","volume":"32","author":"hester","year":"0","journal-title":"32nd AAAI Conference on Artificial Intelligence AAAI 2018"},{"key":"ref1","first-page":"292","article-title":"TAMER: Training an Agent Manually via Evaluative Reinforcement","author":"knox","year":"0","journal-title":"2008 7th IEEE International Conference on Development and Learning"}],"event":{"name":"2021 International Conference on Information and Communication Technology Convergence (ICTC)","start":{"date-parts":[[2021,10,20]]},"location":"Jeju Island, Korea, Republic of","end":{"date-parts":[[2021,10,22]]}},"container-title":["2021 International Conference on Information and Communication Technology Convergence (ICTC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9620727\/9620211\/09620856.pdf?arnumber=9620856","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,5,10]],"date-time":"2022-05-10T16:53:37Z","timestamp":1652201617000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9620856\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,10,20]]},"references-count":11,"URL":"https:\/\/doi.org\/10.1109\/ictc52510.2021.9620856","relation":{},"subject":[],"published":{"date-parts":[[2021,10,20]]}}}