{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,23]],"date-time":"2024-10-23T10:05:09Z","timestamp":1729677909612,"version":"3.28.0"},"reference-count":19,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2013,12]]},"DOI":"10.1109\/asru.2013.6707714","type":"proceedings-article","created":{"date-parts":[[2014,1,10]],"date-time":"2014-01-10T20:07:23Z","timestamp":1389384443000},"page":"108-113","source":"Crossref","is-referenced-by-count":5,"title":["Expert-based reward shaping and exploration scheme for boosting policy learning of dialogue management"],"prefix":"10.1109","author":[{"given":"Emmanuel","family":"Ferreira","sequence":"first","affiliation":[]},{"given":"Fabrice","family":"Lefevre","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"19","doi-asserted-by":"crossref","DOI":"10.21437\/Interspeech.2011-302","article-title":"User simulation in dialogue systems using inverse reinforcement learning","author":"chandramohan","year":"2011","journal-title":"InterSpeech"},{"key":"17","doi-asserted-by":"crossref","first-page":"483","DOI":"10.1613\/jair.3077","article-title":"Kalman temporal differences","volume":"39","author":"geist","year":"2010","journal-title":"Journal of Artificial Intelligence Research (JAIR)"},{"key":"18","doi-asserted-by":"crossref","DOI":"10.21437\/Interspeech.2011-434","article-title":"Uncertainty management for on-line optimisation of a pomdp-based large-scale spoken dialogue system","author":"daubigney","year":"2011","journal-title":"InterSpeech"},{"key":"15","doi-asserted-by":"publisher","DOI":"10.1016\/S0004-3702(98)00023-X"},{"key":"16","doi-asserted-by":"publisher","DOI":"10.1115\/1.3662552"},{"key":"13","first-page":"617","article-title":"Integrating reinforcement learning with human demonstrations of varying ability","author":"taylor","year":"0","journal-title":"The 10th International Conference on Autonomous Agents and Multiagent Systems 2011 AAMAS '11"},{"key":"14","article-title":"Integrating expert knowledge into pomdp optimization for spoken dialog systems","author":"williams","year":"2008","journal-title":"Proceedings of the AAAI-08 Workshop on Advancements in POMDP Solvers"},{"key":"11","article-title":"Policy invariance under reward transformations: Theory and application to reward shaping","author":"ng","year":"1999","journal-title":"ICML"},{"key":"12","doi-asserted-by":"publisher","DOI":"10.1162\/coli.2008.07-028-R2-05-82"},{"key":"3","doi-asserted-by":"publisher","DOI":"10.1016\/j.csl.2009.04.001"},{"key":"2","doi-asserted-by":"publisher","DOI":"10.1109\/TNN.1998.712192"},{"key":"1","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.1997.658989"},{"key":"10","doi-asserted-by":"publisher","DOI":"10.1109\/JSTSP.2012.2229257"},{"key":"7","article-title":"Effects of the user model on simulation-based learning of dialogue strategies","author":"schatztnann","year":"2005","journal-title":"ASRU"},{"key":"6","doi-asserted-by":"publisher","DOI":"10.1017\/S0269888906000944"},{"key":"5","article-title":"Unsupervised clustering of probability distributions of semantic graphs for pomdp based spoken dialogue systems with summary space","author":"pinault","year":"2011","journal-title":"Proc IJCAI Workshop Knowledge and Reasoning in Practical Dialogue Systems"},{"key":"4","doi-asserted-by":"publisher","DOI":"10.1016\/j.csl.2009.07.003"},{"key":"9","doi-asserted-by":"crossref","first-page":"903","DOI":"10.1109\/JSTSP.2012.2229963","article-title":"Incremental sparse bayesian method for online dialog strategy learning","volume":"6","author":"sungjin","year":"2012","journal-title":"Journal on Selected Topics in Signal Processing"},{"key":"8","article-title":"Gaussian processes for fast policy optimisation of pomdp-based dialogue managers","author":"gasic","year":"2010","journal-title":"SIGdial"}],"event":{"name":"2013 IEEE Workshop on Automatic Speech Recognition & Understanding (ASRU)","start":{"date-parts":[[2013,12,8]]},"location":"Olomouc, Czech Republic","end":{"date-parts":[[2013,12,12]]}},"container-title":["2013 IEEE Workshop on Automatic Speech Recognition and Understanding"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6695806\/6707689\/06707714.pdf?arnumber=6707714","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,3,23]],"date-time":"2022-03-23T01:01:36Z","timestamp":1647997296000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/6707714\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2013,12]]},"references-count":19,"URL":"https:\/\/doi.org\/10.1109\/asru.2013.6707714","relation":{},"subject":[],"published":{"date-parts":[[2013,12]]}}}