{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,2]],"date-time":"2025-08-02T04:28:52Z","timestamp":1754108932011,"version":"3.28.0"},"reference-count":29,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,12,13]],"date-time":"2021-12-13T00:00:00Z","timestamp":1639353600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,12,13]],"date-time":"2021-12-13T00:00:00Z","timestamp":1639353600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,12,13]]},"DOI":"10.1109\/asru51503.2021.9688234","type":"proceedings-article","created":{"date-parts":[[2022,2,3]],"date-time":"2022-02-03T15:31:00Z","timestamp":1643902260000},"page":"954-961","source":"Crossref","is-referenced-by-count":10,"title":["Multitask Generative Adversarial Imitation Learning for Multi-Domain Dialogue System"],"prefix":"10.1109","author":[{"given":"Chuan-En","family":"Hsu","sequence":"first","affiliation":[{"name":"National Yang Ming Chiao Tung University,Dept of Electrical and Computer Engineering,Taiwan"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mahdin","family":"Rohmatillah","sequence":"additional","affiliation":[{"name":"National Yang Ming Chiao Tung University,Dept of Electrical and Computer Engineering,Taiwan"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jen-Tzung","family":"Chien","sequence":"additional","affiliation":[{"name":"National Yang Ming Chiao Tung University,Dept of Electrical and Computer Engineering,Taiwan"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref10","first-page":"297","article-title":"Is your goal-oriented dialog model performing really well? empirical analysis of system-wise evaluation","author":"takanobu","year":"0","journal-title":"Proc of Annual Meeting of the Special Interest Group on Discourse and Dialogue"},{"key":"ref11","first-page":"4572","article-title":"Generative adversarial imitation learning","volume":"29","author":"ho","year":"0","journal-title":"Advances in neural information processing systems"},{"key":"ref12","first-page":"3675","article-title":"Hierarchical deep reinforcement learning: Integrating temporal abstraction and intrinsic motivation","volume":"29","author":"kulkarni","year":"0","journal-title":"Advances in neural information processing systems"},{"key":"ref13","article-title":"MGAN: Training generative adversarial nets with multiple generators","author":"hoang","year":"0","journal-title":"Proc of International Conference on Learning Representations"},{"key":"ref14","article-title":"MultiWOZ 2.1: Multi-domain dialogue state corrections and state tracking baselines","author":"eric","year":"2019","journal-title":"ArXiv Preprint"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-demos.19"},{"key":"ref16","first-page":"4496","article-title":"Distral: Robust multitask reinforcement learning","author":"teh","year":"0","journal-title":"Advances in neural information processing systems"},{"key":"ref17","first-page":"1407","article-title":"IMPALA: Scalable distributed deep-RL with importance weighted actor-learner architectures","author":"espeholt","year":"0","journal-title":"Proc of International Conference on Machine Learning"},{"key":"ref18","first-page":"1928","article-title":"Asynchronous methods for deep reinforcement learning","author":"mnih","year":"0","journal-title":"Proc of International Conference on Machine Learning"},{"key":"ref19","first-page":"2672","article-title":"Generative adversarial nets","volume":"27","author":"goodfellow","year":"0","journal-title":"Advances in neural information processing systems"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2020-1313"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.59"},{"key":"ref27","first-page":"4171","article-title":"BERT: Pre-training of deep bidirectional transformers for language understanding","author":"devlin","year":"0","journal-title":"Proc of Conference of North American Chapter of Association for Computational Linguistics Human Language Technologies"},{"key":"ref3","article-title":"Proximal policy optimization algorithms","author":"schulman","year":"2017","journal-title":"ArXiv Preprint"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.emnlp-main.273"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-1383"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.findings-emnlp.209"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2021-534"},{"key":"ref7","article-title":"Personalizing a dialogue system with transfer reinforcement learning","author":"mo","year":"0","journal-title":"Proc of AAAI Conference on Artificial Intelligence"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D19-1010"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1145\/3459637.3482333"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1007\/s11431-020-1692-3"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.23919\/EUSIPCO.2019.8903084"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/MLSP.2017.8168121"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.23919\/EUSIPCO.2019.8903147"},{"key":"ref24","first-page":"1611","article-title":"Multiple target prediction for deep reinforcement learning","author":"chien","year":"0","journal-title":"Proc of Asia-Pacific Signal and Information Processing Association Annual Summit and Conference"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.23919\/Eusipco47968.2020.9287440"},{"key":"ref26","article-title":"Algorithms for inverse reinforcement learning","author":"ng","year":"0","journal-title":"Proc of International Conference on Machine Learning"},{"key":"ref25","first-page":"3540","article-title":"FeUdal networks for hierarchical reinforcement learning","author":"vezhnevets","year":"0","journal-title":"Proc of International Conference on Machine Learning"}],"event":{"name":"2021 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","start":{"date-parts":[[2021,12,13]]},"location":"Cartagena, Colombia","end":{"date-parts":[[2021,12,17]]}},"container-title":["2021 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9687821\/9687855\/09688234.pdf?arnumber=9688234","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,5,16]],"date-time":"2022-05-16T16:41:45Z","timestamp":1652719305000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9688234\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,12,13]]},"references-count":29,"URL":"https:\/\/doi.org\/10.1109\/asru51503.2021.9688234","relation":{},"subject":[],"published":{"date-parts":[[2021,12,13]]}}}