{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,29]],"date-time":"2026-04-29T22:21:59Z","timestamp":1777501319251,"version":"3.51.4"},"reference-count":30,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2017,12]]},"DOI":"10.1109\/apsipa.2017.8282005","type":"proceedings-article","created":{"date-parts":[[2018,2,14]],"date-time":"2018-02-14T15:31:33Z","timestamp":1518622293000},"page":"076-082","source":"Crossref","is-referenced-by-count":5,"title":["An integrated framework for multimodal human-robot interaction"],"prefix":"10.1109","author":[{"given":"Luis Fernando","family":"D'Haro","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Andreea I.","family":"Niculescu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Caixia","family":"Cai","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Suraj","family":"Nair","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Rafael E.","family":"Banchs","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Alois","family":"Knoll","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Haizhou","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref30","article-title":"Strategies to cope with errors in human-machine spoken interactions: using chatbots as back-off mechanism for task-oriented dialogues","author":"niculescu","year":"2015","journal-title":"Proceedings ERRARE 2015-Errors by Humans and Machines in multimedia multimodal and multilingual data processing"},{"key":"ref10","author":"van den oord","year":"2016","journal-title":"WaveNet A Generative Model for Raw Audio"},{"key":"ref11","author":"arik","year":"2017","journal-title":"Deep Voice Real-time neural text-to-speech"},{"key":"ref12","article-title":"CMU's robust spoken language understanding system","volume":"93","author":"sunil","year":"1993","journal-title":"Proceedings of EUROSPEECH"},{"key":"ref13","article-title":"Stochastic Representation of Conceptual Structure in the ATIS Task","author":"roberto","year":"0","journal-title":"HLT 1991"},{"key":"ref14","first-page":"2205","article-title":"Natural language understanding using statistical machine translation","author":"klaus","year":"2001","journal-title":"InterSpeech"},{"key":"ref15","first-page":"4077","article-title":"Recurrent conditional random field for language understanding","author":"kaisheng","year":"2014","journal-title":"Proceedings IEEE International Conference on Acoustics Speech and Signal Processing (ICASSP) 2014"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2014.2303296"},{"key":"ref17","author":"jaech","year":"2016","journal-title":"Domain adaptation of recurrent neural networks for natural language understanding"},{"key":"ref18","doi-asserted-by":"crossref","first-page":"11","DOI":"10.1109\/89.817450","article-title":"A stochastic model of human-machine interaction for learning dialog strategies","volume":"8","author":"esther","year":"2000","journal-title":"IEEE Transactions on Speech and Audio Processing"},{"key":"ref19","first-page":"716","article-title":"Automating spoken dialogue management design using machine learning: An industry perspective","author":"tim","year":"2008","journal-title":"Speech communication 50"},{"key":"ref28","first-page":"840","article-title":"Configuration of dialogue agent with multiple knowledge sources","author":"ridong","year":"2015","journal-title":"Signal and Information Processing Association Annual Summit and Conference (APSIPA) 2015 Asia-Pacific"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2012.2205597"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1016\/j.specom.2011.05.008"},{"key":"ref3","doi-asserted-by":"crossref","first-page":"45","DOI":"10.1109\/79.536824","article-title":"A review of large-vocabulary continuous-speech","volume":"13","author":"young","year":"1996","journal-title":"Signal Processing Magazine"},{"key":"ref6","article-title":"Which ASR should I choose for my dialogue system?","author":"morbini","year":"2013","journal-title":"Proc SIGDial"},{"key":"ref29","article-title":"A configurable dialogue platform for ASORO robots","author":"ridong","year":"2011","journal-title":"Asia Pacific Signal and Information Processing Association Annual Summit and Conference APSIPA ASC"},{"key":"ref5","author":"wayne","year":"2016","journal-title":"Achieving human parity in conversational speech recognition"},{"key":"ref8","volume":"33","author":"ehud","year":"2000","journal-title":"Building Natural Language Generation Systems"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2016-299"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1145\/2974804.2974805"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.1996.541110"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCIS.2015.7274565"},{"key":"ref20","first-page":"67","article-title":"OpenDial: A toolkit for developing spoken dialogue systems with probabilistic rules","author":"pierre","year":"2016","journal-title":"ACL 2016"},{"key":"ref22","article-title":"trindikit.py: An open-source Python library for developing ISU-based dialogue systems","author":"peter","year":"2009","journal-title":"Proc of IWSDS 9"},{"key":"ref21","first-page":"931","article-title":"GALAXY-II: a reference architecture for conversational system development","volume":"98","year":"1998","journal-title":"ICSLP"},{"key":"ref24","article-title":"When industrial robots become more social: on the desihn and evaluation of a multimodal interface for welding robots","year":"2017","journal-title":"APSIPA"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/IUSER.2014.7002667"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1007\/978-0-85729-414-2_8"},{"key":"ref25","first-page":"47","article-title":"A robust spoken Q&A system with scarce in-domain resources","author":"luis fernando","year":"2015","journal-title":"Signal and Information Processing Association Annual Summit and Conference (APSIPA) 2015 Asia-Pacific"}],"event":{"name":"2017 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","location":"Kuala Lumpur","start":{"date-parts":[[2017,12,12]]},"end":{"date-parts":[[2017,12,15]]}},"container-title":["2017 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8270695\/8281978\/08282005.pdf?arnumber=8282005","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,10,10]],"date-time":"2019-10-10T20:20:15Z","timestamp":1570738815000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/8282005\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,12]]},"references-count":30,"URL":"https:\/\/doi.org\/10.1109\/apsipa.2017.8282005","relation":{},"subject":[],"published":{"date-parts":[[2017,12]]}}}