{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,5]],"date-time":"2025-11-05T11:12:37Z","timestamp":1762341157733,"version":"3.28.0"},"reference-count":31,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018,7]]},"DOI":"10.1109\/hsi.2018.8431232","type":"proceedings-article","created":{"date-parts":[[2018,8,13]],"date-time":"2018-08-13T18:11:17Z","timestamp":1534183877000},"page":"50-56","source":"Crossref","is-referenced-by-count":53,"title":["A Vision and Speech Enabled, Customizable, Virtual Assistant for Smart Environments"],"prefix":"10.1109","author":[{"given":"Giancarlo","family":"Iannizzotto","sequence":"first","affiliation":[]},{"given":"Lucia Lo","family":"Bello","sequence":"additional","affiliation":[]},{"given":"Andrea","family":"Nucita","sequence":"additional","affiliation":[]},{"given":"Giorgio Mario","family":"Grasso","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/ETFA.2008.4638508"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/HSI.2010.5514504"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2016.2527299"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298682"},{"journal-title":"Natural TTS Synthesis by Conditioning WaveNet on Mel Spectrogram Predictions","year":"2017","author":"shen","key":"ref12"},{"key":"ref13","article-title":"Deep speech: Scaling up end-to-end speech recognition","volume":"abs 1412 5567","author":"hannun","year":"2014","journal-title":"CoRR"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1023\/A:1025708916924"},{"key":"ref15","first-page":"204","article-title":"Flite: a small fast run-time synthesis engine","author":"black","year":"2001","journal-title":"4th ITRW on Speech Synthesis"},{"key":"ref16","first-page":"509","article-title":"Festival speaks italian!","author":"cosi","year":"2001","journal-title":"EUROSPEECH 2001 Scandinavia 7th European Conference on Speech Communication and Technology 2nd INTERSPEECH Event"},{"journal-title":"Snowboy hotword detection","year":"2018","key":"ref17"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2006.1659988"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1023\/B:VISI.0000013087.49260.fb"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/HSI.2010.5514566"},{"journal-title":"Embodied Conversational Agents","year":"2000","key":"ref4"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1145\/3173574.3174042"},{"key":"ref3","first-page":"359","article-title":"The persona effect: Affective impact of animated pedagogical agents","author":"lester","year":"1997","journal-title":"Proceedings of the ACM SIGCHI Conference on Human Factors in Computing Systems CHI '97"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1186\/s40469-015-0006-9"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1142\/S021800141455009X"},{"key":"ref5","first-page":"123","author":"andr\u00e9","year":"2010","journal-title":"Interacting with Embodied Conversational Agents"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/T-AFFC.2011.34"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/W16-3628"},{"key":"ref2","doi-asserted-by":"crossref","first-page":"125","DOI":"10.1007\/978-3-540-74997-4_12","article-title":"Creating rapport with virtual agents","author":"gratch","year":"2007","journal-title":"Intelligent Virtual Agents"},{"key":"ref9","first-page":"63","author":"martinez","year":"2016","journal-title":"Advances Challenges and Opportunities in Automatic Facial Expression Recognition"},{"key":"ref1","article-title":"The insecurity of home digital voice assistants - amazon alexa as a case study","volume":"abs 1712 3327","author":"lei","year":"2017","journal-title":"CoRR"},{"journal-title":"Open Source Computer Vision Library","year":"2015","key":"ref20"},{"journal-title":"High quality face recognition with deep metric learning","year":"2017","author":"king","key":"ref22"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref24","first-page":"189","author":"learned-miller","year":"2016","journal-title":"Labeled faces in the wild A survey"},{"key":"ref23","first-page":"1755","article-title":"Dlib-ml: A machine learning toolkit","volume":"10","author":"king","year":"2009","journal-title":"Journal of Machine Learning Research"},{"key":"ref26","first-page":"33","article-title":"Bukimi no tani [The uncanny valley]","volume":"7","author":"mori","year":"1970","journal-title":"Energy"},{"journal-title":"Mycroft an open source artificial intelligence for everyone","article-title":"MycroftAI","year":"2018","key":"ref25"}],"event":{"name":"2018 11th International Conference on Human System Interaction (HSI)","start":{"date-parts":[[2018,7,4]]},"location":"Gdansk","end":{"date-parts":[[2018,7,6]]}},"container-title":["2018 11th International Conference on Human System Interaction (HSI)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8417135\/8430754\/08431232.pdf?arnumber=8431232","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,1,26]],"date-time":"2022-01-26T08:19:50Z","timestamp":1643185190000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8431232\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,7]]},"references-count":31,"URL":"https:\/\/doi.org\/10.1109\/hsi.2018.8431232","relation":{},"subject":[],"published":{"date-parts":[[2018,7]]}}}