{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,16]],"date-time":"2026-04-16T11:30:58Z","timestamp":1776339058195,"version":"3.51.2"},"reference-count":33,"publisher":"IEEE","license":[{"start":{"date-parts":[[2019,10,1]],"date-time":"2019-10-01T00:00:00Z","timestamp":1569888000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2019,10,1]],"date-time":"2019-10-01T00:00:00Z","timestamp":1569888000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2019,10,1]],"date-time":"2019-10-01T00:00:00Z","timestamp":1569888000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2019,10]]},"DOI":"10.1109\/sped.2019.8906584","type":"proceedings-article","created":{"date-parts":[[2019,11,25]],"date-time":"2019-11-25T14:12:33Z","timestamp":1574691153000},"page":"1-8","source":"Crossref","is-referenced-by-count":10,"title":["Towards End-to-End spoken intent recognition in smart home"],"prefix":"10.1109","author":[{"given":"Thierry","family":"Desot","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Francois","family":"Portet","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Michel","family":"Vacher","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.1986.1169172"},{"key":"ref32","first-page":"1389","article-title":"The CIRDO corpus: comprehensive audio\/video database of domestic falls of elderly people","author":"vacher","year":"2016","journal-title":"Proceedings of the 10th International Conference on Language Resources and Evaluation (LREC 2016)"},{"key":"ref31","first-page":"707","article-title":"Etude de la performance des mod&#x00E8;les acoustiques pour des voix de personnes a?g&#x00E9;es en vue de l&#x2019;adaptation des syst&#x00E8;mes de RAP (assessment of the acoustic models performance in the ageing voice case for ASR system adaptation)[in French]","author":"aman","year":"2012","journal-title":"Actes de la conf&#x00E9;rence conjointe JEP-TALN-RECITAL 2012 volume 1 JEP ATALA\/AFCP"},{"key":"ref30","first-page":"1610","article-title":"A French non-native corpus for automatic speech recognition","volume":"6","author":"tan","year":"0","journal-title":"Proc Int Conference on Language Resources and Evaluation (LREC)"},{"key":"ref10","article-title":"The Kaldi speech recognition toolkit","author":"povey","year":"2011","journal-title":"Tech Rep"},{"key":"ref11","article-title":"Parallel training of deep neural networks with natural gradient and parameter averaging","author":"povey","year":"2014"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2014.2383614"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/W17-5514"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2016-1352"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D17-1274"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2008.925143"},{"key":"ref17","doi-asserted-by":"crossref","first-page":"509","DOI":"10.1007\/978-3-030-00794-2_55","article-title":"Towards a French Smart-Home Voice Command Corpus: Design and NLU Experiments","author":"desot","year":"2018","journal-title":"International Conference on Text Speech and Dialogue"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/PERCOMW.2019.8730721"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2018-1456"},{"key":"ref28","article-title":"A large reference corpus for spoken French: Eslo 1 and 2 and its variations","author":"serpollet","year":"2007","journal-title":"Proceedings from The Corpus Linguistics Conference Series"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.3115\/1613984.1613994"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1613\/jair.5477"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/SLT.2018.8639513"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2017-1178"},{"key":"ref29","first-page":"1","article-title":"Analysis of disfluent repetitions in spontaneous speech recognition","author":"rangarajan","year":"2006","journal-title":"Signal Processing Conference 2006 14th European"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.3115\/1220175.1220253"},{"key":"ref8","article-title":"Deep speech: Scaling up end-to-end speech recognition","author":"hannun","year":"2014"},{"key":"ref7","first-page":"3732","article-title":"Incorporating named entity recognition into the speech transcription process","author":"hatmi","year":"2013","journal-title":"Proc of Annual Conference of the International Speech Communication Association (Interspeech)"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8461785"},{"key":"ref9","article-title":"Training neural speech recognition systems with synthetic speech augmentation","author":"li","year":"2018"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1002\/9781119992691.ch3"},{"key":"ref20","first-page":"1","article-title":"Chainer: a next-generation open source framework for deep learning","volume":"5","author":"tokui","year":"2015","journal-title":"Proceedings of Workshop on Machine Learning Systems (LearningSys) in The Twenty-ninth Annual Conference on Neural Information Processing Systems (NIPS)"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2016.7472621"},{"key":"ref21","article-title":"Automatic differentiation in PyTorch","author":"paszke","year":"2017","journal-title":"NIPS-W"},{"key":"ref24","first-page":"4499","article-title":"The Sweet-Home speech and multimodal corpus for home automation interaction","author":"vacher","year":"2014","journal-title":"9th edition of the Language Resources and Evaluation Conference (LREC)"},{"key":"ref23","first-page":"173","article-title":"Deep speech 2: End-to-end speech recognition in English and Mandarin","author":"amodei","year":"2016","journal-title":"Proceedings of the International Conference on Machine Learning"},{"key":"ref26","first-page":"1234","article-title":"Sequence-to-sequence data augmentation for dialogue language understanding","author":"hou","year":"2018","journal-title":"Proceedings of the 27th International Conference on Computational Linguistics"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/DASC\/PiCom\/CBDCom\/CyberSciTech.2019.00149"}],"event":{"name":"2019 International Conference on Speech Technology and Human-Computer Dialogue (SpeD)","location":"Timisoara, Romania","start":{"date-parts":[[2019,10,10]]},"end":{"date-parts":[[2019,10,12]]}},"container-title":["2019 International Conference on Speech Technology and Human-Computer Dialogue (SpeD)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8895628\/8906276\/08906584.pdf?arnumber=8906584","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,7,14]],"date-time":"2022-07-14T23:15:59Z","timestamp":1657840559000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8906584\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,10]]},"references-count":33,"URL":"https:\/\/doi.org\/10.1109\/sped.2019.8906584","relation":{},"subject":[],"published":{"date-parts":[[2019,10]]}}}