{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,30]],"date-time":"2024-10-30T07:24:02Z","timestamp":1730273042486,"version":"3.28.0"},"reference-count":26,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018,11]]},"DOI":"10.1109\/iscslp.2018.8706581","type":"proceedings-article","created":{"date-parts":[[2019,5,20]],"date-time":"2019-05-20T22:58:35Z","timestamp":1558393115000},"page":"280-284","source":"Crossref","is-referenced-by-count":4,"title":["From Speech Signals to Semantics \u2014 Tagging Performance at Acoustic, Phonetic and Word Levels"],"prefix":"10.1109","author":[{"given":"Yao","family":"Qian","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Rutuja","family":"Ubale","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Patrick","family":"Lange","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Keelan","family":"Evanini","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Frank","family":"Soong","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"doi-asserted-by":"publisher","key":"ref10","DOI":"10.1109\/ASRU.2011.6163899"},{"doi-asserted-by":"publisher","key":"ref11","DOI":"10.1109\/ASRU.2015.7404790"},{"doi-asserted-by":"publisher","key":"ref12","DOI":"10.1109\/ICASSP.2016.7472618"},{"key":"ref13","first-page":"6","article-title":"Architectures for deep neural network based acoustic models defined over windowed speech waveforms","author":"bhargava","year":"2015","journal-title":"Proc of Interspeech"},{"doi-asserted-by":"publisher","key":"ref14","DOI":"10.1109\/ICASSP.2016.7472652"},{"doi-asserted-by":"publisher","key":"ref15","DOI":"10.21437\/Interspeech.2016-686"},{"doi-asserted-by":"publisher","key":"ref16","DOI":"10.1109\/ICASSP.2017.7953076"},{"key":"ref17","article-title":"Exploring ASR-free end-to-end modeling to improve spoken language understanding in a cloud-based dialog system","author":"qian","year":"2017","journal-title":"Proc of ASRU"},{"key":"ref18","article-title":"Towards end-to-end modeling of spoken language understanding in a cloud-based spoken dialog system","author":"qian","year":"2017","journal-title":"Proc of SemDial"},{"doi-asserted-by":"publisher","key":"ref19","DOI":"10.1109\/ICASSP.2018.8461785"},{"doi-asserted-by":"publisher","key":"ref4","DOI":"10.1016\/j.specom.2005.06.001"},{"doi-asserted-by":"publisher","key":"ref3","DOI":"10.1109\/ICASSP.2011.5947636"},{"doi-asserted-by":"publisher","key":"ref6","DOI":"10.3115\/1073445.1073446"},{"key":"ref5","article-title":"Learning spoken language without transcriptions","volume":"99","author":"gorin","year":"1999","journal-title":"Proc of ASRU"},{"key":"ref8","first-page":"1764","article-title":"Towards end-to-end speech recognition with recurrent neural networks","volume":"14","author":"graves","year":"2015","journal-title":"Proc of ICML"},{"key":"ref7","first-page":"553","article-title":"Speech utterance classification model training without manual transcriptions","volume":"1","author":"wang","year":"2006","journal-title":"Proc of ICASSP"},{"doi-asserted-by":"publisher","key":"ref2","DOI":"10.1109\/ASRU.2013.6707709"},{"doi-asserted-by":"publisher","key":"ref9","DOI":"10.1109\/ICASSP.2011.5947700"},{"doi-asserted-by":"publisher","key":"ref1","DOI":"10.1109\/TASLP.2014.2383614"},{"doi-asserted-by":"publisher","key":"ref20","DOI":"10.1007\/978-3-319-42816-1_13"},{"doi-asserted-by":"publisher","key":"ref22","DOI":"10.1109\/ICASSP.2016.7472621"},{"doi-asserted-by":"publisher","key":"ref21","DOI":"10.1162\/neco.1997.9.8.1735"},{"key":"ref24","article-title":"The Kaldi speech recognition toolkit","author":"povey","year":"2011","journal-title":"Prof of ASRU"},{"doi-asserted-by":"publisher","key":"ref23","DOI":"10.21437\/Interspeech.2016-82"},{"doi-asserted-by":"publisher","key":"ref26","DOI":"10.21437\/Interspeech.2016-291"},{"key":"ref25","first-page":"788798","article-title":"Front end factor analysis for speaker verification","volume":"19","author":"dehak","year":"2011","journal-title":"IEEE Transactions on Acoustics Speech and Signal Processing"}],"event":{"name":"2018 11th International Symposium on Chinese Spoken Language Processing (ISCSLP)","start":{"date-parts":[[2018,11,26]]},"location":"Taipei City, Taiwan","end":{"date-parts":[[2018,11,29]]}},"container-title":["2018 11th International Symposium on Chinese Spoken Language Processing (ISCSLP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8701133\/8706262\/08706581.pdf?arnumber=8706581","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,8,24]],"date-time":"2020-08-24T00:18:49Z","timestamp":1598228329000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8706581\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,11]]},"references-count":26,"URL":"https:\/\/doi.org\/10.1109\/iscslp.2018.8706581","relation":{},"subject":[],"published":{"date-parts":[[2018,11]]}}}