{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,8]],"date-time":"2024-09-08T15:08:49Z","timestamp":1725808129800},"reference-count":31,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,6,6]],"date-time":"2021-06-06T00:00:00Z","timestamp":1622937600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,6,6]],"date-time":"2021-06-06T00:00:00Z","timestamp":1622937600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,6,6]]},"DOI":"10.1109\/icassp39728.2021.9414029","type":"proceedings-article","created":{"date-parts":[[2021,5,13]],"date-time":"2021-05-13T15:53:45Z","timestamp":1620921225000},"page":"7493-7497","source":"Crossref","is-referenced-by-count":9,"title":["RNN Transducer Models for Spoken Language Understanding"],"prefix":"10.1109","author":[{"given":"Samuel","family":"Thomas","sequence":"first","affiliation":[{"name":"IBM Research AI"}]},{"given":"Hong-Kwang J.","family":"Kuo","sequence":"additional","affiliation":[{"name":"IBM Research AI"}]},{"given":"George","family":"Saon","sequence":"additional","affiliation":[{"name":"IBM Research AI"}]},{"given":"Zoltan","family":"Tuske","sequence":"additional","affiliation":[{"name":"IBM Research AI"}]},{"given":"Brian","family":"Kingsbury","sequence":"additional","affiliation":[{"name":"IBM Research AI"}]},{"given":"Gakuto","family":"Kurata","sequence":"additional","affiliation":[{"name":"IBM Research AI"}]},{"given":"Zvi","family":"Kons","sequence":"additional","affiliation":[{"name":"IBM Research AI"}]},{"given":"Ron","family":"Hoory","sequence":"additional","affiliation":[{"name":"IBM Research AI"}]}],"member":"263","reference":[{"doi-asserted-by":"publisher","key":"ref31","DOI":"10.21437\/Interspeech.2019-1705"},{"doi-asserted-by":"publisher","key":"ref30","DOI":"10.21236\/ADA460245"},{"doi-asserted-by":"publisher","key":"ref10","DOI":"10.1109\/ICASSP40776.2020.9054417"},{"doi-asserted-by":"publisher","key":"ref11","DOI":"10.21437\/Interspeech.2020-1963"},{"doi-asserted-by":"publisher","key":"ref12","DOI":"10.21437\/Interspeech.2020-1160"},{"doi-asserted-by":"publisher","key":"ref13","DOI":"10.21437\/Interspeech.2020-0059"},{"doi-asserted-by":"publisher","key":"ref14","DOI":"10.21437\/Interspeech.2020-2924"},{"doi-asserted-by":"publisher","key":"ref15","DOI":"10.1109\/ICASSP40776.2020.9054314"},{"doi-asserted-by":"publisher","key":"ref16","DOI":"10.1109\/ICASSP.2005.1415176"},{"doi-asserted-by":"publisher","key":"ref17","DOI":"10.1109\/TASL.2008.2001106"},{"year":"2012","author":"graves","article-title":"Sequence transduction with recurrent neural networks","key":"ref18"},{"doi-asserted-by":"publisher","key":"ref19","DOI":"10.1109\/ICASSP.2019.8682336"},{"doi-asserted-by":"publisher","key":"ref28","DOI":"10.21437\/Interspeech.2019-2841"},{"doi-asserted-by":"publisher","key":"ref4","DOI":"10.1109\/ICASSP.2018.8461718"},{"key":"ref27","article-title":"Audio augmentation for speech recognition","author":"ko","year":"2015","journal-title":"Proc INTERSPEECH"},{"key":"ref3","article-title":"Exploring ASR-free end-to-end modeling to improve spoken language understanding in a cloud-based dialog system","author":"qian","year":"2017","journal-title":"Proc IEEE ASRU Workshop"},{"doi-asserted-by":"publisher","key":"ref6","DOI":"10.21437\/Interspeech.2019-2396"},{"doi-asserted-by":"publisher","key":"ref29","DOI":"10.21437\/Interspeech.2019-1952"},{"doi-asserted-by":"publisher","key":"ref5","DOI":"10.1109\/SLT.2018.8639513"},{"doi-asserted-by":"publisher","key":"ref8","DOI":"10.1109\/ICASSP40776.2020.9053281"},{"doi-asserted-by":"publisher","key":"ref7","DOI":"10.21437\/Interspeech.2019-1832"},{"doi-asserted-by":"publisher","key":"ref2","DOI":"10.1109\/SLT.2018.8639043"},{"doi-asserted-by":"publisher","key":"ref9","DOI":"10.1109\/ICASSP40776.2020.9053063"},{"doi-asserted-by":"publisher","key":"ref1","DOI":"10.1109\/ICASSP.2018.8461785"},{"key":"ref20","article-title":"Exploring architectures, data and units for streaming end-to-end speech recognition with RNN-transducer","author":"rao","year":"2017","journal-title":"Proc IEEE ASRU Workshop"},{"doi-asserted-by":"publisher","key":"ref22","DOI":"10.21437\/Interspeech.2019-1943"},{"doi-asserted-by":"publisher","key":"ref21","DOI":"10.1109\/ASRU46091.2019.9003906"},{"key":"ref24","article-title":"Advancing RNN transducer technology for speech recognition","author":"saon","year":"2021","journal-title":"Proc ICASSP"},{"doi-asserted-by":"publisher","key":"ref23","DOI":"10.1109\/ICASSP40776.2020.9054419"},{"doi-asserted-by":"publisher","key":"ref26","DOI":"10.3115\/116580.116613"},{"doi-asserted-by":"publisher","key":"ref25","DOI":"10.1145\/1553374.1553380"}],"event":{"name":"ICASSP 2021 - 2021 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","start":{"date-parts":[[2021,6,6]]},"location":"Toronto, ON, Canada","end":{"date-parts":[[2021,6,11]]}},"container-title":["ICASSP 2021 - 2021 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9413349\/9413350\/09414029.pdf?arnumber=9414029","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,8,2]],"date-time":"2022-08-02T20:18:42Z","timestamp":1659471522000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9414029\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,6,6]]},"references-count":31,"URL":"https:\/\/doi.org\/10.1109\/icassp39728.2021.9414029","relation":{},"subject":[],"published":{"date-parts":[[2021,6,6]]}}}