{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,24]],"date-time":"2025-10-24T13:15:55Z","timestamp":1761311755088},"reference-count":31,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,1,19]]},"DOI":"10.1109\/slt48900.2021.9383623","type":"proceedings-article","created":{"date-parts":[[2021,3,25]],"date-time":"2021-03-25T20:46:54Z","timestamp":1616705214000},"source":"Crossref","is-referenced-by-count":12,"title":["Benchmarking LF-MMI, CTC And RNN-T Criteria For Streaming ASR"],"prefix":"10.1109","author":[{"given":"Xiaohui","family":"Zhang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Frank","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Chunxi","family":"Liu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Kjell","family":"Schubert","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Julian","family":"Chan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Pradyot","family":"Prakash","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jun","family":"Liu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ching-Feng","family":"Yeh","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Fuchun","family":"Peng","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yatharth","family":"Saraf","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Geoffrey","family":"Zweig","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref31","article-title":"Dual application of speech enhancement for automatic speech recognition","author":"pandey","year":"2021","journal-title":"Proc SLT"},{"key":"ref30","article-title":"Improving RNN transducer based ASR with auxiliary tasks","author":"liu","year":"2021","journal-title":"Proc SLT"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU46091.2019.9003854"},{"key":"ref11","article-title":"Multilingual graphemic hybrid ASR with massive data augmentation","author":"liu","year":"2020","journal-title":"Proc of the 1st Joint Workshop on Spoken Language Technologies for Under-resourced languages (SLTU) and Collaboration and Computing for Under-Resourced Languages (CCURL)"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2020-1344"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2016-595"},{"key":"ref14","article-title":"Exploring neural transducers for end-to-end speech recognition","author":"battenberg","year":"2017","journal-title":"Proc ASRU"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2020-2846"},{"key":"ref16","article-title":"Rnn-t for latency controlled asr with improved beam search","author":"jain","year":"2019"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8462682"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU46091.2019.9003972"},{"key":"ref19","article-title":"Efficient dynamic wfst decoding for personalized language models","author":"liu","year":"2019"},{"key":"ref28","article-title":"Alignment restricted streaming recurrent neural network transducer","author":"mahadeokar","year":"2021","journal-title":"Proc SLT"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2016.7472621"},{"key":"ref27","article-title":"Minimum latency training strategies for streaming sequence-to-sequence ASR","author":"inaguma","year":"2020","journal-title":"Proc ICASSP"},{"key":"ref3","article-title":"Attention-based models for speech recognition","author":"chorowski","year":"2015","journal-title":"Proc NueralIPS"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9054345"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9052964"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2015.7178964"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.2013.6707758"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2020-1995"},{"key":"ref2","article-title":"Sequence Transduction with Recurrent Neural Networks","author":"graves","year":"2012","journal-title":"Proc ICML"},{"key":"ref9","doi-asserted-by":"crossref","DOI":"10.21437\/Interspeech.2017-1566","article-title":"Neural speech recognizer: Acoustic-to-word LSTM model for large vocabulary speech recognition","author":"soltau","year":"2017","journal-title":"Proc INTERSPEECH"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1145\/1143844.1143891"},{"key":"ref20","article-title":"Audio augmentation for speech recognition","author":"ko","year":"2015","journal-title":"Proc INTERSPEECH"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-2460"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-2680"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU46091.2019.9003906"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2020-2840"},{"key":"ref26","article-title":"Advancing Acoustic-to-Word CTC Model with Attention and Mixed-Units","author":"das","year":"2018","journal-title":"IEEE TASLP"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU46091.2019.9003834"}],"event":{"name":"2021 IEEE Spoken Language Technology Workshop (SLT)","location":"Shenzhen, China","start":{"date-parts":[[2021,1,19]]},"end":{"date-parts":[[2021,1,22]]}},"container-title":["2021 IEEE Spoken Language Technology Workshop (SLT)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9383468\/9383452\/09383623.pdf?arnumber=9383623","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,5,31]],"date-time":"2021-05-31T21:30:42Z","timestamp":1622496642000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9383623\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,1,19]]},"references-count":31,"URL":"https:\/\/doi.org\/10.1109\/slt48900.2021.9383623","relation":{},"subject":[],"published":{"date-parts":[[2021,1,19]]}}}