{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,23]],"date-time":"2026-02-23T21:45:03Z","timestamp":1771883103838,"version":"3.50.1"},"reference-count":31,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018,12]]},"DOI":"10.1109\/slt.2018.8639655","type":"proceedings-article","created":{"date-parts":[[2019,2,14]],"date-time":"2019-02-14T23:36:34Z","timestamp":1550187394000},"page":"521-527","source":"Crossref","is-referenced-by-count":69,"title":["Multilingual Sequence-to-Sequence Speech Recognition: Architecture, Transfer Learning, and Language Modeling"],"prefix":"10.1109","author":[{"given":"Jaejin","family":"Cho","sequence":"first","affiliation":[]},{"given":"Murali Karthick","family":"Baskar","sequence":"additional","affiliation":[]},{"given":"Ruizhi","family":"Li","sequence":"additional","affiliation":[]},{"given":"Matthew","family":"Wiesner","sequence":"additional","affiliation":[]},{"given":"Sri Harish","family":"Mallidi","sequence":"additional","affiliation":[]},{"given":"Nelson","family":"Yalta","sequence":"additional","affiliation":[]},{"given":"Martin","family":"Karafiat","sequence":"additional","affiliation":[]},{"given":"Shinji","family":"Watanabe","sequence":"additional","affiliation":[]},{"given":"Takaaki","family":"Hori","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2014.6855089"},{"key":"ref30","article-title":"An investigation of deep neural networks for multilingual speech recognition training and adaptation","author":"tong","year":"2017","journal-title":"Tech Rep"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2014.6855129"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/SLT.2016.7846330"},{"key":"ref12","article-title":"Multilingual training and cross-lingual adaptation on CTC-based acoustic model","author":"tong","year":"2017","journal-title":"arXiv preprint arXiv 1711 11585"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/SLT.2014.7078569"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-66429-3_47"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8461802"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.2017.8268945"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8461972"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/JSTSP.2017.2763455"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2018-1910"},{"key":"ref28","first-page":"196","article-title":"RNNLM-recurrent neural network language modeling toolkit","author":"mikolov","year":"2011","journal-title":"Proc of the 2011 ASRU Workshop"},{"key":"ref4","first-page":"577","article-title":"Attention-based models for speech recognition","author":"chorowski","year":"2015","journal-title":"Advances in neural information processing systems"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1997.9.8.1735"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/D14-1179"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-24797-2_2"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2018-1456"},{"key":"ref5","first-page":"1764","article-title":"Towards end-to-end speech recognition with recurrent neural networks","volume":"14","author":"graves","year":"2014","journal-title":"ICML"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2017.7953164"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2016.7472621"},{"key":"ref2","article-title":"Neural machine translation by jointly learning to align and translate","author":"bahdanau","year":"2014","journal-title":"arXiv preprint arXiv 1409 0473"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1016\/j.specom.2013.07.008"},{"key":"ref1","first-page":"3104","article-title":"Sequence to sequence learning with neural networks","author":"sutskever","year":"2014","journal-title":"Advances in neural information processing systems"},{"key":"ref20","article-title":"Monotonic chunkwise attention","author":"chiu","year":"2017","journal-title":"CoRR"},{"key":"ref22","author":"zhang","year":"2016","journal-title":"Towards End-to-End Speech Recognition with Deep Convolutional Neural Networks"},{"key":"ref21","author":"simonyan","year":"2014","journal-title":"Very Deep Convolutional Networks for Large-scale Image Recognition"},{"key":"ref24","article-title":"Advances in joint CTC-attention based end-to-end speech recognition with a deep cnn encoder and RNN-LM","author":"hori","year":"2017","journal-title":"arXiv preprint arXiv 1706 02737"},{"key":"ref23","first-page":"577","article-title":"Attention-based models for speech recognition","volume":"2015 january","author":"chorowski","year":"2015","journal-title":"Advances in neural information processing systems"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/78.650093"},{"key":"ref25","first-page":"1","article-title":"The kaldi speech recognition toolkit","author":"povey","year":"2011","journal-title":"2011 IEEE Workshop on Automatic Speech Recognition &amp; Understanding"}],"event":{"name":"2018 IEEE Spoken Language Technology Workshop (SLT)","location":"Athens, Greece","start":{"date-parts":[[2018,12,18]]},"end":{"date-parts":[[2018,12,21]]}},"container-title":["2018 IEEE Spoken Language Technology Workshop (SLT)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8632666\/8639030\/08639655.pdf?arnumber=8639655","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,1,27]],"date-time":"2022-01-27T07:52:56Z","timestamp":1643269976000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8639655\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,12]]},"references-count":31,"URL":"https:\/\/doi.org\/10.1109\/slt.2018.8639655","relation":{},"subject":[],"published":{"date-parts":[[2018,12]]}}}