{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,4]],"date-time":"2026-04-04T05:40:28Z","timestamp":1775281228738,"version":"3.50.1"},"reference-count":30,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2013,5]]},"DOI":"10.1109\/icassp.2013.6639201","type":"proceedings-article","created":{"date-parts":[[2013,10,29]],"date-time":"2013-10-29T19:19:46Z","timestamp":1383074386000},"page":"7893-7897","source":"Crossref","is-referenced-by-count":235,"title":["KL-divergence regularized deep neural network adaptation for improved large vocabulary speech recognition"],"prefix":"10.1109","author":[{"given":"Dong","family":"Yu","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Kaisheng","family":"Yao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hang","family":"Su","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Gang","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Frank","family":"Seide","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"19","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-15760-8_54"},{"key":"17","doi-asserted-by":"crossref","first-page":"2857","DOI":"10.21437\/Interspeech.2011-715","article-title":"Improving lvcsr system combination using neural network language model cross adaptation","author":"liu","year":"2011","journal-title":"Proc Interspeech'11"},{"key":"18","doi-asserted-by":"crossref","DOI":"10.21437\/Interspeech.2012-9","article-title":"A initial attempt on task-specific adaptation for deep neural networkbased large vocabulary continuous speech recognition","author":"xiao","year":"2012","journal-title":"Proc Interspeech'10"},{"key":"15","doi-asserted-by":"crossref","first-page":"526","DOI":"10.21437\/Interspeech.2010-214","article-title":"Comparison of discriminative input and output transformations for speaker adaptation in the Hybrid NN\/HMM systems","author":"li","year":"2010","journal-title":"Proc Interspeech'10"},{"key":"16","doi-asserted-by":"publisher","DOI":"10.1016\/j.specom.2006.11.005"},{"key":"13","doi-asserted-by":"crossref","first-page":"2171","DOI":"10.21437\/Eurospeech.1995-411","article-title":"Speaker-adaptation for hybrid HMM-ANN continuous speech recognition system","author":"neto","year":"1995","journal-title":"Proc EuroSpeech'95"},{"key":"14","first-page":"1112","article-title":"Hybrid HMM-NN modeling of stationary-transitional units for continuous speech recognition","author":"albesano","year":"1997","journal-title":"Proc NIPS 97"},{"key":"11","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2012.2205597"},{"key":"12","doi-asserted-by":"crossref","first-page":"2183","DOI":"10.21437\/Eurospeech.1995-414","article-title":"Connectionist speaker normalization and adaptation","author":"abrash","year":"1995","journal-title":"Proc EuroSpeech'95"},{"key":"21","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2005.1415279"},{"key":"20","doi-asserted-by":"publisher","DOI":"10.1109\/SLT.2012.6424251"},{"key":"22","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN.2006.1716291"},{"key":"23","article-title":"Regularized adaptation of discriminative classifiers","author":"li","year":"2006","journal-title":"Proc ICASSP'06"},{"key":"24","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2000.862102"},{"key":"25","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.2011.6163899"},{"key":"26","article-title":"Factorized deep neural networks for adaptive speech recognition","author":"yu","year":"2012","journal-title":"International Workshop on Statistical Machine Learning for Speech Processing"},{"key":"27","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2012.2227738"},{"key":"28","author":"snoek","year":"2012","journal-title":"Practical Bayesian Optimization of Machine Learning Algorithms"},{"key":"29","doi-asserted-by":"crossref","first-page":"1348","DOI":"10.1109\/TASL.2009.2020890","article-title":"A novel framework and training algorithm for variable-parameter hidden markov models","volume":"17","author":"yu","year":"2009","journal-title":"IEEE Trans on Audio Speech and Language Processing"},{"key":"3","doi-asserted-by":"crossref","first-page":"437","DOI":"10.21437\/Interspeech.2011-169","article-title":"Conversational speech transcription using context-dependent deep neural networks","author":"seide","year":"2011","journal-title":"Proc Interspeech'11"},{"key":"2","article-title":"Roles of pretraining and finetuning in context-dependent DNN-HMMs for real-world speech recognition","author":"yu","year":"2010","journal-title":"Proc NIPS Workshop on Deep Learning and Unsupervised Feature Learning"},{"key":"10","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2013.6639100"},{"key":"1","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2011.2134090"},{"key":"30","doi-asserted-by":"crossref","first-page":"554","DOI":"10.21437\/Interspeech.2010-221","article-title":"On speaker adaptive training of artificial neural networks","author":"trmal","year":"2010","journal-title":"Proc Interspeech'10"},{"key":"7","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.2011.6163900"},{"key":"6","doi-asserted-by":"crossref","DOI":"10.21437\/Interspeech.2012-10","article-title":"Application of pretrained deep neural networks to large vocabulary speech recognition","author":"jaitly","year":"2012","journal-title":"Proc Interspeech'10"},{"key":"5","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2011.2109382"},{"key":"4","first-page":"2709","article-title":"Automated directory assistance system-From theory to practice","author":"yu","year":"2007","journal-title":"Proc Interspeech'07"},{"key":"9","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2013.6638951"},{"key":"8","doi-asserted-by":"crossref","DOI":"10.21437\/Interspeech.2012-3","article-title":"Scalable minimum bayes risk training of deep neural network acoustic models using distributed hessian-free optimization","author":"kingsbury","year":"2012","journal-title":"Proc Interspeech'10"}],"event":{"name":"ICASSP 2013 - 2013 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","location":"Vancouver, BC, Canada","start":{"date-parts":[[2013,5,26]]},"end":{"date-parts":[[2013,5,31]]}},"container-title":["2013 IEEE International Conference on Acoustics, Speech and Signal Processing"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6619549\/6637585\/06639201.pdf?arnumber=6639201","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,7,5]],"date-time":"2023-07-05T15:23:08Z","timestamp":1688570588000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/6639201\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2013,5]]},"references-count":30,"URL":"https:\/\/doi.org\/10.1109\/icassp.2013.6639201","relation":{},"subject":[],"published":{"date-parts":[[2013,5]]}}}