{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,2]],"date-time":"2025-12-02T15:03:26Z","timestamp":1764687806567,"version":"3.28.0"},"reference-count":21,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018,4]]},"DOI":"10.1109\/icassp.2018.8461979","type":"proceedings-article","created":{"date-parts":[[2018,9,21]],"date-time":"2018-09-21T22:24:48Z","timestamp":1537568688000},"page":"6094-6098","source":"Crossref","is-referenced-by-count":4,"title":["Modeling Non-Linguistic Contextual Signals in LSTM Language Models Via Domain Adaptation"],"prefix":"10.1109","author":[{"given":"Min","family":"Ma","sequence":"first","affiliation":[]},{"given":"Shankar","family":"Kumar","sequence":"additional","affiliation":[]},{"given":"Fadi","family":"Biadsy","sequence":"additional","affiliation":[]},{"given":"Michael","family":"Nirschl","sequence":"additional","affiliation":[]},{"given":"Tomas","family":"Vykruta","sequence":"additional","affiliation":[]},{"given":"Pedro","family":"Moreno","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"crossref","DOI":"10.21437\/Interspeech.2017-1310","article-title":"Approaches for neural-network language model adaptation","author":"ma","year":"2017","journal-title":"Proceedings of the Interspeech"},{"key":"ref11","doi-asserted-by":"crossref","first-page":"109","DOI":"10.1016\/S0079-7421(08)60536-8","article-title":"Catastrophic interference in connectionist networks: The sequential learning problem","volume":"24","author":"mccloskey","year":"1989","journal-title":"Psychology of Learning and Motivation"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2016-480"},{"key":"ref13","first-page":"1","article-title":"Learning representations by back-propagating errors","volume":"5","author":"david","year":"1988","journal-title":"Cognitive Modeling"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1145\/2623330.2623612"},{"key":"ref15","first-page":"2121","article-title":"Adaptive subgradient methods for online learning and stochastic optimization","volume":"12","author":"duchi","year":"2011","journal-title":"Journal of Machine Learning Research"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICFHR.2014.55"},{"key":"ref17","article-title":"Long short-term memory recurrent neural network architectures for large scale acoustic modeling","author":"sak","year":"2014","journal-title":"Fifteenth Annual Conference of the International Speech Communication Association"},{"key":"ref18","article-title":"LSTM: A search space odyssey","author":"klaus","year":"2016","journal-title":"IEEE Transactions on Neural Networks and Learning Systems"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298932"},{"key":"ref4","article-title":"Recurrent neural network language model adaptation for multi-genre broadcast speech recognition","author":"xie","year":"2015","journal-title":"Proceedings of Interspeech"},{"key":"ref3","first-page":"194","article-title":"LSTM neural networks for language modeling","author":"sundermeyer","year":"2012","journal-title":"INTER-SPEECH"},{"key":"ref6","article-title":"Semi-supervised adaptation of rnnlms by fine-tuning with domain-specific auxiliary features","author":"salil","year":"2017","journal-title":"Proceedings of the Interspeech"},{"journal-title":"Contextual lstm (clstm) models for large scale nlp tasks","year":"2016","author":"ghosh","key":"ref5"},{"key":"ref8","doi-asserted-by":"crossref","first-page":"504","DOI":"10.1126\/science.1127647","article-title":"Reducing the dimensionality of data with neural networks","volume":"313","author":"e hinton","year":"2006","journal-title":"Science"},{"key":"ref7","article-title":"Effectively building tera scale maxent language models incorporating non-linguistic signals","author":"biadsy","year":"2017","journal-title":"Proc In-terspeech"},{"key":"ref2","first-page":"20","article-title":"Deep neural network language models","author":"ebru","year":"2012","journal-title":"Proceedings of the NAACL-HLT 2012 Workshop Will We Ever Really Replace the N-gram Model? On the Future of Language Modeling for HLT Association for Computational Linguistics"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/SLT.2012.6424228"},{"key":"ref9","article-title":"Improved neural network based language modelling and adaptation","author":"junho","year":"2010","journal-title":"Eleventh Annual Conference of the International Speech Communication Association"},{"key":"ref20","doi-asserted-by":"crossref","DOI":"10.1109\/ASRU.2017.8268931","article-title":"Lat-tice rescoring strategies for long short-term memory language models in speech recognition","author":"kumar","year":"2017","journal-title":"Automatic Speech Recognition and Understanding (ASRU) 2017 IEEE Workshop on"},{"journal-title":"Using the output embedding to improve language models","year":"2016","author":"press","key":"ref21"}],"event":{"name":"ICASSP 2018 - 2018 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","start":{"date-parts":[[2018,4,15]]},"location":"Calgary, AB","end":{"date-parts":[[2018,4,20]]}},"container-title":["2018 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8450881\/8461260\/08461979.pdf?arnumber=8461979","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,8,24]],"date-time":"2020-08-24T05:57:38Z","timestamp":1598248658000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8461979\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,4]]},"references-count":21,"URL":"https:\/\/doi.org\/10.1109\/icassp.2018.8461979","relation":{},"subject":[],"published":{"date-parts":[[2018,4]]}}}