{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,4]],"date-time":"2026-04-04T06:12:46Z","timestamp":1775283166551,"version":"3.50.1"},"reference-count":106,"publisher":"Elsevier BV","issue":"3","license":[{"start":{"date-parts":[[1996,5,1]],"date-time":"1996-05-01T00:00:00Z","timestamp":830908800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Speech Communication"],"published-print":{"date-parts":[[1996,5]]},"DOI":"10.1016\/0167-6393(96)00003-9","type":"journal-article","created":{"date-parts":[[2002,7,26]],"date-time":"2002-07-26T01:59:02Z","timestamp":1027648742000},"page":"205-231","source":"Crossref","is-referenced-by-count":73,"title":["Towards increasing speech recognition error rates"],"prefix":"10.1016","volume":"18","author":[{"given":"Herv\u00e9","family":"Bourlard","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hynek","family":"Hermansky","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Nelson","family":"Morgan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"78","reference":[{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB1","series-title":"Proc. IEEE Internat. Conf. Acoust. Speech","first-page":"684","article-title":"Rapid speaker adaptation using model prediction","author":"Ahadi","year":"1995"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB2","doi-asserted-by":"crossref","first-page":"109","DOI":"10.1152\/jn.1966.29.1.109","article-title":"Click-evoked response patterns of single units in the medial geniculate body of the cat","volume":"Vol. 29","author":"Aitkin","year":"1966","journal-title":"J. Neurophysiology"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB3","series-title":"Proc: IEEE Internat. Conf. Acoust. Speech Signal Process.","first-page":"II.668, II.671","article-title":"A dynamic cepstrum incorporating time-frequency masking and its application to continuous speech recognition","author":"Aikawa","year":"1993"},{"issue":"No. 4","key":"10.1016\/0167-6393(96)00003-9_NEWBIB4","doi-asserted-by":"crossref","first-page":"567","DOI":"10.1109\/89.326615","article-title":"How do humans process and recognize speech?","volume":"Vol. 2","author":"Allen","year":"1994","journal-title":"IEEE Trans. Speech Audio Process."},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB5","series-title":"Proc. IEEE Internat. Conf. Acoust. Speech Signal Process.","first-page":"I.433, I.437","article-title":"Adaptation to new microphones using tied-mixture normalization","author":"Anastasakos","year":"1994"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB6","series-title":"Proc. IEEE Internat. Conf. Acoust. Speech Signal Process.","first-page":"985","article-title":"Regression features for recognition of speech in quiet and in noise","author":"Applebaum","year":"1991"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB7","series-title":"Proc. IEEE Internat. Conf. Acoust. Speech Signal Process.","first-page":"125","article-title":"Automatic detection of new words in a large vocabulary continuous speech recognition system","author":"Asadi","year":"1990"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB8","series-title":"Proc. DARPA Speech and Natural Language Workshop","first-page":"180","article-title":"Improving state-of-the-art continuous speech recognition systems using the N-best paradigm with neural networks","author":"Austin","year":"1992"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB9","series-title":"Proc. IEEE Internat. Conf. Acoust. Speech Signal Process.","first-page":"493","article-title":"A new algorithm for the estimation of hidden Markov models","author":"Bahl","year":"1988"},{"issue":"No. 1","key":"10.1016\/0167-6393(96)00003-9_NEWBIB10","doi-asserted-by":"crossref","first-page":"24","DOI":"10.1109\/TASSP.1975.1162650","article-title":"The Dragon system \u2014 An overview","volume":"Vol. ASSP-23","author":"Baker","year":"1975","journal-title":"IEEE Trans. Acoust. Speech Signal Process."},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB11","doi-asserted-by":"crossref","first-page":"252","DOI":"10.1109\/72.125866","article-title":"Global optimization of a neural-hidden Markov model hybrid","volume":"Vol. 3","author":"Bengio","year":"1992","journal-title":"IEEE Trans. Neural Networks"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB12","article-title":"An input output HMM architecture","volume":"Vol. 7","author":"Bengio","year":"1995"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB13","unstructured":"A. Bounds (1995), Personal communication."},{"issue":"No. 12","key":"10.1016\/0167-6393(96)00003-9_NEWBIB14","doi-asserted-by":"crossref","first-page":"1167","DOI":"10.1109\/34.62605","article-title":"Links between Markov models and multilayer perceptrons","volume":"Vol. 12","author":"Bourlard","year":"1990","journal-title":"IEEE Trans. Pattern Anal. Machine Intell."},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB15","author":"Bourlard","year":"1994"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB16","article-title":"REMAP: Recursive estimation and maximization of a posteriori probabilities \u2014 Application to transition-based connectionist speech recognition","author":"Bourlard","year":"1994"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB17","series-title":"Proc. Eurospeech '95","article-title":"REMAP: recursive estimation and maximization of a posteriori probabilities in connectionist speech recognition","author":"Bourlard","year":"1995"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB18","article-title":"An experimental automatic word recognition system","author":"Bridle","year":"1974"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB19","unstructured":"J.S. Bridle, (1995), Personal communication."},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB20","unstructured":"P. Brown, The acoustic-modelling problem in automatic speech recognition, PhD Thesis, Computer Science Department, Carnegie Mellon University."},{"issue":"No. 6","key":"10.1016\/0167-6393(96)00003-9_NEWBIB21","doi-asserted-by":"crossref","first-page":"2623","DOI":"10.1121\/1.397756","article-title":"Application of an auditory model to speech recognition","volume":"Vol. 85","author":"Cohen","year":"1989","journal-title":"J. Acoust. Soc. Amer."},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB22","unstructured":"J.R. Cohen (1995), Informal communication."},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB23","series-title":"Proc. Internat. Conf. Speech Language Processing","first-page":"915","article-title":"Hybrid neural network\/hidden Markov model continuous speech recognition","author":"Cohen","year":"1992"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB24","doi-asserted-by":"crossref","first-page":"789","DOI":"10.1121\/1.392049","article-title":"Central auditory processing of peripheral vowel spectra","volume":"Vol. 77","author":"Chistovich","year":"1985","journal-title":"J. Acoust. Soc. Amer."},{"issue":"No. 4","key":"10.1016\/0167-6393(96)00003-9_NEWBIB25","doi-asserted-by":"crossref","first-page":"357","DOI":"10.1109\/TASSP.1980.1163420","article-title":"Comparison of parametric representations for monosyllabic word recognition in continuously spoken sentences","volume":"Vol. 28","author":"Davis","year":"1980","journal-title":"IEEE Trans. Acoust. Speech Signal Process."},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB26","article-title":"Incorporating the time correlation between successive observations in an acoustic-phonetic hidden Markov model for continuous speech recognition","author":"de La Noue","year":"1989","journal-title":"AT&T Technical Memorandum No. 11226"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB27","series-title":"Proc. DARPA Speech and Natural Language Workshop","first-page":"103","article-title":"Adaptive language modelling using minimum discriminant estimation","author":"Della Pietra","year":"1992"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB28","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1111\/j.2517-6161.1977.tb01600.x","article-title":"Maximum likelihood from incomplete data via the EM algorithm","volume":"Vol. 39","author":"Dempster","year":"1977","journal-title":"J. Roy. Statist. Soc."},{"issue":"No. 4","key":"10.1016\/0167-6393(96)00003-9_NEWBIB29","doi-asserted-by":"crossref","first-page":"507","DOI":"10.1109\/89.326610","article-title":"Speech recognition using hidden Markov models with polynomial regression functions as nonstationary states","volume":"Vol. 2","author":"Deng","year":"1994","journal-title":"IEEE Trans. Speech Audio Process."},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB30","series-title":"Proc. IEEE Internat. Conf. Acoust. Speech Signal Process.","first-page":"556","article-title":"Phonetically sensitive discriminants for improved speech recognition","author":"Doddington","year":"1989"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB31","article-title":"A new structure for automatic speech recognition","author":"Duchnowski","year":"1993"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB32","series-title":"Proc. IEEE Internat. Conf. Acoust. Speech Signal Process.","first-page":"535","article-title":"Effects of emphasizing transitional or stationary parts of the speech signal in a discrete utterance recognition system","author":"Elenius","year":"1982"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB33","series-title":"Proc. IEEE Internat. Conf. Acoust. Speech Signal Process.","first-page":"I.549, I.552","article-title":"City name recognition over the telephone","author":"Fanty","year":"1993"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB34","series-title":"IEEE Proc. Internat. Conf. Acoust. Speech Signal Process.","first-page":"425","article-title":"Connectionist Viterbi training: A new hybrid method for continuous speech recognition","author":"Franzini","year":"1990"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB35","author":"Fletcher","year":"1953"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB36","doi-asserted-by":"crossref","first-page":"254","DOI":"10.1109\/TASSP.1981.1163530","article-title":"Cepstral analysis technique for automatic speaker verification","volume":"Vol. 29","author":"Furui","year":"1981","journal-title":"IEEE Trans. Acoust. Speech Signal Process."},{"issue":"No. 1","key":"10.1016\/0167-6393(96)00003-9_NEWBIB37","doi-asserted-by":"crossref","first-page":"52","DOI":"10.1109\/TASSP.1986.1164788","article-title":"Speaker independent isolated word recognizer using dynamic features of speech spectrum","volume":"Vol. 34","author":"Furui","year":"1986","journal-title":"IEEE Trans. Acoust. Speech Signal Process."},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB38","doi-asserted-by":"crossref","first-page":"101","DOI":"10.1006\/csla.1993.1005","article-title":"Hidden Markov models with templates as non-stationary states: An application to speech recognition","volume":"Vol. 2","author":"Ghitza","year":"1993","journal-title":"Computer Speech and Language"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB39","series-title":"Proc. IEEE Internat. Conf. Acoust. Speech Signal Process.","first-page":"1361","article-title":"A probabilistic approach to the understanding and training of neural network classifiers","author":"Gish","year":"1990"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB40","doi-asserted-by":"crossref","first-page":"911","DOI":"10.1214\/aoms\/1177704014","article-title":"Maximum entropy for hypothesis formulation, especially for multidimensional contingency tables","volume":"Vol. 34","author":"Good","year":"1963","journal-title":"Ann. Math. Statist."},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB41","article-title":"Temporal aspects of audition","author":"Green","year":"1976","journal-title":"PhD Thesis"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB42","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1016\/S0095-4470(19)30460-7","article-title":"The representation of speech in the auditory periphery","volume":"Vol. 16","author":"Greenberg","year":"1988","journal-title":"J. Phonetics"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB43","series-title":"Proc. IEEE Internat. Conf. Acoust. Speech Signal Process.","first-page":"20","article-title":"Decoder selection based on cross-entropies","author":"Gopalakrishnan","year":"1988"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB44","doi-asserted-by":"crossref","DOI":"10.21437\/ICSLP.1994-470","article-title":"Statistical trajectory models for phonetic recognition","author":"Goldenthal","year":"1994"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB45","series-title":"Proc. IEEE Internat. Conf. Acoust. Speech Signal Process.","first-page":"II.239, II.242","article-title":"Improvements in connected digit recognition using linear discriminant analysis and mixture densities","author":"Haeb-Umbach","year":"1994"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB46","series-title":"Proc. IEEE Internat. Conf. Acoust. Speech Signal Process.","first-page":"425","article-title":"Methods for improved speech recognition over telephone line","author":"Hauenstein","year":"1995"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB47","series-title":"Proc. IEEE Internat. Conf. Acoust. Speech Signal Process.","first-page":"18.A.5.1, 18.A.5.4","article-title":"The harmonic magnitude suppression (HMS) technique for intelligibility enhancement in the presence in interfering speech","author":"Hanson","year":"1984"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB48","series-title":"Proc. IEEE Internat. Conf. Acoust. Speech Signal Process.","first-page":"1159","article-title":"An efficient speaker-independent automatic speech recognition by simulation of some properties of human auditory perception","author":"Hermansky","year":"1987"},{"issue":"No. 4","key":"10.1016\/0167-6393(96)00003-9_NEWBIB49","doi-asserted-by":"crossref","first-page":"1738","DOI":"10.1121\/1.399423","article-title":"Perceptual linear predictive (PLP) analysis of speech","volume":"Vol. 87","author":"Hermansky","year":"1990","journal-title":"J. Acoust. Soc. Amer."},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB50","first-page":"61","article-title":"Exploring temporal domain for robustness in speech recognition","volume":"Vol. II","author":"Hermansky","year":"1995"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB51","series-title":"Proc. IEEE Internat. Conf. Acoust. Speech Signal Process.","first-page":"777","article-title":"Analysis and synthesis of speech based on spectral transform linear predictive method","author":"Hermansky","year":"1983"},{"issue":"No. 4","key":"10.1016\/0167-6393(96)00003-9_NEWBIB52","doi-asserted-by":"crossref","first-page":"578","DOI":"10.1109\/89.326616","article-title":"RASTA processing of speech","volume":"Vol. 2","author":"Hermansky","year":"1994","journal-title":"IEEE Trans. Speech Audio Process."},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB53","series-title":"Proc. IEEE Internat. Conf. Acoust. Speech Signal Process.","first-page":"405","article-title":"Speech enhancement based on temporal processing","author":"Hermansky","year":"1995"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB54","series-title":"Proc. IEEE Internat. Conf. Acoust. Speech Signal Process.","first-page":"69","article-title":"Recent improvements to the ABBOT large vocabulary CSR system","author":"Hochberg","year":"1995"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB55","series-title":"Internat. Conf. Acoust. Speech Signal Process.","first-page":"262","article-title":"A comparison of several acoustic representations for speech recognition with degraded and undegraded speech","author":"Hunt","year":"1989"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB56","series-title":"Internat. Conf. Acoust. Speech Signal Process.","first-page":"310","article-title":"Automatic formant extraction utilizing mel scale and equal loudness contour","author":"Itahashi","year":"1976"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB57","series-title":"Proc. Internat. Joint Conf. on Neural Networks","first-page":"II.801, II.808","article-title":"Speaker independent phonetic classification in continuous English letters","author":"Janseen","year":"1991"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB58","doi-asserted-by":"crossref","first-page":"250","DOI":"10.1109\/TIT.1975.1055384","article-title":"Design of a linguistic statistical decoder for the recognition of continuous speech","volume":"Vol. IT-21","author":"Jelinek","year":"1975","journal-title":"IEEE Trans. Information Theory"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB59","first-page":"532","article-title":"Continuous speech recognition by statistical methods","volume":"Vol. 64","author":"Jelinek","year":"1976"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB60","series-title":"Proc. DARPA Speech and Nautral Language Workshop","first-page":"293","article-title":"A dynamic language model for speech recognition","author":"Jelinek","year":"1991"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB61","doi-asserted-by":"crossref","first-page":"181","DOI":"10.1162\/neco.1994.6.2.181","article-title":"Hierarchical mixtures of experts and the EM algorithm","volume":"Vol. 6","author":"Jordan","year":"1994","journal-title":"Neural Computation"},{"issue":"No. 6","key":"10.1016\/0167-6393(96)00003-9_NEWBIB62","doi-asserted-by":"crossref","first-page":"1404","DOI":"10.1109\/TASSP.1985.1164727","article-title":"Mixture autoregressive hidden Markov models for speech signals","volume":"Vol. 33","author":"Juang","year":"1985","journal-title":"IEEE Trans. Acoust. Speech Signal Process."},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB63","series-title":"Proc. 15th Annual Speech Research Symposium","first-page":"175","article-title":"Vocal tract normalization in speech recognition: Compensation for systematic speaker variability","author":"Kamm","year":"1995"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB64","series-title":"Proc. IEEE Workshop on Neural Networks for Signal Process.","first-page":"299","article-title":"New discriminative training algorithms based on the generalized probabilistic descent method","author":"Katagiri","year":"1991"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB65","series-title":"The Representation of Speech in the Peripheral Auditory System","first-page":"181","article-title":"Speech processing strategies based on auditory models","author":"Klatt","year":"1982"},{"issue":"No. 4","key":"10.1016\/0167-6393(96)00003-9_NEWBIB66","doi-asserted-by":"crossref","first-page":"806","DOI":"10.1109\/78.80902","article-title":"A study on speaker adaptation of the parameters of continuous density hidden Markov models","volume":"Vol. 39","author":"Lee","year":"1991","journal-title":"IEEE Trans. Signal Process."},{"issue":"No. 1","key":"10.1016\/0167-6393(96)00003-9_NEWBIB67","doi-asserted-by":"crossref","first-page":"109","DOI":"10.1109\/72.182700","article-title":"Hidden control neural architecture modeling of nonlinear time varying systems and its applications","volume":"Vol. 4","author":"Levin","year":"1993","journal-title":"IEEE Trans. Neural Networks"},{"issue":"No. 3","key":"10.1016\/0167-6393(96)00003-9_NEWBIB68","doi-asserted-by":"crossref","first-page":"223","DOI":"10.1109\/TASSP.1979.1163234","article-title":"Spectral root homomorphic deconvolution system","volume":"Vol. 27","author":"Lim","year":"1979","journal-title":"IEEE Trans. Acoust. Speech Signal Process."},{"issue":"No. 5","key":"10.1016\/0167-6393(96)00003-9_NEWBIB69","doi-asserted-by":"crossref","first-page":"729","DOI":"10.1109\/TIT.1982.1056544","article-title":"Maximum likelihood estimation for multivariate observations of Markov sources","volume":"Vol. IT-28","author":"Liporace","year":"1982","journal-title":"IEEE Trans. Information Theory"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB70","series-title":"Proc. Internat. Conf. on Spoken Language Processing","article-title":"Connected digit recognition using connectionist probability estimators and mixture-Gaussian densities","author":"Lubensky","year":"1994"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB71","series-title":"Proc. IEEE Internat. Conf. Acoust. Speech Signal Process.","first-page":"738","article-title":"Recognition of consonant based on the Perceptron model","author":"Makino","year":"1983"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB72","series-title":"Pattern Recognition and Artificial Intelligence","first-page":"374","article-title":"Distance measures for speech recognition, psychological and instrumental","author":"Mermelstein","year":"1976"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB73","series-title":"IEEE Proc. Internat. Conf. Acoust. Speech Signal Process.","first-page":"413","article-title":"Continuous speech recognition using multilayer perceptrons with hidden Markov models","author":"Morgan","year":"1990"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB74","first-page":"741","article-title":"Neural networks for statistical recognition of continuous speech","volume":"Vol. 83","author":"Morgan","year":"1995"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB75","series-title":"IEEE Proc. Internat. Conf. Acoust. Speech Signal Process.","first-page":"397","article-title":"Stochastic perceptual models of speech","author":"Morgan","year":"1995"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB76","series-title":"Proc. Eurospeech'95","first-page":"771","article-title":"Digit recognition with stochastic perceptual models","author":"Morgan","year":"1995"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB77","series-title":"IEEE Proc. Internat. Conf. Acoust. Speech Signal Process.","first-page":"I.417, I.420","article-title":"Probabilistic optimum filtering for robust speech recognition","author":"Neumayer","year":"1994"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB78","series-title":"IEEE Proc. Internat. Conf. Acoust. Speech Signal Process.","first-page":"389","article-title":"Context modeling with the stochastic segment model","author":"Ostendorf","year":"1992"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB79","series-title":"IEEE Proc. Internat. Conf. Acoust. Speech Signal Process.","first-page":"569","article-title":"On the interaction between true source, training, and testing language models","author":"Paul","year":"1991"},{"issue":"No. 5","key":"10.1016\/0167-6393(96)00003-9_NEWBIB80","doi-asserted-by":"crossref","first-page":"2876","DOI":"10.1121\/1.409409","article-title":"Temporal masking in automatic speech recognition","volume":"Vol. 95","author":"Pavel","year":"1994","journal-title":"J. Acoust. Soc. Amer."},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB81","doi-asserted-by":"crossref","first-page":"458","DOI":"10.1121\/1.1911711","article-title":"Perceptual and physical space of vowel sounds","volume":"Vol. 46","author":"Pols","year":"1969","journal-title":"J. Acoust. Soc. Amer."},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB82","doi-asserted-by":"crossref","first-page":"972","DOI":"10.1109\/T-C.1971.223391","article-title":"Real-time recognition of spoken words","volume":"Vol. 20(C)","author":"Pols","year":"1971","journal-title":"IEEE Trans. Computers"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB83","series-title":"Proc. IEEE Internat. Conf. Acoust. Speech Signal Process.","first-page":"1291","article-title":"Linear predictive hidden Markov models and the speech signal","author":"Poritz","year":"1982"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB84","series-title":"Proc. IEEE Internat. Conf. Acoust. Speech Signal Process.","first-page":"705","article-title":"On hidden Markov models in isolated word recognition","author":"Poritz","year":"1986"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB85","series-title":"Proc. IEEE Internat. Conf. Acoust. Speech Signal Process.","first-page":"18.A.2.1., 18.A.2.4","article-title":"Optimal estimators for spectral restoration of noisy speech","author":"Porter","year":"1984"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB86","first-page":"257","article-title":"A tutorial on hidden Markov models and selected applications in speech recognition","volume":"Vol. 77","author":"Rabiner","year":"1989"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB87","series-title":"Proc. IEEE Internat. Conf. Acoust. Speech Signal Process.","first-page":"596","article-title":"Efficient search using posterior phone probability estimates","author":"Renals","year":"1995"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB88","doi-asserted-by":"crossref","first-page":"461","DOI":"10.1162\/neco.1991.3.4.461","article-title":"Neural network classifiers estimate Bayesian a posteriori probabilities","volume":"Vol. 3","author":"Richard","year":"1991","journal-title":"Neural Computation"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB89","series-title":"Proc. Eurospeech'93","first-page":"1941","article-title":"A neural network based, speaker independent, large vocabulary, continuous speech recognition system: the Wernicke project","author":"Robinson","year":"1993"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB90","doi-asserted-by":"crossref","first-page":"259","DOI":"10.1016\/0885-2308(91)90010-N","article-title":"A recurrent error propagation network speech recognition system","volume":"Vol. 5","author":"Robinson","year":"1991","journal-title":"Computer Speech and Language"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB91","series-title":"Proc. Internat. Conf. on Spoken Language Processing","first-page":"1835","article-title":"Cepstral channel normalization techniques for HMM-based speaker verification","author":"Rosenberg","year":"1994"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB92","series-title":"Proc. IEEE Internat. Conf. Acoust. Speech Signal Process.","first-page":"69","article-title":"The ARM continuous speech recognition system","author":"Russell","year":"1990"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB93","series-title":"Proc. IEEE Internat. Conf. Acoust. Speech Signal Process.","first-page":"I.1.4, I.1.7","article-title":"New uses of the N-best sentence hypotheses within the BYBLOS speech recognition system","author":"Schwartz","year":"1992"},{"issue":"No. 1","key":"10.1016\/0167-6393(96)00003-9_NEWBIB94","doi-asserted-by":"crossref","first-page":"55","DOI":"10.1016\/S0095-4470(19)30466-8","article-title":"A joint synchrony\/mean-rate model of auditory speech processing","volume":"Vol. 16","author":"Seneff","year":"1985","journal-title":"J. Phonetics"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB95","series-title":"Proc. IEEE Internat. Conf. Acoust. Speech Signal Process.","first-page":"629","article-title":"A speech recognizer using radial basis function neural networks in an HMM framework","author":"Singer","year":"1992"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB96","series-title":"Proc. Eurospeech'95","first-page":"1271","article-title":"Multilingual assessment of speaker independent large vocabulary speech-recognition systems: The SQALE project (speech recognition quality assessment for language engineering)","author":"Steeneken","year":"1995"},{"issue":"No. 1","key":"10.1016\/0167-6393(96)00003-9_NEWBIB97","doi-asserted-by":"crossref","first-page":"153","DOI":"10.1037\/h0046162","article-title":"On the psychophysical law","volume":"Vol. 64","author":"Stevens","year":"1957","journal-title":"Psychol. Rev."},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB98","doi-asserted-by":"crossref","first-page":"319","DOI":"10.3758\/BF03215796","article-title":"Brightness and loudness as functions of stimulus duration","author":"Stevens","year":"1966","journal-title":"Perception and Psychophysics"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB99","first-page":"678","article-title":"Blind deconvolution through digital signal processing","volume":"Vol. 63","author":"Stockham","year":"1975"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB100","doi-asserted-by":"crossref","first-page":"583","DOI":"10.1109\/TASSP.1978.1163149","article-title":"Memory and time improvements in a dynamic programming algorithm for matching speech patterns","volume":"Vol. 26","author":"Tappert","year":"1978","journal-title":"IEEE Trans. Acoust. Speech Signal Process."},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB101","series-title":"Proc. IEEE Internat. Conf. Acoust. Speech Signal Process.","first-page":"61","article-title":"Continuous speech recognition using linked predictive neural networks","author":"Tebelskis","year":"1991"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB102","series-title":"Proc. IEEE Internat. Conf. Acoust. Speech Signal Process.","first-page":"107","article-title":"Phoneme recognition using time-delay neural networks","author":"Waibel","year":"1988"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB103","series-title":"Proc. IEEE Internat. Conf. Acoust. Speech Signal Process.","first-page":"384","article-title":"Explicit time correlation in hidden Markov models for speech recognition","author":"Wellekens","year":"1987"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB104","first-page":"401","article-title":"Scaling","volume":"Vol. 3","author":"Zwicker","year":"1975"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB105","first-page":"1602","article-title":"The use of speech knowledge in automatic speech recognition","volume":"Vol. 73","author":"Zue","year":"1985"},{"key":"10.1016\/0167-6393(96)00003-9_NEWBIB106","series-title":"Proc. ARPA Speech Recognition Workshop","article-title":"Copernicus and the ASR challenge \u2014 Waiting for Kepler","author":"Bourlard","year":"1996"}],"container-title":["Speech Communication"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:0167639396000039?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:0167639396000039?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2024,12,6]],"date-time":"2024-12-06T12:20:35Z","timestamp":1733487635000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/0167639396000039"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[1996,5]]},"references-count":106,"journal-issue":{"issue":"3","published-print":{"date-parts":[[1996,5]]}},"alternative-id":["0167639396000039"],"URL":"https:\/\/doi.org\/10.1016\/0167-6393(96)00003-9","relation":{},"ISSN":["0167-6393"],"issn-type":[{"value":"0167-6393","type":"print"}],"subject":[],"published":{"date-parts":[[1996,5]]}}}