{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,4]],"date-time":"2026-04-04T05:36:40Z","timestamp":1775281000103,"version":"3.50.1"},"reference-count":43,"publisher":"Elsevier BV","issue":"4","license":[{"start":{"date-parts":[[1998,12,1]],"date-time":"1998-12-01T00:00:00Z","timestamp":912470400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[1998,12,1]],"date-time":"1998-12-01T00:00:00Z","timestamp":912470400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/legal\/tdmrep-license"},{"start":{"date-parts":[[1999,3,25]],"date-time":"1999-03-25T00:00:00Z","timestamp":922320000000},"content-version":"vor","delay-in-days":114,"URL":"http:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0\/"}],"content-domain":{"domain":["elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Speech Communication"],"published-print":{"date-parts":[[1998,12]]},"DOI":"10.1016\/s0167-6393(98)00061-2","type":"journal-article","created":{"date-parts":[[2003,4,4]],"date-time":"2003-04-04T22:57:58Z","timestamp":1049497078000},"page":"283-297","update-policy":"https:\/\/doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":212,"title":["Heteroscedastic discriminant analysis and reduced rank HMMs for improved speech recognition"],"prefix":"10.1016","volume":"26","author":[{"given":"Nagendra","family":"Kumar","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Andreas G.","family":"Andreou","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"78","reference":[{"key":"10.1016\/S0167-6393(98)00061-2_BIB1","doi-asserted-by":"crossref","first-page":"716","DOI":"10.1109\/TAC.1974.1100705","article-title":"A new look at the statistical identification model","volume":"19","author":"Akaike","year":"1974","journal-title":"IEEE Transactions on Automatic Control"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB2","doi-asserted-by":"crossref","unstructured":"Aubert, X., Haeb-Umbach, R., Ney, H., 1993. Continuous mixture densities and linear discriminant analysis for improved context-dependent acoustic models. In: Proc. of ICASSP, Vol. 2, pp. 648\u2013651","DOI":"10.1109\/ICASSP.1993.319393"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB3","unstructured":"Ayer, C.M., 1992. A discriminatively derived transform capable for improved speech recognition accuracy. Ph.D. Thesis, University of London"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB4","doi-asserted-by":"crossref","unstructured":"Ayer, C.M., Hunt, M.J., Brookes, D.M., 1993. A discriminately derived linear transform for improved speech recognition. In: Proc. Eurospeech 93, Vol. 1, pp. 583\u2013586","DOI":"10.21437\/Eurospeech.1993-137"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB5","doi-asserted-by":"crossref","first-page":"176","DOI":"10.2307\/2984113","article-title":"Multivariate analysis","volume":"9","author":"Bartlett","year":"1947","journal-title":"J. Roy. Statist. Soc. B"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB6","doi-asserted-by":"crossref","first-page":"164","DOI":"10.1214\/aoms\/1177697196","article-title":"A maximization technique occuring in the statistical analysis of probabilistic functions of Markov chains","volume":"41","author":"Baum","year":"1970","journal-title":"Ann. Math. Stat."},{"key":"10.1016\/S0167-6393(98)00061-2_BIB7","doi-asserted-by":"crossref","first-page":"229","DOI":"10.1006\/csla.1993.1012","article-title":"Discriminative feature selection for speech recognition","volume":"7","author":"Bocchieri","year":"1993","journal-title":"Computer Speech and Language"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB8","doi-asserted-by":"crossref","unstructured":"Brown, P.F., 1987. The acoustic-modelling problem in automatic speech recognition. Ph.D. Thesis, Carnegie Mellon University","DOI":"10.21236\/ADA188529"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB9","doi-asserted-by":"crossref","first-page":"86","DOI":"10.1111\/j.1467-842X.1984.tb01271.x","article-title":"Canonical variate analysis \u2013 a general formulation","volume":"26","author":"Campbell","year":"1984","journal-title":"Australian Journal of Statistics"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB10","doi-asserted-by":"crossref","first-page":"2623","DOI":"10.1121\/1.397756","article-title":"Application of an auditory model to speech recognition","volume":"85","author":"Cohen","year":"1989","journal-title":"J. Acoust. Soc. Amer."},{"issue":"4","key":"10.1016\/S0167-6393(98)00061-2_BIB11","doi-asserted-by":"crossref","first-page":"357","DOI":"10.1109\/TASSP.1980.1163420","article-title":"Comparison of parametric representations for monosyllabic word recognition in continuously spoken sentances","volume":"28","author":"Davis","year":"1980","journal-title":"IEEE Transactions on Acoustics, Speech, and Signal Processing"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB12","doi-asserted-by":"crossref","unstructured":"Dempster, A.P., Laird, N.M., Rubin, D.B., 1977. Maximum likelihood from incomplete data via EM algorithm. J. Roy. Statist. Soc. 1\u201338","DOI":"10.1111\/j.2517-6161.1977.tb01600.x"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB13","unstructured":"Dillon, W.R., Goldstein, M., 1984. Multivariate Analysis. Wiley, New York"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB14","doi-asserted-by":"crossref","unstructured":"Doddington, G., 1989. Phonetically sensitive discriminants for improved speech recognition. In: Proceedings 1989 ICASSP, no. S10 b.11, pp. 556\u2013559","DOI":"10.1109\/ICASSP.1989.266487"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB15","unstructured":"Duda, R.O., Hart, P.B., 1973. Pattern Classification and Scene Analysis. Wiley, New York"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB16","doi-asserted-by":"crossref","unstructured":"Engle, R.F., 1995. ARCH: Selected Readings. Oxford Univ. Press, Oxford","DOI":"10.1093\/oso\/9780198774310.001.0001"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB17","doi-asserted-by":"crossref","first-page":"179","DOI":"10.1111\/j.1469-1809.1936.tb02137.x","article-title":"The use of multiple measurements in taxonomic problems","volume":"7","author":"Fisher","year":"1936","journal-title":"Ann. Eugen."},{"key":"10.1016\/S0167-6393(98)00061-2_BIB18","doi-asserted-by":"crossref","first-page":"376","DOI":"10.1111\/j.1469-1809.1938.tb02189.x","article-title":"The statistical utilization of multiple measurements","volume":"8","author":"Fisher","year":"1938","journal-title":"Ann. Eugen."},{"key":"10.1016\/S0167-6393(98)00061-2_BIB19","doi-asserted-by":"crossref","unstructured":"Fukunaga, K., 1990. Introduction to Statistical Pattern Recognition. Academic Press, New York","DOI":"10.1016\/B978-0-08-047865-4.50007-7"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB20","doi-asserted-by":"crossref","first-page":"52","DOI":"10.1109\/TASSP.1986.1164788","article-title":"Speaker-independent isolated word recognition using dynamic features of speech spectrum","volume":"34","author":"Furui","year":"1986","journal-title":"IEEE Transactions on Acoustics, Speech, and Signal Processing"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB21","doi-asserted-by":"crossref","unstructured":"Haeb-Umbach R., Ney H., 1992. Linear discriminant analysis for improved large vocabulary continuous speech recognition. In: Proc. ICASSP, Vol. 1, pp. 13-16","DOI":"10.1109\/ICASSP.1992.225984"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB22","doi-asserted-by":"crossref","unstructured":"Haeb-Umbach, R., Geller, D., Ney, H., 1993. Improvement in connected digit recognition using linear discriminant analysis and mixture densities. In: Proceedings of ICASSP, pp. 239\u2013242","DOI":"10.1109\/ICASSP.1993.319279"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB23","unstructured":"Hastie, T., Tibshirani, R., 1994. Discriminant analysis by gaussian mixtures. Tech. Rep., AT&T Bell Laboratories"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB24","doi-asserted-by":"crossref","first-page":"1738","DOI":"10.1121\/1.399423","article-title":"Perceptual linear predictive (plp) analysis of speech","volume":"87","author":"Hermansky","year":"1990","journal-title":"J. Acoust. Soc. Amer."},{"key":"10.1016\/S0167-6393(98)00061-2_BIB25","doi-asserted-by":"crossref","unstructured":"Hunt, M., 1979. A statistical approach to metrics for word and syllable recognition. In: 98th Meeting of the Acoustical Society of America, November","DOI":"10.1121\/1.2017735"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB26","doi-asserted-by":"crossref","unstructured":"Hunt M.J., Lefebvre C., 1989. A comparison of several acoustic representations for speech recognition with degraded and undegraded speech. In: Proc. ICASSP, Vol. 1, pp. 262-265","DOI":"10.1109\/ICASSP.1989.266415"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB27","doi-asserted-by":"crossref","unstructured":"Jankowski Jr., C.R., 1992. A comparison of auditory models for automatic speech recognition. Master's Thesis, MIT","DOI":"10.3115\/1075527.1075637"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB28","unstructured":"Kumar, N., 1997. Investigation of silicon auditory models and generalization of linear discriminant analysis for improved speech recognition. Ph.D. Thesis, Johns Hopkins University, http:\/\/olympus.ece.jhu.edu\/archives\/phd\/nkumar97\/index.html"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB29","unstructured":"Kumar, N., Andreou, A., 1996a. On generalizations of linear discriminant analysis. Tech. Rep., Electrical and Computer Engineering Technical Report-96-07, April"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB30","unstructured":"Kumar, N., Andreou, A., 1996b. Generalization of linear discriminant analysis in maximum likelihood framework. In: Proceedings of Joint Meeting of American Statistical Association, Chicago, IL, August"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB31","unstructured":"Kumar, N., Andreou, A., submitted. Heteroscedastic discriminant analysis: maximum likelihood feature extraction for heteroscedastic models. IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB32","unstructured":"Kumar, N., Neti, C., Andreou, A., 1995. Application of discriminant analysis to speech recognition with auditory features. In: Proceedings of the 15th Annual Speech Research Symposium, Johns Hopkins University, Baltimore, MD, pp. 153\u2013160, June"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB33","doi-asserted-by":"crossref","first-page":"297","DOI":"10.1002\/j.1538-7305.1975.tb02840.x","article-title":"An algorithm for determining the endpoints of isolated utterances","volume":"54","author":"Rabiner","year":"1975","journal-title":"Bell Syst. Tech. J."},{"key":"10.1016\/S0167-6393(98)00061-2_BIB34","unstructured":"Rao, C.R., 1965. Linear Statistical Inference and its Applications. Wiley, New York"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB35","unstructured":"Rissanen, J., 1989. Stochastic Complexity in Statistical Inquiry. Series in Computer Science, Vol. 15. World Scientific, Singapore"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB36","doi-asserted-by":"crossref","unstructured":"Roth R., Baker J.K., Baker J.M., Gillick L., Hunt M.J., Ito Y., Loewe S., Orloff J., Peskin B., Scattone F., 1993. Large vocabulary continuous speech recognition of wall street journal data. In: Proc. ICASSP, Vol. 2, pp. 640\u2013643","DOI":"10.1109\/ICASSP.1993.319391"},{"issue":"2","key":"10.1016\/S0167-6393(98)00061-2_BIB37","doi-asserted-by":"crossref","first-page":"461","DOI":"10.1214\/aos\/1176344136","article-title":"Estimating the dimension of a model","volume":"6","author":"Schwarz","year":"1978","journal-title":"Annals of Statistics"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB38","doi-asserted-by":"crossref","unstructured":"Siohan O., 1995. On the robustness of linear discriminant analysis as a preprocessing step for noisy speech recognition. In: Proc. ICASSP, Vol. 1, pp. 125\u2013128","DOI":"10.1109\/ICASSP.1995.479289"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB39","doi-asserted-by":"crossref","unstructured":"Sun, D., 1997. \u201cFeature dimensionality reduction using reduced-rank maximum likelihood estimation for hidden Markov models.\u201d In: International Conference on Language and Speech, pp. 244\u2013247","DOI":"10.21437\/ICSLP.1996-80"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB40","doi-asserted-by":"crossref","unstructured":"Wood L., Pearce D., Novello F., 1991. Improved vocabulary-independent sub-word HMM modelling. In: Proc. ICASSP, Vol. 1, pp. 181\u2013184","DOI":"10.1109\/ICASSP.1991.150307"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB41","doi-asserted-by":"crossref","unstructured":"Woodland P.C., Cole D.R., 1991. Optimising hidden markov models using discriminative output distribution. In: Proc. ICASSP, Vol. 1, pp. 545\u2013548","DOI":"10.1109\/ICASSP.1991.150397"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB42","doi-asserted-by":"crossref","unstructured":"Yu, G., Russell, W., Schwartz, R., Makhoul, J., 1990. Discriminant analysis and supervised vector quantization for continuous speech recognition. In: Proceedings of ICASSP, pp. 685\u2013688, April","DOI":"10.1109\/ICASSP.1990.115850"},{"key":"10.1016\/S0167-6393(98)00061-2_BIB43","doi-asserted-by":"crossref","unstructured":"Zahorian S.A., Qian D., Jagharghi A.J., 1991. Acoustic-phonetic transformations for improved speaker-independent isolated word recognition. In: Proc. ICASSP, Vol. 1, pp. 561\u2013564","DOI":"10.1109\/ICASSP.1991.150401"}],"container-title":["Speech Communication"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0167639398000612?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0167639398000612?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2025,9,28]],"date-time":"2025-09-28T22:37:57Z","timestamp":1759099077000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S0167639398000612"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[1998,12]]},"references-count":43,"journal-issue":{"issue":"4","published-print":{"date-parts":[[1998,12]]}},"alternative-id":["S0167639398000612"],"URL":"https:\/\/doi.org\/10.1016\/s0167-6393(98)00061-2","relation":{},"ISSN":["0167-6393"],"issn-type":[{"value":"0167-6393","type":"print"}],"subject":[],"published":{"date-parts":[[1998,12]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"Heteroscedastic discriminant analysis and reduced rank HMMs for improved speech recognition","name":"articletitle","label":"Article Title"},{"value":"Speech Communication","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/S0167-6393(98)00061-2","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"converted-article","name":"content_type","label":"Content Type"},{"value":"Copyright \u00a9 1998 Elsevier Science B.V. All rights reserved.","name":"copyright","label":"Copyright"}]}}