{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,10]],"date-time":"2026-02-10T18:19:50Z","timestamp":1770747590170,"version":"3.49.0"},"reference-count":41,"publisher":"Elsevier BV","issue":"9","license":[{"start":{"date-parts":[[1999,11,1]],"date-time":"1999-11-01T00:00:00Z","timestamp":941414400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Neural Networks"],"published-print":{"date-parts":[[1999,11]]},"DOI":"10.1016\/s0893-6080(99)00043-x","type":"journal-article","created":{"date-parts":[[2002,7,25]],"date-time":"2002-07-25T22:54:47Z","timestamp":1027637687000},"page":"1229-1252","source":"Crossref","is-referenced-by-count":95,"title":["Improved learning algorithms for mixture of experts in multiclass classification"],"prefix":"10.1016","volume":"12","author":[{"given":"K.","family":"Chen","sequence":"first","affiliation":[]},{"given":"L.","family":"Xu","sequence":"additional","affiliation":[]},{"given":"H.","family":"Chi","sequence":"additional","affiliation":[]}],"member":"78","reference":[{"key":"10.1016\/S0893-6080(99)00043-X_BIB2","unstructured":"Bennani, Y., & Gallinari, P. (1994). Connectionist approaches for automatic speaker recognition. Proceeding of ESCA Workshop on Automatic Speaker Recognition, Identification and Verification, Martigny, Switzerland, pp. 95-102."},{"issue":"3","key":"10.1016\/S0893-6080(99)00043-X_BIB3","doi-asserted-by":"crossref","first-page":"229","DOI":"10.1142\/S0129065791000212","article-title":"A fast procedure for re-training the multilayer perception","volume":"2","author":"Bishop","year":"1991","journal-title":"International Journal of Neural Systems"},{"issue":"4","key":"10.1016\/S0893-6080(99)00043-X_BIB4","doi-asserted-by":"crossref","first-page":"494","DOI":"10.1162\/neco.1992.4.4.494","article-title":"Exact calculation of the Hessian matrix for the multilayer perceptron","volume":"4","author":"Bishop","year":"1992","journal-title":"Neural Computation"},{"key":"10.1016\/S0893-6080(99)00043-X_BIB5","series-title":"Computational statistics","first-page":"409","article-title":"Construction of reliable maximum likelihood algorithms with applications to logistic and Cox regression","author":"B\u00f6ning","year":"1993"},{"key":"10.1016\/S0893-6080(99)00043-X_BIB6","series-title":"Classification and regression trees","author":"Breiman","year":"1984"},{"key":"10.1016\/S0893-6080(99)00043-X_BIB7","series-title":"Neurocomputing: algorithm, architectures, and applications","first-page":"227","article-title":"Probabilistic interpretation of feedforward classification network outputs, with relationships to statistical pattern recognition","author":"Bridle","year":"1989"},{"key":"10.1016\/S0893-6080(99)00043-X_BIB8","doi-asserted-by":"crossref","first-page":"76","DOI":"10.1093\/imamat\/6.1.76","article-title":"The convergence of a class of double rank minimization algorithms","volume":"6","author":"Broyden","year":"1970","journal-title":"Journal of the Institute of Mathematics and Its Applications"},{"issue":"9","key":"10.1016\/S0893-6080(99)00043-X_BIB9","doi-asserted-by":"crossref","first-page":"1437","DOI":"10.1109\/5.628714","article-title":"Speaker recognition: a tutorial","volume":"85","author":"Campbell","year":"1997","journal-title":"Proceedings of the IEEE"},{"issue":"7","key":"10.1016\/S0893-6080(99)00043-X_BIB15","doi-asserted-by":"crossref","first-page":"545","DOI":"10.1016\/S0167-8655(98)00055-5","article-title":"A connectionist method for pattern classification with diverse features","volume":"19","author":"Chen","year":"1998","journal-title":"Pattern Recognition Letters"},{"key":"10.1016\/S0893-6080(99)00043-X_BIB11","first-page":"1493","article-title":"Speaker identification based on hierarchical mixture of experts","author":"Chen","year":"1995","journal-title":"Proceedings of World Congress on Neural Networks, Washington, DC"},{"key":"10.1016\/S0893-6080(99)00043-X_BIB12","unstructured":"Chen, K., Xie, D., & Chi, H. (1996). A modified HME architecture for text-dependent speaker identification. IEEE Transactions on Neural Networks, 7(5): 1309\u20131313 (for errata see IEEE Transactions on Neural Networks, 8(2): 455, 1997)."},{"issue":"1","key":"10.1016\/S0893-6080(99)00043-X_BIB13","doi-asserted-by":"crossref","first-page":"29","DOI":"10.1142\/S012906579600004X","article-title":"Speaker identification using time-delay HMEs","volume":"7","author":"Chen","year":"1996","journal-title":"International Journal of Neural Systems"},{"issue":"1","key":"10.1016\/S0893-6080(99)00043-X_BIB16","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1111\/j.2517-6161.1977.tb01600.x","article-title":"Maximum-likelihood from incomplete data via the EM algorithm","volume":"39","author":"Dempster","year":"1977","journal-title":"Journal of the Royal Statistical Society B"},{"key":"10.1016\/S0893-6080(99)00043-X_BIB17","series-title":"Pattern classification and scene analysis","author":"Duda","year":"1973"},{"key":"10.1016\/S0893-6080(99)00043-X_BIB18","doi-asserted-by":"crossref","first-page":"179","DOI":"10.1111\/j.1469-1809.1936.tb02137.x","article-title":"The use of multiple measurements in taxonomic problem","volume":"7","author":"Fisher","year":"1936","journal-title":"Annals of Eugenices"},{"key":"10.1016\/S0893-6080(99)00043-X_BIB19","doi-asserted-by":"crossref","first-page":"317","DOI":"10.1093\/comjnl\/13.3.317","article-title":"A general quadratic programming algorithm","volume":"13","author":"Fletcher","year":"1970","journal-title":"Computer Journal"},{"key":"10.1016\/S0893-6080(99)00043-X_BIB20","series-title":"Practical methods of optimization","author":"Fletcher","year":"1987"},{"issue":"9","key":"10.1016\/S0893-6080(99)00043-X_BIB21","doi-asserted-by":"crossref","first-page":"859","DOI":"10.1016\/S0167-8655(97)00073-1","article-title":"Recent advances in speaker recognition","volume":"18","author":"Furui","year":"1997","journal-title":"Pattern Recognition Letters"},{"key":"10.1016\/S0893-6080(99)00043-X_BIB22","doi-asserted-by":"crossref","first-page":"23","DOI":"10.1090\/S0025-5718-1970-0258249-6","article-title":"A family of variable metric methods derived by variational means","volume":"24","author":"Goldfarb","year":"1970","journal-title":"Mathematics of Computation"},{"key":"10.1016\/S0893-6080(99)00043-X_BIB23","series-title":"Matrix computations","author":"Golub","year":"1989"},{"issue":"5","key":"10.1016\/S0893-6080(99)00043-X_BIB24","doi-asserted-by":"crossref","first-page":"923","DOI":"10.1109\/72.165594","article-title":"Classification trees with neural network decision trees","volume":"3","author":"Guo","year":"1992","journal-title":"IEEE Transactions on Neural Networks"},{"issue":"3","key":"10.1016\/S0893-6080(99)00043-X_BIB25","doi-asserted-by":"crossref","first-page":"509","DOI":"10.1016\/0893-6080(96)83696-3","article-title":"Structural learning with forgetting","volume":"9","author":"Ishikawa","year":"1996","journal-title":"Neural Networks"},{"issue":"1","key":"10.1016\/S0893-6080(99)00043-X_BIB26","doi-asserted-by":"crossref","first-page":"79","DOI":"10.1162\/neco.1991.3.1.79","article-title":"Adaptive mixture of local experts","volume":"3","author":"Jacobs","year":"1991","journal-title":"Neural Computation"},{"issue":"2","key":"10.1016\/S0893-6080(99)00043-X_BIB27","doi-asserted-by":"crossref","first-page":"181","DOI":"10.1162\/neco.1994.6.2.181","article-title":"Hierarchical mixture of experts and the EM algorithm","volume":"6","author":"Jordan","year":"1994","journal-title":"Neural Computation"},{"issue":"9","key":"10.1016\/S0893-6080(99)00043-X_BIB28","doi-asserted-by":"crossref","first-page":"1409","DOI":"10.1016\/0893-6080(95)00014-3","article-title":"Convergence results for the EM approach to mixtures of experts","volume":"8","author":"Jordan","year":"1995","journal-title":"Neural Networks"},{"key":"10.1016\/S0893-6080(99)00043-X_BIB29","series-title":"Generalized linear models","author":"McCullagh","year":"1983"},{"key":"10.1016\/S0893-6080(99)00043-X_BIB30","series-title":"Mathematical programming: theory and algorithms","author":"Minoux","year":"1986"},{"key":"10.1016\/S0893-6080(99)00043-X_BIB31","series-title":"Applied linear statistical models","author":"Neter","year":"1985"},{"key":"10.1016\/S0893-6080(99)00043-X_BIB32","doi-asserted-by":"crossref","unstructured":"Ramamurti, V., & Ghosh, J. (1996). Advances in using hierarchical mixture of experts for signal classification. Proceedings of International Conference on Acoustic, Speech, and Signal Processing, Atlanta, pp. 3569\u20133572.","DOI":"10.1109\/ICASSP.1996.550800"},{"key":"10.1016\/S0893-6080(99)00043-X_BIB33","doi-asserted-by":"crossref","unstructured":"Ramamurti, V., & Ghosh, J. (1997). Regularization and error bars for the mixture of experts network. Proceedings of IEEE International Conference of Neural Networks, Houston, pp. 221\u2013225.","DOI":"10.1109\/ICNN.1997.611668"},{"key":"10.1016\/S0893-6080(99)00043-X_BIB34","doi-asserted-by":"crossref","first-page":"647","DOI":"10.1090\/S0025-5718-1970-0274029-X","article-title":"On variable metric methods for sparse Hessians","volume":"24","author":"Shanno","year":"1970","journal-title":"Mathematics of Computation"},{"key":"10.1016\/S0893-6080(99)00043-X_BIB35","unstructured":"Waterhouse, S.R. (1993). The application of HME with the EM algorithm to speech recognition. Master Thesis, Department of Engineering, Cambridge University."},{"key":"10.1016\/S0893-6080(99)00043-X_BIB36","unstructured":"Waterhouse, S.R. (1997). Classification and regression using mixtures of experts. Ph.D., Thesis, Department of Engineering, Cambridge University."},{"key":"10.1016\/S0893-6080(99)00043-X_BIB40","unstructured":"Xu, L. (1996). Bayesian-Kullback YING-YANG learning scheme: reviews and new results, Proceedings of International Conference on Neural Information Processing, Hong Kong, pp. 59-67."},{"issue":"1-3","key":"10.1016\/S0893-6080(99)00043-X_BIB41","first-page":"223","volume":"19","author":"Xu","year":"1998","journal-title":"RBF nets, mixture of experts, and Bayesian Ying-Yang learning, Neurocomputing"},{"key":"10.1016\/S0893-6080(99)00043-X_BIB37","unstructured":"Xu, L., & Jordan, M.I. (1994). A modified gating network for the mixture of experts architecture. Proceedings of World Congress on Neural Networks, San Diego, pp. II405\u2013II410."},{"issue":"2","key":"10.1016\/S0893-6080(99)00043-X_BIB38","doi-asserted-by":"crossref","first-page":"129","DOI":"10.1162\/neco.1996.8.1.129","article-title":"On convergence properties of the EM algorithm for Gaussian mixtures","volume":"8","author":"Xu","year":"1996","journal-title":"Neural Computation"},{"key":"10.1016\/S0893-6080(99)00043-X_BIB39","series-title":"Advances in Neural Information Processing Systems","first-page":"633","article-title":"Advances in neural information processing systems","author":"Xu","year":"1995"},{"issue":"5","key":"10.1016\/S0893-6080(99)00043-X_NEWBIB1","doi-asserted-by":"crossref","first-page":"1231","DOI":"10.1109\/72.536317","article-title":"Input\/output HMMs for sequence processing","volume":"7","author":"Bengio","year":"1996","journal-title":"IEEE Transactions on Neural Networks"},{"issue":"1-3","key":"10.1016\/S0893-6080(99)00043-X_NEWBIB10","doi-asserted-by":"crossref","first-page":"227","DOI":"10.1016\/S0925-2312(98)00019-8","article-title":"A method of combining multiple probabilistic classifiers through soft competition on different features sets","volume":"20","author":"Chen","year":"1998","journal-title":"Neurocomputing"},{"issue":"2","key":"10.1016\/S0893-6080(99)00043-X_NEWBIB14","doi-asserted-by":"crossref","first-page":"81","DOI":"10.1007\/BF00571681","article-title":"Text-dependent speaker identification based on input\/output HMM: an empirical study","volume":"3","author":"Chen","year":"1996","journal-title":"Neural Processing Letters"}],"container-title":["Neural Networks"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S089360809900043X?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S089360809900043X?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2024,12,5]],"date-time":"2024-12-05T20:44:46Z","timestamp":1733431486000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S089360809900043X"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[1999,11]]},"references-count":41,"journal-issue":{"issue":"9","published-print":{"date-parts":[[1999,11]]}},"alternative-id":["S089360809900043X"],"URL":"https:\/\/doi.org\/10.1016\/s0893-6080(99)00043-x","relation":{},"ISSN":["0893-6080"],"issn-type":[{"value":"0893-6080","type":"print"}],"subject":[],"published":{"date-parts":[[1999,11]]}}}