{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,4]],"date-time":"2026-04-04T05:34:21Z","timestamp":1775280861220,"version":"3.50.1"},"reference-count":19,"publisher":"Elsevier BV","issue":"1","license":[{"start":{"date-parts":[[1998,4,1]],"date-time":"1998-04-01T00:00:00Z","timestamp":891388800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Speech Communication"],"published-print":{"date-parts":[[1998,4]]},"DOI":"10.1016\/s0167-6393(97)00062-9","type":"journal-article","created":{"date-parts":[[2002,7,26]],"date-time":"2002-07-26T00:58:41Z","timestamp":1027645121000},"page":"19-37","source":"Crossref","is-referenced-by-count":93,"title":["Algorithms for bigram and trigram word clustering"],"prefix":"10.1016","volume":"24","author":[{"given":"Sven","family":"Martin","sequence":"first","affiliation":[]},{"given":"J\u00f6rg","family":"Liermann","sequence":"additional","affiliation":[]},{"given":"Hermann","family":"Ney","sequence":"additional","affiliation":[]}],"member":"78","reference":[{"key":"10.1016\/S0167-6393(97)00062-9_BIB1","doi-asserted-by":"crossref","first-page":"179","DOI":"10.1109\/TPAMI.1983.4767370","article-title":"A maximum likelihood approach to continuous speech recognition","volume":"5","author":"Bahl","year":"1993","journal-title":"IEEE Trans. Pattern Anal. Machine Intell."},{"key":"10.1016\/S0167-6393(97)00062-9_BIB2","doi-asserted-by":"crossref","unstructured":"Bellegarda, J.R., Butzberger, J.W., Chow, Y.-L., Coccaro, N.B., Naik, D., 1996. A novel word clustering algorithm based on latent semantic analysis. In: Proc. 1996 IEEE Internat. Conf. Acoust. Speech Signal Process., Atlanta, GA, 7\u201310 May 1996, pp. 172\u2013175.","DOI":"10.1109\/ICASSP.1996.540318"},{"key":"10.1016\/S0167-6393(97)00062-9_BIB3","unstructured":"Brill, E., 1993. A corpus-based approach to language learning. Ph.D. Thesis, Department of Computer and Information Science, University of Pennsylvania, Philadelphia, PA."},{"issue":"4","key":"10.1016\/S0167-6393(97)00062-9_BIB4","first-page":"467","article-title":"Class-based n-gram models of natural language","volume":"18","author":"Brown","year":"1992","journal-title":"Computational Linguistics"},{"key":"10.1016\/S0167-6393(97)00062-9_BIB5","unstructured":"Duda, R.O., Hart, P.E., 1973. Pattern Classification and Scene Analysis. Wiley, New York."},{"key":"10.1016\/S0167-6393(97)00062-9_BIB6","doi-asserted-by":"crossref","unstructured":"Jardino, M., 1996. Multilingual stochastic n-gram class language models. In: Proc. 1996 IEEE Internat. Conf. Acoust. Speech Signal Process., Atlanta, GA, 7\u201310 May 1996, pp. 161\u2013163.","DOI":"10.1109\/ICASSP.1996.540315"},{"key":"10.1016\/S0167-6393(97)00062-9_BIB7","doi-asserted-by":"crossref","unstructured":"Jardino, M., Adda, G., 1993. Automatic word classification using simulated annealing. In: Proc. 3rd European Conf. on Speech Communication and Technology, Berlin, 21\u201323 September 1993, pp. 1191\u20131194.","DOI":"10.1109\/ICASSP.1993.319224"},{"key":"10.1016\/S0167-6393(97)00062-9_BIB8","doi-asserted-by":"crossref","unstructured":"Jardino, M., Adda, G., 1994. Automatic determination of a stochastic bi-gram class language model. In: Carrasco, R.C., Oncina, J. (Eds.), Grammatical Inference and Applications, 2nd Internat. Coll., ICGI-94, Alicante, Spain, 21\u201323 September 1994. Lecture Notes in Artificial Intelligence, Vol. 862, Springer, Berlin, pp. 57\u201365.","DOI":"10.1007\/3-540-58473-0_137"},{"key":"10.1016\/S0167-6393(97)00062-9_BIB9","doi-asserted-by":"crossref","unstructured":"Jelinek, F., 1991. Self-organized language modeling for speech recognition. In: Waibel, A., Lee, K.-F. (Eds.), Readings in Speech Recognition, Morgan Kaufmann, San Mateo, CA, pp. 450\u2013506.","DOI":"10.1016\/B978-0-08-051584-7.50045-0"},{"key":"10.1016\/S0167-6393(97)00062-9_BIB10","doi-asserted-by":"crossref","unstructured":"Kneser, R., Ney, H., 1993. Improved clustering techniques for class-based statistical language modelling. In: Proc. 3rd European Conf. on Speech Communication and Technology, Berlin, 21\u201323 September 1993, pp. 973\u2013976.","DOI":"10.21437\/Eurospeech.1993-229"},{"key":"10.1016\/S0167-6393(97)00062-9_BIB11","unstructured":"Lafferty, J.D., Mercer, R.L., 1993. Automatic classification using features of spelling. In: Proc. 9th Ann. Conf. of the University of Waterloo Centre for the new OED and Text Research, Oxford University Press, Oxford, pp. 89\u2013103."},{"key":"10.1016\/S0167-6393(97)00062-9_BIB12","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1006\/csla.1994.1001","article-title":"On structuring probabilistic dependences in stochastic language modelling","volume":"8","author":"Ney","year":"1994","journal-title":"Computer Speech and Language"},{"issue":"12","key":"10.1016\/S0167-6393(97)00062-9_BIB13","doi-asserted-by":"crossref","first-page":"1202","DOI":"10.1109\/34.476512","article-title":"On the estimation of small probabilities by leaving-one-out","volume":"17","author":"Ney","year":"1995","journal-title":"IEEE Trans. Pattern Anal. Machine Intell."},{"key":"10.1016\/S0167-6393(97)00062-9_BIB14","doi-asserted-by":"crossref","unstructured":"Ney, H., Martin, S.C., Wessel, F., 1997. Statistical language modeling using leaving-one-out. In: Young, S., Bloothooft, G. (Eds.), Corpus-Based Methods in Language and Speech Processing. Kluwer Academic Publishers, Dordrecht, The Netherlands, pp. 174\u2013207.","DOI":"10.1007\/978-94-017-1183-8_6"},{"issue":"1","key":"10.1016\/S0167-6393(97)00062-9_BIB15","doi-asserted-by":"crossref","first-page":"43","DOI":"10.1006\/csla.1996.0022","article-title":"A word graph algorithm for large vocabulary continuous speech recognition","volume":"11","author":"Ortmanns","year":"1997","journal-title":"Computer, Speech and Language"},{"key":"10.1016\/S0167-6393(97)00062-9_BIB16","doi-asserted-by":"crossref","unstructured":"Paul, D.B., Baker, J.M., 1992. The design for the Wall Street Journal-based CSR corpus. In: Proc. DARPA Speech and Natural Language Workshop, Harriman, NY, 23\u201326 February 1992, pp. 357\u2013362.","DOI":"10.3115\/1075527.1075614"},{"key":"10.1016\/S0167-6393(97)00062-9_BIB17","doi-asserted-by":"crossref","unstructured":"Rosenfeld, R., 1994. Adaptive statistical language modeling: A maximum entropy approach. Ph.D. Thesis, Tech. Rept. CMU-CS-94-138, School of Computer Science, Carnegie Mellon University, Pittsburgh, PA, 114 pages.","DOI":"10.3115\/1075812.1075827"},{"key":"10.1016\/S0167-6393(97)00062-9_BIB18","doi-asserted-by":"crossref","unstructured":"Tak\u00e1cs, L., 1984. Combinatorics. In: Krishnaiah, P.R., Sen, P.K. (Eds.), Nonparametric Methods, Handbook of Statistics, Vol. 4. North-Holland, Amsterdam, pp. 123\u2013143.","DOI":"10.1016\/S0169-7161(84)04009-8"},{"key":"10.1016\/S0167-6393(97)00062-9_BIB19","unstructured":"Wessel, F., Ortmanns, S., Ney, H., 1997. Implementation of word based statistical language models. In: Proc. 2nd SQEL Workshop, Plze\u0148 (Pilsen), 27\u201329 April 1997, pp. 55\u201359."}],"container-title":["Speech Communication"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0167639397000629?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0167639397000629?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2023,4,16]],"date-time":"2023-04-16T06:20:58Z","timestamp":1681626058000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S0167639397000629"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[1998,4]]},"references-count":19,"journal-issue":{"issue":"1","published-print":{"date-parts":[[1998,4]]}},"alternative-id":["S0167639397000629"],"URL":"https:\/\/doi.org\/10.1016\/s0167-6393(97)00062-9","relation":{},"ISSN":["0167-6393"],"issn-type":[{"value":"0167-6393","type":"print"}],"subject":[],"published":{"date-parts":[[1998,4]]}}}