{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,14]],"date-time":"2026-05-14T23:25:46Z","timestamp":1778801146862,"version":"3.51.4"},"reference-count":54,"publisher":"Elsevier BV","issue":"2-4","license":[{"start":{"date-parts":[[1999,11,1]],"date-time":"1999-11-01T00:00:00Z","timestamp":941414400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Speech Communication"],"published-print":{"date-parts":[[1999,11]]},"DOI":"10.1016\/s0167-6393(99)00050-3","type":"journal-article","created":{"date-parts":[[2003,4,5]],"date-time":"2003-04-05T03:57:58Z","timestamp":1049515078000},"page":"159-176","source":"Crossref","is-referenced-by-count":192,"title":["Speaking in shorthand \u2013 A syllable-centric perspective for understanding pronunciation variation"],"prefix":"10.1016","volume":"29","author":[{"given":"Steven","family":"Greenberg","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"78","reference":[{"key":"10.1016\/S0167-6393(99)00050-3_BIB1","doi-asserted-by":"crossref","unstructured":"Arai, T., Greenberg, S., 1997. The temporal properties of spoken Japanese are similar to those of English. In: Proceedings of Eurospeech, Rhodes, Greece, pp. 1011\u20131014","DOI":"10.21437\/Eurospeech.1997-355"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB2","series-title":"Class, Codes and Control","author":"Bernstein","year":"1974"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB3","unstructured":"Bernstein, J., Baldwin, G., Cohen, M., Murveit, H., Weintraub, M., 1992. Phonological studies for speech recognition. In: Proceedings of the DARPA Speech Recognition Workshop, pp. 41\u201348"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB4","doi-asserted-by":"crossref","unstructured":"Byrne, W., Finke, M., Khudanpur, S., McDonnough, J., Nock, H., Saraclar, M., Wooters, C., Zavaliagkos, G., 1997. Pronunciation modelling for conversational speech recognition \u2013 A status report from WS97. In: Proceedings of the IEEE Workshop on Automatic Speech Recognition and Understanding, pp. 26\u201333","DOI":"10.1109\/ASRU.1997.658973"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB5","doi-asserted-by":"crossref","unstructured":"Byrne, W., Finke, M., Khudanpur, S., McDonnough, J., Nock, H., Saraclar, M., Wooters, C., Zavaliagkos, G., 1998. Pronunciation modeling using a hand-labelled corpus for conversational speech recognition. In: Proceedings of the IEEE International Conference on Acoustics, Speech and Signal Processing, pp. 313\u2013316","DOI":"10.1109\/ICASSP.1998.674430"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB6","doi-asserted-by":"crossref","unstructured":"Coleman, J., 1992. The phonetic interpretation of headed phonological structures containing overlapping constituents. Phonetics Yearbook 9, 1\u201344","DOI":"10.1017\/S0952675700001482"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB7","series-title":"The Cambridge Encyclopedia of the English Language","author":"Crystal","year":"1995"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB8","series-title":"Relative Frequency of English Speech Sounds","author":"Dewey","year":"1923"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB9","series-title":"The Adventures of Sherlock Holmes","author":"Doyle","year":"1892"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB10","unstructured":"Fosler, E., Weintraub, M., Wegmann, S., Kao, Y.-H., Khudanpur, S., Galles, C., Saraclar, M., 1996. Automatic learning of word pronunciation from data. In: Proceedings of the International Conference on Spoken Language Processing, pp. S28\u201329"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB11","doi-asserted-by":"crossref","unstructured":"Fosler-Lussier, E., Morgan, N., 1998. Effects of speaking rate and word frequency on pronunciations in conversational speech. Speech Communication 29 (2\u20134), 137\u2013158","DOI":"10.1016\/S0167-6393(99)00035-7"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB12","unstructured":"Fosler-Lussier, E., Greenberg, S., Morgan, N., 1999. Incorporating contextual phonetics into automatic speech recognition. In: Proceedings of the International Congress of Phonetic Sciences, San Francisco"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB13","doi-asserted-by":"crossref","first-page":"290","DOI":"10.1002\/j.1538-7305.1930.tb00368.x","article-title":"The words and sounds of telephone conversations","volume":"9","author":"French","year":"1930","journal-title":"Bell System Tech. J."},{"key":"10.1016\/S0167-6393(99)00050-3_BIB14","doi-asserted-by":"crossref","unstructured":"Ganapathiraju, A., Goel, V., Picone, J., Corrada, A., Doddington, G., Kirchhoff, K., Ordowski, M., Wheatley, B., 1997. Syllable \u2013 A promising recognition unit for LVCSR. In: Proceedings of the IEEE Workshop on Automatic Speech Recognition and Understanding, pp. 207\u2013214","DOI":"10.1109\/ASRU.1997.659007"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB15","doi-asserted-by":"crossref","unstructured":"Gauvain, J., Lamel, L., Adda, G., Adda-Decker, M., 1994. The LIMSI continuous speech dictation system: Evaluation on the ARPA Wall Street Journal task. In: Proceedings of the IEEE International Conference on Acoustics, Speech and Signal Processing, pp. 557\u2013560","DOI":"10.1109\/ICASSP.1994.389233"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB16","doi-asserted-by":"crossref","unstructured":"Godfrey, J.J., Holliman, E.C., McDaniel, J., 1992. SWITCHBOARD: Telephone speech corpus for research and development. In: Proceedings of the IEEE International Conference on Acoustics, Speech and Signal Processing, pp. 517\u2013520","DOI":"10.1109\/ICASSP.1992.225858"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB17","unstructured":"Goldinger, S.D., Pisoni, D.B., Luce, P., 1996. Speech perception and spoken word recognition: Research and theory. In: Lass N. (Ed.), Principles of Experimental Phonetics, Mosby St. Louis, pp. 277\u2013327"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB18","unstructured":"Greenberg, S., 1997a. On the origins of speech intelligibility in the real world. In: Proceedings of the ESCA Workshop on Robust Speech Recognition for Unknown Communication Channels. Pont-a-Mousson, France, pp. 23\u201332"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB19","unstructured":"Greenberg, S., 1997b. The switchboard transcription project. Research Report #24, Large Vocabulary Continuous Speech Recognition Summer Research Workshop Technical Report Series. Center for Language and Speech Processing. Johns Hopkins University Press, Baltimore, MD"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB20","doi-asserted-by":"crossref","unstructured":"Greenberg, S., 1997c. Auditory function. In: Crocker, M. (Ed.), Encyclopedia of Acoustics. Wiley, New York, pp. 1301\u20131323","DOI":"10.1002\/9780470172537.ch104"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB21","unstructured":"Greenberg, S., 1998. Speaking in shorthand \u2013 A syllable-centric perspective for understanding pronunciation variation. In: Proceedings of the ESCA Workshop on Modeling Pronunciation Variation for Automatic Speech Recognition, Kerkrade, The Netherlands, pp. 47\u201356"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB22","unstructured":"Greenberg, S., Hollenback, J., Ellis, D., 1996. Insights into spoken language gleaned from phonetic transcription of the Switchboard corpus. In: Proceedings of the International Conference on Spoken Language Processing, Philadelphia, pp. S32\u201335"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB23","unstructured":"Greenberg, S., Ellis, D.A., Hollenback, J., Fosler-Lussier, E., 1999. Phonetic transcription of spontaneous American English (the Switchboard corpus). Speech Communication (submitted)"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB24","series-title":"Language; Its Nature, Development and Origin","author":"Jespersen","year":"1922"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB25","series-title":"Syllable-based Generalizations in English Phonology","author":"Kahn","year":"1980"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB26","series-title":"A Pronouncing Dictionary of American English","author":"Kenyon","year":"1953"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB27","doi-asserted-by":"crossref","first-page":"117","DOI":"10.1016\/S0167-6393(98)00032-6","article-title":"Robust speech recognition using the modulation spectrogram","volume":"25","author":"Kingsbury","year":"1998","journal-title":"Speech Communication"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB28","unstructured":"Kirchhoff, K., 1999. Robust speech recognition using articulatory information. Ph.D. thesis, University of Bielefeld"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB29","unstructured":"Kohler, K., 1995. Articulatory reduction in different speaking styles. In: Proceedings of the International Congress of Phonetic Sciences, Stockholm, Vol. 2, pp. 12\u201319"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB30","series-title":"Prosody in Speech Understanding Systems","author":"Kompe","year":"1997"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB31","series-title":"Sociolinguistic Patterns","author":"Labov","year":"1972"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB32","unstructured":"Lehiste, I., 1996. Suprasegmental features of speech. In: Lass, N. (Ed.), Principles of Experimental Phonetics. Mosby, St. Louis, pp. 226\u2013244"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB33","series-title":"Speaking","author":"Levelt","year":"1989"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB34","doi-asserted-by":"crossref","first-page":"1773","DOI":"10.1121\/1.1918816","article-title":"A spectrographic study of vowel reduction","volume":"35","author":"Lindblom","year":"1963","journal-title":"J. Acoust. Soc. Amer."},{"key":"10.1016\/S0167-6393(99)00050-3_BIB35","doi-asserted-by":"crossref","unstructured":"Lindblom, B., 1990. Explaining phonetic variation: a sketch of the H\u2013H theory. In: Hardcastle, W., Marchal. A. (Eds.), Speech Production and Speech Modeling. Kluwer Academic Publishers, Dordrecht, pp. 403\u2013439","DOI":"10.1007\/978-94-009-2037-8_16"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB36","series-title":"An Introduction to the Languages of the World","author":"Lyovin","year":"1997"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB37","unstructured":"McAllaster, D., Gillick, L., Scattone, F., Newman, M., 1998. Explorations with fabricated data. In: Proceedings of the DARPA Workshop on Conversational Speech Recognition, Hub-5"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB38","doi-asserted-by":"crossref","unstructured":"Niemann, H., Noth, E., Kiessling, A., Kompe, R., Batliner, A., 1997. Prosodic processing and its use in Verbmobil. In: Proceedings of IEEE International Conference on Acoustics, Speech and Signal Processing, pp. 75\u201378","DOI":"10.1109\/ICASSP.1997.599550"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB39","unstructured":"Ostendorf, M., Byrne, B., Macchiani, M., Finke, M., Gunawardana, A., Ross, K., Roweis, S., Shriberg, E., Talkin, D., Waibel, A., Wheatley, B., Zeppenfeld, T., 1997. Modeling systematic variations in pronunciation via a language-dependent hidden speaking mode. Research Report #24, Large Vocabulary Continuous Speech Recognition Workshop Technical Report Series. Center for Language and Speech Processing. Johns Hopkins University, Baltimore, MD"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB40","series-title":"Fundamentals of Speech Recognition","author":"Rabiner","year":"1993"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB41","series-title":"Automatic Speech and Speaker Recognition: Advanced Topics","article-title":"Automatic generation of detailed pronunciation lexicons","author":"Riley","year":"1995"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB42","unstructured":"Riley, M., Finke, M., Khudanpur, S., Llolje, A., McDonough, J., Nock, H., Saraclar, M., Wooters, C., Zavaliagkos, G., 1998. Stochastic pronunciation modelling and hand-labelled phonetic corpora. In: Proceedings of the ESCA Tutorial and Research Workshop on Modeling Pronunciation Variation for Automatic Speech Recognition, Kerkrade, pp. 109\u2013116"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB43","unstructured":"Schiel, F.A., Tillmann, H., 1998. Statistical modeling of pronunciation: it\u2019s not the model, it\u2019s the data. In: Proceedings of the ESCA Tutorial and Research Workshop on Modeling Pronunciation Variation for Automatic Speech Recognition, Kerkrade, pp. 131\u2013136"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB44","unstructured":"Silipo, R., Greenberg, S., 1999. Automatic transcription of prosodic stress for spontaneous English discourse. In: Proceedings of the International Congress of Phonetic Sciences, San Francisco"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB45","doi-asserted-by":"crossref","unstructured":"van Son, R.J.J.H., Koopmans-van Beinum, J., Pols, L.C.W., 1998. Efficiency as an organizing principle of natural speech. In: Proceedings of the International Conference on Spoken Language Processing, pp. 2375\u20132378","DOI":"10.21437\/ICSLP.1998-738"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB46","doi-asserted-by":"crossref","first-page":"95","DOI":"10.1016\/S0167-6393(98)00069-7","article-title":"Acoustic correlates of lexical stress in continuous telephone speech","volume":"27","author":"van Kuik","year":"1999","journal-title":"Speech Communication"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB47","unstructured":"van Wieringen, A., 1995. Perceiving dynamic speechlike sounds. Ph.D. thesis, University of Amsterdam"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB48","series-title":"Prosody and Speech Recognition","author":"Waibel","year":"1998"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB49","unstructured":"Weintraub, M., Taussig, K., Smith, K.H., Snodgrass, A., 1996. Effect of speaking style on LVCSR performance. In: Proceedings of the International Conference on Spoken Language Processing, Philadelphia"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB50","unstructured":"Weintraub, M., Fosler, E., Galles, C., Kao, Y.-H., Khudanpur, S., Saraclar, M., Wegmann, S., 1997. WS96 project report: Automatic learning of word pronunciation from data. Research Report #24, Large Vocabulary Continuous Speech Recognition Summer Research Workshop Technical Report Series. Center for Language and Speech Processing. Johns Hopkins University, Baltimore, MD"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB51","unstructured":"Wu, S.-L., Kingsbury, B., Morgan, N., Greenberg, S., 1998a. Incorporating information from syllable-length time scales into automatic speech recognition. In: Proceedings of the IEEE International Conference on Acoustics, Speech and Signal Processing. Seattle, pp. 721\u2013724"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB52","doi-asserted-by":"crossref","unstructured":"Wu, S.-L., Kingsbury, B., Morgan, N., Greenberg, S., 1998b. Performance improvements through combining phone- and syllable-length information in automatic speech recognition. In: Proceedings of the International Conference on Spoken Language Processing, Sydney, pp. 854\u2013857","DOI":"10.21437\/ICSLP.1998-305"},{"key":"10.1016\/S0167-6393(99)00050-3_BIB53","doi-asserted-by":"crossref","first-page":"251","DOI":"10.1080\/00221309.1945.10544509","article-title":"The meaning-frequency relationship of words","volume":"33","author":"Zipf","year":"1945","journal-title":"J. Gen. Psych."},{"key":"10.1016\/S0167-6393(99)00050-3_BIB54","doi-asserted-by":"crossref","unstructured":"Zue, V.W., Seneff, S., 1996. Transcription and alignment of the TIMIT database. In: Fujisaki, H. (Ed.), Recent Research Towards Advanced Man-Machine Interface Through Spoken Language. Elsevier, Amsterdam, pp. 515\u2013525","DOI":"10.1016\/B978-044481607-8\/50088-8"}],"container-title":["Speech Communication"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0167639399000503?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0167639399000503?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2024,12,3]],"date-time":"2024-12-03T23:21:49Z","timestamp":1733268109000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S0167639399000503"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[1999,11]]},"references-count":54,"journal-issue":{"issue":"2-4","published-print":{"date-parts":[[1999,11]]}},"alternative-id":["S0167639399000503"],"URL":"https:\/\/doi.org\/10.1016\/s0167-6393(99)00050-3","relation":{},"ISSN":["0167-6393"],"issn-type":[{"value":"0167-6393","type":"print"}],"subject":[],"published":{"date-parts":[[1999,11]]}}}