{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,3]],"date-time":"2026-04-03T10:24:23Z","timestamp":1775211863236,"version":"3.50.1"},"reference-count":47,"publisher":"Springer Science and Business Media LLC","issue":"1-2","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Lang Resources &amp; Evaluation"],"published-print":{"date-parts":[[2010,4]]},"DOI":"10.1007\/s10579-009-9095-y","type":"journal-article","created":{"date-parts":[[2009,8,3]],"date-time":"2009-08-03T11:50:52Z","timestamp":1249300252000},"page":"41-58","source":"Crossref","is-referenced-by-count":7,"title":["Analyzing and identifying multiword expressions in spoken language"],"prefix":"10.1007","volume":"44","author":[{"given":"Helmer","family":"Strik","sequence":"first","affiliation":[]},{"given":"Micha","family":"Hulsbosch","sequence":"additional","affiliation":[]},{"given":"Catia","family":"Cucchiarini","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2009,8,4]]},"reference":[{"key":"9095_CR1","doi-asserted-by":"crossref","first-page":"1001","DOI":"10.1121\/1.1534836","volume":"113","author":"A Bell","year":"2003","unstructured":"Bell, A., Jurafsky, D., Fosler-Lussier, E., Girand, C., Gregory, M. L., & Gildea, D. (2003). Effects of disfluencies, predictability, and utterance position on word form variation in English conversation. Journal of the Acoustical Society of America, 113, 1001\u20131024.","journal-title":"Journal of the Acoustical Society of America"},{"key":"9095_CR2","unstructured":"Beulen, K., Ortmanns, S., Eiden, A., Martin, S., Welling, L., & Overmann, J. (1998). Pronunciation modeling in the RWTH large vocabulary speech recognizer. (Paper presented at the ESCA Workshop \u201cModeling pronunciation variation for automatic speech recognition\u201d, Kerkrade)."},{"issue":"4","key":"9095_CR3","doi-asserted-by":"crossref","first-page":"433","DOI":"10.1016\/j.csl.2004.11.003","volume":"19","author":"D Binnenpoorte","year":"2005","unstructured":"Binnenpoorte, D., Cucchiarini, C., Boves, L., & Strik, H. (2005). Multiword expressions in spoken language: An exploratory study on pronunciation variation. Computer Speech & Language, 19(4), 433\u2013449.","journal-title":"Computer Speech & Language"},{"key":"9095_CR4","volume-title":"The phonology of Dutch","author":"G Booij","year":"1995","unstructured":"Booij, G. (1995). The phonology of Dutch. Oxford: Clarendon Press."},{"key":"9095_CR44","unstructured":"CGN website (2004). http:\/\/lands.let.ru.nl\/cgn\/ehome.htm . Accessed November 1, 2007."},{"issue":"4","key":"9095_CR5","doi-asserted-by":"crossref","first-page":"535","DOI":"10.1016\/S0346-251X(97)00046-8","volume":"25","author":"F Chambers","year":"1998","unstructured":"Chambers, F. (1998). What do we mean by fluency? System, 25(4), 535\u2013544.","journal-title":"System"},{"issue":"1","key":"9095_CR6","doi-asserted-by":"crossref","first-page":"72","DOI":"10.1093\/applin\/amm022","volume":"29","author":"K Conklin","year":"2007","unstructured":"Conklin, K., & Schmitt, N. (2007). Formulaic sequences: Are they processed more quickly than nonformulaic language by native and nonnative speakers? Applied Linguistics, 29(1), 72\u201389.","journal-title":"Applied Linguistics"},{"issue":"2","key":"9095_CR7","doi-asserted-by":"crossref","first-page":"131","DOI":"10.3109\/02699209608985167","volume":"10","author":"C Cucchiarini","year":"1996","unstructured":"Cucchiarini, C. (1996). Assessing transcription agreement: Methodological aspects. Clinical Linguistics & Phonetics, 10(2), 131\u2013155.","journal-title":"Clinical Linguistics & Phonetics"},{"issue":"6","key":"9095_CR8","doi-asserted-by":"crossref","first-page":"2862","DOI":"10.1121\/1.1471894","volume":"111","author":"C Cucchiarini","year":"2002","unstructured":"Cucchiarini, C., Strik, H., & Boves, L. (2002). Quantitative assessment of second language learners\u2019 fluency: Comparisons between read and spontaneous speech. Journal of the Acoustical Society of America, 111(6), 2862\u20132873.","journal-title":"Journal of the Acoustical Society of America"},{"key":"9095_CR9","doi-asserted-by":"crossref","unstructured":"Dahlmann, I., & Adolphs, S. (2007). Pauses as an indicator of psycholinguistically valid multi-word expressions (MWEs)? Proceedings of the ACL-2007 workshop on \u2018A broader perspective on multiword expressions\u2019, Prague, 49\u201356.","DOI":"10.3115\/1613704.1613711"},{"key":"9095_CR10","unstructured":"Elffers, A., Van Bael, C., & Strik, H. (2005). Adapt: Algorithm for dynamic alignment of phonetic transcriptions. (CLST internal report)."},{"issue":"1","key":"9095_CR11","doi-asserted-by":"crossref","first-page":"25","DOI":"10.1075\/ijcl.12.1.04erm","volume":"12","author":"B Erman","year":"2007","unstructured":"Erman, B. (2007). Cognitive processes as evidence of the idiom principle. International Journal of Corpus Linguistics, 12(1), 25\u201353.","journal-title":"International Journal of Corpus Linguistics"},{"key":"9095_CR12","doi-asserted-by":"crossref","first-page":"162","DOI":"10.1006\/brln.2001.2514","volume":"81","author":"M Ernestus","year":"2002","unstructured":"Ernestus, M., Baayen, H., & Schreuder, R. (2002). The recognition of reduced word forms. Brain and Language, 81, 162\u2013173.","journal-title":"Brain and Language"},{"key":"9095_CR13","unstructured":"Evert, S. (2004). The statistics of word cooccurences\u2014Word pairs and collocations. Dissertation, Universit\u00e4t Stuttgart."},{"key":"9095_CR14","doi-asserted-by":"crossref","unstructured":"Evert, S., & Krenn, B. (2001). Methods for the qualitative evaluation of lexical association measures. (Paper presented at the 39th annual meeting of the association for computational linguistics, Toulouse).","DOI":"10.3115\/1073012.1073037"},{"key":"9095_CR15","doi-asserted-by":"crossref","unstructured":"Finke, M., & Waibel, A. (1997). Speaking mode dependent pronunciation modeling in large vocabulary conversational speech recognition. (Paper presented at EuroSpeech-97, Rhodes).","DOI":"10.21437\/Eurospeech.1997-625"},{"key":"9095_CR16","first-page":"145","volume-title":"Prefabricated patterns in advanced EFL writing: Collocations and formulae. Phraseology: theory, analysis, and applications","author":"S Granger","year":"1998","unstructured":"Granger, S. (1998). Prefabricated patterns in advanced EFL writing: Collocations and formulae. Phraseology: theory, analysis, and applications (pp. 145\u2013160). Oxford: Clarendon Press."},{"key":"9095_CR17","unstructured":"Gregoire, N., Evert, S., & Kim, S. N. (Eds.). (2007). Proceedings of the ACL-2007 Workshop on \u2018A Broader Perspective on Multiword Expressions\u2019, Prague. http:\/\/www.aclweb.org\/anthology-new\/W\/W07\/W07-11.pdf ."},{"key":"9095_CR18","first-page":"151","volume":"35","author":"ML Gregory","year":"1999","unstructured":"Gregory, M. L., Raymond, W. D., Bell, A., Fosler-Lussier, E., & Jurafsky, D. (1999). The effects of collocational strength and contextual predictability in lexical production. Chicago Linguistics Society, 35, 151\u2013166.","journal-title":"Chicago Linguistics Society"},{"key":"9095_CR19","doi-asserted-by":"crossref","first-page":"229","DOI":"10.1075\/tsl.45.13jur","volume-title":"Frequency and the emergence of linguistic structure","author":"D Jurafsky","year":"2001","unstructured":"Jurafsky, D., Bell, A., Gregory, M. L., & Raymond, W. D. (2001). Probabilistic relations between words: Evidence from reduction in lexical production. In J. Bybee & P. Hopper (Eds.), Frequency and the emergence of linguistic structure (pp. 229\u2013254). Amsterdam: John Benjamins."},{"key":"9095_CR20","doi-asserted-by":"crossref","first-page":"117","DOI":"10.1016\/S0093-934X(03)00425-5","volume":"90","author":"R Kemps","year":"2004","unstructured":"Kemps, R., Ernestus, M., Schreuder, R., & Baayen, R. H. (2004). Processing reduced word forms: The suffix restoration effect. Brain and Language, 90, 117\u2013127.","journal-title":"Brain and Language"},{"key":"9095_CR21","doi-asserted-by":"crossref","first-page":"193","DOI":"10.1016\/S0167-6393(99)00048-5","volume":"29","author":"JM Kessens","year":"1999","unstructured":"Kessens, J. M., Wester, M., & Strik, H. (1999). Improving the performance of a Dutch CSR by modeling within-word and cross-word pronunciation variation. Speech Communication, 29, 193\u2013207.","journal-title":"Speech Communication"},{"key":"9095_CR22","volume-title":"Smooth talkers. The linguistic performance of auctioneers and sportscasters","author":"K Kuiper","year":"1996","unstructured":"Kuiper, K. (1996). Smooth talkers. The linguistic performance of auctioneers and sportscasters. Mawah, NJ: Lawrence Erlabum Associates."},{"key":"9095_CR23","doi-asserted-by":"crossref","first-page":"37","DOI":"10.1075\/lllt.9.04kui","volume-title":"Formulaic sequences: Acquisition, processing and use","author":"K Kuiper","year":"2004","unstructured":"Kuiper, K. (2004). Formulaic performance in conventionalised varieties of speech. In N. Schmitt (Ed.), Formulaic sequences: Acquisition, processing and use (pp. 37\u201354). Amsterdam: John Benjamins."},{"key":"9095_CR24","volume-title":"Lexical phrases and language teaching","author":"JR Nattinger","year":"1992","unstructured":"Nattinger, J. R., & DeCarrico, J. S. (1992). Lexical phrases and language teaching. Oxford: Oxford University Press."},{"key":"9095_CR25","volume-title":"New Frontiers of Corpus Research. (pp 105\u2013112)","author":"NHJ Oostdijk","year":"2002","unstructured":"Oostdijk, N. H. J. (2002). The design of the Spoken Dutch Corpus. In P. Peters, P. Collins, & A. Smith (Eds.), New Frontiers of Corpus Research. (pp. 105\u2013112). Amsterdam: Rodopi."},{"key":"9095_CR26","unstructured":"Pedersen, T. (2006). Ngram Statistics Package (NSP). Retrieved November 1, 2007, from http:\/\/www.d.umn.edu\/~tpederse\/nsp.html ."},{"key":"9095_CR27","doi-asserted-by":"crossref","first-page":"378","DOI":"10.1016\/j.csl.2004.11.002","volume":"19","author":"S Piao","year":"2005","unstructured":"Piao, S., Rayson, P., Archer, D., & McEnery, T. (2005). Comparing and combining a semantic tagger and a statistical tool for MWE extraction. Computer Speech & Language, 19, 378\u2013397.","journal-title":"Computer Speech & Language"},{"key":"9095_CR28","unstructured":"Pluymaeckers, M. (2003) Prefabs in sports commentary. Master\u2019s thesis, Tilburg University."},{"key":"9095_CR29","unstructured":"Rayson, P., Sharoff, S., & Adolphs, S. (Eds.). (2006). Proceedings of the EACL-2006 workshop on \u2018multi-word-expressions in a multilingual context\u2019, Trento, Italy."},{"key":"9095_CR30","doi-asserted-by":"crossref","first-page":"23","DOI":"10.1075\/lllt.9.03rea","volume-title":"Formulaic sequences: Acquisition, processing and use","author":"Read and Nation","year":"2004","unstructured":"Read and Nation. (2004). Measurement of formulaic sequences. In N. Schmitt (Ed.), Formulaic sequences: Acquisition, processing and use (pp. 23\u201335). Amsterdam: John Benjamins."},{"key":"9095_CR31","doi-asserted-by":"crossref","unstructured":"Sag, I., Baldwin, T., Bond, F., Copestake, A. & Flickinger, D. (2002). Multiword expressions: A pain in the neck for NLP. In Proceedings of the 3rd international conferences on intelligent text processing and computational linguistics, 1\u201315.","DOI":"10.1007\/3-540-45715-1_1"},{"key":"9095_CR32","doi-asserted-by":"crossref","DOI":"10.1075\/lllt.9","volume-title":"Formulaic sequences: Acquisition, processing and use","author":"N Schmitt","year":"2004","unstructured":"Schmitt, N. (2004). Formulaic sequences: Acquisition, processing and use. Amsterdam: John Benjamins."},{"key":"9095_CR33","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1075\/lllt.9.02sch","volume-title":"Formulaic sequences: Acquisition, processing and use","author":"N Schmitt","year":"2004","unstructured":"Schmitt, N., & Carter, N. (2004). Formulaic sequences in action: An introduction. In N. Schmitt (Ed.), Formulaic sequences: Acquisition, processing and use (pp. 1\u201322). Amsterdam: John Benjamins."},{"key":"9095_CR34","doi-asserted-by":"crossref","first-page":"127","DOI":"10.1075\/lllt.9.08sch","volume-title":"Formulaic sequences: Acquisition, processing and use","author":"N Schmitt","year":"2004","unstructured":"Schmitt, N., Grandage, S., & Adolphs, S. (2004). Are Corpus-derived Recurrent Clusters Psycholinguistically Valid? In N. Schmitt (Ed.), Formulaic sequences: Acquisition, processing and use (pp. 127\u2013152). Amsterdam: John Benjamins."},{"key":"9095_CR35","doi-asserted-by":"crossref","unstructured":"Sloboda, T., & Waibel, A. (1996). Dictionary learning for spontaneous speech recognition. (Paper presented at 4th international conference on spoken language processing, Philadelphia).","DOI":"10.1109\/ICSLP.1996.607274"},{"key":"9095_CR36","doi-asserted-by":"crossref","first-page":"161","DOI":"10.1016\/j.jml.2005.11.001","volume":"54","author":"SA Sprenger","year":"2006","unstructured":"Sprenger, S. A., Levelt, W. J. M., & Kempen, G. (2006). Lexical access during the production of idiomatic phrases. Journal of Memory and Language, 54, 161\u2013184.","journal-title":"Journal of Memory and Language"},{"issue":"2\u20134","key":"9095_CR37","doi-asserted-by":"crossref","first-page":"225","DOI":"10.1016\/S0167-6393(99)00038-2","volume":"29","author":"H Strik","year":"1999","unstructured":"Strik, H., & Cucchiarini, C. (1999). Modeling pronunciation variation for ASR: A survey of the literature. Speech Communication, 29(2\u20134), 225\u2013246.","journal-title":"Speech Communication"},{"issue":"1","key":"9095_CR38","doi-asserted-by":"crossref","first-page":"84","DOI":"10.1093\/applin\/17.1.84","volume":"17","author":"R Towell","year":"1996","unstructured":"Towell, R., Hawkins, R., & Bazergui, N. (1996). The development of fluency in davanced learners of French. Applied Linguistics, 17(1), 84\u2013119.","journal-title":"Applied Linguistics"},{"key":"9095_CR39","doi-asserted-by":"crossref","first-page":"153","DOI":"10.1075\/lllt.9.09und","volume-title":"Formulaic sequences: Acquisition, processing and use","author":"G Underwood","year":"2004","unstructured":"Underwood, G., Schmitt, N., & Galpin, A. (2004). The eyes have it: An eye-movement study into the processing of formulaic sequences. In N. Schmitt (Ed.), Formulaic sequences: Acquisition, processing and use (pp. 153\u2013172). Amsterdam: John Benjamins."},{"key":"9095_CR40","doi-asserted-by":"crossref","unstructured":"Van de Cruys, T. & Villada Moir\u00f3n, B. (2007). Semantics-based multiword expression extraction. In Proceedings of the ACL workshop \u2018A broader perspective on multiword expressions\u2019, 25\u201332.","DOI":"10.3115\/1613704.1613708"},{"key":"9095_CR41","doi-asserted-by":"crossref","first-page":"207","DOI":"10.1016\/j.langcom.2004.02.003","volume":"24","author":"D Lancker Sidtis Van","year":"2004","unstructured":"Van Lancker Sidtis, D., & Rallon, G. (2004). Tracking the incidence of formulaic expressions in everyday speech: Methods for classification and verification. Language & Communication, 24, 207\u2013240.","journal-title":"Language & Communication"},{"key":"9095_CR42","unstructured":"Villada Moir\u00f3n, B. (2005). Data-driven Identification of fixed expressions and their modifiability. Dissertation, University of Groningen, The Netherlands."},{"key":"9095_CR43","unstructured":"Villada Moir\u00f3n, B., Villavicencio, A., McCarthy, D., Evert, S., & Stevenson, S. (Eds.). (2006). Proceedings of the COLING\/ACL 2006 workshop on \u2018Multiword expressions: Identifying and exploiting underlying properties\u2019, Sydney. http:\/\/acl.ldc.upenn.edu\/W\/W06\/W06-1200.pdf ."},{"key":"9095_CR45","unstructured":"Wells, J. C. (1996). SAMPA for Dutch. http:\/\/www.phon.ucl.ac.uk\/home\/sampa\/dutch.htm Accessed November 1, 2007."},{"issue":"1","key":"9095_CR46","first-page":"27","volume":"2","author":"D Wood","year":"2004","unstructured":"Wood, D. (2004). An empirical investigation into the facilitating role of automatized lexical phrases in second language fluency development. Journal of language and learning, 2(1), 27\u201350.","journal-title":"Journal of language and learning"},{"key":"9095_CR47","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1016\/S0271-5309(99)00015-4","volume":"20","author":"A Wray","year":"2000","unstructured":"Wray, A., & Perkins, M. R. (2000). The functions of formulaic language: An integrated model. Language & Communication, 20, 1\u201328.","journal-title":"Language & Communication"}],"container-title":["Language Resources and Evaluation"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10579-009-9095-y.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,5,26]],"date-time":"2023-05-26T06:22:56Z","timestamp":1685082176000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10579-009-9095-y"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2009,8,4]]},"references-count":47,"journal-issue":{"issue":"1-2","published-print":{"date-parts":[[2010,4]]}},"alternative-id":["9095"],"URL":"https:\/\/doi.org\/10.1007\/s10579-009-9095-y","relation":{},"ISSN":["1574-020X","1574-0218"],"issn-type":[{"value":"1574-020X","type":"print"},{"value":"1574-0218","type":"electronic"}],"subject":[],"published":{"date-parts":[[2009,8,4]]}}}