{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,14]],"date-time":"2026-03-14T08:58:54Z","timestamp":1773478734241,"version":"3.50.1"},"reference-count":40,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2026,3,14]],"date-time":"2026-03-14T00:00:00Z","timestamp":1773446400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0"},{"start":{"date-parts":[[2026,3,14]],"date-time":"2026-03-14T00:00:00Z","timestamp":1773446400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0"}],"funder":[{"DOI":"10.13039\/501100014826","name":"ADAPT research centre","doi-asserted-by":"crossref","award":["13\/RC\/2106"],"award-info":[{"award-number":["13\/RC\/2106"]}],"id":[{"id":"10.13039\/501100014826","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100001602","name":"science fundation ireland","doi-asserted-by":"crossref","award":["SFI\/12\/RC\/2289"],"award-info":[{"award-number":["SFI\/12\/RC\/2289"]}],"id":[{"id":"10.13039\/501100001602","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100008530","name":"European Regional Development Fund","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100008530","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100014013","name":"UK Research and Innovation","doi-asserted-by":"crossref","award":["EP\/V047949\/1"],"award-info":[{"award-number":["EP\/V047949\/1"]}],"id":[{"id":"10.13039\/100014013","id-type":"DOI","asserted-by":"crossref"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Lang Resources &amp; Evaluation"],"published-print":{"date-parts":[[2026,6]]},"DOI":"10.1007\/s10579-025-09876-7","type":"journal-article","created":{"date-parts":[[2026,3,14]],"date-time":"2026-03-14T08:26:09Z","timestamp":1773476769000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Towards a resource for multilingual lexicons: an MT assisted and human-in-the-loop multilingual parallel corpus with multi-word expression annotation"],"prefix":"10.1007","volume":"60","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-3221-2185","authenticated-orcid":false,"given":"Lifeng","family":"Han","sequence":"first","affiliation":[]},{"given":"Najet Hadj","family":"Mohamed","sequence":"additional","affiliation":[]},{"given":"Malak","family":"Rassem","sequence":"additional","affiliation":[]},{"given":"Gareth J. F.","family":"Jones","sequence":"additional","affiliation":[]},{"given":"Alan F.","family":"Smeaton","sequence":"additional","affiliation":[]},{"given":"Goran","family":"Nenadic","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2026,3,14]]},"reference":[{"key":"9876_CR1","first-page":"267","volume-title":"Handbook of natural language processing","author":"T Baldwin","year":"2010","unstructured":"Baldwin, T., & Kim, S. N. (2010). Multiword expressions. Handbook of natural language processing (2nd ed., pp. 267\u2013292). Chapman and Hall.","edition":"2"},{"key":"9876_CR2","doi-asserted-by":"publisher","DOI":"10.1007\/s10579-020-09514-4","author":"R Bawden","year":"2020","unstructured":"Bawden, R., Bilinski, E., Lavergne, T., & Rosset, S. (2020). Diabla: a corpus of bilingual spontaneous written dialogues for machine translation. Language Resources and Evaluation. https:\/\/doi.org\/10.1007\/s10579-020-09514-4","journal-title":"Language Resources and Evaluation"},{"key":"9876_CR3","unstructured":"Bouamor, D., Semmar, N., & Zweigenbaum, P. (2012). Identifying bilingual multi-word expressions for statistical machine translation. In: Conference on language resources and evaluation."},{"key":"9876_CR4","doi-asserted-by":"crossref","unstructured":"Chowdhary, V., & Greenwood, S. (2017). Emt: End to end model training for msr machine translation. In: Proceedings of the 1st workshop on data management for end-to-end machine learning, https:\/\/www.microsoft.com\/en-us\/research\/publication\/emt-end-end-model-training-msr-machine-translation\/.","DOI":"10.1145\/3076246.3076247"},{"issue":"4","key":"9876_CR5","doi-asserted-by":"publisher","first-page":"837","DOI":"10.1162\/COLI_a_00302","volume":"43","author":"M Constant","year":"2017","unstructured":"Constant, M., Eryi\u01e7it, G., Monti, J., van der Plas, L., Ramisch, C., Rosner, M., & Todirascu, A. (2017). Survey: Multiword expression processing: A Survey. Computational Linguistics, 43(4), 837\u2013892. https:\/\/doi.org\/10.1162\/COLI_a_00302https:\/\/www.aclweb.org\/anthology\/J17-4005.","journal-title":"Computational Linguistics"},{"key":"9876_CR6","unstructured":"Gladkoff, S., & Han, L. (2021). HOPE: A task-oriented and human-centric evaluation framework using professional post-editing towards more effective MT evaluation. CoRR abs\/2112.13833, https:\/\/arxiv.org\/abs\/2112.13833, arXiv:2112.13833."},{"key":"9876_CR7","unstructured":"Gladkoff, S., Sorokina, I., Han, L., & Alekseeva, A. (2022). Measuring uncertainty in translation quality evaluation (TQE). In: Calzolari, N., B\u00e9chet, F., Blache, P., Choukri, K., Cieri, C., Declerck, T., Goggi, S., Isahara, H., Maegaard, B., Mariani, J., Mazo, H., Odijk, J., Piperidis, S. (eds) Proceedings of the thirteenth language resources and evaluation conference, European language resources association, Marseille, France, pp 1454\u20131461, https:\/\/aclanthology.org\/2022.lrec-1.156\/."},{"key":"9876_CR8","unstructured":"Han, L., Jones, G., & Smeaton, A. (2020a). AlphaMWE: Construction of multilingual parallel corpora with MWE annotations. In: Proceedings of the joint workshop on multiword expressions and electronic lexicons, Association for Computational Linguistics, online, pp 44\u201357, https:\/\/www.aclweb.org\/anthology\/2020.mwe-1.6."},{"key":"9876_CR9","unstructured":"Han, L., Jones, G. J. F., & Smeaton, A. (2020b). MultiMWE: Building a multi-lingual multi-word expression (MWE) parallel corpora. In: Proceedings of The 12th language resources and evaluation conference, European Language Resources Association, Marseille, France, pp 2970\u20132979, https:\/\/www.aclweb.org\/anthology\/2020.lrec-1.363."},{"key":"9876_CR10","unstructured":"Hassan, H., Aue, A., Chen, C., Chowdhary, V., Clark, J., Federmann, C., Huang, X., Junczys-Dowmunt, M., Lewis, W., Li, M., Liu, S., Liu, T., Luo, R., Menezes, A., Qin, T., Seide, F., Tan, X., Tian, F., Wu, L., Wu, S., Xia, Y., Zhang, D., Zhang, Z., & Zhou, M. (2018). Achieving human parity on automatic Chinese to English news translation. ArXiv abs\/1803.05567."},{"key":"9876_CR11","doi-asserted-by":"publisher","first-page":"339","DOI":"10.1162\/tacl_a_00065","volume":"5","author":"M Johnson","year":"2017","unstructured":"Johnson, M., Schuster, M., Le, Q. V., Krikun, M., Wu, Y., Chen, Z., Thorat, N., Vi\u00e9gas, F., Wattenberg, M., Corrado, G., Hughes, M., & Dean, J. (2017). Google\u2019s multilingual neural machine translation system: Enabling zero-shot translation. Transactions of the Association for Computational Linguistics, 5, 339\u2013351. https:\/\/doi.org\/10.1162\/tacl_a_00065https:\/\/www.aclweb.org\/anthology\/Q17-1024.","journal-title":"Transactions of the Association for Computational Linguistics"},{"key":"9876_CR12","unstructured":"Kato, A., Shindo, H., & Matsumoto, Y. (2016). Construction of an English dependency corpus incorporating compound function words. In: Proceedings of the tenth international conference on language resources and evaluation (LREC\u201916), European Language Resources Association (ELRA), Portoro\u017e, Slovenia, pp 1667\u20131671, https:\/\/aclanthology.org\/L16-1263."},{"key":"9876_CR13","unstructured":"Kato, A., Shindo, H., & Matsumoto, Y. (2018). Construction of Large-scale English verbal multiword expression annotated corpus. In: Proceedings of the eleventh international conference on language resources and evaluation (LREC 2018), Miyazaki, Japan."},{"key":"9876_CR14","unstructured":"Lambert, P., & Banchs, R. E. (2005). Data inferred multi-word expressions for statistical machine translation. In: Proceedings of machine translation Summit X, Thailand, pp 396\u2013403, https:\/\/hal.archives-ouvertes.fr\/hal-00705007."},{"key":"9876_CR15","doi-asserted-by":"crossref","unstructured":"L\u00e4ubli, S., Castilho, S., Neubig, G., Sennrich, R., Shen, Q., & Toral, A. (2020). A set of recommendations for assessing human-machine parity in language translation. arXiv e-prints arXiv:2004.01694.","DOI":"10.1613\/jair.1.11371"},{"key":"9876_CR16","first-page":"93","volume-title":"Machine translation","author":"X Li","year":"2019","unstructured":"Li, X., Yan, J., Zhang, J., & Zong, C. (2019). Neural name translation improves neural machine translation. In J. Chen & J. Zhang (Eds.), Machine translation (pp. 93\u2013100). Springer."},{"key":"9876_CR17","unstructured":"Macketanz, V., Avramidis, E., Manakhimova, S., & M\u00f6ller, S. (2021). Linguistic evaluation for the 2021 state-of-the-art machine translation systems for German to English and English to German. In: Proceedings of the sixth conference on machine translation, Association for Computational Linguistics, Online, pp 1059\u20131073, https:\/\/aclanthology.org\/2021.wmt-1.115."},{"key":"9876_CR18","doi-asserted-by":"crossref","unstructured":"Maldonado, A., Han, L., Moreau, E., Alsulaimani, A., Chowdhury, K. D., Vogel, C., & Liu, Q. (2017). Detection of verbal multi-word expressions via conditional random fields with syntactic dependency features and semantic re-ranking. In: The 13th workshop on multiword expressions @ EACL 2017, ACL.","DOI":"10.18653\/v1\/W17-1715"},{"key":"9876_CR19","unstructured":"Markantonatou, S., McCrae, J., Mitrovi\u0107, J., Tiberius, C., Ramisch, C., Vaidya, A., Osenova, P., & Savary, A. (eds) (2020). Proceedings of the joint workshop on multiword expressions and electronic lexicons, Association for Computational Linguistics, online, https:\/\/aclanthology.org\/2020.mwe-1.0."},{"key":"9876_CR20","doi-asserted-by":"crossref","unstructured":"Markantonatou, S., Ramisch, C., Savary, A., & Vincze, V. (eds) (2017). Proceedings of the 13th workshop on multiword expressions (MWE 2017), Association for Computational Linguistics, Valencia, Spainhttps:\/\/doi.org\/10.18653\/v1\/W17-17, https:\/\/www.aclweb.org\/anthology\/W17-1700.","DOI":"10.18653\/v1\/W17-17"},{"key":"9876_CR21","unstructured":"Mohamed, N. H., Rassem, M., Han, L., & Nenadic, G. (2023). Alphamwe-Arabic: Arabic edition of multilingual parallel corpora with multiword expression annotations."},{"key":"9876_CR22","volume-title":"Semantic reranking of crf label sequences for verbal multiword expression identification","author":"E Moreau","year":"2018","unstructured":"Moreau, E., Alsulaimani, A., Dublin, T. C., Maldonado, A., Han, L., Vogel, C., & Chowdhury, K. D. (2018). Semantic reranking of crf label sequences for verbal multiword expression identification. Language Science Press."},{"key":"9876_CR23","doi-asserted-by":"publisher","unstructured":"Pulcini, V. (2020). English-derived multi-word and phraseological units across languages in the global anglicism database. Textus, English Studies in Italy (1\/2020):127\u2013143, https:\/\/doi.org\/10.7370\/97355, https:\/\/www.rivisteweb.it\/doi\/10.7370\/97355.","DOI":"10.7370\/97355"},{"key":"9876_CR24","unstructured":"Radford, A., Wu, J., Child, R., Luan, D., Amodei, D., & Sutskever, I. (2019). Language models are unsupervised multitask learners."},{"issue":"1","key":"9876_CR25","first-page":"5485","volume":"21","author":"C Raffel","year":"2020","unstructured":"Raffel, C., Shazeer, N., Roberts, A., Lee, K., Narang, S., Matena, M., Zhou, Y., Li, W., & Liu, P. J. (2020). Exploring the limits of transfer learning with a unified text-to-text transformer. The Journal of Machine Learning Research, 21(1), 5485\u20135551.","journal-title":"The Journal of Machine Learning Research"},{"key":"9876_CR26","unstructured":"Ramisch, C., Cordeiro, S. R., Savary, A., Vincze, V., Barbu\u00a0Mititelu, V., Bhatia, A., Buljan, M., Candito, M., Gantar, P., Giouli, V., G\u00fcng\u00f6r, T., Hawwari, A., I\u00f1urrieta, U., Kovalevskaite, J., Krek, S., Lichte, T., Liebeskind, C., Monti, J., Parra\u00a0Escart\u00edn, C., QasemiZadeh, B., Ramisch, R., Schneider, N., Stoyanova, I., Vaidya, A., & Walsh, A. (2018). Edition 1.1 of the PARSEME shared task on automatic identification of verbal multiword expressions. In: Proceedings of the joint workshop on linguistic annotation, multiword expressions and constructions (LAW-MWE-CxG-2018), Association for Computational Linguistics, Santa Fe, New Mexico, USA, pp 222\u2013240, https:\/\/www.aclweb.org\/anthology\/W18-4925."},{"key":"9876_CR27","unstructured":"Rikters, M., & Bojar, O. (2017). Paying attention to multi-word expressions in neural machine translation. In: Proceedings of the 16th machine translation summit, Nagoya, Japan."},{"key":"9876_CR28","first-page":"1","volume-title":"Computational Linguistics and Intelligent Text Processing","author":"IA Sag","year":"2002","unstructured":"Sag, I. A., Baldwin, T., Bond, F., Copestake, A., & Flickinger, D. (2002). Multiword expressions: A pain in the neck for nlp. In A. Gelbukh (Ed.), Computational Linguistics and Intelligent Text Processing (pp. 1\u201315). Springer."},{"key":"9876_CR29","doi-asserted-by":"crossref","unstructured":"Savary, A., Ramisch, C., Cordeiro, S., Sangati, F., Vincze, V., QasemiZadeh, B., Candito, M., Cap, F., Giouli, V., Stoyanova, I., & Doucet, A. (2017). The PARSEME shared task on automatic identification of verbal multiword expressions. In: Proceedings of the 13th workshop on multiword expressions (MWE 2017), Valencia, Spain, pp 31\u201347, https:\/\/doi.org\/10.18653\/v1\/W17-1704, https:\/\/www.aclweb.org\/anthology\/W17-1704.","DOI":"10.18653\/v1\/W17-1704"},{"key":"9876_CR30","unstructured":"Schneider, N., Onuffer, S., Kazour, N., Danchik, E., Mordowanec, M. T., Conrad, H., & Smith, N. A. (2014). Comprehensive annotation of multiword expressions in a social web corpus. In: Proceedings of the ninth international conference on language resources and evaluation (LREC-2014), European Languages Resources Association, Reykjavik, Iceland, pp 455\u2013461, http:\/\/www.lrec-conf.org\/proceedings\/lrec2014\/pdf\/521_Paper.pdf."},{"key":"9876_CR31","doi-asserted-by":"publisher","first-page":"811","DOI":"10.22364\/bjmc.2016.4.4.14","volume":"4","author":"I Skadina","year":"2016","unstructured":"Skadina, I. (2016). Multi-word expressions in English-Latvian machine translation. Baltic Journal Modern Computing, 4, 811\u2013825.","journal-title":"Baltic Journal Modern Computing"},{"key":"9876_CR32","doi-asserted-by":"crossref","unstructured":"Sun, M., Jiang, B., Xiong, H., He, Z., Wu, H., & Wang, H. (2019). Baidu neural machine translation systems for WMT19. In: Proceedings of the fourth conference on machine translation (Volume 2: Shared Task Papers, Day 1), Association for Computational Linguistics, Florence, Italy, pp 374\u2013381, https:\/\/doi.org\/10.18653\/v1\/W19-5341, https:\/\/www.aclweb.org\/anthology\/W19-5341.","DOI":"10.18653\/v1\/W19-5341"},{"key":"9876_CR33","doi-asserted-by":"crossref","unstructured":"Tan, L., & Pal, S. (2014). Manawi: Using multi-word expressions and named entities to improve machine translation. In: Proceedings of the ninth workshop on statistical machine translation, Association for Computational Linguistics, Baltimore, Maryland, USA, pp 201\u2013206, https:\/\/doi.org\/10.3115\/v1\/W14-3323, https:\/\/www.aclweb.org\/anthology\/W14-3323.","DOI":"10.3115\/v1\/W14-3323"},{"key":"9876_CR34","unstructured":"Vaswani, A., Shazeer, N., Parmar, N., Uszkoreit, J., Jones, L., Gomez, A. N., Kaiser, L., & Polosukhin, I. (2017). Attention is all you need. In: Conference on neural information processing system, pp 6000\u20136010."},{"key":"9876_CR35","unstructured":"Vincze, V. (2012). Light verb constructions in the SzegedParalellFX English\u2013Hungarian parallel corpus. In: Proceedings of the eighth international conference on language resources and evaluation (LREC\u201912), European Language Resources Association, Istanbul, Turkey, pp 2381\u20132388, http:\/\/www.lrec-conf.org\/proceedings\/lrec2012\/pdf\/177_Paper.pdf."},{"key":"9876_CR36","unstructured":"Vincze, V., & Csirik, J. (2010). Hungarian corpus of light verb constructions. In: Proceedings of the 23rd international conference on computational linguistics (Coling 2010), Coling 2010 Organizing Committee, Beijing, China, pp 1110\u20131118, https:\/\/www.aclweb.org\/anthology\/C10-1125."},{"key":"9876_CR37","unstructured":"Vincze, V., Nagy\u00a0T, I., & Berend, G. (2011). Multiword expressions and named entities in the wiki50 corpus. In: Proceedings of the international conference recent advances in natural language processing 2011, Association for Computational Linguistics, Hissar, Bulgaria, pp 289\u2013295, https:\/\/www.aclweb.org\/anthology\/R11-1040."},{"key":"9876_CR38","unstructured":"Walsh, A., Bonial, C., Geeraert, K., McCrae, J. P., Schneider, N., & Somers, C. (2018). Constructing an annotated corpus of verbal MWEs for English. In: Proceedings of the joint workshop on linguistic annotation, multiword expressions and constructions (LAW-MWE-CxG-2018), Association for Computational Linguistics, Santa Fe, New Mexico, USA, pp 193\u2013200, https:\/\/www.aclweb.org\/anthology\/W18-4921."},{"key":"9876_CR39","unstructured":"Wu, Y., Schuster, M., Chen, Z., Le, Q. V., Norouzi, M., Macherey, W., Krikun, M., Cao, Y., Gao, Q., Macherey, K., Klingner, J., Shah, A., Johnson, M., Liu, X., Kaiser, L., Gouws, S., Kato, Y., Kudo, T., Kazawa, H., Stevens, K., Kurian, G., Patil, N., Wang, W., Young, C., Smith, J., Riesa, J., Rudnick, A., Vinyals, O., Corrado, G., Hughes, M., & Dean, J. (2016). Google\u2019s neural machine translation system: Bridging the gap between human and machine translation. CoRR abs\/1609.08144, http:\/\/arxiv.org\/abs\/1609.08144."},{"key":"9876_CR40","unstructured":"Zaninello, A., & Birch, A. (2020). Multiword expression aware neural machine translation. In: Proceedings of the 12th language resources and evaluation conference, European Language Resources Association, Marseille, France, pp 3816\u20133825, https:\/\/www.aclweb.org\/anthology\/2020.lrec-1.471."}],"container-title":["Language Resources and Evaluation"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10579-025-09876-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10579-025-09876-7","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10579-025-09876-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,14]],"date-time":"2026-03-14T08:26:17Z","timestamp":1773476777000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10579-025-09876-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,3,14]]},"references-count":40,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2026,6]]}},"alternative-id":["9876"],"URL":"https:\/\/doi.org\/10.1007\/s10579-025-09876-7","relation":{},"ISSN":["1574-020X","1574-0218"],"issn-type":[{"value":"1574-020X","type":"print"},{"value":"1574-0218","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,3,14]]},"assertion":[{"value":"12 August 2021","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"14 October 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"14 March 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}],"article-number":"33"}}