{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T12:02:48Z","timestamp":1780315368203,"version":"3.54.1"},"reference-count":511,"publisher":"Springer Science and Business Media LLC","issue":"6","license":[{"start":{"date-parts":[[2026,3,27]],"date-time":"2026-03-27T00:00:00Z","timestamp":1774569600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2026,5,22]],"date-time":"2026-05-22T00:00:00Z","timestamp":1779408000000},"content-version":"vor","delay-in-days":56,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"funder":[{"name":"the Talent Fund of Beijing Jiaotong University"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Artif Intell Rev"],"DOI":"10.1007\/s10462-026-11534-5","type":"journal-article","created":{"date-parts":[[2026,3,27]],"date-time":"2026-03-27T13:55:20Z","timestamp":1774619720000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["A survey on large language models with multilingualism: recent advances and new frontiers"],"prefix":"10.1007","volume":"59","author":[{"given":"Kaiyu","family":"Huang","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Fengran","family":"Mo","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Xinyu","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Hongliang","family":"Li","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"You","family":"Li","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Yuanchi","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Weijian","family":"Yi","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Yulong","family":"Mao","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Jinchen","family":"Liu","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Yuzhuang","family":"Xu","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Jinan","family":"Xu","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Jian-Yun","family":"Nie","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Yang","family":"Liu","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2026,3,27]]},"reference":[{"key":"11534_CR1","unstructured":"AI@Meta: Llama 3 Model Card (2024). https:\/\/github.com\/meta-llama\/llama3\/blob\/main\/MODEL_CARD.md"},{"key":"11534_CR2","doi-asserted-by":"crossref","unstructured":"Abadji J, Ortiz Suarez P, Romary L, Sagot B (2022) Towards a Cleaner Document-Oriented Multilingual Crawled Corpus. arXiv e-prints, 2201\u201306642 arXiv:2201.06642 [cs.CL]","DOI":"10.63317\/579or68a4ybs"},{"key":"11534_CR3","unstructured":"Abdin M, Aneja J, Behl H, Bubeck S, Eldan R, Gunasekar S, Harrison M, Hewett RJ, Javaheripi M, Kauffmann P et al (2024) Phi-4 technical report. arXiv preprint arXiv:2412.08905"},{"key":"11534_CR4","unstructured":"Abdin M, Jacobs SA, Awan AA, Aneja J, Awadallah A, Awadalla H, Bach N, Bahree A, Bakhtiari A, Behl H et al (2024) Phi-3 technical report: A highly capable language model locally on your phone. arXiv preprint arXiv:2404.14219"},{"key":"11534_CR5","unstructured":"Abonizio H, Bonifacio L, Jeronymo V, Lotufo R, Zavrel J, Nogueira R (2023) InPars Toolkit: A Unified and Reproducible Synthetic Data Generation Pipeline for Neural Information Retrieval"},{"key":"11534_CR6","unstructured":"Acharya A, Murthy R, Kumar V, Sen J (2024) NLLB-E5: A Scalable Multilingual Retrieval Model . https:\/\/arxiv.org\/abs\/2409.05401"},{"key":"11534_CR7","unstructured":"Achiam J, Adler S, Agarwal S, Ahmad L, Akkaya I, Aleman FL, Almeida D, Altenschmidt J, Altman S, Anadkat S et al (2023) Gpt-4 technical report. arXiv preprint arXiv:2303.08774"},{"key":"11534_CR8","doi-asserted-by":"crossref","unstructured":"Adelani DI, Abbott J, Neubig G, D\u2019souza D, Kreutzer J, Lignos C, Palen-Michel C, Buzaaba H, Rijhwani S, Ruder S, Mayhew S, Azime IA, Muhammad S, Emezue CC, Nakatumba-Nabende J, Ogayo P, Aremu A, Gitau C, Mbaye D, Alabi J, Yimam SM, Gwadabe T, Ezeani I, Niyongabo RA, Mukiibi J, Otiende V, Orife I, David D, Ngom S, Adewumi T, Rayson P, Adeyemi M, Muriuki G, Anebi E, Chukwuneke C, Odu N, Wairagala EP, Oyerinde S, Siro C, Bateesa TS, Oloyede T, Wambui Y, Akinode V, Nabagereka D, Katusiime M, Awokoya A, MBOUP M, Gebreyohannes D, Tilaye H, Nwaike K, Wolde D, Faye A, Sibanda B, Ahia O, Dossou BFP, Ogueji K, DIOP TI, Diallo A, Akinfaderin A, Marengereke T, Osei S (2021) MasakhaNER: Named Entity Recognition for African Languages","DOI":"10.1162\/tacl_a_00416"},{"key":"11534_CR9","doi-asserted-by":"crossref","unstructured":"Adelani DI, Masiak M, Azime IA, Alabi J, Tonja AL, Mwase C, Ogundepo O, Dossou BFP, Oladipo A, Nixdorf D, Emezue CC, al-azzawi Sibanda B, David D, Ndolela L, Mukiibi J, Ajayi T, Moteu T, Odhiambo B, Owodunni A, Obiefuna N, Mohamed M, Muhammad SH, Ababu TM, Salahudeen SA, Yigezu MG, Gwadabe T, Abdulmumin I, Taye M, Awoyomi O, Shode I, Adelani T, Abdulganiyu H, Omotayo A-H, Adeeko A, Afolabi A, Aremu A, Samuel O, Siro C, Kimotho W, Ogbu O, Mbonu C, Chukwuneke C, Fanijo S, Ojo J, Awosan O, Kebede T, Sakayo TS, Nyatsine P, Sidume F, Yousuf O, Oduwole M, Tshinu T, Kimanuka U, Diko T, Nxakama S, Nigusse S, Johar A, Mohamed S, Hassan FM, Mehamed MA, Ngabire E, Jules J, Ssenkungu I, Stenetorp P (2023) MasakhaNEWS: News Topic Classification for African languages","DOI":"10.18653\/v1\/2023.ijcnlp-main.10"},{"key":"11534_CR10","doi-asserted-by":"crossref","unstructured":"Adelani DI, Liu H, Shen X, Vassilyev N, Alabi JO, Mao Y, Gao H, Lee AE-S (2023) SIB-200: A Simple, Inclusive, and Big Evaluation Dataset for Topic Classification in 200+ Languages and Dialects","DOI":"10.18653\/v1\/2024.eacl-long.14"},{"key":"11534_CR11","unstructured":"Adeyemi M, Oladipo A, Pradeep R, Lin J (2023) Zero-Shot Cross-Lingual Reranking with Large Language Models for Low-Resource Languages . https:\/\/arxiv.org\/abs\/2312.16159"},{"key":"11534_CR12","doi-asserted-by":"publisher","unstructured":"Adeyemi M, Oladipo A, Zhang X, Alfonso-Hermelo D, Rezagholizadeh M, Chen B, Omotayo A-H, Abdulmumin I, Etori NA, Musa TB, Fanijo S, Awoyomi OO, Salahudeen SA, Mohammed LA, Abolade DO, Lawan FI, Sabo\u00a0Abubakar M, Nasir\u00a0Iro R, Imam\u00a0Abubakar A, Mohamed SA, Mohamed HM, Ajayi TO, Lin J (2024) Ciral: A test collection for clir evaluations in african languages. In: Proceedings of the 47th International ACM SIGIR Conference on Research and Development in Information Retrieval. SIGIR \u201924, pp. 293\u2013302. Association for Computing Machinery, New York, NY, USA . https:\/\/doi.org\/10.1145\/3626772.3657884","DOI":"10.1145\/3626772.3657884"},{"key":"11534_CR13","unstructured":"Aghajanyan A, Yu L, Conneau A, Hsu W-N, Hambardzumyan K, Zhang S, Roller S, Goyal N, Levy O, Zettlemoyer L (2023) Scaling laws for generative mixed-modal language models. In: International Conference on Machine Learning, pp. 265\u2013279 . PMLR"},{"key":"11534_CR14","doi-asserted-by":"crossref","unstructured":"Agrawal S, Zhou C, Lewis M, Zettlemoyer L, Ghazvininejad M (2023) In-context examples selection for machine translation. In: Rogers, A., Boyd-Graber, J., Okazaki, N. (eds.) Findings of the Association for Computational Linguistics: ACL 2023, pp. 8857\u20138873. Association for Computational Linguistics, Toronto, Canada . https:\/\/doi.org\/10.18653\/v1\/2023.findings-acl.564 . https:\/\/aclanthology.org\/2023.findings-acl.564","DOI":"10.18653\/v1\/2023.findings-acl.564"},{"key":"11534_CR15","unstructured":"Aguilar G, Kar S, Solorio T (2020) Lince: A centralized benchmark for linguistic code-switching evaluation. In: Proceedings of the Twelfth Language Resources and Evaluation Conference, pp. 1803\u20131813"},{"key":"11534_CR16","doi-asserted-by":"crossref","unstructured":"Aharoni R, Johnson M, Firat O (2019) Massively multilingual neural machine translation. In: Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long and Short Papers), pp. 3874\u20133884","DOI":"10.18653\/v1\/N19-1388"},{"key":"11534_CR17","doi-asserted-by":"crossref","unstructured":"Ahuja K, Diddee H, Hada R, Ochieng M, Ramesh K, Jain P, Nambi A, Ganu T, Segal S, Axmed M, Bali K, Sitaram S (2023) MEGA: Multilingual Evaluation of Generative AI","DOI":"10.18653\/v1\/2023.emnlp-main.258"},{"key":"11534_CR18","doi-asserted-by":"crossref","unstructured":"Ahuja S, Aggarwal D, Gumma V, Watts I, Sathe A, Ochieng M, Hada R, Jain P, Axmed M, Bali K, Sitaram S (2024) MEGAVERSE: Benchmarking Large Language Models Across Languages. Modalities, Models and Tasks","DOI":"10.18653\/v1\/2024.naacl-long.143"},{"key":"11534_CR19","doi-asserted-by":"publisher","first-page":"80","DOI":"10.1016\/j.aiopen.2023.08.001","volume":"4","author":"Q Ai","year":"2023","unstructured":"...Ai Q, Bai T, Cao Z, Chang Y, Chen J, Chen Z, Cheng Z, Dong S, Dou Z, Feng F, Gao S, Guo J, He X, Lan Y, Li C, Liu Y, Lyu Z, Ma W, Ma J, Ren Z, Ren P, Wang Z, Wang M, Wen J-R, Wu L, Xin X, Xu J, Yin D, Zhang P, Zhang F, Zhang W, Zhang M, Zhu X (2023) Information retrieval meets large language models: a strategic report from chinese ir community. AI Open 4:80\u201390. https:\/\/doi.org\/10.1016\/j.aiopen.2023.08.001","journal-title":"AI Open"},{"key":"11534_CR20","unstructured":"Alabi JO, Adelani DI, Mosbach M, Klakow D (2022) Adapting pre-trained language models to african languages via multilingual adaptive fine-tuning. arXiv preprint arXiv:2204.06487"},{"key":"11534_CR21","unstructured":"Albert A (2023) Jailbreak Chat. https:\/\/www.jailbreakchat.com. Accessed: 2024-02-20"},{"key":"11534_CR22","unstructured":"Anil R, Dai AM, Firat O, Johnson M, Lepikhin D, Passos A, Shakeri S, Taropa E, Bailey P, Chen Z et al (2023) Palm 2 technical report. arXiv preprint arXiv:2305.10403"},{"key":"11534_CR23","unstructured":"Anthropic A (2024) The claude 3 model family: Opus, sonnet, haiku. Claude-3 Model Card"},{"key":"11534_CR24","unstructured":"Arivazhagan N, Bapna A, Firat O, Lepikhin D, Johnson M, Krikun M, Chen MX, Cao Y, Foster G, Cherry C et al (2019) Massively multilingual neural machine translation in the wild: Findings and challenges. arXiv preprint arXiv:1907.05019"},{"key":"11534_CR25","doi-asserted-by":"crossref","unstructured":"Artetxe M, Ruder S, Yogatama D (2020) On the cross-lingual transferability of monolingual representations. In: Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, pp. 4623\u20134637","DOI":"10.18653\/v1\/2020.acl-main.421"},{"key":"11534_CR26","doi-asserted-by":"crossref","unstructured":"Asai A, Kasai J, Clark J, Lee K, Choi E, Hajishirzi H (2021) XOR QA: Cross-lingual open-retrieval question answering. In: Proceedings of the 2021 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, pp. 547\u2013564. Association for Computational Linguistics, Online . https:\/\/doi.org\/10.18653\/v1\/2021.naacl-main.46 . https:\/\/aclanthology.org\/2021.naacl-main.46","DOI":"10.18653\/v1\/2021.naacl-main.46"},{"key":"11534_CR27","unstructured":"Bai Y, Kadavath S, Kundu S, Askell A, Kernion J, Jones A, Chen A, Goldie A, Mirhoseini A, McKinnon C et al (2022) Constitutional ai: Harmlessness from ai feedback. arXiv preprint arXiv:2212.08073"},{"key":"11534_CR28","unstructured":"Bai J, Bai S, Chu Y, Cui Z, Dang K, Deng X, Fan Y, Ge W, Han Y, Huang F, et al (2023) Qwen technical report. arXiv preprint arXiv:2309.16609"},{"key":"11534_CR29","doi-asserted-by":"crossref","unstructured":"Bandarkar L, Liang D, Muller B, Artetxe M, Shukla SN, Husa D, Goyal N, Krishnan A, Zettlemoyer L, Khabsa M (2023) The belebele benchmark: a parallel reading comprehension dataset in 122 language variants. arXiv preprint arXiv:2308.16884","DOI":"10.18653\/v1\/2024.acl-long.44"},{"key":"11534_CR30","doi-asserted-by":"crossref","unstructured":"Bang Y, Cahyawijaya S, Lee N, Dai W, Su D, Wilie B, Lovenia H, Ji Z, Yu T, Chung W et al (2023) A multitask, multilingual, multimodal evaluation of chatgpt on reasoning, hallucination, and interactivity. In: Proceedings of the 13th International Joint Conference on Natural Language Processing and the 3rd Conference of the Asia-Pacific Chapter of the Association for Computational Linguistics (Volume 1: Long Papers), pp. 675\u2013718","DOI":"10.18653\/v1\/2023.ijcnlp-main.45"},{"key":"11534_CR31","doi-asserted-by":"crossref","unstructured":"Bansal N, Sharma A, Singh R (2019) A review on the application of deep learning in legal domain. In: Artificial Intelligence Applications and Innovations: 15th IFIP WG 12.5 International Conference, AIAI 2019, Hersonissos, Crete, Greece, May 24\u201326, 2019, Proceedings 15, pp. 374\u2013381 . Springer","DOI":"10.1007\/978-3-030-19823-7_31"},{"key":"11534_CR32","doi-asserted-by":"crossref","unstructured":"Bapna A, Firat O (2019) Simple, scalable adaptation for neural machine translation. In: Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing (EMNLP-IJCNLP), pp. 1538\u20131548","DOI":"10.18653\/v1\/D19-1165"},{"key":"11534_CR33","unstructured":"Basile P, Musacchio E, Polignano M, Siciliani L, Fiameni G, Semeraro G (2023) Llamantino: Llama 2 models for effective text generation in italian language. arXiv preprint arXiv:2312.09993"},{"key":"11534_CR34","unstructured":"Baumgartner N, St\u00fcrmer M, Grabmair M, Niklaus J et al (2024) Towards explainability and fairness in swiss judgement prediction: Benchmarking on a multilingual dataset. arXiv preprint arXiv:2402.17013"},{"key":"11534_CR35","unstructured":"BehnamGhader P, Adlakha V, Mosbach M, Bahdanau D, Chapados N, Reddy S (2024) LLM2Vec: Large Language Models Are Secretly Powerful Text Encoders . https:\/\/arxiv.org\/abs\/2404.05961"},{"key":"11534_CR36","unstructured":"Beltagy I, Peters ME, Cohan A (2020) Longformer: The long-document transformer. arXiv preprint arXiv:2004.05150"},{"key":"11534_CR37","unstructured":"Bhardwaj R, Poria S (2023) Red-teaming large language models using chain of utterances for safety-alignment. arXiv preprint arXiv:2308.09662"},{"key":"11534_CR38","doi-asserted-by":"crossref","unstructured":"Bhattacharjee A, Hasan T, Ahmad WU, Li Y-F, Kang Y-B, Shahriyar R (2023) CrossSum: Beyond English-Centric Cross-Lingual Summarization for 1,500+ Language Pairs","DOI":"10.18653\/v1\/2023.acl-long.143"},{"key":"11534_CR39","unstructured":"Bi X, Chen D, Chen G, Chen S, Dai D, Deng C, Ding H, Dong K, Du Q, Fu Z et al (2024) Deepseek llm: Scaling open-source language models with longtermism. arXiv preprint arXiv:2401.02954"},{"key":"11534_CR40","unstructured":"Biderman S, Schoelkopf H, Anthony QG, Bradley H, O\u2019Brien K, Hallahan E, Khan MA, Purohit S, Prashanth US, Raff E et al (2023) Pythia: A suite for analyzing large language models across training and scaling. In: International Conference on Machine Learning, pp. 2397\u20132430 . PMLR"},{"key":"11534_CR41","unstructured":"BioMistral: BioInstructQA. https:\/\/huggingface.co\/datasets\/BioMistral\/BioInstructQA"},{"key":"11534_CR42","unstructured":"Bonifacio L, Jeronymo V, Abonizio HQ, Campiotti I, Fadaee M, Lotufo R, Nogueira R (2022) mMARCO: A Multilingual Version of the MS MARCO Passage Ranking Dataset . https:\/\/arxiv.org\/abs\/2108.13897"},{"key":"11534_CR43","doi-asserted-by":"publisher","unstructured":"Bonifacio L, Abonizio H, Fadaee M, Nogueira R (2022) Inpars: Unsupervised dataset generation for information retrieval. In: Proceedings of the 45th International ACM SIGIR Conference on Research and Development in Information Retrieval. SIGIR \u201922, pp. 2387\u20132392. Association for Computing Machinery, New York, NY, USA . https:\/\/doi.org\/10.1145\/3477495.3531863","DOI":"10.1145\/3477495.3531863"},{"key":"11534_CR44","doi-asserted-by":"publisher","first-page":"185","DOI":"10.1177\/135910457000100301","volume":"1","author":"RW Brislin","year":"1970","unstructured":"Brislin RW (1970) Back-translation for cross-cultural research. J Cross Cult Psychol 1:185\u2013216","journal-title":"J Cross Cult Psychol"},{"key":"11534_CR45","first-page":"1877","volume":"33","author":"T Brown","year":"2020","unstructured":"Brown T, Mann B, Ryder N, Subbiah M, Kaplan JD, Dhariwal P, Neelakantan A, Shyam P, Sastry G, Askell A et al (2020) Language models are few-shot learners. Adv Neural Inf Process Syst 33:1877\u20131901","journal-title":"Adv Neural Inf Process Syst"},{"key":"11534_CR46","doi-asserted-by":"crossref","unstructured":"Brugger T, St\u00fcrmer M, Niklaus J (2023) Multilegalsbd: A multilingual legal sentence boundary detection dataset. In: Proceedings of the Nineteenth International Conference on Artificial Intelligence and Law, pp. 42\u201351","DOI":"10.1145\/3594536.3595132"},{"key":"11534_CR47","unstructured":"Cai Z, Cao M, Chen H, Chen K, Chen K, Chen X, Chen X, Chen Z, Chen Z, Chu P et al (2024) Internlm2 technical report. arXiv preprint arXiv:2403.17297"},{"issue":"10","key":"11534_CR48","doi-asserted-by":"publisher","first-page":"1899","DOI":"10.1002\/asi.21577","volume":"62","author":"ES Callahan","year":"2011","unstructured":"Callahan ES, Herring SC (2011) Cultural bias in wikipedia content on famous persons. J Am Soc Inform Sci Technol 62(10):1899\u20131915","journal-title":"J Am Soc Inform Sci Technol"},{"key":"11534_CR49","doi-asserted-by":"crossref","unstructured":"Cao B, Cao Y, Lin L, Chen J (2024) Defending against alignment-breaking attacks via robustly aligned llm. In: Proceedings of the 62nd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pp. 10542\u201310560","DOI":"10.18653\/v1\/2024.acl-long.568"},{"key":"11534_CR50","doi-asserted-by":"crossref","unstructured":"Caswell I, Breiner T, Esch D, Bapna A (2020) Language ID in the wild: Unexpected challenges on the path to a thousand-language web text corpus. In: Scott, D., Bel, N., Zong, C. (eds.) Proceedings of the 28th International Conference on Computational Linguistics, pp. 6588\u20136608. International Committee on Computational Linguistics, Barcelona, Spain (Online) . https:\/\/doi.org\/10.18653\/v1\/2020.coling-main.579 . https:\/\/aclanthology.org\/2020.coling-main.579","DOI":"10.18653\/v1\/2020.coling-main.579"},{"key":"11534_CR51","unstructured":"Cettolo M, Federico M, Bentivogli L, Niehues J, St\u00fcker S, Sudoh K, Yoshino K, Federmann C (2017) Overview of the IWSLT 2017 evaluation campaign. In: Proceedings of the 14th International Conference on Spoken Language Translation, pp. 2\u201314. International Workshop on Spoken Language Translation, Tokyo, Japan . https:\/\/aclanthology.org\/2017.iwslt-1.1"},{"key":"11534_CR52","unstructured":"Cettolo M, Girardi C, Federico M (2012) WIT3: Web inventory of transcribed and translated talks. In: Proceedings of the 16th Annual Conference of the European Association for Machine Translation, pp. 261\u2013268. European Association for Machine Translation, Trento, Italy . https:\/\/www.aclweb.org\/anthology\/2012.eamt-1.60"},{"key":"11534_CR53","doi-asserted-by":"crossref","unstructured":"Chai L, Yang J, Sun T, Guo H, Liu J, Wang B, Liang X, Bai J, Li T, Peng Q, et al (2024) xcot: Cross-lingual instruction tuning for cross-lingual chain-of-thought reasoning. arXiv preprint arXiv:2401.07037","DOI":"10.1609\/aaai.v39i22.34524"},{"key":"11534_CR54","first-page":"2898","volume":"2020","author":"I Chalkidis","year":"2020","unstructured":"Chalkidis I, Fergadiotis M, Malakasiotis P, Aletras N, Androutsopoulos I (2020) Legal-bert: the muppets straight out of law school. Find Assoc Comput Ling EMNLP 2020:2898\u20132904","journal-title":"Find Assoc Comput Ling EMNLP"},{"key":"11534_CR55","doi-asserted-by":"crossref","unstructured":"Chalkidis I, Garneau N, Goan\u0163\u0103 C, Katz D, S\u00f8gaard A (2023) Lexfiles and legallama: Facilitating english multinational legal language model development. In: Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pp. 15513\u201315535","DOI":"10.18653\/v1\/2023.acl-long.865"},{"key":"11534_CR56","doi-asserted-by":"crossref","unstructured":"Chalkidis I, Pasini T, Zhang S, Tomada L, Schwemer S, S\u00f8gaard A (2022) Fairlex: A multilingual benchmark for evaluating fairness in legal text processing. In: Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pp. 4389\u20134406","DOI":"10.18653\/v1\/2022.acl-long.301"},{"key":"11534_CR57","doi-asserted-by":"crossref","unstructured":"Chalkidis I, Fergadiotis M, Androutsopoulos I (2021) MultiEURLEX - a multi-lingual and multi-label legal document classification dataset for zero-shot cross-lingual transfer. In: Moens, M.-F., Huang, X., Specia, L., Yih, S.W.-t. (eds.) Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing, pp. 6974\u20136996. Association for Computational Linguistics, Online and Punta Cana, Dominican Republic . https:\/\/doi.org\/10.18653\/v1\/2021.emnlp-main.559 . https:\/\/aclanthology.org\/2021.emnlp-main.559","DOI":"10.18653\/v1\/2021.emnlp-main.559"},{"key":"11534_CR58","doi-asserted-by":"crossref","unstructured":"Chalkidis I, Jana A, Hartung D, Bommarito M, Androutsopoulos I, Katz D, Aletras N (2022) Lexglue: A benchmark dataset for legal language understanding in english. In: Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pp. 4310\u20134330","DOI":"10.18653\/v1\/2022.acl-long.297"},{"issue":"3","key":"11534_CR59","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3641289","volume":"15","author":"Y Chang","year":"2024","unstructured":"Chang Y, Wang X, Wang J, Wu Y, Yang L, Zhu K, Chen H, Yi X, Wang C, Wang Y et al (2024) A survey on evaluation of large language models. ACM Trans Intell Syst Technol 15(3):1\u201345","journal-title":"ACM Trans Intell Syst Technol"},{"key":"11534_CR60","doi-asserted-by":"crossref","unstructured":"Chang TA, Arnett C, Tu Z, Bergen BK (2023) When is multilinguality a curse? language modeling for 250 high-and low-resource languages. arXiv preprint arXiv:2311.09205","DOI":"10.18653\/v1\/2024.emnlp-main.236"},{"key":"11534_CR61","doi-asserted-by":"crossref","unstructured":"Changpinyo S, Xue L, Yarom M, Thapliyal AV, Szpektor I, Amelot J, Chen X, Soricut R (2023) MaXM: Towards Multilingual Visual Question Answering","DOI":"10.18653\/v1\/2023.findings-emnlp.176"},{"key":"11534_CR62","unstructured":"Chao P, Robey A, Dobriban E, Hassani H, Pappas GJ, Wong E (2023) Jailbreaking black box large language models in twenty queries. In: R0-FoMo: Robustness of Few-shot and Zero-shot Learning in Large Foundation Models"},{"key":"11534_CR63","doi-asserted-by":"crossref","unstructured":"Chao P, Debenedetti E, Robey A, Andriushchenko M, Croce F, Sehwag V, Dobriban E, Flammarion N, Pappas GJ, Tramer F, Hassani H, Wong E (2024) JailbreakBench: An Open Robustness Benchmark for Jailbreaking Large Language Models","DOI":"10.52202\/079017-1745"},{"key":"11534_CR64","doi-asserted-by":"crossref","unstructured":"Chen J, Xiao S, Zhang P, Luo K, Lian D, Liu Z (2024) BGE M3-Embedding: Multi-Lingual, Multi-Functionality, Multi-Granularity Text Embeddings Through Self-Knowledge Distillation . https:\/\/arxiv.org\/abs\/2402.03216","DOI":"10.18653\/v1\/2024.findings-acl.137"},{"key":"11534_CR65","doi-asserted-by":"crossref","unstructured":"Chen J, Xiao S, Zhang P, Luo K, Lian D, Liu Z (2024) M3-embedding: Multi-linguality, multi-functionality, multi-granularity text embeddings through self-knowledge distillation. In: Ku, L.-W., Martins, A., Srikumar, V. (eds.) Findings of the Association for Computational Linguistics ACL 2024, pp. 2318\u20132335. Association for Computational Linguistics, Bangkok, Thailand and virtual meeting . https:\/\/doi.org\/10.18653\/v1\/2024.findings-acl.137 . https:\/\/aclanthology.org\/2024.findings-acl.137","DOI":"10.18653\/v1\/2024.findings-acl.137"},{"key":"11534_CR66","unstructured":"Chen Y, Liu Q, Zhang Y, Sun W, Shi D, Mao J, Yin D (2024) TourRank: Utilizing Large Language Models for Documents Ranking with a Tournament-Inspired Strategy . https:\/\/arxiv.org\/abs\/2406.11678"},{"key":"11534_CR67","doi-asserted-by":"crossref","unstructured":"Chen J, Xiao S, Zhang P, Luo K, Lian D, Liu Z (2024) BGE M3-Embedding: Multi-Lingual. Multi-Functionality, Multi-Granularity Text Embeddings Through Self-Knowledge Distillation","DOI":"10.18653\/v1\/2024.findings-acl.137"},{"key":"11534_CR68","unstructured":"Chen W, Wang Q, Long Z, Zhang X, Lu Z, Li B, Wang S, Xu J, Bai X, Huang X, Wei Z (2023) Disc-finllm: A chinese financial large language model based on multiple experts fine-tuning. arXiv preprint arXiv:2310.15205"},{"key":"11534_CR69","unstructured":"Chen Z, Cano AH, Romanou A, Bonnet A, Matoba K, Salvi F, Pagliardini M, Fan S, K\u00f6pf A, Mohtashami A et al (2023) Meditron-70b: Scaling medical pretraining for large language models. arXiv preprint arXiv:2311.16079"},{"key":"11534_CR70","unstructured":"Chen J, Wang X, Gao A, Jiang F, Chen S, Zhang H, Song D, Xie W, Kong C, Li J et al (2023) Huatuogpt-ii, one-stage training for medical adaption of llms. arXiv preprint arXiv:2311.09774"},{"key":"11534_CR71","unstructured":"Chen Y, Cai W, Wu L, Li X, Xin Z, Fu C (2023) Tigerbot: An open multilingual multitask llm. arXiv preprint arXiv:2312.08688"},{"key":"11534_CR72","unstructured":"Chen D, Huang Y, Li X, Li Y, Liu Y, Pan H, Xu L, Zhang D, Zhang Z, Han K (2024) Orion-14b: Open-source multilingual large language models. arXiv preprint arXiv:2401.12246"},{"key":"11534_CR73","doi-asserted-by":"crossref","unstructured":"Cheng Y, Bapna A, Firat O, Cao Y, Wang P, Macherey W (2022) Multilingual mix: Example interpolation improves multilingual neural machine translation. In: Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pp. 4092\u20134102","DOI":"10.18653\/v1\/2022.acl-long.282"},{"key":"11534_CR74","unstructured":"Chiang W-L, Li Z, Lin Z, Sheng Y, Wu Z, Zhang H, Zheng L, Zhuang S, Zhuang Y, Gonzalez JE et al (2023) Vicuna: An open-source chatbot impressing gpt-4 with 90 chatgpt quality. See https:\/\/vicuna.lmsys.org (accessed 14 April 2023) 2(3), 6"},{"issue":"240","key":"11534_CR75","first-page":"1","volume":"24","author":"A Chowdhery","year":"2023","unstructured":"Chowdhery A, Narang S, Devlin J, Bosma M, Mishra G, Roberts A, Barham P, Chung HW, Sutton C, Gehrmann S et al (2023) Palm: Scaling language modeling with pathways. J Mach Learn Res 24(240):1\u2013113","journal-title":"J Mach Learn Res"},{"key":"11534_CR76","doi-asserted-by":"crossref","unstructured":"Christen R, Shaitarova A, St\u00fcrmer M, Niklaus J (2023) Resolving legalese: A multilingual exploration of negation scope resolution in legal documents. arXiv preprint arXiv:2309.08695","DOI":"10.63317\/4g9pkcwo8ev8"},{"issue":"70","key":"11534_CR77","first-page":"1","volume":"25","author":"HW Chung","year":"2024","unstructured":"Chung HW, Hou L, Longpre S, Zoph B, Tay Y, Fedus W, Li Y, Wang X, Dehghani M, Brahma S et al (2024) Scaling instruction-finetuned language models. J Mach Learn Res 25(70):1\u201353","journal-title":"J Mach Learn Res"},{"key":"11534_CR78","unstructured":"Chung HW, Constant N, Garcia X, Roberts A, Tay Y, Narang S, Firat O (2023) Unimax: Fairer and more effective language sampling for large-scale multilingual pretraining. arXiv preprint arXiv:2304.09151"},{"key":"11534_CR79","first-page":"454","volume":"8","author":"JH Clark","year":"2020","unstructured":"Clark JH, Choi E, Collins M, Garrette D, Kwiatkowski T, Nikolaev V, Palomaki J (2020) Tydi qa: a benchmark for information-seeking question answering in ty pologically di verse languages. Trans Assoc Comput Ling 8:454\u2013470","journal-title":"Trans Assoc Comput Ling"},{"key":"11534_CR80","doi-asserted-by":"crossref","unstructured":"Clark E, Rijhwani S, Gehrmann S, Maynez J, Aharoni R, Nikolaev V, Sellam T, Siddhant A, Das D, Parikh AP (2023) SEAHORSE: A Multilingual, Multifaceted Dataset for Summarization Evaluation","DOI":"10.18653\/v1\/2023.emnlp-main.584"},{"key":"11534_CR81","unstructured":"Colombo P, Pires TP, Boudiaf M, Culver D, Melo R, Corro C, Martins AF, Esposito F, Raposo VL, Morgado S et al (2024) Saullm-7b: A pioneering large language model for law. arXiv preprint arXiv:2403.03883"},{"key":"11534_CR82","doi-asserted-by":"crossref","unstructured":"Conia S, Li M, Lee D, Minhas U, Ilyas I, Li Y (2023) Increasing coverage and precision of textual information in multilingual knowledge graphs. In: Bouamor, H., Pino, J., Bali, K. (eds.) Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, pp. 1612\u20131634. Association for Computational Linguistics, Singapore . https:\/\/doi.org\/10.18653\/v1\/2023.emnlp-main.100 . https:\/\/aclanthology.org\/2023.emnlp-main.100","DOI":"10.18653\/v1\/2023.emnlp-main.100"},{"key":"11534_CR83","first-page":"125","volume":"32","author":"A Conneau","year":"2019","unstructured":"Conneau A, Lample G (2019) Cross-lingual language model pretraining. Adv Neural Inf Process Syst 32:125","journal-title":"Adv Neural Inf Process Syst"},{"key":"11534_CR84","doi-asserted-by":"crossref","unstructured":"Conneau A, Khandelwal K, Goyal N, Chaudhary V, Wenzek G, Guzm\u00e1n F, Grave E, Ott M, Zettlemoyer L, Stoyanov V (2020) Unsupervised cross-lingual representation learning at scale. In: Jurafsky, D., Chai, J., Schluter, N., Tetreault, J. (eds.) Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, pp. 8440\u20138451. Association for Computational Linguistics, Online . https:\/\/doi.org\/10.18653\/v1\/2020.acl-main.747 . https:\/\/aclanthology.org\/2020.acl-main.747","DOI":"10.18653\/v1\/2020.acl-main.747"},{"key":"11534_CR85","doi-asserted-by":"crossref","unstructured":"Conneau A, Rinott R, Lample G, Williams A, Bowman S, Schwenk H, Stoyanov V (2018) Xnli: Evaluating cross-lingual sentence representations. In: Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing, pp. 2475\u20132485","DOI":"10.18653\/v1\/D18-1269"},{"key":"11534_CR86","doi-asserted-by":"crossref","unstructured":"Conneau A, Khandelwal K, Goyal N, Chaudhary V, Wenzek G, Guzm\u00e1n F, Grave E, Ott M, Zettlemoyer L, Stoyanov V (2019) Unsupervised cross-lingual representation learning at scale. arXiv preprint arXiv:1911.02116","DOI":"10.18653\/v1\/2020.acl-main.747"},{"key":"11534_CR87","doi-asserted-by":"crossref","unstructured":"Conneau A, Khandelwal K, Goyal N, Chaudhary V, Wenzek G, Guzm\u00e1n F, Grave E, Ott M, Zettlemoyer L, Stoyanov V (2020) Unsupervised Cross-lingual Representation Learning at Scale . https:\/\/arxiv.org\/abs\/1911.02116","DOI":"10.18653\/v1\/2020.acl-main.747"},{"key":"11534_CR88","doi-asserted-by":"crossref","unstructured":"Conneau A, Khandelwal K, Goyal N, Chaudhary V, Wenzek G, Guzm\u00e1n F, Grave E, Ott M, Zettlemoyer L, Stoyanov V (2020) Unsupervised cross-lingual representation learning at scale. In: Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics . Association for Computational Linguistics","DOI":"10.18653\/v1\/2020.acl-main.747"},{"key":"11534_CR89","unstructured":"Cui Y, Yang Z, Yao X (2023) Efficient and effective text encoding for chinese llama and alpaca. arXiv preprint arXiv:2304.08177"},{"key":"11534_CR90","unstructured":"Cui J, Li Z, Yan Y, Chen B, Yuan L (2023) Chatlaw: Open-source legal large language model with integrated external knowledge bases. arXiv preprint arXiv:2306.16092"},{"issue":"5","key":"11534_CR91","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3406095","volume":"53","author":"R Dabre","year":"2020","unstructured":"Dabre R, Chu C, Kunchukuttan A (2020) A survey of multilingual neural machine translation. ACM Comput Surv (CSUR) 53(5):1\u201338","journal-title":"ACM Comput Surv (CSUR)"},{"key":"11534_CR92","doi-asserted-by":"crossref","unstructured":"Dabre R, Fujita A, Chu C (2019) Exploiting multilingualism through multistage fine-tuning for low-resource neural machine translation. In: Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing (EMNLP-IJCNLP), pp. 1410\u20131416","DOI":"10.18653\/v1\/D19-1146"},{"key":"11534_CR93","doi-asserted-by":"crossref","unstructured":"Dac\u00a0Lai V, Van\u00a0Nguyen C, Ngo NT, Nguyen T, Dernoncourt F, Rossi RA, Nguyen TH (2023) Okapi: Instruction-tuned large language models in multiple languages with reinforcement learning from human feedback. arXiv e-prints, 2307","DOI":"10.18653\/v1\/2023.emnlp-demo.28"},{"key":"11534_CR94","unstructured":"Dai Z, Callan J (2019) Context-Aware Sentence\/Passage Term Importance Estimation For First Stage Retrieval . https:\/\/arxiv.org\/abs\/1910.10687"},{"key":"11534_CR95","unstructured":"Dai Z, Zhao VY, Ma J, Luan Y, Ni J, Lu J, Bakalov A, Guu K, Hall K, Chang M-W (2023) Promptagator: Few-shot dense retrieval from 8 examples. In: The Eleventh International Conference on Learning Representations . https:\/\/openreview.net\/forum?id=gmL46YMpu2J"},{"key":"11534_CR96","unstructured":"Dan Y, Lei Z, Gu Y, Li Y, Yin J, Lin J, Ye L, Tie Z, Zhou Y, Wang Y et al (2023) Educhat: A large-scale language model-based chatbot system for intelligent education. arXiv preprint arXiv:2308.02773"},{"key":"11534_CR97","doi-asserted-by":"crossref","unstructured":"Das R, Ranjan S, Pathak S, Jyothi P (2023) Improving pretraining techniques for code-switched NLP. In: Rogers, A., Boyd-Graber, J., Okazaki, N. (eds.) Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pp. 1176\u20131191. Association for Computational Linguistics, Toronto, Canada . https:\/\/doi.org\/10.18653\/v1\/2023.acl-long.66 . https:\/\/aclanthology.org\/2023.acl-long.66","DOI":"10.18653\/v1\/2023.acl-long.66"},{"key":"11534_CR98","doi-asserted-by":"crossref","unstructured":"Deng G, Liu Y, Li Y, Wang K, Zhang Y, Li Z, Wang H, Zhang T, Liu Y (2024) Masterkey: Automated jailbreaking of large language model chatbots. In: Proc. ISOC NDSS","DOI":"10.14722\/ndss.2024.24188"},{"key":"11534_CR99","unstructured":"Deng Y, Zhang W, Pan SJ, Bing L (2023) Multilingual jailbreak challenges in large language models. arXiv preprint arXiv:2310.06474"},{"key":"11534_CR100","doi-asserted-by":"crossref","unstructured":"Dettmers T, Pagnoni A, Holtzman A, Zettlemoyer L (2023) QLoRA: Efficient Finetuning of Quantized LLMs","DOI":"10.52202\/075280-0441"},{"key":"11534_CR101","unstructured":"Devlin J, Chang M-W, Lee K, Toutanova K (2018) Bert: Pre-training of deep bidirectional transformers for language understanding. arXiv preprint arXiv:1810.04805"},{"key":"11534_CR102","doi-asserted-by":"crossref","unstructured":"De\u00a0Bruyn M, Lotfi E, Buhmann J, Daelemans W (2021) MFAQ: a multilingual FAQ dataset. In: Proceedings of the 3rd Workshop on Machine Reading for Question Answering, pp. 1\u201313. Association for Computational Linguistics, Punta Cana, Dominican Republic . https:\/\/aclanthology.org\/2021.mrqa-1.1","DOI":"10.18653\/v1\/2021.mrqa-1.1"},{"key":"11534_CR103","doi-asserted-by":"crossref","unstructured":"Ding B, Qin C, Zhao R, Luo T, Li X, Chen G, Xia W, Hu J, Luu AT, Joty S (2024) Data augmentation using llms: Data perspectives, learning paradigms and challenges. arXiv preprint arXiv:2403.02990","DOI":"10.18653\/v1\/2024.findings-acl.97"},{"key":"11534_CR104","doi-asserted-by":"crossref","unstructured":"Ding P, Kuang J, Ma D, Cao X, Xian Y, Chen J, Huang S (2023) A wolf in sheep\u2019s clothing: Generalized nested jailbreak prompts can fool large language models easily. arXiv preprint arXiv:2311.08268","DOI":"10.18653\/v1\/2024.naacl-long.118"},{"key":"11534_CR105","doi-asserted-by":"crossref","unstructured":"Dodge J, Sap M, Marasovi\u0107 A, Agnew W, Ilharco G, Groeneveld D, Mitchell M, Gardner M (2021) Documenting large webtext corpora: A case study on the colossal clean crawled corpus. In: Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing, pp. 1286\u20131305","DOI":"10.18653\/v1\/2021.emnlp-main.98"},{"key":"11534_CR106","doi-asserted-by":"crossref","unstructured":"Do\u011fru\u00f6z AS, Sitaram S, Bullock B, Toribio AJ (2021) A survey of code-switching: Linguistic and social perspectives for language technologies. In: Proceedings of the 59th Annual Meeting of the Association for Computational Linguistics and the 11th International Joint Conference on Natural Language Processing (Volume 1: Long Papers), pp. 1654\u20131666","DOI":"10.18653\/v1\/2021.acl-long.131"},{"key":"11534_CR107","doi-asserted-by":"crossref","unstructured":"Ebrahimi A, Kann K (2021) How to adapt your pretrained multilingual model to 1600 languages. arXiv preprint arXiv:2106.02124","DOI":"10.18653\/v1\/2021.acl-long.351"},{"key":"11534_CR108","doi-asserted-by":"crossref","unstructured":"El-Kishky A, Chaudhary V, Guzm\u00e1n F, Koehn P (2020) CCAligned: A massive collection of cross-lingual web-document pairs. In: Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing (EMNLP), pp. 5960\u20135969. Association for Computational Linguistics, Online . https:\/\/doi.org\/10.18653\/v1\/2020.emnlp-main.480 . https:\/\/aclanthology.org\/2020.emnlp-main.480","DOI":"10.18653\/v1\/2020.emnlp-main.480"},{"key":"11534_CR505","unstructured":"eBible.org: eBible. https:\/\/github.com\/BibleNLP"},{"key":"11534_CR506","unstructured":"erfanzar: Multi-Turn Conversational Prompts from ChatGPT-4. https:\/\/huggingface.co\/datasets\/erfanzar\/GPT-4-Prompts"},{"issue":"2","key":"11534_CR109","first-page":"190","volume":"72","author":"C Escolano","year":"2021","unstructured":"Escolano C, Costa-Juss\u00e0 MR, Fonollosa JA (2021) From bilingual to multilingual neural-based machine translation by incremental training. J Am Soc Inf Sci 72(2):190\u2013203","journal-title":"J Am Soc Inf Sci"},{"key":"11534_CR110","doi-asserted-by":"crossref","unstructured":"Etxaniz J, Azkune G, Soroa A, Lacalle OL, Artetxe M (2023) Do multilingual language models think better in english? arXiv preprint arXiv:2308.01223","DOI":"10.18653\/v1\/2024.naacl-short.46"},{"key":"11534_CR111","first-page":"1","volume":"22","author":"A Fan","year":"2021","unstructured":"Fan A, Bhosale S, Schwenk H, Ma Z, El-Kishky A, Goyal S, Baines M, Celebi O, Wenzek G, Chaudhary V et al (2021) Beyond english-centric multilingual machine translation. J Mach Learn Res 22:1\u201348","journal-title":"J Mach Learn Res"},{"key":"11534_CR112","unstructured":"Fan T, Kang Y, Ma G, Chen W, Wei W, Fan L, Yang Q (2023) Fate-llm: A industrial grade federated learning framework for large language models. arXiv preprint arXiv:2310.10049"},{"key":"11534_CR113","doi-asserted-by":"publisher","first-page":"3237","DOI":"10.18653\/v1\/2022.findings-acl.255","volume":"2022","author":"Y Fang","year":"2022","unstructured":"Fang Y, Wang S, Xu Y, Xu R, Sun S, Zhu C, Zeng M (2022) Leveraging knowledge in multilingual commonsense reasoning. Find Assoc Comput Ling ACL 2022:3237\u20133246","journal-title":"Find Assoc Comput Ling ACL"},{"key":"11534_CR114","first-page":"100508","volume":"14","author":"G Fatouros","year":"2023","unstructured":"Fatouros G, Soldatos J, Kouroumali K, Makridis G, Kyriazis D (2023) Transforming sentiment analysis in the financial domain with chatgpt. Mach Learn Appl 14:100508","journal-title":"Mach Learn Appl"},{"issue":"120","key":"11534_CR115","first-page":"1","volume":"23","author":"W Fedus","year":"2022","unstructured":"Fedus W, Zoph B, Shazeer N (2022) Switch transformers: scaling to trillion parameter models with simple and efficient sparsity. J Mach Learn Res 23(120):1\u201339","journal-title":"J Mach Learn Res"},{"key":"11534_CR116","doi-asserted-by":"crossref","unstructured":"Ferrara E (2023) Should chatgpt be biased? challenges and risks of bias in large language models. arXiv preprint arXiv:2304.03738","DOI":"10.2139\/ssrn.4627814"},{"key":"11534_CR117","doi-asserted-by":"crossref","unstructured":"Fetahu B, Chen Z, Kar S, Rokhlenko O, Malmasi S (2023) Multiconer v2: a large multilingual dataset for fine-grained and noisy named entity recognition. arXiv preprint arXiv:2310.13213","DOI":"10.18653\/v1\/2023.findings-emnlp.134"},{"key":"11534_CR118","doi-asserted-by":"crossref","unstructured":"Fetahu B, Kar S, Chen Z, Rokhlenko O, Malmasi S (2023) SemEval-2023 Task 2: Fine-grained Multilingual Named Entity Recognition (MultiCoNER 2). In: Proceedings of the 17th International Workshop on Semantic Evaluation (SemEval-2023). Association for Computational Linguistics, ???","DOI":"10.18653\/v1\/2023.semeval-1.310"},{"key":"11534_CR119","doi-asserted-by":"crossref","unstructured":"Firat O, Cho K, Sankaran B, Yarman\u00a0Vural FT, Bengio Y (2017) Multi-way, multilingual neural machine translation. Computer Speech and Language 45(C), 236\u2013252","DOI":"10.1016\/j.csl.2016.10.006"},{"key":"11534_CR120","doi-asserted-by":"crossref","unstructured":"FitzGerald J, Hench C, Peris C, Mackie S, Rottmann K, Sanchez A, Nash A, Urbach L, Kakarala V, Singh R, Ranganath S, Crist L, Britan M, Leeuwis W, Tur G, Natarajan P (2022) MASSIVE: A 1M-Example Multilingual Natural Language Understanding Dataset with 51 Typologically-Diverse Languages","DOI":"10.18653\/v1\/2023.acl-long.235"},{"key":"11534_CR121","unstructured":"Fluhr C, Frederking RE, Oard D, Okumura A, Ishikawa K, Satoh K (1995) 2.1 multilingual information retrieval"},{"key":"11534_CR122","doi-asserted-by":"crossref","unstructured":"Formal T, Piwowarski B, Clinchant S (2021) SPLADE: Sparse Lexical and Expansion Model for First Stage Ranking, pp. 2288\u20132292. Association for Computing Machinery, New York, NY, USA . https:\/\/doi.org\/10.1145\/3404835.3463098","DOI":"10.1145\/3404835.3463098"},{"key":"11534_CR123","unstructured":"Formal T, Lassance C, Piwowarski B, Clinchant S (2021) SPLADE v2: Sparse Lexical and Expansion Model for Information Retrieval. arXiv . https:\/\/doi.org\/10.48550\/ARXIV.2109.10086 . https:\/\/arxiv.org\/abs\/2109.10086"},{"key":"11534_CR124","doi-asserted-by":"publisher","unstructured":"Formal T, Lassance C, Piwowarski B, Clinchant S (2022) From distillation to hard negative sampling: Making sparse neural ir models more effective. In: Proceedings of the 45th International ACM SIGIR Conference on Research and Development in Information Retrieval. SIGIR \u201922, pp. 2353\u20132359. Association for Computing Machinery, New York, NY, USA . https:\/\/doi.org\/10.1145\/3477495.3531857","DOI":"10.1145\/3477495.3531857"},{"key":"11534_CR125","unstructured":"Foundation W. Wikimedia Downloads. https:\/\/dumps.wikimedia.org"},{"key":"11534_CR126","unstructured":"FredZhang: toxi-text-3M. https:\/\/huggingface.co\/datasets\/FredZhang7\/toxi-text-3M"},{"key":"11534_CR127","unstructured":"Fu C, Feng X, Huang Y, Huo W, Li B, Wang H, Qin B, Liu T (2024) Relay decoding: Concatenating large language models for machine translation. arXiv preprint arXiv:2405.02933"},{"key":"11534_CR128","unstructured":"Gangavarapu A (2024) Introducing l2m3, a multilingual medical large language model to advance health equity in low-resource regions. arXiv preprint arXiv:2404.08705"},{"key":"11534_CR129","unstructured":"Gao Y, Xiong Y, Gao X, Jia K, Pan J, Bi Y, Dai Y, Sun J, Wang H (2023) Retrieval-augmented generation for large language models: A survey. arXiv preprint arXiv:2312.10997"},{"key":"11534_CR130","doi-asserted-by":"crossref","unstructured":"Gao W, Niu C, Nie J-Y, Zhou M, Hu J, Wong K-F, Hon H-W (2007) Cross-lingual query suggestion using query logs of different languages. In: Proceedings of the 30th Annual International ACM SIGIR Conference on Research and Development in Information Retrieval, pp. 463\u2013470","DOI":"10.1145\/1277741.1277821"},{"key":"11534_CR131","doi-asserted-by":"crossref","unstructured":"Gao L, Dai Z, Callan J (2021) COIL: Revisit exact lexical match in information retrieval with contextualized inverted list. In: Proceedings of the 2021 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, pp. 3030\u20133042. Association for Computational Linguistics, Online . https:\/\/doi.org\/10.18653\/v1\/2021.naacl-main.241 . https:\/\/aclanthology.org\/2021.naacl-main.241","DOI":"10.18653\/v1\/2021.naacl-main.241"},{"key":"11534_CR132","unstructured":"Gao L, Biderman S, Black S, Golding L, Hoppe T, Foster C, Phang J, He H, Thite A, Nabeshima N et al (2020) The pile: An 800gb dataset of diverse text for language modeling. arXiv preprint arXiv:2101.00027"},{"key":"11534_CR133","doi-asserted-by":"crossref","unstructured":"Garcia X, Constant N, Parikh A, Firat O (2021) Towards continual learning for multilingual machine translation via vocabulary substitution. In: Proceedings of the 2021 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, pp. 1184\u20131192","DOI":"10.18653\/v1\/2021.naacl-main.93"},{"key":"11534_CR134","unstructured":"Garcia GL, Paiola PH, Morelli LH, Candido G, J\u00fanior AC, Jodas DS, Afonso L, Guilherme IR, Penteado BE, Papa JP (2024) Introducing bode: A fine-tuned large language model for portuguese prompt-based task. arXiv preprint arXiv:2401.02909"},{"key":"11534_CR135","unstructured":"Garcia X, Bansal Y, Cherry C, Foster G, Krikun M, Feng F, Johnson M, Firat O (2023) The unreasonable effectiveness of few-shot learning for machine translation"},{"key":"11534_CR136","doi-asserted-by":"crossref","unstructured":"Garc\u00eda-Ferrero I, Agerri R, Salazar AA, Cabrio E, Iglesia I, Lavelli A, Magnini B, Molinet B, Ramirez-Romero J, Rigau G et al (2024) Medical mt5: An open-source multilingual text-to-text llm for the medical domain. arXiv preprint arXiv:2404.07613","DOI":"10.63317\/2kopd98p2rcz"},{"key":"11534_CR137","doi-asserted-by":"crossref","unstructured":"Geng L, Yan X, Cao Z, Li J, Li W, Li S, Zhou X, Yang Y, Zhang J (2023) Kbioxlm: A knowledge-anchored biomedical multilingual pretrained language model. arXiv preprint arXiv:2311.11564","DOI":"10.18653\/v1\/2023.findings-emnlp.751"},{"key":"11534_CR138","doi-asserted-by":"crossref","unstructured":"Gerz D, Su P, Kusztos R, Mondal A, Lis M, Singhal E, Mrksic N, Wen T, Vulic I (2021) Multilingual and cross-lingual intent detection from spoken data. CoRR abs\/2104.08524 arxiv:2104.08524","DOI":"10.18653\/v1\/2021.emnlp-main.591"},{"key":"11534_CR139","unstructured":"Gibert O, Nail G, Arefyev N, Ba\u00f1\u00f3n M, Linde J, Ji S, Zaragoza-Bernabeu J, Aulamo M, Ram\u00edrez-S\u00e1nchez G, Kutuzov A, Pyysalo S, Oepen S, Tiedemann J (2024) A New Massive Multilingual Dataset for High-Performance Language Technologies"},{"key":"11534_CR140","doi-asserted-by":"crossref","unstructured":"Goel R, Ammar W, Gupta A, Vashishtha S, Sano M, Surani F, Chang M, Choe H, Greene D, He K, Nitisaroj R, Trukhina A, Paul S, Shah P, Shah R, Yu Z (2023) PRESTO: A Multilingual Dataset for Parsing Realistic Task-Oriented Dialogs","DOI":"10.18653\/v1\/2023.emnlp-main.667"},{"key":"11534_CR141","doi-asserted-by":"crossref","unstructured":"Gordon TF, Governatori G, Rotolo A (2009) Rules and norms: Requirements for rule interchange languages in the legal domain. In: International Workshop on Rules and Rule Markup Languages for the Semantic Web, pp. 282\u2013296 . Springer","DOI":"10.1007\/978-3-642-04985-9_26"},{"key":"11534_CR142","first-page":"522","volume":"10","author":"N Goyal","year":"2022","unstructured":"Goyal N, Gao C, Chaudhary V, Chen P-J, Wenzek G, Ju D, Krishnan S, Ranzato M, Guzm\u00e1n F, Fan A (2022) The flores-101 evaluation benchmark for low-resource and multilingual machine translation. Trans Assoc Comput Ling 10:522\u2013538","journal-title":"Trans Assoc Comput Ling"},{"key":"11534_CR143","doi-asserted-by":"crossref","unstructured":"Goyal S, Rastogi E, Rajagopal SP, Yuan D, Zhao F, Chintagunta J, Naik G, Ward J (2024) Healai: A healthcare llm for effective medical documentation. In: Proceedings of the 17th ACM International Conference on Web Search and Data Mining, pp. 1167\u20131168","DOI":"10.1145\/3616855.3635739"},{"key":"11534_CR144","unstructured":"Grattafiori A, Dubey A, Jauhri A, Pandey A, Kadian A, Al-Dahle A, Letman A et al (2024) The Llama 3 Herd of Models . https:\/\/arxiv.org\/abs\/2407.21783"},{"key":"11534_CR145","volume-title":"Cross-language information retrieval","author":"G Grefenstette","year":"2012","unstructured":"Grefenstette G (2012) Cross-language information retrieval, vol 2. Springer, Cham"},{"key":"11534_CR146","unstructured":"Gu A, Dao T (2023) Mamba: Linear-time sequence modeling with selective state spaces. arXiv preprint arXiv:2312.00752"},{"key":"11534_CR147","unstructured":"Guo D, Yang D, Zhang H, Song J, Zhang R, Xu R, Zhu Q, Ma S, Wang P, Bi X et al (2025) Deepseek-r1: Incentivizing reasoning capability in llms via reinforcement learning. arXiv preprint arXiv:2501.12948"},{"key":"11534_CR148","unstructured":"Gutenberg P. Project Gutenberg. https:\/\/www.gutenberg.org\/"},{"key":"11534_CR149","doi-asserted-by":"crossref","unstructured":"Guzm\u00e1n F, Chen P-J, Ott M, Pino J, Lample G, Koehn P, Chaudhary V, Ranzato M (2019) Two new evaluation datasets for low-resource machine translation: Nepali-english and sinhala-english. arXiv preprint arXiv:1902.01382","DOI":"10.18653\/v1\/D19-1632"},{"key":"11534_CR150","unstructured":"HIT-SCIR: Chinese-Mixtral-8x7B: An Open-Source Mixture-of-Experts LLM. GitHub (2024)"},{"key":"11534_CR151","unstructured":"Han T, Adams LC, Papaioannou J-M, Grundmann P, Oberhauser T, L\u00f6ser A, Truhn D, Bressem KK (2023) Medalpaca\u2013an open-source collection of medical conversational ai models and training data. arXiv preprint arXiv:2304.08247"},{"key":"11534_CR152","doi-asserted-by":"crossref","unstructured":"Haq S, Sharma A, Khattab O, Chhaya N, Bhattacharyya P (2024) IndicIRSuite: Multilingual dataset and neural information models for Indian languages. In: Ku, L.-W., Martins, A., Srikumar, V. (eds.) Proceedings of the 62nd Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers), pp. 501\u2013509. Association for Computational Linguistics, Bangkok, Thailand . https:\/\/doi.org\/10.18653\/v1\/2024.acl-short.46 . https:\/\/aclanthology.org\/2024.acl-short.46","DOI":"10.18653\/v1\/2024.acl-short.46"},{"key":"11534_CR153","doi-asserted-by":"crossref","unstructured":"Hardalov M, Mihaylov T, Zlatkova D, Dinkov Y, Koychev I, Nakov P (2020) EXAMS: A Multi-Subject High School Examinations Dataset for Cross-Lingual and Multilingual Question Answering","DOI":"10.18653\/v1\/2020.emnlp-main.438"},{"key":"11534_CR154","doi-asserted-by":"crossref","unstructured":"Hasan T, Bhattacharjee A, Islam MS, Samin K, Li Y-F, Kang Y-B, Rahman MS, Shahriyar R (2021) XL-Sum: Large-Scale Multilingual Abstractive Summarization for 44 Languages","DOI":"10.18653\/v1\/2021.findings-acl.413"},{"key":"11534_CR155","unstructured":"Hasan MM, Rahman Z, Mostafiz R, Hossain MA (2025) Sentra-guard: A multilingual human-ai framework for real-time defense against adversarial llm jailbreaks. arXiv preprint arXiv:2510.22628"},{"key":"11534_CR156","first-page":"229","volume":"12","author":"Z He","year":"2024","unstructured":"He Z, Liang T, Jiao W, Zhang Z, Yang Y, Wang R, Tu Z, Shi S, Wang X (2024) Exploring human-like translation strategy with large language models. Trans Assoc Comput Ling 12:229\u2013246","journal-title":"Trans Assoc Comput Ling"},{"key":"11534_CR157","doi-asserted-by":"crossref","unstructured":"He Z, Liang T, Jiao W, Zhang Z, Yang Y, Wang R, Tu Z, Shi S, Wang X (2023) Exploring Human-Like Translation Strategy with Large Language Models","DOI":"10.1162\/tacl_a_00642"},{"key":"11534_CR158","unstructured":"He W, Wen J, Zhang L, Cheng H, Qin B, Li Y, Jiang F, Chen J, Wang B, Yang M (2023) HanFei-1.0. GitHub"},{"key":"11534_CR159","unstructured":"Hendy A, Abdelrehim M, Sharaf A, Raunak V, Gabr M, Matsushita H, Kim YJ, Afify M, Awadalla HH (2023) How good are gpt models at machine translation? a comprehensive evaluation. arXiv preprint arXiv:2302.09210"},{"key":"11534_CR160","doi-asserted-by":"crossref","unstructured":"Hoang VCD, Koehn P, Haffari G, Cohn T (2018) Iterative back-translation for neural machine translation. In: Proceedings of the 2nd Workshop on Neural Machine Translation and Generation, pp. 18\u201324","DOI":"10.18653\/v1\/W18-2703"},{"key":"11534_CR161","doi-asserted-by":"publisher","first-page":"33","DOI":"10.1023\/B:INRT.0000009439.19151.4c","volume":"7","author":"V Hollink","year":"2004","unstructured":"Hollink V, Kamps J, Monz C, De Rijke M (2004) Monolingual document retrieval for european languages. Inf Retri 7:33\u201352","journal-title":"Inf Retri"},{"key":"11534_CR162","unstructured":"Hu J, Ruder S, Siddhant A, Neubig G, Firat O, Johnson M (2020) XTREME: A Massively Multilingual Multi-task Benchmark for Evaluating Cross-lingual Generalization"},{"key":"11534_CR163","doi-asserted-by":"crossref","unstructured":"Hu L, Liu Z, Zhao Z, Hou L, Nie L, Li J (2023) A survey of knowledge enhanced pre-trained language models. IEEE Transactions on Knowledge and Data Engineering","DOI":"10.1109\/TKDE.2023.3310002"},{"key":"11534_CR164","unstructured":"Hu Z, Wu G, Mitra S, Zhang R, Sun T, Huang H, Swaminathan V. Token-level adversarial prompt detection based on perplexity measures and contextual information. In: ICLR 2025 Workshop on Building Trust in Language Models and Applications"},{"key":"11534_CR165","first-page":"12365","volume":"2023","author":"H Huang","year":"2023","unstructured":"Huang H, Tang T, Zhang D, Zhao WX, Song T, Xia Y, Wei F (2023) Not all languages are created equal in llms: Improving multilingual capability by cross-lingual-thought prompting. Find Assoc Comput Ling EMNLP 2023:12365\u201312394","journal-title":"Find Assoc Comput Ling EMNLP"},{"key":"11534_CR166","doi-asserted-by":"publisher","unstructured":"Huang Z, Yu P, Allan J (2023) Improving cross-lingual information retrieval on low-resource languages via optimal transport distillation. In: Proceedings of the Sixteenth ACM International Conference on Web Search and Data Mining. WSDM \u201923, pp. 1048\u20131056. Association for Computing Machinery, New York, NY, USA https:\/\/doi.org\/10.1145\/3539597.3570468","DOI":"10.1145\/3539597.3570468"},{"key":"11534_CR167","unstructured":"Huang Y, Gupta S, Xia M, Li K, Chen D (2023) Catastrophic jailbreak of open-source llms via exploiting generation. arXiv preprint arXiv:2310.06987"},{"key":"11534_CR168","doi-asserted-by":"crossref","unstructured":"Huang K, Li P, Liu J, Sun M, Liu Y (2023) Learn and consolidate: Continual adaptation for zero-shot and multilingual neural machine translation. In: Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, pp. 13938\u201313951","DOI":"10.18653\/v1\/2023.emnlp-main.860"},{"key":"11534_CR169","doi-asserted-by":"crossref","unstructured":"Huang K, Li P, Ma J, Yao T, Liu Y (2023) Knowledge transfer in incremental learning for multilingual neural machine translation. In: Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pp. 15286\u201315304","DOI":"10.18653\/v1\/2023.acl-long.852"},{"key":"11534_CR170","doi-asserted-by":"crossref","unstructured":"Huang K, Li P, Ma J, Liu Y (2022) Entropy-based vocabulary substitution for incremental learning in multilingual neural machine translation. In: Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing, pp. 10537\u201310550","DOI":"10.18653\/v1\/2022.emnlp-main.720"},{"key":"11534_CR171","doi-asserted-by":"crossref","unstructured":"Huang K-P, Yang C-K, Fu Y-K, Dunbar E, Lee H-y (2024) Zero resource code-switched speech benchmark using speech utterance pairs for multiple spoken languages. In: ICASSP 2024-2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp. 10006\u201310010 . IEEE","DOI":"10.1109\/ICASSP48485.2024.10446737"},{"key":"11534_CR172","unstructured":"Huang Q, Tao M, Zhang C, An Z, Jiang C, Chen Z, Wu Z, Feng Y (2023) Lawyer llama technical report. ArXiv abs\/2305.15062"},{"key":"11534_CR173","unstructured":"Huang Q, Tao M, An Z, Zhang C, Jiang C, Chen Z, Wu Z, Feng Y (2023) Lawyer llama technical report. arXiv preprint arXiv:2305.15062"},{"key":"11534_CR174","doi-asserted-by":"crossref","unstructured":"Huguet\u00a0Cabot P-L, Tedeschi S, Ngonga\u00a0Ngomo A-C, Navigli R (2023) Red$$^{{\\rm fm}}$$: a filtered and multilingual relation extraction dataset. In: Proc. of the 61st Annual Meeting of the Association for Computational Linguistics: ACL 2023. Association for Computational Linguistics, Toronto, Canada . https:\/\/arxiv.org\/abs\/2306.09802","DOI":"10.18653\/v1\/2023.acl-long.237"},{"key":"11534_CR175","doi-asserted-by":"crossref","unstructured":"Hull DA, Grefenstette G (1996) Querying across languages: A dictionary-based approach to multilingual information retrieval. In: Proceedings of the 19th Annual International ACM SIGIR Conference on Research and Development in Information Retrieval, pp. 49\u201357","DOI":"10.1145\/243199.243212"},{"key":"11534_CR176","doi-asserted-by":"crossref","unstructured":"Hutchinson B, Prabhakaran V, Denton E, Webster K, Zhong Y, Denuyl S (2020) Social biases in nlp models as barriers for persons with disabilities. In: Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, pp. 5491\u20135501","DOI":"10.18653\/v1\/2020.acl-main.487"},{"key":"11534_CR177","doi-asserted-by":"crossref","unstructured":"ImaniGooghari A, Lin P, Kargaran AH, Severini S, Sabet MJ, Kassner N, Ma C, Schmid H, Martins AF, Yvon F et al (2023) Glot500: Scaling multilingual corpora and language models to 500 languages. arXiv preprint arXiv:2305.12182","DOI":"10.18653\/v1\/2023.acl-long.61"},{"key":"11534_CR178","unstructured":"Inan H, Upasani K, Chi J, Rungta R, Iyer K, Mao Y, Tontchev M, Hu Q, Fuller B, Testuggine D et al (2023) Llama guard: Llm-based input-output safeguard for human-ai conversations. arXiv preprint arXiv:2312.06674"},{"key":"11534_CR179","doi-asserted-by":"crossref","unstructured":"Intrator Y, Halfon M, Goldenberg R, Tsarfaty R, Eyal M, Rivlin E, Matias Y, Aizenberg N (2024) Breaking the language barrier: Can direct inference outperform pre-translation in multilingual llm applications? arXiv preprint arXiv:2403.04792","DOI":"10.18653\/v1\/2024.naacl-short.75"},{"key":"11534_CR180","unstructured":"Introducing Embed v3. https:\/\/cohere.com\/blog\/introducing-embed-v3. Accessed: 2023-11-02"},{"key":"11534_CR181","unstructured":"Izacard G, Caron M, Hosseini L, Riedel S, Bojanowski P, Joulin A, Grave E (2021) Unsupervised Dense Information Retrieval with Contrastive Learning . https:\/\/doi.org\/10.48550\/ARXIV.2112.09118 . https:\/\/arxiv.org\/abs\/2112.09118"},{"key":"11534_CR182","unstructured":"Jain N, Schwarzschild A, Wen Y, Somepalli G, Kirchenbauer J, Chiang P-y, Goldblum M, Saha A, Geiping J, Goldstein T (2023) Baseline defenses for adversarial attacks against aligned language models. arXiv preprint arXiv:2309.00614"},{"key":"11534_CR183","doi-asserted-by":"crossref","unstructured":"Jeronymo V, Lotufo R, Nogueira R (2023) NeuralMind-UNICAMP at 2022 TREC NeuCLIR: Large Boring Rerankers for Cross-lingual Retrieval . https:\/\/arxiv.org\/abs\/2303.16145","DOI":"10.6028\/NIST.SP.500-338.neuclir-NM.unicamp"},{"key":"11534_CR184","unstructured":"Jeronymo V, Bonifacio L, Abonizio H, Fadaee M, Lotufo R, Zavrel J, Nogueira R (2023) InPars-v2: Large Language Models as Efficient Dataset Generators for Information Retrieval. arXiv . https:\/\/doi.org\/10.48550\/ARXIV.2301.01820 . https:\/\/arxiv.org\/abs\/2301.01820"},{"key":"11534_CR185","unstructured":"Jiang AQ, Sablayrolles A, Mensch A, Bamford C, Chaplot DS, Casas Ddl, Bressand F, Lengyel G, Lample G, Saulnier L et al (2023) Mistral 7b. arXiv preprint arXiv:2310.06825"},{"key":"11534_CR186","first-page":"15009","volume":"2023","author":"W Jiao","year":"2023","unstructured":"Jiao W, Huang J, Wang W, He Z, Liang T, Wang X, Shi S, Tu Z (2023) Parrot: translating during chat using large language models tuned with human translation and feedback. Find Assoc Comput Ling EMNLP 2023:15009\u201315020","journal-title":"Find Assoc Comput Ling EMNLP"},{"key":"11534_CR187","unstructured":"Jin H, Chen R, Zhou A, Chen J, Zhang Y, Wang H (2024) Guard: Role-playing to generate natural-language jailbreakings to test guideline adherence of large language models. arXiv preprint arXiv:2402.03299"},{"key":"11534_CR188","first-page":"339","volume":"5","author":"M Johnson","year":"2017","unstructured":"Johnson M, Schuster M, Le QV, Krikun M, Wu Y, Chen Z, Thorat N, Vi\u00e9gas F, Wattenberg M, Corrado G et al (2017) Google\u2019s multilingual neural machine translation system: enabling zero-shot translation. Trans Assoc Comput Ling 5:339\u2013351","journal-title":"Trans Assoc Comput Ling"},{"key":"11534_CR189","doi-asserted-by":"crossref","unstructured":"Joshi P, Santy S, Budhiraja A, Bali K, Choudhury M (2020) The state and fate of linguistic diversity and inclusion in the NLP world. In: Jurafsky, D., Chai, J., Schluter, N., Tetreault, J. (eds.) Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, pp. 6282\u20136293. Association for Computational Linguistics, Online . https:\/\/doi.org\/10.18653\/v1\/2020.acl-main.560 . https:\/\/aclanthology.org\/2020.acl-main.560","DOI":"10.18653\/v1\/2020.acl-main.560"},{"key":"11534_CR190","doi-asserted-by":"crossref","unstructured":"Kabra A, Liu E, Khanuja S, Aji AF, Winata G, Cahyawijaya S, Aremu A, Ogayo P, Neubig G (2023) Multi-lingual and multi-cultural figurative language understanding. In: Rogers, A., Boyd-Graber, J., Okazaki, N. (eds.) Findings of the Association for Computational Linguistics: ACL 2023, pp. 8269\u20138284. Association for Computational Linguistics, Toronto, Canada . https:\/\/doi.org\/10.18653\/v1\/2023.findings-acl.525 . https:\/\/aclanthology.org\/2023.findings-acl.525","DOI":"10.18653\/v1\/2023.findings-acl.525"},{"key":"11534_CR191","unstructured":"Kandpal N, Wallace E, Raffel C (2022) Deduplicating training data mitigates privacy risks in language models. In: International Conference on Machine Learning, pp. 10697\u201310707 . PMLR"},{"key":"11534_CR192","unstructured":"Kaplan J, McCandlish S, Henighan T, Brown TB, Chess B, Child R, Gray S, Radford A, Wu J, Amodei D (2020) Scaling laws for neural language models. arXiv preprint arXiv:2001.08361"},{"key":"11534_CR193","doi-asserted-by":"crossref","unstructured":"Keung P, Lu Y, Szarvas G, Smith NA (2020) The multilingual amazon reviews corpus. In: Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing","DOI":"10.18653\/v1\/2020.emnlp-main.369"},{"key":"11534_CR194","doi-asserted-by":"crossref","unstructured":"Keung P, Lu Y, Szarvas G, Smith NA (2020) The Multilingual Amazon Reviews Corpus","DOI":"10.18653\/v1\/2020.emnlp-main.369"},{"key":"11534_CR195","doi-asserted-by":"crossref","unstructured":"Khatri J, Srivastava V, Vig L (2023) Can you translate for me? code-switched machine translation with large language models. In: Proceedings of the 13th International Joint Conference on Natural Language Processing and the 3rd Conference of the Asia-Pacific Chapter of the Association for Computational Linguistics (Volume 2: Short Papers), pp. 83\u201392","DOI":"10.18653\/v1\/2023.ijcnlp-short.10"},{"key":"11534_CR196","doi-asserted-by":"publisher","unstructured":"Khattab O, Zaharia M (2020) Colbert: Efficient and effective passage search via contextualized late interaction over bert. In: Proceedings of the 43rd International ACM SIGIR Conference on Research and Development in Information Retrieval. SIGIR \u201920, pp. 39\u201348. Association for Computing Machinery, New York, NY, USA . https:\/\/doi.org\/10.1145\/3397271.3401075","DOI":"10.1145\/3397271.3401075"},{"key":"11534_CR197","doi-asserted-by":"crossref","unstructured":"Kim S, Joo S, Kim D, Jang J, Ye S, Shin J, Seo M (2023) The cot collection: Improving zero-shot and few-shot learning of language models via chain-of-thought fine-tuning. In: Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, pp. 12685\u201312708","DOI":"10.18653\/v1\/2023.emnlp-main.782"},{"key":"11534_CR198","unstructured":"Kim S, Ki D, Kim Y, Lee J (2023) Boosting Cross-lingual Transferability in Multilingual Models via In-Context Learning"},{"issue":"13","key":"11534_CR199","doi-asserted-by":"publisher","first-page":"3521","DOI":"10.1073\/pnas.1611835114","volume":"114","author":"J Kirkpatrick","year":"2017","unstructured":"Kirkpatrick J, Pascanu R, Rabinowitz N, Veness J, Desjardins G, Rusu AA, Milan K, Quan J, Ramalho T, Grabska-Barwinska A et al (2017) Overcoming catastrophic forgetting in neural networks. Proc Natl Acad Sci 114(13):3521\u20133526","journal-title":"Proc Natl Acad Sci"},{"key":"11534_CR200","doi-asserted-by":"crossref","unstructured":"Koto F, Beck T, Talat Z, Gurevych I, Baldwin T (2024) Zero-shot sentiment analysis in low-resource languages using a multilingual sentiment lexicon. arXiv preprint arXiv:2402.02113","DOI":"10.18653\/v1\/2024.eacl-long.18"},{"key":"11534_CR201","first-page":"50","volume":"10","author":"J Kreutzer","year":"2022","unstructured":"Kreutzer J, Caswell I, Wang L, Wahab A, Esch D, Ulzii-Orshikh N, Tapo A, Subramani N, Sokolov A, Sikasote C et al (2022) Quality at a glance: an audit of web-crawled multilingual datasets. Trans Assoc Comput Ling 10:50\u201372","journal-title":"Trans Assoc Comput Ling"},{"key":"11534_CR202","unstructured":"Kumar A, Agarwal C, Srinivas S, Li AJ, Feizi S, Lakkaraju H. Certifying llm safety against adversarial prompting. In: First Conference on Language Modeling"},{"key":"11534_CR203","unstructured":"Kusupati A, Bhatt G, Rege A, Wallingford M, Sinha A, Ramanujan V, Howard-Snyder W, Chen K, Kakade S, Jain P, Farhadi A (2024) Matryoshka Representation Learning . https:\/\/arxiv.org\/abs\/2205.13147"},{"key":"11534_CR204","doi-asserted-by":"crossref","unstructured":"Labrak Y, Bazoge A, Morin E, Gourraud P-A, Rouvier M, Dufour R (2024) Biomistral: A collection of open-source pretrained large language models for medical domains. arXiv preprint arXiv:2402.10373","DOI":"10.18653\/v1\/2024.findings-acl.348"},{"key":"11534_CR205","first-page":"13171","volume":"2023","author":"V Lai","year":"2023","unstructured":"Lai V, Ngo N, Veyseh APB, Man H, Dernoncourt F, Bui T, Nguyen T (2023) Chatgpt beyond english: towards a comprehensive evaluation of large language models in multilingual learning. Find Assoc Comput Ling EMNLP 2023:13171\u201313189","journal-title":"Find Assoc Comput Ling EMNLP"},{"key":"11534_CR206","doi-asserted-by":"publisher","unstructured":"Lassance C, Clinchant S (2022) An efficiency study for splade models. In: Proceedings of the 45th International ACM SIGIR Conference on Research and Development in Information Retrieval. SIGIR \u201922, pp. 2220\u20132226. Association for Computing Machinery, New York, NY, USA . https:\/\/doi.org\/10.1145\/3477495.3531833","DOI":"10.1145\/3477495.3531833"},{"key":"11534_CR207","unstructured":"Lassance C (2023) Extending English IR methods to multi-lingual IR . https:\/\/arxiv.org\/abs\/2302.14723"},{"key":"11534_CR208","doi-asserted-by":"publisher","first-page":"351","DOI":"10.1007\/978-3-030-99736-6_24","volume-title":"Advances in information retrieval","author":"D Lawrie","year":"2022","unstructured":"Lawrie D, Mayfield J, Oard DW, Yang E (2022) Hc4: a new suite of test collections for ad hoc clir. In: Hagen M, Verberne S, Macdonald C, Seifert C, Balog K, N\u00f8rv\u00e5g K, Setty V (eds) Advances in information retrieval. Springer, Cham, pp 351\u2013366"},{"key":"11534_CR209","doi-asserted-by":"crossref","unstructured":"Lawrie D, Yang E, Oard DW, Mayfield J (2023) Neural approaches to multilingual information retrieval. Advances in Information Retrieval: 45th European Conference on Information Retrieval. ECIR 2023, Dublin, Ireland, April 2\u20136, 2023, Proceedings, Part I. Springer, Berlin, Heidelberg, pp 521\u2013536","DOI":"10.1007\/978-3-031-28244-7_33"},{"key":"11534_CR210","unstructured":"Lee C, Roy R, Xu M, Raiman J, Shoeybi M, Catanzaro B, Ping W (2024) NV-Embed: Improved Techniques for Training LLMs as Generalist Embedding Models . https:\/\/arxiv.org\/abs\/2405.17428"},{"key":"11534_CR211","unstructured":"Lee S, Shakir A, Koenig D, Lipp J (2024) Open Source Strikes Bread - New Fluffy Embeddings Model . https:\/\/www.mixedbread.ai\/blog\/mxbai-embed-large-v1"},{"key":"11534_CR212","unstructured":"Lee J, Chen A, Dai Z, Dua D, Sachan DS, Boratko M, Luan Y, Arnold SMR, Perot V, Dalmia S, Hu H, Lin X, Pasupat P, Amini A, Cole JR, Riedel S, Naim I, Chang M-W, Guu K (2024) Can Long-Context Language Models Subsume Retrieval, RAG, SQL, and More? . https:\/\/arxiv.org\/abs\/2406.13121"},{"key":"11534_CR213","doi-asserted-by":"crossref","unstructured":"Lee D, Xie S, Rahman S, Pat K, Lee D, Chen QA (2023) prompter says: A linguistic approach to understanding and detecting jailbreak attacks against large-language models. In: Proceedings of the 1st ACM Workshop on Large AI Systems and Models with Privacy and Safety Analysis, pp. 77\u201387","DOI":"10.1145\/3689217.3690618"},{"key":"11534_CR214","unstructured":"Lee J, Dai Z, Ren X, Chen B, Cer D, Cole JR, Hui K, Boratko M, Kapadia R, Ding W, Luan Y, Duddu SMK, Abrego GH, Shi W, Gupta N, Kusupati A, Jain P, Jonnalagadda SR, Chang M-W, Naim I (2024) Gecko: Versatile Text Embeddings Distilled from Large Language Models . https:\/\/arxiv.org\/abs\/2403.20327"},{"key":"11534_CR215","doi-asserted-by":"crossref","unstructured":"Levy S, John N, Liu L, Vyas Y, Ma J, Fujinuma Y, Ballesteros M, Castelli V, Roth D (2023) Comparing biases and the impact of multilingual training across multiple languages. In: Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, pp. 10260\u201310280","DOI":"10.18653\/v1\/2023.emnlp-main.634"},{"key":"11534_CR216","doi-asserted-by":"crossref","unstructured":"Lewis P, O\u011fuz B, Rinott R, Riedel S, Schwenk H (2020) MLQA: Evaluating Cross-lingual Extractive Question Answering","DOI":"10.18653\/v1\/2020.acl-main.653"},{"key":"11534_CR217","doi-asserted-by":"crossref","unstructured":"Lewis M, Liu Y, Goyal N, Ghazvininejad M, Mohamed A, Levy O, Stoyanov V, Zettlemoyer L (2020) Bart: Denoising sequence-to-sequence pre-training for natural language generation, translation, and comprehension. In: Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, pp. 7871\u20137880","DOI":"10.18653\/v1\/2020.acl-main.703"},{"key":"11534_CR218","unstructured":"Le\u00a0Scao T, Fan A, Akiki C, Pavlick E, Ili\u0107 S, Hesslow D, Castagn\u00e9 R, Luccioni AS, Yvon F, Gall\u00e9 M et al (2022) Bloom: A 176b-parameter open-access multilingual language model"},{"key":"11534_CR219","doi-asserted-by":"crossref","unstructured":"Li L, Dong B, Wang R, Hu X, Zuo W, Lin D, Qiao Y, Shao J (2024) Salad-bench: A hierarchical and comprehensive safety benchmark for large language models. arXiv preprint arXiv:2402.05044","DOI":"10.18653\/v1\/2024.findings-acl.235"},{"key":"11534_CR220","unstructured":"Li J, Liu Y, Liu C, Shi L, Ren X, Zheng Y, Liu Y, Xue Y (2024) A cross-language investigation into jailbreak attacks in large language models. arXiv preprint arXiv:2401.16765"},{"key":"11534_CR221","unstructured":"Li Y, Wei F, Zhao J, Zhang C, Zhang H (2023) Rain: Your language models can align themselves without finetuning. In: The Twelfth International Conference on Learning Representations"},{"key":"11534_CR222","unstructured":"Li H, Koto F, Wu M, Aji AF, Baldwin T (2023) Bactrian-X: Multilingual Replicable Instruction-Following Models with Low-Rank Adaptation"},{"key":"11534_CR223","unstructured":"Li Z, Shi Y, Liu Z, Yang F, Liu N, Du M (2024) Quantifying multilingual performance of large language models across languages. arXiv preprint arXiv:2404.11553"},{"key":"11534_CR224","doi-asserted-by":"crossref","unstructured":"Li B, Zhou H, He J, Wang M, Yang Y, Li L (2020) On the sentence embeddings from pre-trained language models. In: Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing (EMNLP), pp. 9119\u20139130","DOI":"10.18653\/v1\/2020.emnlp-main.733"},{"key":"11534_CR225","doi-asserted-by":"crossref","unstructured":"Li J, Tang T, Zhao WX, Nie J-Y, Wen J-R (2022) Pretrained language models for text generation: A survey. arXiv preprint arXiv:2201.05273","DOI":"10.24963\/ijcai.2021\/612"},{"key":"11534_CR226","doi-asserted-by":"crossref","unstructured":"Li Y, Franz M, Sultan MA, Iyer B, Lee Y-S, Sil A (2022) Learning cross-lingual IR from an English retriever. In: Proceedings of the 2022 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, pp. 4428\u20134436. Association for Computational Linguistics, Seattle, United States . https:\/\/doi.org\/10.18653\/v1\/2022.naacl-main.329 . https:\/\/aclanthology.org\/2022.naacl-main.329","DOI":"10.18653\/v1\/2022.naacl-main.329"},{"key":"11534_CR227","unstructured":"Li X, Jin J, Zhou Y, Zhang Y, Zhang P, Zhu Y, Dou Z (2024) From matching to generation: a survey on generative information retrieval . https:\/\/arxiv.org\/abs\/2404.14851"},{"key":"11534_CR228","unstructured":"Li X, Zhou Z, Zhu J, Yao J, Liu T, Han B (2023) Deepinception: Hypnotize large language model to be jailbreaker. arXiv preprint arXiv:2311.03191"},{"key":"11534_CR229","doi-asserted-by":"crossref","unstructured":"Li H, Xu J, Cui G, Guan C, Mo F, Huang K (2025) Multilingual collaborative defense for large language models. arXiv preprint arXiv:2505.11835","DOI":"10.18653\/v1\/2025.findings-emnlp.200"},{"key":"11534_CR230","doi-asserted-by":"crossref","unstructured":"Li H, Ai Q, Chen J, Dong Q, Wu Y, Liu Y, Chen C, Tian Q (2023) SAILER: Structure-aware Pre-trained Language Model for Legal Case Retrieval","DOI":"10.1145\/3539618.3591761"},{"key":"11534_CR231","unstructured":"Li X, Nie E, Liang S (2023) From Classification to Generation: Insights into Crosslingual Retrieval Augmented ICL"},{"key":"11534_CR232","doi-asserted-by":"crossref","unstructured":"Li X, Nie E, Liang S (2023) Crosslingual retrieval augmented in-context learning for Bangla. In: Alam, F., Kar, S., Chowdhury, S.A., Sadeque, F., Amin, R. (eds.) Proceedings of the First Workshop on Bangla Language Processing (BLP-2023), pp. 136\u2013151. Association for Computational Linguistics, Singapore . https:\/\/doi.org\/10.18653\/v1\/2023.banglalp-1.15 . https:\/\/aclanthology.org\/2023.banglalp-1.15","DOI":"10.18653\/v1\/2023.banglalp-1.15"},{"key":"11534_CR233","doi-asserted-by":"crossref","unstructured":"Liang Y, Duan N, Gong Y, Wu N, Guo F, Qi W, Gong M, Shou L, Jiang D, Cao G, Fan X, Zhang R, Agrawal R, Cui E, Wei S, Bharti T, Qiao Y, Chen J-H, Wu W, Liu S, Yang F, Campos D, Majumder R, Zhou M (2020) XGLUE: A New Benchmark Dataset for Cross-lingual Pre-training, Understanding and Generation","DOI":"10.18653\/v1\/2020.emnlp-main.484"},{"key":"11534_CR234","doi-asserted-by":"crossref","unstructured":"Liang D, Gonen H, Mao Y, Hou R, Goyal N, Ghazvininejad M, Zettlemoyer L, Khabsa M (2023) Xlm-v: Overcoming the vocabulary bottleneck in multilingual masked language models. arXiv preprint arXiv:2301.10472","DOI":"10.18653\/v1\/2023.emnlp-main.813"},{"key":"11534_CR235","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-02181-7","volume-title":"Pretrained transformers for text ranking: bert and beyond","author":"J Lin","year":"2022","unstructured":"Lin J, Nogueira R, Yates A (2022) Pretrained transformers for text ranking: bert and beyond. Springer, Cham"},{"key":"11534_CR236","doi-asserted-by":"crossref","unstructured":"Lin BY, Lee S, Qiao X, Ren X (2021) Common sense beyond english: Evaluating and improving multilingual language models for commonsense reasoning. In: Proceedings of the 59th Annual Meeting of the Association for Computational Linguistics and the 11th International Joint Conference on Natural Language Processing (Volume 1: Long Papers), pp. 1274\u20131287","DOI":"10.18653\/v1\/2021.acl-long.102"},{"key":"11534_CR237","doi-asserted-by":"crossref","unstructured":"Lin BY, Lee S, Qiao X, Ren X (2021) Common sense beyond English: Evaluating and improving multilingual language models for commonsense reasoning. In: Proceedings of the 59th Annual Meeting of the Association for Computational Linguistics and the 11th International Joint Conference on Natural Language Processing (Volume 1: Long Papers), pp. 1274\u20131287. Association for Computational Linguistics, Online . https:\/\/doi.org\/10.18653\/v1\/2021.acl-long.102 . https:\/\/aclanthology.org\/2021.acl-long.102","DOI":"10.18653\/v1\/2021.acl-long.102"},{"key":"11534_CR238","doi-asserted-by":"crossref","unstructured":"Lin Z, Wu L, Wang M, Li L (2021) Learning language specific sub-network for multilingual machine translation. In: Proceedings of the 59th Annual Meeting of the Association for Computational Linguistics and the 11th International Joint Conference on Natural Language Processing (Volume 1: Long Papers), pp. 293\u2013305","DOI":"10.18653\/v1\/2021.acl-long.25"},{"key":"11534_CR239","unstructured":"Lin J, Ma X (2021) A few brief notes on deepimpact, coil, and a conceptual framework for information retrieval techniques. arXiv preprint arXiv:2106.14807"},{"key":"11534_CR240","doi-asserted-by":"crossref","unstructured":"Lin J, Alfonso-Hermelo D, Jeronymo V, Kamalloo E, Lassance C, Nogueira R, Ogundepo O, Rezagholizadeh M, Thakur N, Yang J-H, Zhang X (2023) Simple Yet Effective Neural Ranking and Reranking Baselines for Cross-Lingual Information Retrieval . https:\/\/arxiv.org\/abs\/2304.01019","DOI":"10.6028\/NIST.SP.500-338.neuclir-h2oloo"},{"key":"11534_CR241","doi-asserted-by":"crossref","unstructured":"Lin XV, Mihaylov T, Artetxe M, Wang T, Chen S, Simig D, Ott M, Goyal N, Bhosale S, Du J et al (2022) Few-shot learning with multilingual generative language models. In: Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing, pp. 9019\u20139052","DOI":"10.18653\/v1\/2022.emnlp-main.616"},{"key":"11534_CR242","doi-asserted-by":"crossref","unstructured":"Lison, P., Tiedemann, J.: Opensubtitles2016: Extracting large parallel corpora from movie and tv subtitles. European Language Resources Association (2016)","DOI":"10.63317\/3fi26b3nobqg"},{"issue":"9","key":"11534_CR243","first-page":"1","volume":"55","author":"P Liu","year":"2023","unstructured":"Liu P, Yuan W, Fu J, Jiang Z, Hayashi H, Neubig G (2023) Pre-train, prompt, and predict: A systematic survey of prompting methods in natural language processing. ACM Comput Surv 55(9):1\u201335","journal-title":"ACM Comput Surv"},{"key":"11534_CR244","doi-asserted-by":"crossref","unstructured":"Liu Y, Deng G, Xu Z, Li Y, Zheng Y, Zhang Y, Zhao L, Zhang T, Liu Y (2023) Jailbreaking chatgpt via prompt engineering: An empirical study. arXiv preprint arXiv:2305.13860","DOI":"10.1145\/3663530.3665021"},{"key":"11534_CR245","unstructured":"Liu X, Xu N, Chen M, Xiao C (2023) Autodan: Generating stealthy jailbreak prompts on aligned large language models. arXiv preprint arXiv:2310.04451"},{"key":"11534_CR246","doi-asserted-by":"crossref","unstructured":"Liu Z, Huang D, Huang K, Li Z, Zhao J (2021) Finbert: A pre-trained financial language representation model for financial text mining. In: Proceedings of the Twenty-ninth International Conference on International Joint Conferences on Artificial Intelligence, pp. 4513\u20134519","DOI":"10.24963\/ijcai.2020\/622"},{"key":"11534_CR247","unstructured":"Liu H, Li C, Wu Q, Lee YJ (2024) Visual instruction tuning. Advances in neural information processing systems 36"},{"key":"11534_CR248","doi-asserted-by":"crossref","unstructured":"Liu H, Liu J, Cui L, Teng Z, Duan N, Zhou M, Zhang Y (2023) Logiqa 2.0\u2013an improved dataset for logical reasoning in natural language understanding. IEEE\/ACM Transactions on Audio, Speech, and Language Processing","DOI":"10.1109\/TASLP.2023.3293046"},{"key":"11534_CR249","doi-asserted-by":"publisher","unstructured":"Liu Z, Zhou Y, Zhu Y, Lian J, Li C, Dou Z, Lian D, Nie J-Y (2024) Information retrieval meets large language models. In: Companion Proceedings of the ACM Web Conference 2024. WWW \u201924, pp. 1586\u20131589. Association for Computing Machinery, New York, NY, USA . https:\/\/doi.org\/10.1145\/3589335.3641299","DOI":"10.1145\/3589335.3641299"},{"key":"11534_CR250","unstructured":"Liu X-Y, Wang G, Zha D (2023) Fingpt: Democratizing internet-scale data for financial large language models. arXiv preprint arXiv:2307.10485"},{"key":"11534_CR251","unstructured":"Liu JM, Li D, Cao H, Ren T, Liao Z, Wu J (2023) ChatCounselor: A Large Language Models for Mental Health Support"},{"key":"11534_CR252","doi-asserted-by":"crossref","unstructured":"Liu C, Zhang W, Zhao Y, Luu AT, Bing L (2024) Is translation all you need? a study on solving multilingual tasks with large language models. arXiv preprint arXiv:2403.10258","DOI":"10.18653\/v1\/2025.naacl-long.485"},{"issue":"1","key":"11534_CR253","doi-asserted-by":"publisher","first-page":"227","DOI":"10.1007\/s10796-020-09996-1","volume":"23","author":"E Loginova","year":"2021","unstructured":"Loginova E, Varanasi S, Neumann G (2021) Towards end-to-end multilingual question answering. Inf Syst Front 23(1):227\u2013241","journal-title":"Inf Syst Front"},{"key":"11534_CR254","doi-asserted-by":"crossref","unstructured":"Loginova E, Varanasi S, Neumann G (2018) Towards multilingual neural question answering. In: New Trends in Databases and Information Systems: ADBIS 2018 Short Papers and Workshops, AI* QA, BIGPMED, CSACDB, M2U, BigDataMAPS, ISTREND, DC, Budapest, Hungary, September, 2-5, 2018, Proceedings 22, pp. 274\u2013285 . Springer","DOI":"10.1007\/978-3-030-00063-9_26"},{"key":"11534_CR255","unstructured":"Louis A, Saxena V, Dijck G, Spanakis G (2024) ColBERT-XM: A Modular Multi-Vector Representation Model for Zero-Shot Multilingual Information Retrieval . https:\/\/arxiv.org\/abs\/2402.15059"},{"issue":"6","key":"11534_CR256","doi-asserted-by":"publisher","first-page":"409","DOI":"10.1093\/bib\/bbac409","volume":"23","author":"R Luo","year":"2022","unstructured":"Luo R, Sun L, Xia Y, Qin T, Zhang S, Poon H, Liu T-Y (2022) Biogpt: generative pre-trained transformer for biomedical text generation and mining. Brief Bioinform 23(6):409","journal-title":"Brief Bioinform"},{"key":"11534_CR257","doi-asserted-by":"crossref","unstructured":"Luo L, Ning J, Zhao Y, Wang Z, Ding Z, Chen P, Fu W, Han Q, Xu G, Qiu Y et al (2024) Taiyi: a bilingual fine-tuned large language model for diverse biomedical tasks. Journal of the American Medical Informatics Association, 037","DOI":"10.1093\/jamia\/ocae037"},{"key":"11534_CR258","unstructured":"Luo Y, Kong Q, Xu N, Cao J, Hao B, Qu B, Chen B, Zhu C, Zhao C, Zhang D et al (2023) Yayi 2: Multilingual open-source large language models. arXiv preprint arXiv:2312.14862"},{"key":"11534_CR259","unstructured":"Luo Z, Xie Q, Ananiadou S (2023) Chatgpt as a factual inconsistency evaluator for abstractive text summarization. arXiv preprint arXiv:2303.15621"},{"key":"11534_CR260","doi-asserted-by":"crossref","unstructured":"Luukkonen R, Komulainen V, Luoma J, Eskelinen A, Kanerva J, Kupari H-MK, Ginter F, Laippala V, Muennighoff N, Piktus A et al (2023) Fingpt: Large generative models for a small language. In: The 2023 Conference on Empirical Methods in Natural Language Processing","DOI":"10.18653\/v1\/2023.emnlp-main.164"},{"key":"11534_CR261","unstructured":"Lv H, Wang X, Zhang Y, Huang C, Dou S, Ye J, Gui T, Zhang Q, Huang X (2024) Codechameleon: Personalized encryption framework for jailbreaking large language models. arXiv preprint arXiv:2402.16717"},{"key":"11534_CR262","doi-asserted-by":"crossref","unstructured":"Lyu Q, Havaldar S, Stein A, Zhang L, Rao D, Wong E, Apidianaki M, Callison-Burch C (2023) Faithful chain-of-thought reasoning. In: Proceedings of the 13th International Joint Conference on Natural Language Processing and the 3rd Conference of the Asia-Pacific Chapter of the Association for Computational Linguistics (Volume 1: Long Papers), pp. 305\u2013329","DOI":"10.18653\/v1\/2023.ijcnlp-main.20"},{"key":"11534_CR263","doi-asserted-by":"publisher","unstructured":"Ma X, Wang L, Yang N, Wei F, Lin J (2024) Fine-tuning llama for multi-stage text retrieval. In: Proceedings of the 47th International ACM SIGIR Conference on Research and Development in Information Retrieval. SIGIR \u201924, pp. 2421\u20132425. Association for Computing Machinery, New York, NY, USA . https:\/\/doi.org\/10.1145\/3626772.3657951","DOI":"10.1145\/3626772.3657951"},{"key":"11534_CR264","unstructured":"Ma X, Zhang X, Pradeep R, Lin J (2023) Zero-Shot Listwise Document Reranking with a Large Language Model . https:\/\/arxiv.org\/abs\/2305.02156"},{"key":"11534_CR265","doi-asserted-by":"crossref","unstructured":"MacAvaney S, Soldaini L, Goharian N (2020) Teaching a new dog old tricks: Resurrecting multilingual retrieval using zero-shot learning. Advances in Information Retrieval: 42nd European Conference on IR Research. ECIR 2020, Lisbon, Portugal, April 14\u201317, 2020, Proceedings, Part II. Springer, Berlin, Heidelberg, pp 246\u2013254","DOI":"10.1007\/978-3-030-45442-5_31"},{"key":"11534_CR266","unstructured":"Magueresse A, Carles V, Heetderks E (2020) Low-resource languages: A review of past work and future challenges. arXiv preprint arXiv:2006.07264"},{"key":"11534_CR267","unstructured":"Malmasi S, Fang A, Fetahu B, Kar S, Rokhlenko O (2022) MultiCoNER: A Large-scale Multilingual dataset for Complex Named Entity Recognition"},{"key":"11534_CR268","doi-asserted-by":"crossref","unstructured":"Manakhimova S, Avramidis E, Macketanz V, Lapshinova-Koltunski E, Bagdasarov S, M\u00f6ller S (2023) Linguistically motivated evaluation of the 2023 state-of-the-art machine translation: Can chatgpt outperform nmt? In: Proceedings of the Eighth Conference on Machine Translation, pp. 224\u2013245","DOI":"10.18653\/v1\/2023.wmt-1.23"},{"key":"11534_CR269","doi-asserted-by":"crossref","unstructured":"Manning CD, Raghavan P, Sch\u00fctze H (2008) Introduction to Information Retrieval. Cambridge University Press, ???","DOI":"10.1017\/CBO9780511809071"},{"key":"11534_CR270","first-page":"15009","volume":"37","author":"T Markov","year":"2023","unstructured":"Markov T, Zhang C, Agarwal S, Nekoul FE, Lee T, Adler S, Jiang A, Weng L (2023) A holistic approach to undesired content detection in the real world. Proceed AAAI Conf Artif Intell 37:15009\u201315018","journal-title":"Proceed AAAI Conf Artif Intell"},{"key":"11534_CR271","unstructured":"May P (2021) Machine translated multilingual STS benchmark dataset. https:\/\/github.com\/PhilipMay\/stsb-multi-mt"},{"key":"11534_CR272","unstructured":"Mayfield J, Yang E, Lawrie D, Barham S, Weller O, Mason M, Nair S, Miller S (2023) Synthetic Cross-language Information Retrieval Training Data . https:\/\/arxiv.org\/abs\/2305.00331"},{"key":"11534_CR273","unstructured":"Mazeika M, Phan L, Yin X, Zou A, Wang Z, Mu N, Sakhaee E, Li N, Basart S, Li B et al (2024) Harmbench: A standardized evaluation framework for automated red teaming and robust refusal. arXiv preprint arXiv:2402.04249"},{"key":"11534_CR274","doi-asserted-by":"crossref","unstructured":"Mehnaz L, Mahata D, Gosangi R, Gunturi US, Jain R, Gupta G, Kumar A, Lee IG, Acharya A, Shah R (2021) Gupshup: Summarizing open-domain code-switched conversations. In: Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing, pp. 6177\u20136192","DOI":"10.18653\/v1\/2021.emnlp-main.499"},{"key":"11534_CR275","unstructured":"Mehrotra A, Zampetakis M, Kassianik P, Nelson B, Anderson H, Singer Y, Karbasi A (2023) Tree of attacks: Jailbreaking black-box llms automatically. arXiv preprint arXiv:2312.02119"},{"key":"11534_CR276","unstructured":"Merrick L, Xu D, Nuti G, Campos D (2024) Arctic-Embed: Scalable, Efficient, and Accurate Text Embedding Models . https:\/\/arxiv.org\/abs\/2405.05374"},{"key":"11534_CR277","doi-asserted-by":"crossref","unstructured":"Miceli-Barone AV, Haddow B, Germann U, Sennrich R (2017) Regularization techniques for fine-tuning in neural machine translation. In: Proceedings of the 2017 Conference on Empirical Methods in Natural Language Processing, pp. 1489\u20131494","DOI":"10.18653\/v1\/D17-1156"},{"issue":"2","key":"11534_CR278","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3605943","volume":"56","author":"B Min","year":"2023","unstructured":"Min B, Ross H, Sulem E, Veyseh APB, Nguyen TH, Sainz O, Agirre E, Heintz I, Roth D (2023) Recent advances in natural language processing via large pre-trained language models: A survey. ACM Comput Surv 56(2):1\u201340","journal-title":"ACM Comput Surv"},{"key":"11534_CR279","doi-asserted-by":"publisher","first-page":"1098","DOI":"10.1109\/TC.2008.42","volume":"57","author":"J Mirkovic","year":"2008","unstructured":"Mirkovic J, Reiher P, Papadopoulos C, Hussain A, Shepard M, Berg M, Jung R (2008) Testing a collaborative ddos defense in a red team\/blue team exercise. IEEE Trans Comput 57:1098\u20131112","journal-title":"IEEE Trans Comput"},{"key":"11534_CR280","doi-asserted-by":"crossref","unstructured":"Mittal S, Sundriyal M, Nakov P (2023) Lost in translation, found in spans: Identifying claims in multilingual social media. In: Bouamor, H., Pino, J., Bali, K. (eds.) Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, pp. 3887\u20133902. Association for Computational Linguistics, Singapore . https:\/\/doi.org\/10.18653\/v1\/2023.emnlp-main.236 . https:\/\/aclanthology.org\/2023.emnlp-main.236","DOI":"10.18653\/v1\/2023.emnlp-main.236"},{"key":"11534_CR281","doi-asserted-by":"crossref","unstructured":"Moradshahi M, Shen T, Bali K, Choudhury M, Chalendar G, Goel A, Kim S, Kodali P, Kumaraguru P, Semmar N, Semnani SJ, Seo J, Seshadri V, Shrivastava M, Sun M, Yadavalli A, You C, Xiong D, Lam MS (2023) X-RiSAWOZ: High-Quality End-to-End Multilingual Dialogue Datasets and Few-shot Agents","DOI":"10.18653\/v1\/2023.findings-acl.174"},{"key":"11534_CR507","unstructured":"mteb: Amazon Massive Intent. https:\/\/huggingface.co\/datasets\/mteb\/amazon_massive_intent"},{"key":"11534_CR508","unstructured":"mteb: MTEB Benchmark. https:\/\/huggingface.co\/datasets\/mteb\/bucc-bitext-mining"},{"key":"11534_CR282","doi-asserted-by":"publisher","unstructured":"Muennighoff N, Tazi N, Magne L, Reimers N (2022) Mteb: Massive text embedding benchmark. arXiv preprint arXiv:2210.07316https:\/\/doi.org\/10.48550\/ARXIV.2210.07316","DOI":"10.48550\/ARXIV.2210.07316"},{"key":"11534_CR283","unstructured":"Muennighoff N, Su H, Wang L, Yang N, Wei F, Yu T, Singh A, Kiela D (2024) Generative Representational Instruction Tuning . https:\/\/arxiv.org\/abs\/2402.09906"},{"key":"11534_CR284","doi-asserted-by":"crossref","unstructured":"Muennighoff N, Wang T, Sutawika L, Roberts A, Biderman S, Scao TL, Bari MS, Shen S, Yong Z-X, Schoelkopf H et al (2022) Crosslingual generalization through multitask finetuning. arXiv preprint arXiv:2211.01786","DOI":"10.18653\/v1\/2023.acl-long.891"},{"key":"11534_CR285","unstructured":"Muennighoff N, Rush A, Barak B, Le\u00a0Scao T, Tazi N, Piktus A, Pyysalo S, Wolf T, Raffel CA (2024) Scaling data-constrained language models. Advances in Neural Information Processing Systems 36"},{"key":"11534_CR286","doi-asserted-by":"crossref","unstructured":"Muennighoff N, Wang T, Sutawika L, Roberts A, Biderman S, Scao TL, Bari MS, Shen S, Yong Z-X, Schoelkopf H et al (2022) Crosslingual generalization through multitask finetuning. arXiv preprint arXiv:2211.01786","DOI":"10.18653\/v1\/2023.acl-long.891"},{"key":"11534_CR287","doi-asserted-by":"crossref","unstructured":"Muhammad SH, Abdulmumin I, Ayele AA, Ousidhoum N, Adelani DI, Yimam SM, Ahmad IS, Beloucif M, Mohammad SM, Ruder S, Hourrane O, Brazdil P, Ali FDMA, David D, Osei S, Bello BS, Ibrahim F, Gwadabe T, Rutunda S, Belay T, Messelle WB, Balcha HB, Chala SA, Gebremichael HT, Opoku B, Arthur S (2023) AfriSenti: A Twitter Sentiment Analysis Benchmark for African Languages","DOI":"10.18653\/v1\/2023.emnlp-main.862"},{"key":"11534_CR288","doi-asserted-by":"crossref","unstructured":"Nadeem M, Bethke A, Reddy S (2021) Stereoset: Measuring stereotypical bias in pretrained language models. In: Proceedings of the 59th Annual Meeting of the Association for Computational Linguistics and the 11th International Joint Conference on Natural Language Processing (Volume 1: Long Papers), pp. 5356\u20135371","DOI":"10.18653\/v1\/2021.acl-long.416"},{"key":"11534_CR289","doi-asserted-by":"crossref","unstructured":"Nair S, Yang E, Lawrie D, Duh K, McNamee P, Murray K, Mayfield J, Oard DW (2022) Transfer learning approaches for building cross-language dense retrieval models. Advances in Information Retrieval: 44th European Conference on IR Research. ECIR 2022, Stavanger, Norway, April 10\u201314, 2022, Proceedings, Part I. Springer, Berlin, Heidelberg, pp 382\u2013396","DOI":"10.1007\/978-3-030-99736-6_26"},{"key":"11534_CR290","doi-asserted-by":"publisher","unstructured":"Nair S, Yang E, Lawrie D, Mayfield J, Oard DW (2023) Blade: Combining vocabulary pruning and intermediate pretraining for scaleable neural clir. In: Proceedings of the 46th International ACM SIGIR Conference on Research and Development in Information Retrieval. SIGIR \u201923, pp. 1219\u20131229. Association for Computing Machinery, New York, NY, USA . https:\/\/doi.org\/10.1145\/3539618.3591644","DOI":"10.1145\/3539618.3591644"},{"key":"11534_CR291","doi-asserted-by":"crossref","unstructured":"Nekoto W, Marivate V, Matsila T, Fasubaa T, Fagbohungbe T, Akinola SO, Muhammad S, Kabongo\u00a0Kabenamualu S, Osei S, Sackey F, Niyongabo RA, Macharm R, Ogayo P, Ahia O, Berhe MM, Adeyemi M, Mokgesi-Selinga M, Okegbemi L, Martinus L, Tajudeen K, Degila K, Ogueji K, Siminyu K, Kreutzer J, Webster J, Ali JT, Abbott J, Orife I, Ezeani I, Dangana IA, Kamper H, Elsahar H, Duru G, Kioko G, Espoir M, Biljon E, Whitenack D, Onyefuluchi C, Emezue CC, Dossou BFP, Sibanda B, Bassey B, Olabiyi A, Ramkilowan A, \u00d6ktem A, Akinfaderin A, Bashir A (2020) Participatory research for low-resourced machine translation: A case study in African languages. In: Cohn, T., He, Y., Liu, Y. (eds.) Findings of the Association for Computational Linguistics: EMNLP 2020, pp. 2144\u20132160. Association for Computational Linguistics, Online . https:\/\/doi.org\/10.18653\/v1\/2020.findings-emnlp.195 . https:\/\/aclanthology.org\/2020.findings-emnlp.195","DOI":"10.18653\/v1\/2020.findings-emnlp.195"},{"key":"11534_CR292","doi-asserted-by":"crossref","unstructured":"Neural machine translation for low-resource languages (2023) Ranathunga, S., Lee, E.-S.A., Prifti Skenduli, M., Shekhar, R., Alam, M., Kaur. R A survey ACM Computing Surveys 55:1\u201337","DOI":"10.1145\/3567592"},{"key":"11534_CR293","unstructured":"New embedding models and API updates. https:\/\/openai.com\/index\/new-embedding-models-and-api-updates\/. Accessed: 2024-01-25"},{"key":"11534_CR294","doi-asserted-by":"crossref","unstructured":"Nguyen T, Nguyen CV, Lai VD, Man H, Ngo NT, Dernoncourt F, Rossi RA, Nguyen TH (2023) CulturaX: A Cleaned, Enormous, and Multilingual Dataset for Large Language Models in 167 Languages","DOI":"10.63317\/5iz6z5g7eit3"},{"key":"11534_CR295","unstructured":"Nguyen H-T, Yamada H, Satoh K (2024) Gpts and language barrier: A cross-lingual legal qa examination. arXiv preprint arXiv:2403.18098"},{"key":"11534_CR296","unstructured":"Nicholas G, Bhatia A (2023) Lost in translation: Large language models in non-english content analysis. arXiv preprint arXiv:2306.07377"},{"key":"11534_CR297","volume-title":"Cross-language Information Retrieval","author":"J-Y Nie","year":"2022","unstructured":"Nie J-Y (2022) Cross-language Information Retrieval. Springer, Cham"},{"key":"11534_CR298","doi-asserted-by":"crossref","unstructured":"Nie J-Y, Simard M, Isabelle P, Durand R (1999) Cross-language information retrieval based on parallel texts and automatic mining of parallel texts from the web. In: Proceedings of the 22nd Annual International ACM SIGIR Conference on Research and Development in Information Retrieval, pp. 74\u201381","DOI":"10.1145\/312624.312656"},{"key":"11534_CR299","doi-asserted-by":"crossref","unstructured":"Niklaus J, Matoshi V, Rani P, Galassi A, St\u00fcrmer M, Chalkidis I et al (2023) Lextreme: A multi-lingual and multi-task benchmark for the legal domain. In: Findings of the Association for Computational Linguistics: EMNLP 2023, pp. 3016\u20133054. Association for Computational Linguistics, ???","DOI":"10.18653\/v1\/2023.findings-emnlp.200"},{"key":"11534_CR300","doi-asserted-by":"crossref","unstructured":"Niklaus J, Matoshi V, St\u00fcrmer M, Chalkidis I, Ho DE (2023) Multilegalpile: A 689gb multilingual legal corpus. arXiv preprint arXiv:2306.02069","DOI":"10.18653\/v1\/2024.acl-long.805"},{"key":"11534_CR301","unstructured":"Nivre J, Marneffe M-C, Ginter F, Haji\u010d J, Manning CD, Pyysalo S, Schuster S, Tyers F, Zeman D (2020) Universal Dependencies v2: An evergrowing multilingual treebank collection. In: Calzolari, N., B\u00e9chet, F., Blache, P., Choukri, K., Cieri, C., Declerck, T., Goggi, S., Isahara, H., Maegaard, B., Mariani, J., Mazo, H., Moreno, A., Odijk, J., Piperidis, S. (eds.) Proceedings of the Twelfth Language Resources and Evaluation Conference, pp. 4034\u20134043. European Language Resources Association, Marseille, France . https:\/\/aclanthology.org\/2020.lrec-1.497"},{"key":"11534_CR302","first-page":"223","volume":"33","author":"DW Oard","year":"1998","unstructured":"Oard DW, Diekema AR (1998) Cross-language information retrieval. Ann Rev Inf Sci Technol (ARIST) 33:223\u201356","journal-title":"Ann Rev Inf Sci Technol (ARIST)"},{"key":"11534_CR303","doi-asserted-by":"crossref","unstructured":"Oncevay A, Haddow B, Birch A (2020) Bridging linguistic typology and multilingual machine translation with multi-view language representations. In: Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing (EMNLP), pp. 2391\u20132406","DOI":"10.18653\/v1\/2020.emnlp-main.187"},{"key":"11534_CR304","first-page":"27730","volume":"35","author":"L Ouyang","year":"2022","unstructured":"Ouyang L, Wu J, Jiang X, Almeida D, Wainwright C, Mishkin P, Zhang C, Agarwal S, Slama K, Ray A et al (2022) Training language models to follow instructions with human feedback. Adv Neural Inf Process Syst 35:27730\u201327744","journal-title":"Adv Neural Inf Process Syst"},{"key":"11534_CR305","doi-asserted-by":"crossref","unstructured":"Ouyang X, Wang S, Pang C, Sun Y, Tian H, Wu H, Wang H (2020) Ernie-m: Enhanced multilingual representation by aligning cross-lingual semantics with monolingual corpora. arXiv preprint arXiv:2012.15674","DOI":"10.18653\/v1\/2021.emnlp-main.3"},{"key":"11534_CR306","doi-asserted-by":"crossref","unstructured":"Pan X, Zhang B, May J, Nothman J, Knight K, Ji H (2017) Cross-lingual name tagging and linking for 282 languages. In: Proceedings of the 55th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pp. 1946\u20131958. Association for Computational Linguistics, Vancouver, Canada . https:\/\/doi.org\/10.18653\/v1\/P17-1178 . https:\/\/www.aclweb.org\/anthology\/P17-1178","DOI":"10.18653\/v1\/P17-1178"},{"key":"11534_CR307","doi-asserted-by":"crossref","unstructured":"Pan X, Wang M, Wu L, Li L (2021) Contrastive learning for many-to-many multilingual neural machine translation. In: Proceedings of the 59th Annual Meeting of the Association for Computational Linguistics and the 11th International Joint Conference on Natural Language Processing (Volume 1: Long Papers), pp. 244\u2013258","DOI":"10.18653\/v1\/2021.acl-long.21"},{"key":"11534_CR308","unstructured":"Penedo G, Kydl\u00ed\u010dek H, Werra L, Wolf T (2024) FineWeb . https:\/\/doi.org\/10.57967\/hf\/2092 . https:\/\/huggingface.co\/datasets\/HuggingFaceFW\/fineweb"},{"key":"11534_CR309","doi-asserted-by":"crossref","unstructured":"Peng Q, Chai Y, Li X (2024) Humaneval-xl: A multilingual code generation benchmark for cross-lingual natural language generalization. arXiv preprint arXiv:2402.16694","DOI":"10.63317\/2zjsm6sdd5yo"},{"key":"11534_CR310","unstructured":"Peng Z, Wang W, Dong L, Hao Y, Huang S, Ma S, Wei F (2023) Kosmos-2: Grounding multimodal large language models to the world. arXiv preprint arXiv:2306.14824"},{"key":"11534_CR311","doi-asserted-by":"crossref","unstructured":"Peng P, Yan B, Watanabe S, Harwath D (2023) Prompting the hidden talent of web-scale speech models for zero-shot task generalization. Proceedings of the Annual Conference of the International Speech Communication Association INTERSPEECH 2023:396\u2013400","DOI":"10.21437\/Interspeech.2023-2032"},{"key":"11534_CR312","doi-asserted-by":"publisher","DOI":"10.4324\/9780203006344","volume-title":"English and the discourses of colonialism","author":"A Pennycook","year":"2002","unstructured":"Pennycook A (2002) English and the discourses of colonialism. Routledge, Abingdon"},{"key":"11534_CR313","doi-asserted-by":"publisher","DOI":"10.1017\/9781108783071","volume-title":"Languages of the world","author":"A Pereltsvaig","year":"2020","unstructured":"Pereltsvaig A (2020) Languages of the world. Cambridge University Press, Cambridge"},{"key":"11534_CR314","doi-asserted-by":"crossref","unstructured":"Peris C, Dupuy C, Majmudar J, Parikh R, Smaili S, Zemel R, Gupta R (2023) Privacy in the time of language models. In: Proceedings of the Sixteenth ACM International Conference on Web Search and Data Mining, pp. 1291\u20131292","DOI":"10.1145\/3539597.3575792"},{"key":"11534_CR315","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-23008-0","volume-title":"Multilingual information retrieval: from research to practice","author":"C Peters","year":"2012","unstructured":"Peters C, Braschler M, Clough P (2012) Multilingual information retrieval: from research to practice. Springer, Cham"},{"key":"11534_CR316","unstructured":"Piqueras LC, S\u00f8gaard A (2022) Are pretrained multilingual models equally fair across languages? In: Proceedings of the 29th International Conference on Computational Linguistics, pp. 3597\u20133605"},{"key":"11534_CR317","doi-asserted-by":"crossref","unstructured":"Pires R, Abonizio H, Almeida TS, Nogueira R (2023) Sabi\u00e1: Portuguese large language models. In: Brazilian Conference on Intelligent Systems, pp. 226\u2013240 . Springer","DOI":"10.1007\/978-3-031-45392-2_15"},{"key":"11534_CR318","doi-asserted-by":"crossref","unstructured":"Ponti EM, Glava\u0161 G, Majewska O, Liu Q, Vuli\u0107 I, Korhonen A (2020) XCOPA: A multilingual dataset for causal commonsense reasoning. In: Webber, B., Cohn, T., He, Y., Liu, Y. (eds.) Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing (EMNLP), pp. 2362\u20132376. Association for Computational Linguistics, Online . https:\/\/doi.org\/10.18653\/v1\/2020.emnlp-main.185 . https:\/\/aclanthology.org\/2020.emnlp-main.185","DOI":"10.18653\/v1\/2020.emnlp-main.185"},{"key":"11534_CR319","doi-asserted-by":"crossref","unstructured":"Prabhumoye S, Tsvetkov Y, Salakhutdinov R, Black AW (2018) Style transfer through back-translation. In: Proceedings of the 56th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pp. 866\u2013876","DOI":"10.18653\/v1\/P18-1080"},{"key":"11534_CR320","unstructured":"Pradeep R, Sharifymoghaddam S, Lin J (2023) RankVicuna: Zero-Shot Listwise Document Reranking with Open-Source Large Language Models . https:\/\/arxiv.org\/abs\/2309.15088"},{"key":"11534_CR321","unstructured":"Pradeep R, Sharifymoghaddam S, Lin J (2023) RankZephyr: Effective and Robust Zero-Shot Listwise Reranking is a Breeze! . https:\/\/arxiv.org\/abs\/2312.02724"},{"key":"11534_CR322","unstructured":"Puttaparthi PCR, Deo SS, Gul H, Tang Y, Shang W, Yu Z (2023) Comprehensive Evaluation of ChatGPT Reliability Through Multilingual Inquiries"},{"key":"11534_CR323","doi-asserted-by":"crossref","unstructured":"Qi Y, Sachan D, Felix M, Padmanabhan S, Neubig G (2018) When and why are pre-trained word embeddings useful for neural machine translation? In: Proceedings of the 2018 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 2 (Short Papers), pp. 529\u2013535. Association for Computational Linguistics, New Orleans, Louisiana . https:\/\/doi.org\/10.18653\/v1\/N18-2084 . https:\/\/aclanthology.org\/N18-2084","DOI":"10.18653\/v1\/N18-2084"},{"key":"11534_CR324","doi-asserted-by":"crossref","unstructured":"Qin L, Chen Q, Zhou Y, Chen Z, Li Y, Liao L, Li M, Che W, Yu PS (2024) Multilingual large language model: A survey of resources, taxonomy and frontiers. arXiv preprint arXiv:2404.04925","DOI":"10.1016\/j.patter.2024.101118"},{"key":"11534_CR325","doi-asserted-by":"crossref","unstructured":"Qin L, Chen Q, Wei F, Huang S, Che W (2023) Cross-lingual prompting: Improving zero-shot chain-of-thought reasoning across languages. In: Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, pp. 2695\u20132709","DOI":"10.18653\/v1\/2023.emnlp-main.163"},{"key":"11534_CR326","doi-asserted-by":"crossref","unstructured":"Qiu P, Wu C, Zhang X, Lin W, Wang H, Zhang Y, Wang Y, Xie W (2024) Towards building multilingual language model for medicine. arXiv preprint arXiv:2402.13963","DOI":"10.1038\/s41467-024-52417-z"},{"key":"11534_CR327","doi-asserted-by":"crossref","unstructured":"Qiu P, Wu C, Zhang X, Lin W, Wang H, Zhang Y, Wang Y, Xie W (2024) Towards Building Multilingual Language Model for Medicine","DOI":"10.1038\/s41467-024-52417-z"},{"key":"11534_CR328","doi-asserted-by":"crossref","unstructured":"Qiu P, Wu C, Zhang X, Lin W, Wang H, Zhang Y, Wang Y, Xie W (2024) Towards Building Multilingual Language Model for Medicine","DOI":"10.1038\/s41467-024-52417-z"},{"issue":"1","key":"11534_CR329","doi-asserted-by":"publisher","first-page":"111","DOI":"10.1007\/s12626-022-00105-z","volume":"16","author":"J Rabelo","year":"2022","unstructured":"Rabelo J, Goebel R, Kim M-Y, Kano Y, Yoshioka M, Satoh K (2022) Overview and discussion of the competition on legal information extraction\/entailment (coliee) 2021. Rev Socionetw Strat 16(1):111\u2013133","journal-title":"Rev Socionetw Strat"},{"key":"11534_CR330","doi-asserted-by":"crossref","unstructured":"Rabelo J, Kim M-Y, Goebel R, Yoshioka M, Kano Y, Satoh K (2020) A summary of the coliee 2019 competition. In: New Frontiers in Artificial Intelligence: JSAI-isAI International Workshops, JURISIN, AI-Biz, LENLS, Kansei-AI, Yokohama, Japan, November 10\u201312, 2019, Revised Selected Papers 10, pp. 34\u201349 . Springer","DOI":"10.1007\/978-3-030-58790-1_3"},{"issue":"8","key":"11534_CR331","first-page":"9","volume":"1","author":"A Radford","year":"2019","unstructured":"Radford A, Wu J, Child R, Luan D, Amodei D, Sutskever I et al (2019) Language models are unsupervised multitask learners. OpenAI blog 1(8):9","journal-title":"OpenAI blog"},{"key":"11534_CR332","unstructured":"Radford A, Narasimhan K, Salimans T, Sutskever I et al (2018) Improving language understanding by generative pre-training. OpenAI"},{"key":"11534_CR333","unstructured":"Rae JW, Borgeaud S, Cai T, Millican K, Hoffmann J, Song F, Aslanides J, Henderson S, Ring R, Young S et al (2021) Scaling language models: Methods, analysis & insights from training gopher. arXiv preprint arXiv:2112.11446"},{"key":"11534_CR334","unstructured":"Raffel C, Shazeer N, Roberts A, Lee K, Narang S, Matena M, Zhou Y, Li W, Liu PJ (2019) Exploring the limits of transfer learning with a unified text-to-text transformer. arXiv e-prints arXiv:1910.10683"},{"key":"11534_CR335","doi-asserted-by":"crossref","unstructured":"Rahimi A, Li Y, Cohn T (2019) Massively multilingual transfer for NER. In: Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics, pp. 151\u2013164. Association for Computational Linguistics, Florence, Italy . https:\/\/www.aclweb.org\/anthology\/P19-1015","DOI":"10.18653\/v1\/P19-1015"},{"key":"11534_CR336","doi-asserted-by":"crossref","unstructured":"Rajpurkar P, Zhang J, Lopyrev K, Liang P (2016) Squad: 100,000+ questions for machine comprehension of text. In: Proceedings of the 2016 Conference on Empirical Methods in Natural Language Processing, pp. 2383\u20132392","DOI":"10.18653\/v1\/D16-1264"},{"key":"11534_CR337","doi-asserted-by":"crossref","unstructured":"Ramos R, Martins B, Elliott D (2023) LMCap: Few-shot multilingual image captioning by retrieval augmented language model prompting. In: Rogers, A., Boyd-Graber, J., Okazaki, N. (eds.) Findings of the Association for Computational Linguistics: ACL 2023, pp. 1635\u20131651. Association for Computational Linguistics, Toronto, Canada . https:\/\/doi.org\/10.18653\/v1\/2023.findings-acl.104 . https:\/\/aclanthology.org\/2023.findings-acl.104","DOI":"10.18653\/v1\/2023.findings-acl.104"},{"key":"11534_CR338","unstructured":"Rando J, Tram\u00e8r F (2023) Universal jailbreak backdoors from poisoned human feedback. In: The Twelfth International Conference on Learning Representations"},{"key":"11534_CR339","doi-asserted-by":"crossref","unstructured":"Razumovskaia E, Maynez J, Louis A, Lapata M, Narayan S (2024) Little Red Riding Hood Goes Around the Globe:Crosslingual Story Planning and Generation with Large Language Models","DOI":"10.63317\/3owr5gb5kmfa"},{"key":"11534_CR340","doi-asserted-by":"crossref","unstructured":"Rebedea T, Dinu R, Sreedhar MN, Parisien C, Cohen J (2023) Nemo guardrails: A toolkit for controllable and safe llm applications with programmable rails. In: Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing: System Demonstrations, pp. 431\u2013445","DOI":"10.18653\/v1\/2023.emnlp-demo.40"},{"key":"11534_CR341","unstructured":"Ren X, Zhou P, Meng X, Huang X, Wang Y, Wang W, Li P, Zhang X, Podolskiy A, Arshinov G et al (2023) Pangu: Towards trillion parameter language model with sparse heterogeneous computing. arXiv preprint arXiv:2303.10845 10, 11\u201315"},{"key":"11534_CR342","doi-asserted-by":"crossref","unstructured":"Reusens M, Borchert P, Mieskes M, De\u00a0Weerdt J, Baesens B (2023) Investigating bias in multilingual language models: Cross-lingual transfer of debiasing techniques. In: Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, pp. 2887\u20132896","DOI":"10.18653\/v1\/2023.emnlp-main.175"},{"issue":"4","key":"11534_CR343","first-page":"333","volume":"3","author":"S Robertson","year":"2009","unstructured":"Robertson S, Zaragoza H (2009) The probabilistic relevance framework: BM25 and beyond. Found Trends Inf Retr 3(4):333\u2013389","journal-title":"Found Trends Inf Retr"},{"key":"11534_CR344","unstructured":"Robey A, Wong E, Hassani H, Pappas GJ (2023) Smoothllm: Defending large language models against jailbreaking attacks. arXiv preprint arXiv:2310.03684"},{"key":"11534_CR345","doi-asserted-by":"crossref","unstructured":"Roy U, Constant N, Al-Rfou R, Barua A, Phillips A, Yang Y (2020) LAReQA: Language-agnostic answer retrieval from a multilingual pool. In: Webber, B., Cohn, T., He, Y., Liu, Y. (eds.) Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing (EMNLP), pp. 5919\u20135930. Association for Computational Linguistics, Online . https:\/\/doi.org\/10.18653\/v1\/2020.emnlp-main.477 . https:\/\/aclanthology.org\/2020.emnlp-main.477","DOI":"10.18653\/v1\/2020.emnlp-main.477"},{"key":"11534_CR346","doi-asserted-by":"crossref","unstructured":"Ruder S, Constant N, Botha J, Siddhant A, Firat O, Fu J, Liu P, Hu J, Garrette D, Neubig G, Johnson M (2021) XTREME-R: Towards more challenging and nuanced multilingual evaluation. In: Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing, pp. 10215\u201310245. Association for Computational Linguistics, Online and Punta Cana, Dominican Republic . https:\/\/doi.org\/10.18653\/v1\/2021.emnlp-main.802 . https:\/\/aclanthology.org\/2021.emnlp-main.802","DOI":"10.18653\/v1\/2021.emnlp-main.802"},{"key":"11534_CR347","doi-asserted-by":"crossref","unstructured":"Ruder S, Constant N, Botha J, Siddhant A, Firat O, Fu J, Liu P, Hu J, Garrette D, Neubig G, Johnson M (2021) XTREME-R: Towards more challenging and nuanced multilingual evaluation. In: Moens, M.-F., Huang, X., Specia, L., Yih, S.W.-t. (eds.) Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing, pp. 10215\u201310245. Association for Computational Linguistics, Online and Punta Cana, Dominican Republic . https:\/\/doi.org\/10.18653\/v1\/2021.emnlp-main.802 . https:\/\/aclanthology.org\/2021.emnlp-main.802","DOI":"10.18653\/v1\/2021.emnlp-main.802"},{"key":"11534_CR348","doi-asserted-by":"crossref","unstructured":"Ruder S, Sil A (2021) Multi-domain multilingual question answering. In: Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing: Tutorial Abstracts, pp. 17\u201321","DOI":"10.18653\/v1\/2021.emnlp-tutorials.4"},{"key":"11534_CR349","unstructured":"RyokoAI: ShareGPT52K. https:\/\/huggingface.co\/datasets\/RyokoAI\/ShareGPT52K"},{"key":"11534_CR350","doi-asserted-by":"crossref","unstructured":"Sap M, Shwartz V, Bosselut A, Choi Y, Roth D (2020) Commonsense reasoning for natural language processing. In: Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics: Tutorial Abstracts, pp. 27\u201333","DOI":"10.18653\/v1\/2020.acl-tutorials.7"},{"key":"11534_CR351","doi-asserted-by":"publisher","first-page":"42","DOI":"10.4324\/9781351001724-4","volume-title":"The Routledge Handbook of English Language Studies","author":"EW Schneider","year":"2018","unstructured":"Schneider EW (2018) English and colonialism. The Routledge Handbook of English Language Studies. Routledge, Abingdon, pp 42\u201358"},{"key":"11534_CR352","doi-asserted-by":"crossref","unstructured":"Schwenk H, Wenzek G, Edunov S, Grave E, Joulin A, Fan A (2021) CCMatrix: Mining billions of high-quality parallel sentences on the web. In: Proceedings of the 59th Annual Meeting of the Association for Computational Linguistics and the 11th International Joint Conference on Natural Language Processing (Volume 1: Long Papers), pp. 6490\u20136500. Association for Computational Linguistics, Online . https:\/\/doi.org\/10.18653\/v1\/2021.acl-long.507 . https:\/\/aclanthology.org\/2021.acl-long.507","DOI":"10.18653\/v1\/2021.acl-long.507"},{"key":"11534_CR353","doi-asserted-by":"crossref","unstructured":"Seganti A, Firl\u0105g K, Skowronska H, Sat\u0142awa M, Andruszkiewicz P (2021) Multilingual entity and relation extraction dataset and model. In: Merlo, P., Tiedemann, J., Tsarfaty, R. (eds.) Proceedings of the 16th Conference of the European Chapter of the Association for Computational Linguistics: Main Volume, pp. 1946\u20131955. Association for Computational Linguistics, Online . https:\/\/doi.org\/10.18653\/v1\/2021.eacl-main.166 . https:\/\/aclanthology.org\/2021.eacl-main.166","DOI":"10.18653\/v1\/2021.eacl-main.166"},{"key":"11534_CR354","doi-asserted-by":"crossref","unstructured":"Sennrich R, Vamvas J, Mohammadshahi A (2023) Mitigating hallucinations and off-target machine translation with source-contrastive and language-contrastive decoding. arXiv preprint arXiv:2309.07098","DOI":"10.18653\/v1\/2024.eacl-short.4"},{"key":"11534_CR355","doi-asserted-by":"crossref","unstructured":"Shen X, Chen Z, Backes M, Shen Y, Zhang Y (2023) Do Anything Now: Characterizing and Evaluating In-The-Wild Jailbreak Prompts on Large Language Models","DOI":"10.1145\/3658644.3670388"},{"key":"11534_CR356","doi-asserted-by":"crossref","unstructured":"Shen L, Tan W, Chen S, Chen Y, Zhang J, Xu H, Zheng B, Koehn P, Khashabi D (2024) The Language Barrier: Dissecting Safety Challenges of LLMs in Multilingual Contexts","DOI":"10.18653\/v1\/2024.findings-acl.156"},{"key":"11534_CR357","unstructured":"Shi P, Lin J (2019) Cross-Lingual Relevance Transfer for Document Retrieval . https:\/\/arxiv.org\/abs\/1911.02989"},{"key":"11534_CR358","doi-asserted-by":"crossref","unstructured":"Shi P, Bai H, Lin J (2020) Cross-lingual training of neural models for document ranking. In: Findings of the Association for Computational Linguistics: EMNLP 2020, pp. 2768\u20132773. Association for Computational Linguistics, Online . https:\/\/doi.org\/10.18653\/v1\/2020.findings-emnlp.249 . https:\/\/aclanthology.org\/2020.findings-emnlp.249","DOI":"10.18653\/v1\/2020.findings-emnlp.249"},{"key":"11534_CR359","unstructured":"Shi D, Shen T, Huang Y, Li Z, Leng Y, Jin R, Liu C, Wu X, Guo Z, Yu L, Shi L, Jiang B, Xiong D (2024) Large Language Model Safety: A Holistic Survey . https:\/\/arxiv.org\/abs\/2412.17686"},{"key":"11534_CR360","unstructured":"Shi F, Suzgun M, Freitag M, Wang X, Srivats S, Vosoughi S, Chung HW, Tay Y, Ruder S, Zhou D et al (2022) Language models are multilingual chain-of-thought reasoners. arXiv preprint arXiv:2210.03057"},{"key":"11534_CR361","doi-asserted-by":"crossref","unstructured":"Shi P, Zhang R, Bai H, Lin J (2022) XRICL: Cross-lingual retrieval-augmented in-context learning for cross-lingual text-to-SQL semantic parsing. In: Goldberg, Y., Kozareva, Z., Zhang, Y. (eds.) Findings of the Association for Computational Linguistics: EMNLP 2022, pp. 5248\u20135259. Association for Computational Linguistics, Abu Dhabi, United Arab Emirates . https:\/\/doi.org\/10.18653\/v1\/2022.findings-emnlp.384 . https:\/\/aclanthology.org\/2022.findings-emnlp.384","DOI":"10.18653\/v1\/2022.findings-emnlp.384"},{"key":"11534_CR362","unstructured":"Shliazhko O, Fenogenova A, Tikhonova M, Mikhailov V, Kozlova A, Shavrina T (2022) mgpt: Few-shot learners go multilingual. arXiv preprint arXiv:2204.07580"},{"key":"11534_CR363","doi-asserted-by":"crossref","unstructured":"Singh S, Vargus F, D\u2019souza D, Karlsson B, Mahendiran A, Ko W-Y, Shandilya H, Patel J, Mataciunas D, O\u2019Mahony L, Zhang M, Hettiarachchi R, Wilson J, Machado M, Moura L, Krzemi\u0144ski D, Fadaei H, Ergun I, Okoh I, Alaagib A, Mudannayake O, Alyafeai Z, Chien V, Ruder S, Guthikonda S, Alghamdi E, Gehrmann S, Muennighoff N, Bartolo M, Kreutzer J, \u00dcst\u00fcn A, Fadaee M, Hooker S (2024) Aya dataset: An open-access collection for multilingual instruction tuning. In: Ku, L.-W., Martins, A., Srikumar, V. (eds.) Proceedings of the 62nd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pp. 11521\u201311567. Association for Computational Linguistics, Bangkok, Thailand . https:\/\/doi.org\/10.18653\/v1\/2024.acl-long.620 . https:\/\/aclanthology.org\/2024.acl-long.620","DOI":"10.18653\/v1\/2024.acl-long.620"},{"issue":"7972","key":"11534_CR364","doi-asserted-by":"publisher","first-page":"172","DOI":"10.1038\/s41586-023-06291-2","volume":"620","author":"K Singhal","year":"2023","unstructured":"Singhal K, Azizi S, Tu T, Mahdavi SS, Wei J, Chung HW, Scales N, Tanwani A, Cole-Lewis H, Pfohl S et al (2023) Large language models encode clinical knowledge. Nature 620(7972):172\u2013180","journal-title":"Nature"},{"key":"11534_CR365","unstructured":"Sitawarin C, Mu N, Wagner D, Araujo A (2024) PAL: Proxy-Guided Black-Box Attack on Large Language Models"},{"key":"11534_CR366","unstructured":"Soares F, Stevenson M, Bartolome D, Zaretskaya A (2020) ParaPat: The multi-million sentences parallel corpus of patents abstracts. In: Proceedings of The 12th Language Resources and Evaluation Conference, pp. 3769\u20133774. European Language Resources Association, Marseille, France . https:\/\/www.aclweb.org\/anthology\/2020.lrec-1.465"},{"key":"11534_CR367","doi-asserted-by":"crossref","unstructured":"Soldaini L, Kinney R, Bhagia A, Schwenk D, Atkinson D, Authur R, Bogin B, Chandu K, Dumas J, Elazar Y et al (2024) Dolma: An open corpus of three trillion tokens for language model pretraining research. arXiv preprint arXiv:2402.00159","DOI":"10.18653\/v1\/2024.acl-long.840"},{"key":"11534_CR368","unstructured":"Springer JM, Kotha S, Fried D, Neubig G, Raghunathan A (2024) Repetition Improves Language Model Embeddings . https:\/\/arxiv.org\/abs\/2402.15449"},{"key":"11534_CR369","doi-asserted-by":"crossref","unstructured":"Srinivasan K, Raman K, Chen J, Bendersky M, Najork M (2021) Wit: Wikipedia-based image text dataset for multimodal multilingual machine learning. arXiv preprint arXiv:2103.01913","DOI":"10.1145\/3404835.3463257"},{"key":"11534_CR370","doi-asserted-by":"crossref","unstructured":"Srinivasan A, Choi E (2022) TyDiP: A dataset for politeness classification in nine typologically diverse languages. In: Goldberg, Y., Kozareva, Z., Zhang, Y. (eds.) Findings of the Association for Computational Linguistics: EMNLP 2022, pp. 5723\u20135738. Association for Computational Linguistics, Abu Dhabi, United Arab Emirates . https:\/\/doi.org\/10.18653\/v1\/2022.findings-emnlp.420 . https:\/\/aclanthology.org\/2022.findings-emnlp.420","DOI":"10.18653\/v1\/2022.findings-emnlp.420"},{"key":"11534_CR371","doi-asserted-by":"crossref","unstructured":"Srivastava V, Singh M (2022) Overview and results of mixmt shared-task at wmt 2022. In: Proceedings of the Seventh Conference on Machine Translation (WMT), pp. 806\u2013811","DOI":"10.18653\/v1\/2022.wmt-1.74"},{"key":"11534_CR372","first-page":"14973","volume":"2023","author":"D Stap","year":"2023","unstructured":"Stap D, Niculae V, Monz C (2023) Viewing knowledge transfer in multilingual machine translation through a representational lens. Find Assoc Comput Ling EMNLP 2023:14973\u201314987","journal-title":"Find Assoc Comput Ling EMNLP"},{"key":"11534_CR373","doi-asserted-by":"publisher","first-page":"127063","DOI":"10.1016\/j.neucom.2023.127063","volume":"568","author":"J Su","year":"2024","unstructured":"Su J, Ahmed M, Lu Y, Pan S, Bo W, Liu Y (2024) Roformer: enhanced transformer with rotary position embedding. Neurocomputing 568:127063","journal-title":"Neurocomputing"},{"issue":"3","key":"11534_CR374","doi-asserted-by":"publisher","first-page":"283","DOI":"10.47233\/jteksis.v5i3.871","volume":"5","author":"F Sudirjo","year":"2023","unstructured":"Sudirjo F, Diantoro K, Al-Gasawneh JA, Azzaakiyyah HK, Ausat AMA (2023) Application of chatgpt in improving customer sentiment analysis for businesses. Jurnal Teknologi Dan Sistem Informasi Bisnis 5(3):283\u2013288","journal-title":"Jurnal Teknologi Dan Sistem Informasi Bisnis"},{"key":"11534_CR375","doi-asserted-by":"crossref","unstructured":"Sun W, Yan L, Ma X, Wang S, Ren P, Chen Z, Yin D, Ren Z (2023) Is ChatGPT good at search? investigating large language models as re-ranking agents. In: Bouamor, H., Pino, J., Bali, K. (eds.) Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, pp. 14918\u201314937. Association for Computational Linguistics, Singapore . https:\/\/doi.org\/10.18653\/v1\/2023.emnlp-main.923 . https:\/\/aclanthology.org\/2023.emnlp-main.923","DOI":"10.18653\/v1\/2023.emnlp-main.923"},{"key":"11534_CR376","first-page":"13003","volume":"2023","author":"M Suzgun","year":"2023","unstructured":"Suzgun M, Scales N, Sch\u00e4rli N, Gehrmann S, Tay Y, Chung HW, Chowdhery A, Le Q, Chi E, Zhou D et al (2023) Challenging big-bench tasks and whether chain-of-thought can solve them. Find Assoc Comput Ling ACL 2023:13003\u201313051","journal-title":"Find Assoc Comput Ling ACL"},{"key":"11534_CR377","doi-asserted-by":"publisher","first-page":"257","DOI":"10.1207\/s15516709cog1202_4","volume":"12","author":"J Sweller","year":"1988","unstructured":"Sweller J (1988) Cognitive load during problem solving: effects on learning. Cogn Sci 12:257\u2013285","journal-title":"Cogn Sci"},{"key":"11534_CR378","first-page":"37","volume-title":"Psychology of learning and motivation","author":"J Sweller","year":"2011","unstructured":"Sweller J (2011) Cognitive load theory. Psychology of learning and motivation. Elsevier, Amsterdam, pp 37\u201376"},{"key":"11534_CR379","doi-asserted-by":"publisher","first-page":"24","DOI":"10.1097\/ACM.0000000000003524","volume":"96","author":"A Szulewski","year":"2021","unstructured":"Szulewski A, Howes D, Merri\u00ebnboer JJ, Sweller J (2021) From theory to practice: the application of cognitive load theory to the practice of medicine. Acad Med 96:24\u201330","journal-title":"Acad Med"},{"key":"11534_CR380","unstructured":"Tamber MS, Pradeep R, Lin J (2023) Scaling Down, LiTting Up: Efficient Zero-Shot Listwise Reranking with Seq2seq Encoder-Decoder Models . https:\/\/arxiv.org\/abs\/2312.16098"},{"key":"11534_CR381","unstructured":"Taori R, Gulrajani I, Zhang T, Dubois Y, Li X, Guestrin C, Liang P, Hashimoto TB (2023) Stanford alpaca: An instruction-following llama model"},{"key":"11534_CR382","unstructured":"Team N (2022) No language left behind: Scaling human-centered machine translation. arXiv preprint arXiv:2207.04672"},{"key":"11534_CR383","unstructured":"Team I (2023) Internlm: A multilingual language model with progressively enhanced capabilities"},{"key":"11534_CR384","unstructured":"Team G, Anil R, Borgeaud S, Wu Y, Alayrac J-B, Yu J, Soricut R, Schalkwyk J, Dai AM, Hauth A et al (2023) Gemini: a family of highly capable multimodal models. arXiv preprint arXiv:2312.11805"},{"key":"11534_CR385","unstructured":"Team G, Mesnard T, Hardin C, Dadashi R, Bhupatiraju S, Pathak S, Sifre L, Rivi\u00e8re M, Kale MS, Love J et al (2024) Gemma: Open models based on gemini research and technology. arXiv preprint arXiv:2403.08295"},{"key":"11534_CR386","unstructured":"Thakur N, Bonifacio L, Zhang X, Ogundepo O, Kamalloo E, Alfonso-Hermelo D, Li X, Liu Q, Chen B, Rezagholizadeh M, Lin J (2023) Nomiracl: Knowing when you don\u2019t know for robust multilingual retrieval-augmented generation. ArXiv abs\/2312.11361"},{"key":"11534_CR387","unstructured":"Thakur N, Kazi S, Luo G, Lin J, Ahmad A (2024) MIRAGE-Bench: Automatic Multilingual Benchmark Arena for Retrieval-Augmented Generation Systems . https:\/\/arxiv.org\/abs\/2410.13716"},{"key":"11534_CR388","unstructured":"Thakur N, Bonifacio L, Zhang X, Ogundepo O, Kamalloo E, Alfonso-Hermelo D, Li X, Liu Q, Chen B, Rezagholizadeh M, Lin J (2024) NoMIRACL: Knowing When You Don\u2019t Know for Robust Multilingual Retrieval-Augmented Generation"},{"key":"11534_CR389","doi-asserted-by":"crossref","unstructured":"Thakur N, Ni J, Hernandez\u00a0Abrego G, Wieting J, Lin J, Cer D (2024) Leveraging LLMs for synthesizing training data across many languages in multilingual dense retrieval. In: Duh, K., Gomez, H., Bethard, S. (eds.) Proceedings of the 2024 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies (Volume 1: Long Papers), pp. 7699\u20137724. Association for Computational Linguistics, Mexico City, Mexico . https:\/\/doi.org\/10.18653\/v1\/2024.naacl-long.426 . https:\/\/aclanthology.org\/2024.naacl-long.426","DOI":"10.18653\/v1\/2024.naacl-long.426"},{"key":"11534_CR390","doi-asserted-by":"crossref","unstructured":"Thapliyal AV, Pont-Tuset J, Chen X, Soricut R (2022) Crossmodal-3600: A Massively Multilingual Multimodal Evaluation Dataset","DOI":"10.18653\/v1\/2022.emnlp-main.45"},{"key":"11534_CR391","unstructured":"Thoppilan R, De\u00a0Freitas D, Hall J, Shazeer N, Kulshreshtha A, Cheng H-T, Jin A, Bos T, Baker L, Du Y, et al (2022) Lamda: Language models for dialog applications. arXiv preprint arXiv:2201.08239"},{"key":"11534_CR392","doi-asserted-by":"crossref","unstructured":"Tian Y, Gan R, Song Y, Zhang J, Zhang Y (2023) Chimed-gpt: A chinese medical large language model with full training regime and better alignment to human preferences. arXiv preprint arXiv:2311.06025","DOI":"10.18653\/v1\/2024.acl-long.386"},{"key":"11534_CR393","doi-asserted-by":"crossref","unstructured":"Tiedemann J (2020) The tatoeba translation challenge \u2013 realistic data sets for low resource and multilingual MT. In: Proceedings of the Fifth Conference on Machine Translation, pp. 1174\u20131182. Association for Computational Linguistics, Online . https:\/\/aclanthology.org\/2020.wmt-1.139","DOI":"10.18653\/v1\/2020.wmt-1.139"},{"key":"11534_CR394","doi-asserted-by":"crossref","unstructured":"Tikhonov A, Ryabinin M (2021) It\u2019s All in the Heads: Using Attention Heads as a Baseline for Cross-Lingual Transfer in Commonsense Reasoning. In: Zong, C., Xia, F., Li, W., Navigli, R. (eds.) Findings of the Association for Computational Linguistics: ACL-IJCNLP 2021, pp. 3534\u20133546. Association for Computational Linguistics, Online . https:\/\/doi.org\/10.18653\/v1\/2021.findings-acl.310 . https:\/\/aclanthology.org\/2021.findings-acl.310","DOI":"10.18653\/v1\/2021.findings-acl.310"},{"key":"11534_CR395","unstructured":"Touvron H, Lavril T, Izacard G, Martinet X, Lachaux M-A, Lacroix T, Rozi\u00e8re B, Goyal N, Hambro E, Azhar F et al (2023) Llama: Open and efficient foundation language models. arXiv preprint arXiv:2302.13971"},{"key":"11534_CR396","unstructured":"Trautmann D, Petrova A, Schilder F (2022) Legal prompt engineering for multilingual legal judgement prediction. arXiv preprint arXiv:2212.02199"},{"key":"11534_CR509","unstructured":"Tyqiangz: Multilingual Sentiment Datasets. https:\/\/github.com\/tyqiangz\/multilingual-sentiment-datasets"},{"key":"11534_CR397","doi-asserted-by":"crossref","unstructured":"Urlana A, Chen P, Zhao Z, Cohen SB, Shrivastava M, Haddow B (2023) PMIndiaSum: Multilingual and Cross-lingual Headline Summarization for Languages in India","DOI":"10.18653\/v1\/2023.findings-emnlp.777"},{"key":"11534_CR398","doi-asserted-by":"crossref","unstructured":"Uthus D, Onta\u00f1\u00f3n S, Ainslie J, Guo M (2023) mlongt5: A multilingual and efficient text-to-text transformer for longer sequences. arXiv preprint arXiv:2305.11129","DOI":"10.18653\/v1\/2023.findings-emnlp.628"},{"key":"11534_CR511","doi-asserted-by":"crossref","unstructured":"\u00dcst\u00fcn A, Aryabumi V, Yong Z, Ko W-Y, D\u2019souza D, Onilude G, Bhandari N, Singh S, Ooi H-L, Kayid A, Vargus F, Blunsom P, Longpre S, Muennighoff N, Fadaee M, Kreutzer J, Hooker S (2024) Aya model: An instruction finetuned open-access multilingual language model. In: Ku, L.-W., Martins, A., Srikumar, V. (eds.) Proceedings of the 62nd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pp. 15894\u201315939. Association for Computational Linguistics, Bangkok, Thailand . https:\/\/doi.org\/10.18653\/v1\/2024.acl-long.845 . https:\/\/aclanthology.org\/2024.acl-long.845","DOI":"10.18653\/v1\/2024.acl-long.845"},{"key":"11534_CR399","doi-asserted-by":"crossref","unstructured":"Vashishtha A, Ahuja K, Sitaram S (2023) On evaluating and mitigating gender biases in multilingual settings. arXiv preprint arXiv:2307.01503","DOI":"10.18653\/v1\/2023.findings-acl.21"},{"key":"11534_CR400","unstructured":"Vaswani A, Shazeer N, Parmar N, Uszkoreit J, Jones L, Gomez AN, Kaiser \u0141, Polosukhin I (2017 Attention is all you need. Advances in neural information processing systems 30 )"},{"key":"11534_CR401","doi-asserted-by":"crossref","unstructured":"Verma Y, Jangra A, Verma R, Saha S (2023) Large scale multi-lingual multi-modal summarization dataset. In: Vlachos, A., Augenstein, I. (eds.) Proceedings of the 17th Conference of the European Chapter of the Association for Computational Linguistics, pp. 3620\u20133632. Association for Computational Linguistics, Dubrovnik, Croatia . https:\/\/doi.org\/10.18653\/v1\/2023.eacl-main.263 . https:\/\/aclanthology.org\/2023.eacl-main.263","DOI":"10.18653\/v1\/2023.eacl-main.263"},{"key":"11534_CR402","doi-asserted-by":"crossref","unstructured":"Vernikos G, Popescu-Belis A (2024) Don\u2019t rank, combine! combining machine translation hypotheses using quality estimation. arXiv preprint arXiv:2401.06688","DOI":"10.18653\/v1\/2024.acl-long.653"},{"key":"11534_CR510","unstructured":"Voyage-multilingual-2: Multilingual Embedding Model. https:\/\/blog.voyageai.com\/2024\/06\/10\/voyage-multilingual-2-multilingual-embedding-model\/. Accessed: 2024-06-10"},{"key":"11534_CR403","doi-asserted-by":"crossref","unstructured":"Wan Y, Pu G, Sun J, Garimella A, Chang K-W, Peng N (2023) kelly is a warm person, joseph is a role model: Gender biases in llm-generated reference letters. In: Findings of the Association for Computational Linguistics: EMNLP , pp. 3730\u20133748 (2023)","DOI":"10.18653\/v1\/2023.findings-emnlp.243"},{"key":"11534_CR404","first-page":"16031","volume":"2024","author":"Y Wang","year":"2024","unstructured":"Wang Y, Shi Z, Bai A, Hsieh C-J (2024) Defending llms against jailbreaking attacks via backtranslation. Find Assoc Comput Ling ACL 2024:16031\u201316046","journal-title":"Find Assoc Comput Ling ACL"},{"key":"11534_CR405","first-page":"11440","volume":"36","author":"Q Wang","year":"2022","unstructured":"Wang Q, Zhang J (2022) Parameter differentiation based multilingual neural machine translation. Proceed AAAI Conf Artif Intell 36:11440\u201311448","journal-title":"Proceed AAAI Conf Artif Intell"},{"key":"11534_CR406","unstructured":"Wang X, Chen N, Chen J, Hu Y, Wang Y, Wu X, Gao A, Wan X, Li H, Wang B (2024) Apollo: Lightweight multilingual medical llms towards democratizing medical ai to 6b people. arXiv preprint arXiv:2403.03640"},{"key":"11534_CR407","doi-asserted-by":"crossref","unstructured":"Wang W, Tu Z, Chen C, Yuan Y, Huang J-t, Jiao W, Lyu MR (2023) All languages matter: On the multilingual safety of large language models. arXiv preprint arXiv:2310.00905","DOI":"10.18653\/v1\/2024.findings-acl.349"},{"key":"11534_CR408","unstructured":"Wang G, Cheng S, Zhan X, Li X, Song S, Liu Y (2023) Openchat: Advancing open-source language models with mixed-quality data. In: The Twelfth International Conference on Learning Representations"},{"key":"11534_CR409","doi-asserted-by":"crossref","unstructured":"Wang Z, Zhou S, Fried D, Neubig G (2023) Execution-Based Evaluation for Open-Domain Code Generation","DOI":"10.18653\/v1\/2023.findings-emnlp.89"},{"key":"11534_CR410","doi-asserted-by":"crossref","unstructured":"Wang X, Ruder S, Neubig G (2022) Expanding pretrained models to thousands more languages via lexicon-based adaptation. arXiv preprint arXiv:2203.09435","DOI":"10.18653\/v1\/2022.acl-long.61"},{"key":"11534_CR411","doi-asserted-by":"crossref","unstructured":"Wang X, Tsvetkov Y, Neubig G (2020) Balancing training for multilingual neural machine translation. In: Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, pp. 8526\u20138537","DOI":"10.18653\/v1\/2020.acl-main.754"},{"key":"11534_CR412","unstructured":"Wang X, Wei J, Schuurmans D, Le QV, Chi EH, Narang S, Chowdhery A, Zhou D (2022) Self-consistency improves chain of thought reasoning in language models. In: The Eleventh International Conference on Learning Representations"},{"key":"11534_CR413","unstructured":"Wang L, Yang N, Huang X, Jiao B, Yang L, Jiang D, Majumder R, Wei F (2024) Text Embeddings by Weakly-Supervised Contrastive Pre-training . https:\/\/arxiv.org\/abs\/2212.03533"},{"key":"11534_CR414","doi-asserted-by":"crossref","unstructured":"Wang P, Wei X, Hu F, Han W (2024) Transgpt: Multi-modal generative pre-trained transformer for transportation. arXiv preprint arXiv:2402.07233","DOI":"10.1109\/CLNLP64123.2024.00026"},{"key":"11534_CR415","unstructured":"Wang G, Yang G, Du Z, Fan L, Li X (2023) Clinicalgpt: large language models finetuned with diverse medical data and comprehensive evaluation. arXiv preprint arXiv:2306.09968"},{"key":"11534_CR416","doi-asserted-by":"crossref","unstructured":"Wang J, Liu Y, Wang XE (2022) Assessing multilingual fairness in pre-trained multimodal representations. In: Proceedings of Annual Meeting of Association for Computational Linguistics","DOI":"10.18653\/v1\/2022.findings-acl.211"},{"key":"11534_CR417","doi-asserted-by":"crossref","unstructured":"Wang J, Liang Y, Meng F, Sun Z, Shi H, Li Z, Xu J, Qu J, Zhou J (2023) Is chatgpt a good nlg evaluator? a preliminary study. In: Proceedings of EMNLP Workshop, p. 1","DOI":"10.18653\/v1\/2023.newsum-1.1"},{"key":"11534_CR418","doi-asserted-by":"crossref","unstructured":"Wang L, Yang N, Huang X, Yang L, Majumder R, Wei F (2024) Improving Text Embeddings with Large Language Models . https:\/\/arxiv.org\/abs\/2401.00368","DOI":"10.18653\/v1\/2024.acl-long.642"},{"key":"11534_CR419","unstructured":"Wang L, Yang N, Huang X, Yang L, Majumder R, Wei F (2024) Multilingual E5 Text Embeddings: A Technical Report . https:\/\/arxiv.org\/abs\/2402.05672"},{"key":"11534_CR420","first-page":"24824","volume":"35","author":"J Wei","year":"2022","unstructured":"Wei J, Wang X, Schuurmans D, Bosma M, Xia F, Chi E, Le QV, Zhou D et al (2022) Chain-of-thought prompting elicits reasoning in large language models. Adv Neural Inf Process Syst 35:24824\u201324837","journal-title":"Adv Neural Inf Process Syst"},{"key":"11534_CR421","doi-asserted-by":"crossref","unstructured":"Wei A, Haghtalab N, Steinhardt J (2024) Jailbroken: How does llm safety training fail? Advances in Neural Information Processing Systems 36","DOI":"10.52202\/075280-3508"},{"key":"11534_CR422","unstructured":"Wei J, Tay Y, Bommasani R, Raffel C, Zoph B, Borgeaud S, Yogatama D, Bosma M, Zhou D, Metzler D et al (2022) Emergent abilities of large language models. arXiv preprint arXiv:2206.07682"},{"key":"11534_CR423","unstructured":"Wei Z, Wang Y, Wang Y (2023) Jailbreak and guard aligned language models with only few in-context demonstrations. arXiv preprint arXiv:2310.06387"},{"key":"11534_CR424","unstructured":"Wei X, Wei H, Lin H, Li T, Zhang P, Ren X, Li M, Wan Y, Cao Z, Xie B et al (2023) Polylm: An open source polyglot large language model. arXiv preprint arXiv:2307.06018"},{"key":"11534_CR425","unstructured":"Wenzek G, Lachaux M-A, Conneau A, Chaudhary V, Guzm\u00e1n F, Joulin A, Grave E (2020) CCNet: Extracting high quality monolingual datasets from web crawl data. In: Calzolari, N., B\u00e9chet, F., Blache, P., Choukri, K., Cieri, C., Declerck, T., Goggi, S., Isahara, H., Maegaard, B., Mariani, J., Mazo, H., Moreno, A., Odijk, J., Piperidis, S. (eds.) Proceedings of the Twelfth Language Resources and Evaluation Conference, pp. 4003\u20134012. European Language Resources Association, Marseille, France . https:\/\/aclanthology.org\/2020.lrec-1.494"},{"key":"11534_CR426","doi-asserted-by":"crossref","unstructured":"Winata GI, Aji AF, Cahyawijaya S, Mahendra R, Koto F, Romadhony A, Kurniawan K, Moeljadi D, Prasojo RE, Fung P, Baldwin T, Lau JH, Sennrich R, Ruder S (2023) NusaX: Multilingual Parallel Sentiment Dataset for 10 Indonesian Local Languages","DOI":"10.18653\/v1\/2023.eacl-main.57"},{"key":"11534_CR427","doi-asserted-by":"crossref","unstructured":"Winata GI, Cahyawijaya S, Liu Z, Lin Z, Madotto A, Fung P (2021) Are multilingual models effective in code-switching? In: Proceedings of the Fifth Workshop on Computational Approaches to Linguistic Code-Switching, pp. 142\u2013153","DOI":"10.18653\/v1\/2021.calcs-1.20"},{"key":"11534_CR428","unstructured":"Winata GI, Huang L-K, Vadlamannati S, Chandarana Y (2023) Multilingual Few-Shot Learning via Language Model Retrieval"},{"key":"11534_CR429","unstructured":"Wu D, Wang S, Liu Y, Liu N (2024) LLMs Can Defend Themselves Against Jailbreaking in a Practical Manner: A Vision Paper"},{"key":"11534_CR430","doi-asserted-by":"crossref","unstructured":"Wu M, Li Y, Zhang M, Li L, Haffari G, Liu Q (2021) Uncertainty-aware balancing for multilingual and multi-domain neural machine translation training. In: Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing, pp. 7291\u20137305","DOI":"10.18653\/v1\/2021.emnlp-main.580"},{"key":"11534_CR431","unstructured":"Wu S, Irsoy O, Lu S, Dabravolski V, Dredze M, Gehrmann S, Kambadur P, Rosenberg D, Mann G (2023) Bloomberggpt: A large language model for finance. arXiv preprint arXiv:2303.17564"},{"key":"11534_CR432","unstructured":"Wu C, Zhang X, Zhang Y, Wang Y, Xie W (2023) Pmc-llama: Further finetuning llama on medical papers. arXiv preprint arXiv:2304.14454"},{"key":"11534_CR433","unstructured":"Wynter A, Watts I, Alt\u0131ntoprak NE, Wongsangaroonsri T, Zhang M, Farra N, Baur L, Claudet S, Gajdusek P, G\u00f6ren C et\u00a0al (2024) Rtp-lx: Can llms evaluate toxicity in multilingual scenarios? arXiv preprint arXiv:2404.14397"},{"key":"11534_CR434","doi-asserted-by":"crossref","unstructured":"Xiao S, Liu Z, Zhang P, Xing X (2024) LM-cocktail: Resilient tuning of language models via model merging. In: Ku, L.-W., Martins, A., Srikumar, V. (eds.) Findings of the Association for Computational Linguistics ACL 2024, pp. 2474\u20132488. Association for Computational Linguistics, Bangkok, Thailand and virtual meeting . https:\/\/doi.org\/10.18653\/v1\/2024.findings-acl.145 . https:\/\/aclanthology.org\/2024.findings-acl.145","DOI":"10.18653\/v1\/2024.findings-acl.145"},{"issue":"12","key":"11534_CR435","doi-asserted-by":"publisher","first-page":"1486","DOI":"10.1038\/s42256-023-00765-8","volume":"5","author":"Y Xie","year":"2023","unstructured":"Xie Y, Yi J, Shao J, Curl J, Lyu L, Chen Q, Xie X, Wu F (2023) Defending chatgpt against jailbreak attack via self-reminders. Nat Mach Intell 5(12):1486\u20131496","journal-title":"Nat Mach Intell"},{"key":"11534_CR436","doi-asserted-by":"crossref","unstructured":"Xie Y, Fang M, Pi R, Gong N (2024) Gradsafe: detecting unsafe prompts for llms via safety-critical gradient analysis","DOI":"10.18653\/v1\/2024.acl-long.30"},{"key":"11534_CR437","doi-asserted-by":"crossref","unstructured":"Xiong C, Qi X, Chen P-Y, Ho T-Y (2024) Defensive prompt patch: A robust and interpretable defense of llms against jailbreak attacks. arXiv preprint arXiv:2405.20099","DOI":"10.18653\/v1\/2025.findings-acl.23"},{"key":"11534_CR438","unstructured":"Xiong H, Wang S, Zhu Y, Zhao Z, Liu Y, Wang Q, Shen D (2023) Doctorglm: Fine-tuning your chinese doctor is not a herculean task. arXiv preprint arXiv:2304.01097"},{"key":"11534_CR439","doi-asserted-by":"crossref","unstructured":"Xu N, Wang F, Zhou B, Li BZ, Xiao C, Chen M (2023) Cognitive overload: Jailbreaking large language models with overloaded logical thinking. arXiv preprint arXiv:2311.09827","DOI":"10.18653\/v1\/2024.findings-naacl.224"},{"key":"11534_CR440","doi-asserted-by":"crossref","unstructured":"Xu Y, Hu L, Zhao J, Qiu Z, Ye Y, Gu H (2024) A survey on multilingual large language models: Corpora, alignment, and bias. arXiv preprint arXiv:2404.00929","DOI":"10.1007\/s11704-024-40579-4"},{"key":"11534_CR441","doi-asserted-by":"crossref","unstructured":"Xu S, Dong W, Guo Z, Wu X, Xiong D (2024) Exploring Multilingual Human Value Concepts in Large Language Models: Is Value Alignment Consistent, Transferable and Controllable across Languages?","DOI":"10.18653\/v1\/2024.findings-emnlp.96"},{"key":"11534_CR442","first-page":"291","volume":"10","author":"L Xue","year":"2022","unstructured":"Xue L, Barua A, Constant N, Al-Rfou R, Narang S, Kale M, Roberts A, Raffel C (2022) Byt5: towards a token-free future with pre-trained byte-to-byte models. Trans Assoc Comput Ling 10:291\u2013306","journal-title":"Trans Assoc Comput Ling"},{"key":"11534_CR443","doi-asserted-by":"crossref","unstructured":"Xue L, Constant N, Roberts A, Kale M, Al-Rfou R, Siddhant A, Barua A, Raffel C (2020) mt5: A massively multilingual pre-trained text-to-text transformer. arXiv preprint arXiv:2010.11934","DOI":"10.18653\/v1\/2021.naacl-main.41"},{"key":"11534_CR444","doi-asserted-by":"crossref","unstructured":"Yan B, Li K, Xu M, Dong Y, Zhang Y, Ren Z, Cheng X (2024) On protecting the data privacy of large language models (llms): A survey. arXiv preprint arXiv:2403.05156","DOI":"10.1109\/ICMC60390.2024.00008"},{"key":"11534_CR445","doi-asserted-by":"crossref","unstructured":"Yang E, Lawrie D, Mayfield J, Oard DW, Miller S (2024) Translate-distill: Learning cross-language dense retrieval by translation and distillation. Advances in Information Retrieval: 46th European Conference on Information Retrieval. ECIR 2024, Glasgow, UK, March 24\u201328, 2024, Proceedings, Part II. Springer, Berlin, Heidelberg, pp 50\u201365","DOI":"10.1007\/978-3-031-56060-6_4"},{"key":"11534_CR446","doi-asserted-by":"publisher","unstructured":"Yang E, Lawrie D, Mayfield J (2024) Distillation for multilingual information retrieval. In: Proceedings of the 47th International ACM SIGIR Conference on Research and Development in Information Retrieval. SIGIR \u201924, pp. 2368\u20132373. Association for Computing Machinery, New York, NY, USA . https:\/\/doi.org\/10.1145\/3626772.3657955","DOI":"10.1145\/3626772.3657955"},{"key":"11534_CR447","unstructured":"Yang W, Li C, Zhang J, Zong C (2023) Bigtrans: Augmenting large language models with multilingual translation capability over 100 languages. arXiv preprint arXiv:2305.18098"},{"key":"11534_CR448","doi-asserted-by":"crossref","unstructured":"Yang Y, Zhang Y, Tar C, Baldridge J (2019) PAWS-X: A cross-lingual adversarial dataset for paraphrase identification. In: Inui, K., Jiang, J., Ng, V., Wan, X. (eds.) Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing (EMNLP-IJCNLP), pp. 3687\u20133692. Association for Computational Linguistics, Hong Kong, China . https:\/\/doi.org\/10.18653\/v1\/D19-1382 . https:\/\/aclanthology.org\/D19-1382","DOI":"10.18653\/v1\/D19-1382"},{"key":"11534_CR449","unstructured":"Yang Z, Li L, Lin K, Wang J, Lin C-C, Liu Z, Wang L (2023) The dawn of lmms: Preliminary explorations with gpt-4v (ision). arXiv preprint arXiv:2309.17421 9(1), 1"},{"key":"11534_CR450","unstructured":"Yang A, Li A, Yang B, Zhang B, Hui B, Zheng B, Yu B, Gao C, Huang C, Lv C et al (2025) Qwen3 technical report. arXiv preprint arXiv:2505.09388"},{"key":"11534_CR451","doi-asserted-by":"crossref","unstructured":"Yang J, Yin Y, Ma S, Huang H, Zhang D, Li Z, Wei F (2021) Multilingual agreement for multilingual neural machine translation. In: Proceedings of the 59th Annual Meeting of the Association for Computational Linguistics and the 11th International Joint Conference on Natural Language Processing (Volume 2: Short Papers), pp. 233\u2013239","DOI":"10.18653\/v1\/2021.acl-short.31"},{"key":"11534_CR452","doi-asserted-by":"crossref","unstructured":"Yang Y, Duan H, Abbasi A, Lalor JP, Tam KY (2025) Bias a-head? analyzing bias in transformer-based language model attention heads. In: Proceedings of the 5th Workshop on Trustworthy NLP (TrustNLP 2025), pp. 276\u2013290","DOI":"10.18653\/v1\/2025.trustnlp-main.18"},{"key":"11534_CR453","doi-asserted-by":"crossref","unstructured":"Yang H, Liu X-Y, Wang CD (2023) Fingpt: Open-source financial large language models. arXiv preprint arXiv:2306.06031","DOI":"10.2139\/ssrn.4489826"},{"key":"11534_CR454","unstructured":"Yang A, Xiao B, Wang B, Zhang B, Bian C, Yin C, Lv C, Pan D, Wang D, Yan D et al (2023) Baichuan 2: Open large-scale language models. arXiv preprint arXiv:2309.10305"},{"key":"11534_CR455","unstructured":"Yang Y, Tang Y, Tam KY (2023) Investlm: A large language model for investment using financial domain instruction tuning. arXiv preprint arXiv:2309.13064"},{"key":"11534_CR456","doi-asserted-by":"crossref","unstructured":"Yang K, Zhang T, Kuang Z, Xie Q, Ananiadou S (2023) Mentalllama: Interpretable mental health analysis on social media with large language models. arXiv preprint arXiv:2309.13567","DOI":"10.18653\/v1\/2023.emnlp-main.370"},{"key":"11534_CR457","doi-asserted-by":"crossref","unstructured":"Yao Y, Duan J, Xu K, Cai Y, Sun Z, Zhang Y (2024) A survey on large language model (llm) security and privacy: The good, the bad, and the ugly. High-Confidence Computing, 100211","DOI":"10.1016\/j.hcc.2024.100211"},{"key":"11534_CR458","unstructured":"Yeh K-C, Chi J-A, Lian D-C, Hsieh S-K (2023) Evaluating interfaced llm bias. In: Proceedings of the 35th Conference on Computational Linguistics and Speech Processing (ROCLING 2023), pp. 292\u2013299"},{"key":"11534_CR459","doi-asserted-by":"publisher","first-page":"4913","DOI":"10.18653\/v1\/2021.findings-acl.435","volume":"2021","author":"W Yin","year":"2021","unstructured":"Yin W, Radev D, Xiong C (2021) Docnli: a large-scale dataset for document-level natural language inference. Find Assoc Comput Ling ACL-IJCNLP 2021:4913\u20134922","journal-title":"Find Assoc Comput Ling ACL-IJCNLP"},{"key":"11534_CR460","doi-asserted-by":"crossref","unstructured":"Yin D, Bansal H, Monajatipoor M, Li LH, Chang K-W (2022) GeoMLAMA: Geo-Diverse Commonsense Probing on Multilingual Pre-Trained Language Models","DOI":"10.18653\/v1\/2022.emnlp-main.132"},{"key":"11534_CR461","unstructured":"Yong Z-X, Menghini C, Bach SH (2023) Low-resource languages jailbreak gpt-4. arXiv preprint arXiv:2310.02446"},{"key":"11534_CR462","unstructured":"Yu F, Zhang H, Wang B (2023) Nature language reasoning, a survey. arXiv preprint arXiv:2303.14725"},{"key":"11534_CR463","unstructured":"Yu J, Lin X, Yu Z, Xing X (2023) GPTFUZZER: Red Teaming Large Language Models with Auto-Generated Jailbreak Prompts"},{"key":"11534_CR464","unstructured":"Yu J, Zhu J, Wang Y, Liu Y, Chang H, Nie J, Kong C, Chong R, XinLiu An J, Lu L, Fang M, Zhu L (2023) Taoli Llama. GitHub"},{"key":"11534_CR465","doi-asserted-by":"crossref","unstructured":"Yu J, Kim SU, Choi J, Choi JD (2024) What is your favorite gender, mlm? gender bias evaluation in multilingual masked language models. arXiv preprint arXiv:2404.06621","DOI":"10.3390\/info15090549"},{"key":"11534_CR466","unstructured":"Yuan Y, Jiao W, Wang W, Huang J-t, He P, Shi S, Tu Z (2024) GPT-4 Is Too Smart To Be Safe: Stealthy Chat with LLMs via Cipher"},{"key":"11534_CR467","unstructured":"Yue S, Chen W, Wang S, Li B, Shen C, Liu S, Zhou Y, Xiao Y, Yun S, Huang X, Wei Z (2023) DISC-LawLLM: Fine-tuning Large Language Models for Intelligent Legal Services"},{"key":"11534_CR468","unstructured":"Yunxiang L, Zihan L, Kai Z, Ruilong D, You Z (2023) Chatdoctor: A medical chat model fine-tuned on llama model using medical domain knowledge. arXiv preprint arXiv:2303.14070"},{"key":"11534_CR469","unstructured":"ZHIPU: Zhipu ai devday glm-4 (2024)"},{"key":"11534_CR470","first-page":"19488","volume":"38","author":"J Zeng","year":"2024","unstructured":"Zeng J, Meng F, Yin Y, Zhou J (2024) Teaching large language models to translate with comparison. Proceed AAAI Conf Artif Intell 38:19488\u201319496","journal-title":"Proceed AAAI Conf Artif Intell"},{"key":"11534_CR471","doi-asserted-by":"crossref","unstructured":"Zeng Y, Lin H, Zhang J, Yang D, Jia R, Shi W (2024) How johnny can persuade llms to jailbreak them: Rethinking persuasion to challenge ai safety by humanizing llms. In: Proceedings of the 62nd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pp. 14322\u201314350","DOI":"10.18653\/v1\/2024.acl-long.773"},{"key":"11534_CR472","unstructured":"Zeng A, Liu X, Du Z, Wang Z, Lai H, Ding M, Yang Z, Xu Y, Zheng W, Xia X et al (2022) Glm-130b: An open bilingual pre-trained model. arXiv preprint arXiv:2210.02414"},{"key":"11534_CR473","doi-asserted-by":"publisher","first-page":"216","DOI":"10.1016\/j.aiopen.2021.12.003","volume":"2","author":"Z Zhang","year":"2021","unstructured":"Zhang Z, Gu Y, Han X, Chen S, Xiao C, Sun Z, Yao Y, Qi F, Guan J, Ke P et al (2021) Cpm-2: large-scale cost-effective pre-trained language models. AI Open 2:216\u2013224","journal-title":"AI Open"},{"key":"11534_CR474","doi-asserted-by":"publisher","first-page":"1114","DOI":"10.1162\/tacl_a_00595","volume":"11","author":"X Zhang","year":"2023","unstructured":"Zhang X, Thakur N, Ogundepo O, Kamalloo E, Alfonso-Hermelo D, Li X, Liu Q, Rezagholizadeh M, Lin J (2023) MIRACL: a multilingual retrieval dataset covering 18 diverse languages. Trans Assoc Comput Ling 11:1114\u20131131. https:\/\/doi.org\/10.1162\/tacl_a_00595","journal-title":"Trans Assoc Comput Ling"},{"key":"11534_CR475","unstructured":"Zhang X, Hofst\u00e4tter S, Lewis P, Tang R, Lin J (2023) Rank-without-GPT: Building GPT-Independent Listwise Rerankers on Open-Source Large Language Models . https:\/\/arxiv.org\/abs\/2312.02969"},{"key":"11534_CR476","unstructured":"Zhang X, Thakur N, Ogundepo O, Kamalloo E, Alfonso-Hermelo D, Li X, Liu Q, Rezagholizadeh M, Lin J (2022) Making a MIRACL: Multilingual Information Retrieval Across a Continuum of Languages"},{"key":"11534_CR477","unstructured":"Zhang S, Fang Q, Zhang Z, Ma Z, Zhou Y, Huang L, Bu M, Gui S, Chen Y, Chen X et al (2023) Bayling: Bridging cross-lingual alignment and instruction following through interactive translation for large language models. arXiv preprint arXiv:2306.10968"},{"key":"11534_CR478","doi-asserted-by":"crossref","unstructured":"Zhang Y, Wang Y, Liu Z, Wang S, Wang X, Li P, Sun M, Liu Y (2024) Enhancing multilingual capabilities of large language models through self-distillation from resource-rich languages. arXiv preprint arXiv:2402.12204","DOI":"10.18653\/v1\/2024.acl-long.603"},{"key":"11534_CR479","doi-asserted-by":"crossref","unstructured":"Zhang W, Aljunied SM, Gao C, Chia YK, Bing L (2023) M3Exam: A Multilingual. Multimodal, Multilevel Benchmark for Examining Large Language Models","DOI":"10.52202\/075280-0240"},{"key":"11534_CR480","doi-asserted-by":"crossref","unstructured":"Zhang Z, Liu Y, Huang W, Mao J, Wang R, Hu H (2024) MELA: Multilingual Evaluation of Linguistic Acceptability","DOI":"10.18653\/v1\/2024.acl-long.146"},{"key":"11534_CR481","doi-asserted-by":"crossref","unstructured":"Zhang B, Williams P, Titov I, Sennrich R (2020) Improving massively multilingual neural machine translation and zero-shot translation. In: Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, pp. 1628\u20131639","DOI":"10.18653\/v1\/2020.acl-main.148"},{"key":"11534_CR482","doi-asserted-by":"crossref","unstructured":"Zhang C, D\u2019Haro L, Tang C, Shi K, Tang G, Li H (2023) xDial-eval: A multilingual open-domain dialogue evaluation benchmark. In: Bouamor, H., Pino, J., Bali, K. (eds.) Findings of the Association for Computational Linguistics: EMNLP 2023, pp. 5579\u20135601. Association for Computational Linguistics, Singapore . https:\/\/doi.org\/10.18653\/v1\/2023.findings-emnlp.371 . https:\/\/aclanthology.org\/2023.findings-emnlp.371","DOI":"10.18653\/v1\/2023.findings-emnlp.371"},{"key":"11534_CR483","doi-asserted-by":"crossref","unstructured":"Zhang Y, Wang J, Wang Z, Zhang R (2023) XSemPLR: Cross-Lingual Semantic Parsing in Multiple Natural Languages and Meaning Representations","DOI":"10.18653\/v1\/2023.acl-long.887"},{"key":"11534_CR484","unstructured":"Zhang S, Chaudhary V, Goyal N, Cross J, Wenzek G, Bansal M, Guzman F (2022) How robust is neural machine translation to language imbalance in multilingual tokenizer training? arXiv preprint arXiv:2204.14268"},{"key":"11534_CR485","unstructured":"Zhang Z, Zhou L, Wang C, Chen S, Wu Y, Liu S, Chen Z, Liu Y, Wang H, Li J, et al (2023) Speak foreign languages with your own voice: Cross-lingual neural codec language modeling. arXiv preprint arXiv:2303.03926"},{"key":"11534_CR486","unstructured":"Zhang S, Roller S, Goyal N, Artetxe M, Chen M, Chen S, Dewan C, Diab M, Li X, Lin XV et al (2022) Opt: Open pre-trained transformer language models. arXiv preprint arXiv:2205.01068"},{"key":"11534_CR487","doi-asserted-by":"crossref","unstructured":"Zhang X, Ma X, Shi P, Lin J (2021) Mr. TyDi: A multi-lingual benchmark for dense retrieval. In: Proceedings of the 1st Workshop on Multilingual Representation Learning, pp. 127\u2013137. Association for Computational Linguistics, Punta Cana, Dominican Republic . https:\/\/doi.org\/10.18653\/v1\/2021.mrl-1.12 . https:\/\/aclanthology.org\/2021.mrl-1.12","DOI":"10.18653\/v1\/2021.mrl-1.12"},{"key":"11534_CR488","doi-asserted-by":"publisher","unstructured":"Zhang X, Ogueji K, Ma X, Lin J (2023) Toward best practices for training multilingual dense retrieval models. ACM Trans. Inf. Syst. 42(2) https:\/\/doi.org\/10.1145\/3613447","DOI":"10.1145\/3613447"},{"key":"11534_CR489","unstructured":"Zhang X, Tian C, Yang X, Chen L, Li Z, Petzold LR (2023) AlpaCare:Instruction-tuned Large Language Models for Medical Application"},{"key":"11534_CR490","doi-asserted-by":"crossref","unstructured":"Zhang H, Chen J, Jiang F, Yu F, Chen Z, Li J, Chen G, Wu X, Zhang Z, Xiao Q, Wan X, Wang B, Li H (2023) Huatuogpt, towards taming language models to be a doctor. arXiv preprint arXiv:2305.15075","DOI":"10.18653\/v1\/2023.findings-emnlp.725"},{"key":"11534_CR491","doi-asserted-by":"crossref","unstructured":"Zhang X, Li S, Hauer B, Shi N, Kondrak G (2023) Don\u2019t trust chatgpt when your question is not in english: A study of multilingual abilities and types of llms. In: Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, pp. 7915\u20137927","DOI":"10.18653\/v1\/2023.emnlp-main.491"},{"key":"11534_CR492","doi-asserted-by":"crossref","unstructured":"Zhang W, Aljunied M, Gao C, Chia YK, Bing L (2024) M3exam: A multilingual, multimodal, multilevel benchmark for examining large language models. Advances in Neural Information Processing Systems 36","DOI":"10.52202\/075280-0240"},{"key":"11534_CR493","doi-asserted-by":"crossref","unstructured":"Zhang R, Cahyawijaya S, Cruz JCB, Winata G, Aji A (2023) Multilingual large language models are not (yet) code-switchers. In: Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, pp. 12567\u201312582","DOI":"10.18653\/v1\/2023.emnlp-main.774"},{"key":"11534_CR494","unstructured":"Zhang M, Liu L, Yanqing Z, Qiao X, Chang S, Zhao X, Zhu J, Zhu M, Peng S, Li Y, Liu Y, Ma W, Piao M, Tao S, Yang H, Jiang Y (2023) Leveraging multilingual knowledge graph to boost domain-specific entity translation of ChatGPT. In: Yamada, M., Carmo, F. (eds.) Proceedings of Machine Translation Summit XIX, Vol. 2: Users Track, pp. 77\u201387. Asia-Pacific Association for Machine Translation, Macau SAR, China . https:\/\/aclanthology.org\/2023.mtsummit-users.7"},{"key":"11534_CR495","doi-asserted-by":"crossref","unstructured":"Zhang X, Zhang Y, Long D, Xie W, Dai Z, Tang J, Lin H, Yang B, Xie P, Huang F, Zhang M, Li W, Zhang M (2024) mGTE: Generalized Long-Context Text Representation and Reranking Models for Multilingual Text Retrieval . https:\/\/arxiv.org\/abs\/2407.19669","DOI":"10.18653\/v1\/2024.emnlp-industry.103"},{"key":"11534_CR496","unstructured":"Zhao WX, Zhou K, Li J, Tang T, Wang X, Hou Y, Min Y, Zhang B, Zhang J, Dong Z et al (2023) A survey of large language models. arXiv preprint arXiv:2303.18223"},{"key":"11534_CR497","doi-asserted-by":"crossref","unstructured":"Zhao J, Mukherjee S, Hosseini S, Chang K-W, Awadallah AH (2020) Gender bias in multilingual embeddings and cross-lingual transfer. In: Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, pp. 2896\u20132907","DOI":"10.18653\/v1\/2020.acl-main.260"},{"issue":"1","key":"11534_CR498","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/2379776.2379777","volume":"45","author":"D Zhou","year":"2012","unstructured":"Zhou D, Truran M, Brailsford T, Wade V, Ashman H (2012) Translation techniques in cross-language information retrieval. ACM Comput Surv (CSUR) 45(1):1\u201344","journal-title":"ACM Comput Surv (CSUR)"},{"key":"11534_CR499","unstructured":"Zhou A, Li B, Wang H (2024) Robust prompt optimization for defending language models against jailbreaking attacks. arXiv preprint arXiv:2401.17263"},{"key":"11534_CR500","unstructured":"Zhou W, Wang X, Xiong L, Xia H, Gu Y, Chai M, Zhu F, Huang C, Dou S, Xi Z et al (2024) Easyjailbreak: A unified framework for jailbreaking large language models. arXiv preprint arXiv:2403.12171"},{"key":"11534_CR501","unstructured":"Zhu Y, Yuan H, Wang S, Liu J, Liu W, Deng C, Chen H, Liu Z, Dou Z, Wen J-R (2024) Large Language Models for Information Retrieval: A Survey . https:\/\/arxiv.org\/abs\/2308.07107"},{"key":"11534_CR502","doi-asserted-by":"crossref","unstructured":"Zhuang S, Ma X, Koopman B, Lin J, Zuccon G (2024) PromptReps: Prompting Large Language Models to Generate Dense and Sparse Representations for Zero-Shot Document Retrieval . https:\/\/arxiv.org\/abs\/2404.18424","DOI":"10.18653\/v1\/2024.emnlp-main.250"},{"key":"11534_CR503","doi-asserted-by":"publisher","unstructured":"Zhuang S, Zhuang H, Koopman B, Zuccon G (2024) A setwise approach for effective and highly efficient zero-shot ranking with large language models. In: Proceedings of the 47th International ACM SIGIR Conference on Research and Development in Information Retrieval. SIGIR \u201924, pp. 38\u201347. Association for Computing Machinery, New York, NY, USA . https:\/\/doi.org\/10.1145\/3626772.3657813","DOI":"10.1145\/3626772.3657813"},{"key":"11534_CR504","unstructured":"Zou A, Wang Z, Kolter JZ, Fredrikson M (2023) Universal and transferable adversarial attacks on aligned language models. arXiv preprint arXiv:2307.15043"}],"container-title":["Artificial Intelligence Review"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10462-026-11534-5","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10462-026-11534-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10462-026-11534-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T11:05:29Z","timestamp":1780311929000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10462-026-11534-5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,3,27]]},"references-count":511,"journal-issue":{"issue":"6","published-online":{"date-parts":[[2026,6]]}},"alternative-id":["11534"],"URL":"https:\/\/doi.org\/10.1007\/s10462-026-11534-5","relation":{},"ISSN":["1573-7462"],"issn-type":[{"value":"1573-7462","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,3,27]]},"assertion":[{"value":"11 July 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 February 2026","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 March 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors have no Conflict of interest to declare that are relevant to the content of this article.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"146"}}