{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,5]],"date-time":"2026-05-05T03:31:06Z","timestamp":1777951866812,"version":"3.51.4"},"reference-count":54,"publisher":"Elsevier BV","license":[{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/legal\/tdmrep-license"},{"start":{"date-parts":[[2026,2,1]],"date-time":"2026-02-01T00:00:00Z","timestamp":1769904000000},"content-version":"vor","delay-in-days":31,"URL":"http:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0\/"}],"content-domain":{"domain":["elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Procedia Computer Science"],"published-print":{"date-parts":[[2026]]},"DOI":"10.1016\/j.procs.2026.01.114","type":"journal-article","created":{"date-parts":[[2026,3,20]],"date-time":"2026-03-20T19:30:19Z","timestamp":1774035019000},"page":"464-473","update-policy":"https:\/\/doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":0,"special_numbering":"C","title":["Saudi Dialects to MSA Machine Translation: A Systematic Evaluation of LLMs"],"prefix":"10.1016","volume":"275","author":[{"given":"Ghada","family":"Alharbi","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"78","reference":[{"key":"10.1016\/j.procs.2026.01.114_bib1","article-title":"\"Dial2MSA-Verified: A Multi-Dialect Arabic Social Media Dataset for Neural Machine Translation to Modern Standard Arabic,\" in","author":"Khered","year":"2025","journal-title":"the 4th Workshop on Arabic Corpus Linguistics (WACL-4)"},{"key":"10.1016\/j.procs.2026.01.114_bib2","doi-asserted-by":"crossref","DOI":"10.63317\/2sqhrzmrh67i","article-title":"\"LLM-based MT data creation: Dialectal to MSA translation shared task,\" in","author":"Abdelaziz","year":"2024","journal-title":"The 6th Workshop on Open-Source Arabic Corpora and Processing Tools (OSACT) @ LREC-COLING"},{"key":"10.1016\/j.procs.2026.01.114_bib3","doi-asserted-by":"crossref","unstructured":"Alanazi et al., \"The Saudi Arabic dialects game localization dataset,\" Data in Brief, 2025.","DOI":"10.1016\/j.dib.2025.111906"},{"key":"10.1016\/j.procs.2026.01.114_bib4","unstructured":"Bouamor et al., \"The MADAR Arabic Dialect Corpus and Lexicon,\" in 11th Int. Conf. on Language Resources and Evaluation (LREC), Miyazaki, Japan, 2018."},{"key":"10.1016\/j.procs.2026.01.114_bib5","doi-asserted-by":"crossref","unstructured":"Alabdullah, et al., \"Advancing dialectal Arabic to modern standard Arabic machine translation.,\" arXiv preprint, 2025.","DOI":"10.21203\/rs.3.rs-7510599\/v1"},{"issue":"2","key":"10.1016\/j.procs.2026.01.114_bib6","doi-asserted-by":"crossref","first-page":"325","DOI":"10.1080\/00437956.1959.11659702","article-title":"\"Diglossia\u201c\"","volume":"15","author":"Ferguson","year":"1959","journal-title":"Word"},{"key":"10.1016\/j.procs.2026.01.114_bib7","article-title":"\"A Reference Grammar of Modern Standard Arabic,\"","author":"Ryding","year":"2005","journal-title":"Cambridge: Cambridge University Press"},{"key":"10.1016\/j.procs.2026.01.114_bib8","article-title":"\u201cIntroduction to Arabic Natural Language Processing, Synthesis Lectures on Human Language Technologies,\u201d","author":"Habash","year":"2010","journal-title":"San Rafael, CA; Morgan & Claypool"},{"key":"10.1016\/j.procs.2026.01.114_bib9","unstructured":"Bouamor, et al. \"A Multidialectal Parallel Corpus of Arabic,\" in 9th Int. Conf. on Language Resources and Evaluation (LREC), Reykjavik, Iceland, 2014."},{"issue":"3","key":"10.1016\/j.procs.2026.01.114_bib10","first-page":"215","article-title":"\"Regional Variation in Saudi Arabian Arabic: A Sociolinguistic Perspective,\"","volume":"31","author":"Alghamdi","year":"2019","journal-title":"Journal of King Saud University\u2013Languages and Translation"},{"key":"10.1016\/j.procs.2026.01.114_bib11","unstructured":"Alameri et al., \"Natural Language Processing for Dialectical Arabic: A Survey,\" Journal of King Saud University\u2013Computer and Information Sciences, vol. 33, no. 4, p. 401\u2013414, 2021."},{"key":"10.1016\/j.procs.2026.01.114_bib12","unstructured":"A. Pasha, \"MADAMIRA: A fast, comprehensive tool for morphological analysis and disambiguation of Arabic,\" in 9th Int. Conf. on Language Resources and Evaluation (LREC), Reykjavik, Iceland\u201c 2014."},{"key":"10.1016\/j.procs.2026.01.114_bib13","unstructured":"Obeid et al., \"CAMeL Tools: An Open Source Python Toolkit for Arabic Natural Language Processing,\" in the 12th Language Resources and Evaluation Conference (LREC), Marseille, France, 2020."},{"key":"10.1016\/j.procs.2026.01.114_bib14","doi-asserted-by":"crossref","unstructured":"Abdelali et al., \"Farasa: A fast and furious segmenter for Arabic.,\" in the North American Chapter of the Association for Computational Linguis- tics (NAACL), San Diego, California, 2016.","DOI":"10.18653\/v1\/N16-3003"},{"key":"10.1016\/j.procs.2026.01.114_bib15","article-title":"\"AraT5: Text-to-text transformers for Arabic language generation,\"","author":"Nagoudi","year":"2021","journal-title":"arXiv preprint"},{"key":"10.1016\/j.procs.2026.01.114_bib16","article-title":"\"mT5: A Massively Multilingual Pre-trained Text-to-Text Transformer,\" in","author":"Xue","year":"2021","journal-title":"EMNLP"},{"key":"10.1016\/j.procs.2026.01.114_bib17","article-title":"\"Exploring GPT-4 for Arabic Dialect Machine Translation,\"","author":"Alhoshan","year":"2025","journal-title":"Frontiers in AI"},{"key":"10.1016\/j.procs.2026.01.114_bib18","article-title":"\"Allam: Large language models for arabic and english,\"","author":"Bari","year":"2024","journal-title":"arXiv preprint arXiv:"},{"key":"10.1016\/j.procs.2026.01.114_bib19","article-title":"\"The interplay of variant, size, and task type in Arabic pre-trained language models,\"","author":"Inoue","year":"2021","journal-title":"arXiv preprint"},{"key":"10.1016\/j.procs.2026.01.114_bib20","first-page":"Online","article-title":"\"ARBERT & MARBERT: Deep Bidirectional Transformers for Arabic,\" in","author":"Abdul-Mageed","year":"2021","journal-title":"the 11th International Joint Conference on Natural Language Processing (ACL-IJCNLP)"},{"key":"10.1016\/j.procs.2026.01.114_bib21","article-title":"\"SaudiBERT: A Large Language Model Pretrained on Saudi Dialect Corpora,\"","author":"Qarah","year":"2024","journal-title":"arXiv preprint"},{"key":"10.1016\/j.procs.2026.01.114_bib22","article-title":"\"Egybert: A large language model pretrained on egyptian dialect corpora,\"","author":"Qarah","year":"2024","journal-title":"arXiv preprint"},{"key":"10.1016\/j.procs.2026.01.114_bib23","article-title":"\"AraT5-MSAizer: Dialectal Arabic to MSA Machine Translation Using Pre-trained T5 Models,\" in","author":"S. A.","year":"2024","journal-title":"the WANLP"},{"key":"10.1016\/j.procs.2026.01.114_bib24","doi-asserted-by":"crossref","unstructured":"M. Fares, \"AraT5-MSAizer: Translating Dialectal Arabic to MSA,\" in he 6th Workshop on Open-Source Arabic Corpora and Processing Tools (OSACT), Torino, Italia., 2024.","DOI":"10.63317\/26nxp6cqn8q2"},{"key":"10.1016\/j.procs.2026.01.114_bib25","unstructured":"C. e. a. Raffel, \"Exploring the limits of transfer learning with a unified text-to-text transforme,\"Journal of machine learning research,2020."},{"key":"10.1016\/j.procs.2026.01.114_bib26","article-title":"\"Gpt-4 technical report,\"","author":"Achiam","year":"2023","journal-title":"arXiv preprint"},{"key":"10.1016\/j.procs.2026.01.114_bib27","article-title":"\"\u201cPrompting Multilingual Large Language Models for Low-Resource Arabic NLP,\u201d,\"","author":"S. L.","year":"2023","journal-title":"arXiv preprint"},{"key":"10.1016\/j.procs.2026.01.114_bib28","article-title":"\"\u201cAdapting Arabic Large Language Models with Prompt-Tuning and Few-Shot Learning,\u201d,\" in","author":"B. A.","year":"2023","journal-title":"WANLP"},{"key":"10.1016\/j.procs.2026.01.114_bib29","article-title":"\"\u201cParameter-Efficient Fine-Tuning for Arabic Dialectal NLP: A Comparative Study of LoRA and Full Fine-Tuning,\u201d,\"","volume":"78","author":"HAlSalman","year":"2024","journal-title":"Journal of Artificial Intelligence Research\u201c"},{"issue":"1","key":"10.1016\/j.procs.2026.01.114_bib30","first-page":"39-49","article-title":"\"A method to convert Sana\u2019ani accent to Modern Standard Arabic.,\"","volume":"8","author":"Al-Gaphari","year":"2010","journal-title":"IJISM"},{"key":"10.1016\/j.procs.2026.01.114_bib31","article-title":"\"Elissa: A dialectal to standard Arabic machine translation system,\" in","author":"Salloum","year":"2012","journal-title":"Proceedings of COLING"},{"key":"10.1016\/j.procs.2026.01.114_bib32","article-title":"\"Transforming standard Arabic to colloquial Arabic\"","author":"Mohamed","year":"2012","journal-title":"The 50th ACL"},{"key":"10.1016\/j.procs.2026.01.114_bib33","article-title":"\"Dialectal to standard Arabic paraphrasing to improve Arabic-English statistical machine translation,\"","author":"Salloum","year":"2011","journal-title":"the first workshop on algorithms and resources for modelling of dialects and language varieties"},{"key":"10.1016\/j.procs.2026.01.114_bib34","article-title":"\"PADIC: extension and new experiments,\" in","author":"Meftouh","year":"2018","journal-title":"7th International Conference on Advanced Technologies (ICAT)"},{"key":"10.1016\/j.procs.2026.01.114_bib35","article-title":"\"A hybrid approach to translate Moroccan Arabic dialect.,\" in","author":"Tachicart","year":"2014","journal-title":"The 9th International Conference on Intelligent Systems: Theories and Applications (SITA-14)"},{"key":"10.1016\/j.procs.2026.01.114_bib36","doi-asserted-by":"crossref","DOI":"10.63317\/2jsust5deuro","article-title":"\"Osact6 dialect to msa translation shared task overview.,\" in","author":"Elneima","year":"2024","journal-title":"The 6th Workshop on Open-Source Arabic Corpora and Processing Tools (OSACT). LREC-COLING"},{"key":"10.1016\/j.procs.2026.01.114_bib37","doi-asserted-by":"crossref","unstructured":"S. Alahmari, \"Sirius_Translators at OSACT6 2024 Shared Task: Fine tuning Ara-T5 Models for Translating Arabic Dialectal Text to Modern Standard Arabic,\" in The 6th OSACT workshop @ LREC-COLING, Torino, Italia., 2024.","DOI":"10.63317\/59fi88he3h8x"},{"key":"10.1016\/j.procs.2026.01.114_bib38","article-title":"\"Attention is all you need.,\"","volume":"30","author":"Vaswani","year":"2017","journal-title":"Advances in neural information processing systems"},{"key":"10.1016\/j.procs.2026.01.114_bib39","article-title":"\"NADI 2023: The fourth nuanced Arabic dialect identification shared task,\"","author":"Abdul-Mageed","year":"2023","journal-title":"arXiv preprint"},{"key":"10.1016\/j.procs.2026.01.114_bib40","article-title":"\"Sada: Saudi audio dataset for arabic,\" in","author":"Alharbi","year":"2024","journal-title":"ICASSP"},{"key":"10.1016\/j.procs.2026.01.114_bib41","doi-asserted-by":"crossref","first-page":"726","DOI":"10.1162\/tacl_a_00343","article-title":"\"Multilingual denoising pre-training for neural machine translation,\"","volume":"8","author":"Liu","year":"2020","journal-title":"Transactions of the Association for Computational Linguistics"},{"key":"10.1016\/j.procs.2026.01.114_bib42","first-page":"27730","article-title":"\"Training language models to follow instructions with human feedback,\"","volume":"35","author":"Ouyang","year":"2022","journal-title":"Advances in neural information processing system"},{"key":"10.1016\/j.procs.2026.01.114_bib43","article-title":"\"Osact 2024 task 2: Arabic dialect to msa translation.,\" in","author":"H. A.","year":"2024","journal-title":"the 6th Workshop on Open- Source Arabic Corpora and Processing Tools, LREC"},{"key":"10.1016\/j.procs.2026.01.114_bib44","unstructured":"Touvron et al., \"Llama: Open and efficient foundation language models,\" arXiv preprint, 2023."},{"key":"10.1016\/j.procs.2026.01.114_bib45","article-title":"\"Deepseek-v3 technical report,\"","author":"Liu","year":"2024","journal-title":"arXiv preprint"},{"key":"10.1016\/j.procs.2026.01.114_bib46","article-title":"\"Saudi-Dialect-ALLaM: LoRA Fine-Tuning for Dialectal Arabic Generation,\"","author":"Barmandah","year":"2025","journal-title":"arXiv preprint"},{"key":"10.1016\/j.procs.2026.01.114_bib47","article-title":"\"Lora: Low-rank adaptation of large language models,\" in","author":"Hu","year":"2022","journal-title":"ICLR"},{"key":"10.1016\/j.procs.2026.01.114_bib48","unstructured":"Ohalete et al., \"COSTAR-A: A prompting framework for enhancing Large Language Model performance on Point-of-View questions.,\" 2025."},{"key":"10.1016\/j.procs.2026.01.114_bib49","article-title":"\"Rolellm: Benchmarking, eliciting, and enhancing role-playing abilities of large language models,\"","author":"Wang","year":"2023","journal-title":"preprint arXiv"},{"key":"10.1016\/j.procs.2026.01.114_bib50","article-title":"\"BLEU: A Method for Automatic Evaluation of Machine Translation,\" in","author":"ePapineni","year":"2002","journal-title":"The 40th Annual Meeting Association of Computational Linguistics (ACL)"},{"key":"10.1016\/j.procs.2026.01.114_bib51","article-title":"\"A Study of Translation Edit Rate with Targeted Human Annotation,\" in","author":"M. S.","year":"2006","journal-title":"The 7th Conference Association Machchine Translatiion Americas (AMTA)"},{"key":"10.1016\/j.procs.2026.01.114_bib52","article-title":"\"The METEOR metric for automatic evaluation of machine translation.\",\" in","author":"Lavie","year":"2009","journal-title":"Machine translation"},{"key":"10.1016\/j.procs.2026.01.114_bib53","article-title":"\"COMET: A neural framework for MT evaluation.,\" in","author":"Rei","year":"2020","journal-title":"arXiv preprint arXiv"},{"key":"10.1016\/j.procs.2026.01.114_bib54","article-title":"\"A Human Judgement Corpus and a Metric for Arabic MT Evaluation,\" in","author":"Salloum","year":"2014","journal-title":"the 52nd ACL"}],"container-title":["Procedia Computer Science"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S1877050926001158?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S1877050926001158?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2026,5,4]],"date-time":"2026-05-04T11:14:15Z","timestamp":1777893255000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S1877050926001158"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026]]},"references-count":54,"alternative-id":["S1877050926001158"],"URL":"https:\/\/doi.org\/10.1016\/j.procs.2026.01.114","relation":{},"ISSN":["1877-0509"],"issn-type":[{"value":"1877-0509","type":"print"}],"subject":[],"published":{"date-parts":[[2026]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"Saudi Dialects to MSA Machine Translation: A Systematic Evaluation of LLMs","name":"articletitle","label":"Article Title"},{"value":"Procedia Computer Science","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.procs.2026.01.114","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2026 The Author(s). Published by Elsevier B.V.","name":"copyright","label":"Copyright"}]}}