{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,15]],"date-time":"2026-04-15T17:50:20Z","timestamp":1776275420924,"version":"3.50.1"},"reference-count":95,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode"}],"funder":[{"name":"Defense Research and Development Organization (DRDO), New Delhi, through the Extramural Research and Intellectual Property Rights (ER&IPR) Project Fund","award":["ERIP\/ER\/202308002\/M\/01\/1834"],"award-info":[{"award-number":["ERIP\/ER\/202308002\/M\/01\/1834"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Access"],"published-print":{"date-parts":[[2025]]},"DOI":"10.1109\/access.2025.3570699","type":"journal-article","created":{"date-parts":[[2025,5,16]],"date-time":"2025-05-16T17:46:01Z","timestamp":1747417561000},"page":"89775-89810","source":"Crossref","is-referenced-by-count":4,"title":["A Novel Approach to Continual Knowledge Transfer in Multilingual Neural Machine Translation Using Autoregressive and Non-Autoregressive Models for Indic Languages"],"prefix":"10.1109","volume":"13","author":[{"given":"Shailashree K.","family":"Sheshadri","sequence":"first","affiliation":[{"name":"Department of Computer Science and Engineering, Amrita School of Computing, Bengaluru, Amrita Vishwa Vidyapeetham, India"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1041-5125","authenticated-orcid":false,"given":"Deepa","family":"Gupta","sequence":"additional","affiliation":[{"name":"Department of Computer Science and Engineering, Amrita School of Computing, Bengaluru, Amrita Vishwa Vidyapeetham, India"}]},{"given":"Biswajit","family":"Paul","sequence":"additional","affiliation":[{"name":"Centre for Artificial Intelligence and Robotics, DRDO, CV Raman Nagar, Bangalore, India"}]},{"given":"J. Siva","family":"Bhavani","sequence":"additional","affiliation":[{"name":"Centre for Artificial Intelligence and Robotics, DRDO, CV Raman Nagar, Bangalore, India"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N16-1101"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N19-1388"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.findings-acl.304"},{"issue":"1","key":"ref4","first-page":"4839","article-title":"Beyond english-centric multilingual machine translation","volume":"22","author":"Fan","year":"2020","journal-title":"J. Mach. Learn. Res."},{"key":"ref5","article-title":"No language left behind: Scaling human-centered machine translation","author":"Team","year":"2022","journal-title":"arXiv:2207.04672"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.emnlp-main.616"},{"key":"ref7","article-title":"GPT-4 technical report","volume-title":"arXiv:2303.08774","author":"Achiam","year":"2023"},{"key":"ref8","article-title":"The llama 3 herd of models","author":"Grattafiori","year":"2024","journal-title":"arXiv:2407.21783"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.acl-long.852"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.emnlp-main.720"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.findings-emnlp.953"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.findings-emnlp.826"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.naacl-long.339"},{"issue":"1","key":"ref14","first-page":"11324","article-title":"PaLM: Scaling language modeling with pathways","volume":"24","author":"Chowdhery","year":"2023","journal-title":"J. Mach. Learn. Res."},{"key":"ref15","article-title":"Bloom: A 176B-parameter open-access multilingual language model","author":"Workshop","year":"2022","journal-title":"arXiv:2211.05100"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.acl-long.656"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.acl-long.448"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N19-1209"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.emnlp-main.111"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.emnlp-main.736"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.emnlp-main.860"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1145\/3430984.3431026"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.loresmt-1.4"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.acl-long.693"},{"key":"ref25","article-title":"MuRIL: Multilingual representations for Indian languages","author":"Khanuja","year":"2021","journal-title":"arXiv:2103.10730"},{"key":"ref26","article-title":"IndicTrans2: Towards high-quality and accessible machine translation models for all 22 scheduled Indian languages","author":"Bharat","year":"2023","journal-title":"Trans. Mach. Learn. Res."},{"key":"ref27","article-title":"Understanding the role of FFNs in driving multilingual behaviour in LLMs","author":"Bhattacharya","year":"2024","journal-title":"arXiv:2404.13855"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2024.3451977"},{"key":"ref29","article-title":"Non-autoregressive neural machine translation","volume-title":"Proc. Int. Conf. Learn. Represent.","author":"Gu"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i05.6413"},{"key":"ref31","article-title":"Switch-GLAT: Multilingual parallel machine translation via code-switch decoder","volume-title":"Proc. Int. Conf. Learn. Represent.","author":"Song"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1613\/jair.1.12007"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1145\/3567592"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1613\/jair.1.13566"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1016\/j.procs.2023.01.242"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1145\/3716629"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1145\/3735633"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.wmt-1.74"},{"key":"ref39","first-page":"91","article-title":"Multilingual continual learning using attention distillation","volume-title":"Proc. 31st Int. Conf. Comput. Linguistics, Ind. Track","author":"Agrawal"},{"key":"ref40","article-title":"How do LLMs acquire new knowledge? A knowledge circuits perspective on continual pre-training","author":"Ou","year":"2025","journal-title":"arXiv:2502.11196"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.emnlp-main.75"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.findings-acl.250"},{"key":"ref43","first-page":"177","article-title":"Exploring the benefits and limitations of multilinguality for non-autoregressive machine translation","volume-title":"Proc. 7th Conf. Mach. Transl. (WMT)","author":"Agrawal"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.findings-ijcnlp.14"},{"key":"ref45","author":"Alessandro","year":"2024","journal-title":"Continualnat: Continual Learning for Nonautoregressive Translation"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1162\/coli_a_00446"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.findings-acl.766"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.emnlp-main.43"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/ijcnn52387.2021.9534401"},{"key":"ref50","article-title":"Continual pre-training mitigates forgetting in language and vision","volume":"179","author":"Cossu","year":"2024","journal-title":"Proc. Neural Netw."},{"key":"ref51","article-title":"Massively multilingual text translation for low-resource languages","author":"Zhou","year":"2024","journal-title":"arXiv:2401.16582"},{"key":"ref52","first-page":"96","article-title":"Zero-shot neural machine translation with self-learning cycle","volume-title":"Proc. 4th Workshop Technol. MT Low Resource Lang. (LoResMT)","author":"Lakew"},{"issue":"1","key":"ref53","first-page":"10185","article-title":"An empirical investigation of the role of pre-training in lifelong learning","volume":"24","author":"Mehta","year":"2023","journal-title":"J. Mach. Learn. Res."},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.naacl-main.310"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.acl-long.143"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.acl-long.77"},{"key":"ref57","first-page":"188","article-title":"Few-shot regularization to tackle catastrophic forgetting in multilingual machine translation","volume-title":"Proc. 15th Biennial Conf. Assoc. Mach. Transl. Americas","author":"Carri\u00f3n"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.naacl-main.93"},{"key":"ref59","first-page":"542","article-title":"Continual learning in multilingual NMT via languagespecific embeddings","volume-title":"Proc. 6th Conf. Mach. Transl.","author":"B\u00e9rard"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P19-2033"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.naacl-long.10"},{"key":"ref62","first-page":"287","article-title":"Adapting large multilingual machine translation models to unseen low resource languages via vocabulary substitution and neuron selection","volume-title":"Proc. 15th biennial Conf. Assoc. Mach. Transl. Americas","author":"Abdelghaffar"},{"key":"ref63","article-title":"Extending multilingual machine translation through imitation learning","author":"Lai","year":"2023","journal-title":"arXiv:2311.08538"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.1145\/3652026"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2023.127115"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1145\/3587932"},{"key":"ref67","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.findings-acl.145"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.26615\/978-954-452-072-4_083"},{"key":"ref69","article-title":"Exploiting multilingualism in low-resource neural machine translation via adversarial learning","author":"Kumar","year":"2023","journal-title":"arXiv:2303.18011"},{"key":"ref70","article-title":"Milpac: A novel benchmark for evaluating translation of legal text to Indian languages","author":"Mahapatra","year":"2023","journal-title":"arXiv:2310.09765"},{"key":"ref71","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.acl-long.618"},{"key":"ref72","first-page":"103","article-title":"An empirical study of leveraging knowledge distillation for compressing multilingual neural machine translation models","volume-title":"Proc. 24th Annu. Conf. Eur. Assoc. Mach. Transl.","author":"Gumma"},{"key":"ref73","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.loresmt-1.7"},{"key":"ref74","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.wmt-1.65"},{"key":"ref75","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.emnlp-main.55"},{"key":"ref76","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.findings-naacl.176"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.emnlp-main.1177"},{"key":"ref78","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.wmt-1.128"},{"key":"ref79","first-page":"207","article-title":"Assessing translation capabilities of large language models involving English and Indian languages","volume-title":"Proc. 25th Annu. Conf. Eur. Assoc. Mach. Transl.","author":"Mujadia"},{"key":"ref80","doi-asserted-by":"publisher","DOI":"10.1038\/s41598-024-74617-9"},{"key":"ref81","article-title":"EMMA-500: Enhancing massively multilingual adaptation of large language models","author":"Ji","year":"2024","journal-title":"arXiv:2409.17892"},{"key":"ref82","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.findings-emnlp.920"},{"key":"ref83","doi-asserted-by":"publisher","DOI":"10.1162\/tacl_a_00452"},{"key":"ref84","article-title":"Paramanu: A family of novel efficient generative foundation language models for Indian languages","author":"Niyogi","year":"2024","journal-title":"arXiv:2401.18034"},{"key":"ref85","article-title":"Airavata: Introducing Hindi instruction-tuned LLM","author":"Gala","year":"2024","journal-title":"arXiv:2401.15006"},{"key":"ref86","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.acl-long.843"},{"key":"ref87","article-title":"Krutrim LLM: Multilingual foundational model for over a billion people","author":"Kallappa","year":"2025","journal-title":"arXiv:2502.09642"},{"key":"ref88","first-page":"50","article-title":"Adapting multilingual LLMs to low-resource languages using continued pre-training and synthetic corpus: A case study for Hindi LLMs","volume-title":"Proc. 1st Workshop Natural Lang. Process. Indo-Aryan Dravidian Lang.","author":"Joshi"},{"key":"ref89","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.emnlp-main.676"},{"key":"ref90","doi-asserted-by":"publisher","DOI":"10.3115\/1073083.1073135"},{"key":"ref91","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/W18-6319"},{"key":"ref92","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/W15-3049"},{"key":"ref93","first-page":"65","article-title":"METEOR: An automatic metric for MT evaluation with improved correlation with human judgments","volume-title":"Proc. ACL Workshop Intrinsic Extrinsic Eval. Measures Mach. Transl. Summarization","author":"Banerjee"},{"key":"ref94","doi-asserted-by":"publisher","DOI":"10.1162\/tacl_a_00288"},{"key":"ref95","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.naacl-long.143"}],"container-title":["IEEE Access"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/6287639\/10820123\/11005970.pdf?arnumber=11005970","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,5,27]],"date-time":"2025-05-27T04:35:47Z","timestamp":1748320547000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11005970\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"references-count":95,"URL":"https:\/\/doi.org\/10.1109\/access.2025.3570699","relation":{},"ISSN":["2169-3536"],"issn-type":[{"value":"2169-3536","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025]]}}}