{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,12]],"date-time":"2026-03-12T06:32:51Z","timestamp":1773297171218,"version":"3.50.1"},"reference-count":38,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2026,3,11]],"date-time":"2026-03-11T00:00:00Z","timestamp":1773187200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,3,11]],"date-time":"2026-03-11T00:00:00Z","timestamp":1773187200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["SN COMPUT. SCI."],"DOI":"10.1007\/s42979-026-04789-w","type":"journal-article","created":{"date-parts":[[2026,3,11]],"date-time":"2026-03-11T13:00:41Z","timestamp":1773234041000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Evaluating Large Language Models in Retrieval-Augmented Tutoring Systems: Methods and Emerging Tools"],"prefix":"10.1007","volume":"7","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-2604-8291","authenticated-orcid":false,"given":"Owais","family":"Bhat","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zubair","family":"Jeelani","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Syed Tanzeel","family":"Rabani","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Syed Mohsin","family":"Saif","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Nawaz A.","family":"Lone","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2026,3,11]]},"reference":[{"key":"4789_CR1","doi-asserted-by":"publisher","unstructured":"Cai D, Wang Y, Liu L. Recent advances in retrieval-augmented text generation. Dl.Acm.OrgD. In: Proceedings of the 45th international ACM SIGIR conference on research and, 2022 dl.Acm.Org. 2022. pp. 3417\u20133419. https:\/\/doi.org\/10.1145\/3477495.3532682.","DOI":"10.1145\/3477495.3532682"},{"key":"4789_CR2","unstructured":"Nye B, Mee D, Core MG. Generative large language models for dialog-based tutoring: an early consideration of opportunities and concerns. 2023. https:\/\/ceur-ws.org\/Vol-3487\/paper4.pdf."},{"key":"4789_CR3","first-page":"4171","volume":"1","author":"J Devlin","year":"2019","unstructured":"Devlin J, Chang MW, Lee K, Toutanova K. BERT: Pre-training of deep bidirectional transformers for language understanding. NAACL HLT 2019\u20132019 Conf North Am Chapter Association Comput Linguistics: Hum Lang Technol - Proc Conf. 2019;1:4171\u201386.","journal-title":"NAACL HLT 2019\u20132019 Conf North Am Chapter Association Comput Linguistics: Hum Lang Technol - Proc Conf"},{"key":"4789_CR4","doi-asserted-by":"publisher","first-page":"238","DOI":"10.1007\/978-3-319-67349-3_22","volume":"658","author":"VI Gromyko","year":"2018","unstructured":"Gromyko VI, Kazaryan VP, Vasilyev NS, Simakin AG, Anosov SS. Artificial intelligence as tutoring partner for human intellect. Adv Intell Syst Comput. 2018;658:238\u201347. https:\/\/doi.org\/10.1007\/978-3-319-67349-3_22.","journal-title":"Adv Intell Syst Comput"},{"key":"4789_CR5","doi-asserted-by":"crossref","unstructured":"Gan W, Sun Y, Ye S, Fan Y, Sun Y. AI-tutor: generating tailored remedial questions and answers based on cognitive diagnostic assessment. In: 2019 6th international conference on behavioral, economic. 2019. https:\/\/ieeexplore.ieee.org\/abstract\/document\/8963236\/. Accessed 8 Jan 2025.","DOI":"10.1109\/BESC48373.2019.8963236"},{"key":"4789_CR6","first-page":"1","volume":"21","author":"C Raffel","year":"2020","unstructured":"Raffel C, Shazeer N, Roberts A, Lee K, Narang S, Matena M, et al. Exploring the limits of transfer learning with a unified text-to-text transformer. J Mach Learn Res. 2020;21:1\u201367.","journal-title":"J Mach Learn Res"},{"key":"4789_CR7","unstructured":"Li Y, Bubeck S, Eldan R, Del Giorno A, Gunasekar S, Lee YT. Textbooks are all you need II: phi-1.5 technical report. 2023. Available from: http:\/\/arxiv.org\/abs\/2309.05463."},{"key":"4789_CR8","unstructured":"Review JM-G-CS. A survey on legal question\u2013answering systems. Elsevier; 2021. https:\/\/www.sciencedirect.com\/science\/article\/pii\/S1574013723000199."},{"key":"4789_CR9","doi-asserted-by":"publisher","unstructured":"Lewis M, Liu Y, Goyal N, Ghazvininejad M, Mohamed A, Levy O, Stoyanov V, Zettlemoyer L. BART: denoising sequence-to-sequence pre-training for natural language generation, translation, and comprehension. In: Proceedings of the annual meeting of the association for computational linguistics. 2020. pp. 7871\u20137880. https:\/\/doi.org\/10.18653\/v1\/2020.acl-main.703.","DOI":"10.18653\/v1\/2020.acl-main.703"},{"key":"4789_CR10","unstructured":"Brown TB, Mann B, Ryder N, Subbiah M, Kaplan J, Dhariwal P, Neelakantan A, Shyam P, Sastry G, Askell A, Agarwal S, Herbert-Voss A, Krueger G, Henighan T, Child R, Ramesh A, Ziegler DM, Wu J, Winter C, Amodei D. Language models are few-shot learners. In: Proceedings.Neurips.Cc. 2025. https:\/\/proceedings.neurips.cc\/paper\/2020\/hash\/1457c0d6bfcb4967418bfb8ac142f64a-Abstract.html. Accessed 11 Jan 2025."},{"key":"4789_CR11","doi-asserted-by":"publisher","unstructured":"Karpukhin V, O\u011fuz B, Min S, Lewis P, Wu L, Edunov S, Chen D, Yih WT. Dense passage retrieval for open-domain question answering. In: EMNLP 2020\u20132020 conference on empirical methods in natural language processing, proceedings of the conference. 2020. pp. 6769\u20136781. https:\/\/doi.org\/10.18653\/v1\/2020.emnlp-main.550.","DOI":"10.18653\/v1\/2020.emnlp-main.550"},{"key":"4789_CR12","unstructured":"Singh Sachan D, Reddy S, Hamilton W, Dyer C, Yogatama D. End-to-end training of multi-document reader and retriever for open-domain question answering. Proceedings.Neurips.Cc. 2021. https:\/\/proceedings.neurips.cc\/paper\/2021\/hash\/da3fde159d754a2555eaa198d2d105b2-Abstract.html."},{"key":"4789_CR13","unstructured":"Liu J, Li L, Xiang T, Wang B. Tcra-llm: token compression retrieval augmented large language model for inference cost reduction. 2025. Available from: https:\/\/arxiv.org\/abs\/2310.15556."},{"key":"4789_CR14","doi-asserted-by":"publisher","DOI":"10.1162\/tacl_a_00605","author":"O Ram","year":"2023","unstructured":"Ram O, Levine Y, Dalmedigos I. In-context retrieval-augmented language models. Trans Assoc Comput Linguist. 2023. https:\/\/doi.org\/10.1162\/tacl_a_00605.","journal-title":"Trans Assoc Comput Linguist"},{"key":"4789_CR15","unstructured":"Sun Z, Wang X, Tay Y, Yang Y, Zhou D. Recitation-augmented language models. 11th international conference on learning representations, ICLR 2023."},{"key":"4789_CR16","unstructured":"Yu W, Iter D, Wang S, Xu Y, Ju M, Sanyal S, Zhu C, Zeng M, Jiang M. Generate rather than retrieve: large language models are strong context generators. In: 11th international conference on learning representations, ICLR 2023."},{"key":"4789_CR17","unstructured":"Zhu Y, Yuan H, Wang S, Liu J, Liu W, Deng C, Chen H, Liu Z, Dou Z, Wen J-R. Large language models for information retrieval: a survey. 2023. Available from: http:\/\/arxiv.org\/abs\/2308.07107."},{"key":"4789_CR18","doi-asserted-by":"publisher","unstructured":"Begoli E, Srinivasan S, Mahbub M. Improving efficiency and robustness of transformer-based information retrieval systems. In: SIGIR 2022\u2014proceedings of the 45th international ACM SIGIR conference on research and development in information retrieval. 2022. pp. 3433\u20133435. https:\/\/doi.org\/10.1145\/3477495.3532681.","DOI":"10.1145\/3477495.3532681"},{"key":"4789_CR19","unstructured":"Gao Y, Xiong Y, Gao X, Jia K, Pan J, Bi Y, Dai Y, Sun J, Wang M, Wang H. Retrieval-augmented generation for large language models: a survey. 2023. Available from: http:\/\/arxiv.org\/abs\/2312.10997."},{"key":"4789_CR20","unstructured":"Siriwardhana S, Weerasekera R, Wen E, Nanayakkara S. Fine-tune the entire RAG architecture (including DPR retriever) for question-answering. 2021. Available from: http:\/\/arxiv.org\/abs\/2106.11517."},{"key":"4789_CR21","unstructured":"Hicke Y, Agarwal A, Ma Q, Denny P. AI-TA: towards an intelligent question-answer teaching assistant using open-source LLMs. 2023. http:\/\/arxiv.org\/abs\/2311.02775."},{"key":"4789_CR22","unstructured":"Lewis P, Perez E, Piktus A, Petroni F, Karpukhin V, Goyal N, K\u00fcttler H, Lewis M, Yih WT, Rockt\u00e4schel T, Riedel S, Kiela D. Retrieval-augmented generation for knowledge-intensive NLP tasks. In: Advances in neural information processing systems. 2020. https:\/\/proceedings.neurips.cc\/paper\/2020\/hash\/6b493230205f780e1bc26945df7481e5-Abstract.html."},{"key":"4789_CR23","doi-asserted-by":"publisher","DOI":"10.1016\/j.lindif.2023.102274","volume":"103","author":"E Kasneci","year":"2023","unstructured":"Kasneci E, Sessler K, K\u00fcchemann S, Bannert M, Dementieva D, Fischer F, et al. ChatGPT for good? On opportunities and challenges of large language models for education. Learn Individ Differ. 2023;103. https:\/\/doi.org\/10.1016\/j.lindif.2023.102274.","journal-title":"Learn Individ Differ"},{"key":"4789_CR24","unstructured":"Guu K, Lee K, Tung Z, Pasupat P, Chang M. Retrieval augmented language model pre-training. In: International conference on machine learning. 2020. http:\/\/proceedings.mlr.press\/v119\/guu20a.html?ref=https:\/\/githubhelp.com."},{"key":"4789_CR25","first-page":"1","volume":"24","author":"G Izacard","year":"2023","unstructured":"Izacard G, Lewis P, Lomeli M, Hosseini L, Petroni F, Schick T, et al. Atlas: few-shot learning with retrieval augmented language models. J Mach Learn Res. 2023;24:1\u201343.","journal-title":"J Mach Learn Res"},{"key":"4789_CR26","doi-asserted-by":"publisher","unstructured":"Scarlatos A, Liu N, Lee J, Baraniuk R, Lan A. (2025). Training llm-based tutors to improve student learning outcomes in dialogues. In: International conference on artificial intelligence in education. Springer; 2025. pp. 251\u2013266. https:\/\/doi.org\/10.1007\/978-3-031-98414-3_18.","DOI":"10.1007\/978-3-031-98414-3_18"},{"key":"4789_CR27","doi-asserted-by":"publisher","unstructured":"Piro L, Bianchi T, Alessandrelli L, Chizzola A, Casiraghi D, Sancassani S, Gatti N. Mylearningtalk: an llm-based intelligent tutoring system. In: International conference on web engineering. Springer; 2024. pp. 428\u2013431. https:\/\/doi.org\/10.1007\/978-3-031-62362-2_39.","DOI":"10.1007\/978-3-031-62362-2_39"},{"key":"4789_CR28","unstructured":"Blobstein A, Izmaylov D, Yifal T, Levy M, Segal A. Angel: a new generation tool for learning material based questions and answers. In: NeurIPS\u201923 workshop on generative AI for education (GAIED). 2023. https:\/\/gaied.org\/neurips2023\/files\/9\/9_paper.pdf."},{"key":"4789_CR29","doi-asserted-by":"publisher","unstructured":"Bhoomika BK, Brunda L, Chandan KH, Anure PS, Upadhyaya SR. CogniLearn: integrating AI-Powered insights for class 10 syllabus. In: Proceedings\u20142025 11th international conference on computing and artificial intelligence, ICCAI 2025. 2025. pp. 465\u2013472. https:\/\/doi.org\/10.1109\/ICCAI66501.2025.00077.","DOI":"10.1109\/ICCAI66501.2025.00077"},{"key":"4789_CR30","unstructured":"Harrison C. LangChain. 2022. https:\/\/github.com\/langchain-ai\/langchain."},{"key":"4789_CR31","doi-asserted-by":"crossref","unstructured":"Douze M, Guzhva A, Deng C, Johnson J, Szilvasy G, Mazar\u00e9 P-E, Lomeli M, Hosseini L, J\u00e9gou H. The Faiss library. 2024. http:\/\/arxiv.org\/abs\/2401.08281.","DOI":"10.1109\/TBDATA.2025.3618474"},{"key":"4789_CR32","doi-asserted-by":"crossref","unstructured":"Roumeliotis KI, Tselikas ND, Nasiopoulos DK. LLMs in e-commerce: A comparative analysis of GPT and LLaMA models in product review evaluation. Nat Lang Process J. 2024;6:100056.","DOI":"10.1016\/j.nlp.2024.100056"},{"key":"4789_CR33","unstructured":"Radford A, Narasimhan K, Salimans T, Sutskever I. (2018). Improving language understanding by generative pre-training."},{"key":"4789_CR34","unstructured":"Touvron H, Lavril T, Izacard G, Martinet X, Lachaux MA, Lacroix T, Lample G. (2023). Llama: Open and efficient foundation language models. arXiv preprint arXiv:230213971."},{"key":"4789_CR35","unstructured":"Chaplot DS. (2023). Albert q. jiang, alexandre sablayrolles, arthur mensch, chris bamford, devendra singh chaplot, diego de las casas, florian bressand, gianna lengyel, guillaume lample, lucile saulnier, l\u00e9lio renard lavaud, marie-anne lachaux, pierre stock, teven le scao, thibaut lavril, thomas wang, timoth\u00e9e lacroix, william el sayed. arXiv preprint arXiv:2310.06825, 3."},{"key":"4789_CR36","doi-asserted-by":"crossref","unstructured":"Chang Y, Wang X, Wang J, Wu Y, Yang L, Zhu K, Xie X. A survey on evaluation of large language models. ACM Trans Intell Syst Technol. 2024;15(3):1\u201345.","DOI":"10.1145\/3641289"},{"key":"4789_CR37","unstructured":"Brown T, Mann B, Ryder N, Subbiah M, Kaplan JD, Dhariwal P, Amodei D. Language models are few-shot learners. Adv Neural Inf Process Syst. 2020;33:1877\u2013901."},{"key":"4789_CR38","doi-asserted-by":"crossref","unstructured":"Ram O, Levine Y, Dalmedigos I, Muhlgay D, Shashua A, Leyton-Brown K, Shoham Y. In-context retrieval-augmented language models. Trans Association Comput Linguistics. 2023;11:1316\u201331.","DOI":"10.1162\/tacl_a_00605"}],"container-title":["SN Computer Science"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s42979-026-04789-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s42979-026-04789-w","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s42979-026-04789-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,11]],"date-time":"2026-03-11T13:01:02Z","timestamp":1773234062000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s42979-026-04789-w"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,3,11]]},"references-count":38,"journal-issue":{"issue":"3","published-online":{"date-parts":[[2026,3]]}},"alternative-id":["4789"],"URL":"https:\/\/doi.org\/10.1007\/s42979-026-04789-w","relation":{},"ISSN":["2661-8907"],"issn-type":[{"value":"2661-8907","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,3,11]]},"assertion":[{"value":"5 July 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"21 January 2026","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"11 March 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"This research does not involve human participants or animals.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Research Involving in Human and Animal Participants"}}],"article-number":"273"}}