{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,10]],"date-time":"2026-03-10T00:52:52Z","timestamp":1773103972214,"version":"3.50.1"},"publisher-location":"Cham","reference-count":38,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031984648","type":"print"},{"value":"9783031984655","type":"electronic"}],"license":[{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-98465-5_8","type":"book-chapter","created":{"date-parts":[[2025,7,19]],"date-time":"2025-07-19T01:46:46Z","timestamp":1752889606000},"page":"60-67","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Do We Need a Detailed Rubric for Automated Essay Scoring Using Large Language Models?"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-2180-9231","authenticated-orcid":false,"given":"Lui","family":"Yoshida","sequence":"first","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,7,20]]},"reference":[{"key":"8_CR1","unstructured":"Brown, T., et al.: Language models are few-shot learners. In: Larochelle, H., Ranzato, M., Hadsell, R., Balcan, M.F., and Lin, H. (eds.) Advances in Neural Information Processing Systems, pp. 1877\u20131901. Curran Associates, Inc. (2020)"},{"key":"8_CR2","unstructured":"Wei, J., et al.: Chain-of-thought prompting elicits reasoning in large language models. In: Koyejo, S., Mohamed, S., Agarwal, D., Belgrave, D., Cho, K., and Oh, A. (eds.) Advances in Neural Information Processing Systems, pp. 24824\u201324837. Curran Associates, Inc. (2022)"},{"key":"8_CR3","unstructured":"Kojima, T., Gu, S.S., Reid, M., Matsuo, Y., Iwasawa, Y.: Large language models are zero-shot reasoners. In: Koyejo, S., Mohamed, S., Agarwal, D., Belgrave, D., Cho, K., and Oh, A. (eds.) Advances in Neural Information Processing Systems, pp. 22199\u201422213. Curran Associates, Inc. (2022)"},{"key":"8_CR4","unstructured":"OpenAI: GPT-4 Technical Report (2023).\u00a0http:\/\/arxiv.org\/abs\/2303.08774,\u00a0"},{"key":"8_CR5","unstructured":"OpenAI: OpenAI o1 System Card.\u00a0https:\/\/openai.com\/index\/openai-o1-system-card\/,\u00a0 Accessed 19 Feb 2025"},{"key":"8_CR6","doi-asserted-by":"publisher","DOI":"10.1016\/j.lindif.2023.102274","volume":"103","author":"E Kasneci","year":"2023","unstructured":"Kasneci, E., et al.: ChatGPT for good? On opportunities and challenges of large language models for education. Learn. Individ. Differ. 103, 102274 (2023)","journal-title":"Learn. Individ. Differ."},{"issue":"1","key":"8_CR7","doi-asserted-by":"publisher","first-page":"90","DOI":"10.1111\/bjet.13370","volume":"55","author":"L Yan","year":"2024","unstructured":"Yan, L., et al.: Practical and ethical challenges of large language models in education: a systematic scoping review. Br. J. Edu. Technol. 55(1), 90\u2013112 (2024)","journal-title":"Br. J. Edu. Technol."},{"key":"8_CR8","doi-asserted-by":"publisher","first-page":"15873","DOI":"10.1007\/s10639-023-11834-1","volume":"28","author":"J Jeon","year":"2023","unstructured":"Jeon, J., Lee, S.: Large language models in education: a focus on the complementary relationship between human teachers and ChatGPT. Educ. Inf. Technol. 28, 15873\u201315892 (2023)","journal-title":"Educ. Inf. Technol."},{"key":"8_CR9","unstructured":"Page, E.B.: The imminence of... grading essays by computer. The Phi Delta Kappan. 47, 238\u2013243 (1966)"},{"key":"8_CR10","doi-asserted-by":"publisher","DOI":"10.7717\/peerj-cs.208","volume":"5","author":"MA Hussein","year":"2019","unstructured":"Hussein, M.A., Hassan, H., Nassef, M.: Automated language essay scoring systems: a literature review. PeerJ Comput. Sci. 5, e208 (2019)","journal-title":"PeerJ Comput. Sci."},{"key":"8_CR11","doi-asserted-by":"crossref","unstructured":"Ke, Z., Ng, V.: Automated essay scoring: a survey of the State of the Art. In: Kraus, S. (ed.) Proceedings of the Twenty-Eighth International Joint Conference on Artificial Intelligence, pp. 6300\u20136308. International Joint Conferences on Artificial Intelligence (2019)","DOI":"10.24963\/ijcai.2019\/879"},{"key":"8_CR12","doi-asserted-by":"publisher","first-page":"2495","DOI":"10.1007\/s10462-021-10068-2","volume":"55","author":"D Ramesh","year":"2022","unstructured":"Ramesh, D., Sanampudi, S.K.: An automated essay scoring systems: a systematic literature review. Artif. Intell. Rev. 55, 2495\u20132527 (2022)","journal-title":"Artif. Intell. Rev."},{"issue":"2","key":"8_CR13","doi-asserted-by":"publisher","DOI":"10.1016\/j.rmal.2023.100050","volume":"2","author":"A Mizumoto","year":"2023","unstructured":"Mizumoto, A., Eguchi, M.: Exploring the potential of using an AI language model for automated essay scoring. Res. Methods Appli. Linguist. 2(2), 100050 (2023)","journal-title":"Res. Methods Appli. Linguist."},{"key":"8_CR14","doi-asserted-by":"crossref","unstructured":"Yancey, K.P., Laflair, G., Verardi, A., Burstein, J.: Rating short L2 Essays on the CEFR scale with GPT-4. In: Kochmar, E., et al. (eds.) Proceedings of the 18th Workshop on Innovative Use of NLP for Building Educational Applications (BEA 2023), pp. 576\u2013584. Association for Computational Linguistics (2023)","DOI":"10.18653\/v1\/2023.bea-1.49"},{"key":"8_CR15","doi-asserted-by":"crossref","unstructured":"Naismith, B., Mulcaire, P., Burstein, J.: Automated evaluation of written discourse coherence using GPT-4. In: Kochmar, E., et al. (eds.) Proceedings of the 18th Workshop on Innovative Use of NLP for Building Educational Applications (BEA 2023), pp. 576\u2013584. Association for Computational Linguistics (2023)","DOI":"10.18653\/v1\/2023.bea-1.32"},{"key":"8_CR16","doi-asserted-by":"crossref","unstructured":"Kim, S., Jo, M.: Is GPT-4 alone sufficient for automated essay scoring?: a comparative judgment approach based on rater cognition. In: Joyner, D., Kim, K.M., Wang, X., and Xia, M. (eds.) Proceedings of the Eleventh ACM Conference on Learning @ Scale, pp. 315\u2013319. Association for Computing Machinery (2024)","DOI":"10.1145\/3657604.3664703"},{"key":"8_CR17","doi-asserted-by":"publisher","unstructured":"Yoshida, L.: The impact of example selection in few-shot prompting on automated essay scoring using GPT models. In: Olney, A.M., Chounta, I.-A., Liu, Z., Santos, O.C., Bittencourt, I.I. (eds.) Artificial Intelligence in Education. Posters and Late Breaking Results, Workshops and Tutorials, Industry and Innovation Tracks, Practitioners, Doctoral Consortium and Blue Sky. pp. 61\u201373. Springer Cham (2024).\u00a0https:\/\/doi.org\/10.1007\/978-3-031-64315-6_5","DOI":"10.1007\/978-3-031-64315-6_5"},{"key":"8_CR18","doi-asserted-by":"crossref","unstructured":"Lee, S., Cai, Y., Meng, D., Wang, Z., Wu, Y.: Unleashing large language models\u2019 proficiency in zero-shot essay scoring. In:\u00a0 Findings of the Association for Computational Linguistics: EMNLP 2024, pp. 181\u2013198. Association for Computational Linguistics (2024)","DOI":"10.18653\/v1\/2024.findings-emnlp.10"},{"key":"8_CR19","doi-asserted-by":"publisher","DOI":"10.1016\/j.caeai.2024.100255","volume":"7","author":"TP Tate","year":"2024","unstructured":"Tate, T.P., et al.: Can AI provide useful holistic essay scoring? Comput. Educ. Artifi. Intell. 7, 100255 (2024)","journal-title":"Comput. Educ. Artifi. Intell."},{"issue":"2","key":"8_CR20","doi-asserted-by":"publisher","first-page":"130","DOI":"10.1016\/j.edurev.2007.05.002","volume":"2","author":"A Jonsson","year":"2007","unstructured":"Jonsson, A., Svingby, G.: The use of scoring rubrics: reliability, validity and educational consequences. Educ. Res. Rev. 2(2), 130\u2013144 (2007)","journal-title":"Educ. Res. Rev."},{"issue":"2","key":"8_CR21","doi-asserted-by":"publisher","first-page":"102","DOI":"10.1080\/00986280902739776","volume":"36","author":"MA Stellmack","year":"2009","unstructured":"Stellmack, M.A., Konheim-Kalkstein, Y.L., Manor, J.E., Massey, A.R., Schmitz, J.A.P.: An Assessment of reliability and validity of a rubric for grading APA-Style introductions. Teach. Psychol. 36(2), 102\u2013107 (2009)","journal-title":"Teach. Psychol."},{"issue":"4","key":"8_CR22","doi-asserted-by":"publisher","first-page":"435","DOI":"10.1080\/02602930902862859","volume":"35","author":"YM Reddy","year":"2010","unstructured":"Reddy, Y.M., Andrade, H.: A review of rubric use in higher education. Assess. Eval. High. Educ. 35(4), 435\u2013448 (2010)","journal-title":"Assess. Eval. High. Educ."},{"issue":"1","key":"8_CR23","first-page":"10","volume":"7","author":"BM Moskal","year":"2000","unstructured":"Moskal, B.M., Leydens, J.A.: Scoring rubric development: validity and reliability. Pract. Assess. Res. Eval. 7(1), 10 (2000)","journal-title":"Pract. Assess. Res. Eval."},{"key":"8_CR24","unstructured":"Moskal, B.M.: Developing classroom performance assessments and scoring rubrics - Part I. ERIC Digest. ERIC Clearinghouse on Assessment and Evaluation College Park MD. ED481714 (2003)"},{"issue":"3","key":"8_CR25","doi-asserted-by":"publisher","first-page":"197","DOI":"10.1187\/cbe.06-06-0168","volume":"5","author":"D Allen","year":"2006","unstructured":"Allen, D., Tanner, K.: Rubrics: tools for making learning goals and evaluation criteria explicit for both teachers and learners. Life Sciences Education. 5(3), 197\u2013203 (2006)","journal-title":"Life Sciences Education."},{"issue":"9","key":"8_CR26","doi-asserted-by":"publisher","first-page":"3464","DOI":"10.1021\/acs.est.3c01106","volume":"57","author":"MC Rillig","year":"2023","unstructured":"Rillig, M.C., \u00c5gerstrand, M., Bi, M., Gould, K.A., Sauerland, U.: Risks and benefits of large language models for the environment. Environ. Sci. Technol. 57(9), 3464\u20133466 (2023)","journal-title":"Environ. Sci. Technol."},{"key":"8_CR27","doi-asserted-by":"publisher","first-page":"80194","DOI":"10.1109\/ACCESS.2024.3409745","volume":"12","author":"FM Argerich","year":"2024","unstructured":"Argerich, F.M., Pati\u00f1o-Mart\u00ednez, M.: Measuring and improving the energy efficiency of large language models inference. IEEE Access. 12, 80194\u201380207 (2024)","journal-title":"IEEE Access."},{"key":"8_CR28","doi-asserted-by":"crossref","unstructured":"Blanchard, D., Tetreault, J., Higgins, D., Cahill, A., Chodorow, M.: TOEFL11: a corpus of non-native English. ETS Res. Rep. RR-13\u201324, i\u201315 (2013)","DOI":"10.1002\/j.2333-8504.2013.tb02331.x"},{"key":"8_CR29","doi-asserted-by":"publisher","first-page":"5573","DOI":"10.1007\/s10639-021-10838-z","volume":"27","author":"V Ramnarain-Seetohul","year":"2022","unstructured":"Ramnarain-Seetohul, V., Bassoo, V., Rosunally, Y.: Similarity measures in automated essay scoring systems: a ten-year review. Educ. Inf. Technol. 27, 5573\u20135604 (2022)","journal-title":"Educ. Inf. Technol."},{"key":"8_CR30","doi-asserted-by":"crossref","unstructured":"Levy, M., Jacoby, A., Goldberg, Y.: Same task, more tokens: the impact of input length on the reasoning performance of large language models. In: Ku, L.-W., Martins, A., and Srikumar, V. (eds.) Proceedings of the 62nd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers). pp. 15339\u201315353. Association for Computational Linguistics (2024)","DOI":"10.18653\/v1\/2024.acl-long.818"},{"key":"8_CR31","doi-asserted-by":"publisher","first-page":"157","DOI":"10.1162\/tacl_a_00638","volume":"12","author":"NF Liu","year":"2024","unstructured":"Liu, N.F., et al.: Lost in the middle: how language models use long contexts. Trans. Associat. Comput. Linguist. 12, 157\u2013173 (2024)","journal-title":"Trans. Associat. Comput. Linguist."},{"key":"8_CR32","doi-asserted-by":"publisher","unstructured":"Wang, Q., Gayed, J.M.: Effectiveness of large language models in automated evaluation of argumentative essays: finetuning vs. zero-shot prompting. Comput. Assisted Lang. Learn., 1\u201329. https:\/\/doi.org\/10.1080\/09588221.2024.2371395","DOI":"10.1080\/09588221.2024.2371395"},{"key":"8_CR33","doi-asserted-by":"publisher","DOI":"10.1016\/j.caeai.2024.100210","volume":"6","author":"E Latif","year":"2024","unstructured":"Latif, E., Zhai, X.: Fine-tuning ChatGPT for automatic scoring. Comput. Educ. Artifi. Intell. 6, 100210 (2024)","journal-title":"Comput. Educ. Artifi. Intell."},{"key":"8_CR34","doi-asserted-by":"publisher","unstructured":"Feng, H., et al.: Leveraging large language models for\u00a0automated Chinese essay scoring. In: Olney, A.M., Chounta, I.-A., Liu, Z., Santos, O.C., and Bittencourt, I.I. (eds.) Artificial Intelligence in Education, pp. 454\u2013467. Springer Cham (2024).\u00a0https:\/\/doi.org\/10.1007\/978-3-031-64302-6_32","DOI":"10.1007\/978-3-031-64302-6_32"},{"key":"8_CR35","unstructured":"OpenAI: o3-mini System Card.\u00a0https:\/\/openai.com\/index\/o3-mini-system-card\/,\u00a0 Accessed 19 Feb 2025"},{"key":"8_CR36","unstructured":"DeepSeek-AI: DeepSeek-R1: Incentivizing Reasoning Capability in LLMs via Reinforcement Learning.\u00a0https:\/\/github.com\/deepseek-ai\/DeepSeek-R1\/blob\/main\/DeepSeek_R1.pdf, Accessed 19 Feb 2025"},{"key":"8_CR37","doi-asserted-by":"publisher","first-page":"53","DOI":"10.1016\/j.asw.2013.04.001","volume":"20","author":"MD Shermis","year":"2014","unstructured":"Shermis, M.D.: State-of-the-art automated essay scoring: Competition, results, and future directions from a United States demonstration. Assess. Writ. 20, 53\u201376 (2014)","journal-title":"Assess. Writ."},{"key":"8_CR38","unstructured":"Yannakoudakis, H., Briscoe, T., Medlock, B.: A new dataset and method for automatically grading ESOL Texts. In: Lin, D., Matsumoto, Y., and Mihalcea, R. (eds.) Proceedings of the 49th Annual Meeting of the Association for Computational Linguistics: Human Language Technologies, pp. 180\u2013189. Association for Computational Linguistics (2011)"}],"container-title":["Lecture Notes in Computer Science","Artificial Intelligence in Education"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-98465-5_8","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,7]],"date-time":"2025-09-07T14:48:14Z","timestamp":1757256494000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-98465-5_8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"ISBN":["9783031984648","9783031984655"],"references-count":38,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-98465-5_8","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025]]},"assertion":[{"value":"20 July 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"AIED","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Artificial Intelligence in Education","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Palermo","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Italy","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2025","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"22 July 2025","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"26 July 2025","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"26","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"aied2025","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/aied2025.itd.cnr.it\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}