{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,19]],"date-time":"2026-06-19T02:52:17Z","timestamp":1781837537959,"version":"3.54.5"},"publisher-location":"Cham","reference-count":20,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783032293718","type":"print"},{"value":"9783032293725","type":"electronic"}],"license":[{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2026]]},"DOI":"10.1007\/978-3-032-29372-5_8","type":"book-chapter","created":{"date-parts":[[2026,6,19]],"date-time":"2026-06-19T02:47:23Z","timestamp":1781837243000},"page":"109-124","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Toward Reliable LLM-Integrated Web Architectures for\u00a0Teacher-Aligned Automatic Student Grading"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0009-0007-8348-2357","authenticated-orcid":false,"given":"Jonas","family":"Gwozdz","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9177-5463","authenticated-orcid":false,"given":"Andreas","family":"Both","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2026,6,20]]},"reference":[{"issue":"1","key":"8_CR1","doi-asserted-by":"publisher","first-page":"60","DOI":"10.1007\/s40593-014-0026-8","volume":"25","author":"S Burrows","year":"2014","unstructured":"Burrows, S., Gurevych, I., Stein, B.: The eras and trends of automatic short answer grading. Int. J. Artif. Intell. Educ. 25(1), 60\u2013117 (2014). https:\/\/doi.org\/10.1007\/s40593-014-0026-8","journal-title":"Int. J. Artif. Intell. Educ."},{"key":"8_CR2","doi-asserted-by":"publisher","DOI":"10.1162\/99608f92.5317da47","author":"L Chen","year":"2024","unstructured":"Chen, L., Zaharia, M., Zou, J.: How is ChatGPT\u2019s behavior changing over time? Harvard Data Sci. Rev. (2024). https:\/\/doi.org\/10.1162\/99608f92.5317da47","journal-title":"Harvard Data Sci. Rev."},{"key":"8_CR3","doi-asserted-by":"publisher","unstructured":"Chu, Y., et al.: A LLM-powered automatic grading framework with human-level guidelines optimization. In: Proceedings of EDM 2025, pp. 31\u201341 (2025). https:\/\/doi.org\/10.5281\/zenodo.15870201","DOI":"10.5281\/zenodo.15870201"},{"key":"8_CR4","doi-asserted-by":"publisher","unstructured":"Desai, S., Durrett, G.: Calibration of pre-trained transformers. In: Proceedings of EMNLP 2020, pp. 295\u2013302 (2020). https:\/\/doi.org\/10.18653\/v1\/2020.emnlp-main.21","DOI":"10.18653\/v1\/2020.emnlp-main.21"},{"key":"8_CR5","doi-asserted-by":"publisher","unstructured":"Funayama, H., Sato, T., Matsubayashi, Y., Mizumoto, T., Suzuki, J., Inui, K.: Balancing cost and quality: an exploration of human-in-the-loop frameworks for automated short answer scoring. In: Proceedings of AIED, pp. 465\u2013476 (2022). https:\/\/doi.org\/10.1007\/978-3-031-11644-5_38","DOI":"10.1007\/978-3-031-11644-5_38"},{"key":"8_CR6","doi-asserted-by":"publisher","first-page":"183","DOI":"10.1007\/s00607-025-01540-w","volume":"107","author":"F Gomes","year":"2025","unstructured":"Gomes, F., Rego, P., Trinta, F.: A systematic mapping study on observability of microservices-based applications: fundamentals, classifications, and challenges. Computing 107, 183 (2025). https:\/\/doi.org\/10.1007\/s00607-025-01540-w","journal-title":"Computing"},{"issue":"1","key":"8_CR7","doi-asserted-by":"publisher","first-page":"1060","DOI":"10.1186\/s12909-024-06026-5","volume":"24","author":"C Gr\u00e9visse","year":"2024","unstructured":"Gr\u00e9visse, C.: LLM-based automatic short answer grading in undergraduate medical education. BMC Med. Educ. 24(1), 1060 (2024). https:\/\/doi.org\/10.1186\/s12909-024-06026-5","journal-title":"BMC Med. Educ."},{"key":"8_CR8","doi-asserted-by":"publisher","unstructured":"Gu, J., et al.: A survey on LLM-as-a-judge. The Innovation, art. 101253 (2026). https:\/\/doi.org\/10.1016\/j.xinn.2025.101253","DOI":"10.1016\/j.xinn.2025.101253"},{"key":"8_CR9","unstructured":"Gwozdz, J., Both, A.: Auditing LLM grading for short-answer responses: confidence gating and cross-model agreement. In: Proceedings of IEEE International Conference on Advanced Learning Technologies (ICALT) 2026 (2026)"},{"key":"8_CR10","doi-asserted-by":"publisher","unstructured":"Hori, T., Yamauchi, K.: Low cost active learning framework for short answer scoring. In: Proceedings of PKAW 2024, pp. 176\u2013189 (2025). https:\/\/doi.org\/10.1007\/978-981-96-0026-7_14","DOI":"10.1007\/978-981-96-0026-7_14"},{"issue":"4","key":"8_CR11","doi-asserted-by":"publisher","first-page":"389","DOI":"10.1023\/A:1025779619903","volume":"37","author":"C Leacock","year":"2003","unstructured":"Leacock, C., Chodorow, M.: C-rater: automated scoring of short-answer questions. Comput. Humanit. 37(4), 389\u2013405 (2003). https:\/\/doi.org\/10.1023\/A:1025779619903","journal-title":"Comput. Humanit."},{"key":"8_CR12","doi-asserted-by":"publisher","unstructured":"Li, Z., et al.: Learning when to defer to humans for short answer grading. In: Proceedings of AIED 2023, pp. 414\u2013425 (2023). https:\/\/doi.org\/10.1007\/978-3-031-36272-9_34","DOI":"10.1007\/978-3-031-36272-9_34"},{"key":"8_CR13","doi-asserted-by":"publisher","unstructured":"Nawahdah, M., Sawalha, H., Salameh, R., Taha, M.: Evaluating the accuracy and effectiveness of AI-based grading in computer science education. In: Proceedings of IEEE SCME 2025, pp. 1\u20136 (2025). https:\/\/doi.org\/10.1109\/SCME62582.2025.11104873","DOI":"10.1109\/SCME62582.2025.11104873"},{"key":"8_CR14","doi-asserted-by":"publisher","unstructured":"Poli\u010dar, P.G., \u0160pendl, M., Curk, T., Zupan, B.: Automated assignment grading with large language models: insights from a bioinformatics course. Bioinformatics 41(Suppl.\u00a01), i21\u2013i29 (2025). https:\/\/doi.org\/10.1093\/bioinformatics\/btaf196","DOI":"10.1093\/bioinformatics\/btaf196"},{"key":"8_CR15","doi-asserted-by":"publisher","unstructured":"Raina, V., Liusie, A., Gales, M.: Is LLM-as-a-judge robust? investigating universal adversarial attacks on zero-shot LLM assessment. In: Proceedings of EMNLP 2024, pp. 7499\u20137517 (2024). https:\/\/doi.org\/10.18653\/v1\/2024.emnlp-main.427","DOI":"10.18653\/v1\/2024.emnlp-main.427"},{"key":"8_CR16","doi-asserted-by":"publisher","unstructured":"Saleh Sedghpour, M.R., Klein, C., Tordsson, J.: An empirical study of service mesh traffic management policies for microservices. In: Proceedings of ICPE 2022, pp. 17\u201327 (2022). https:\/\/doi.org\/10.1145\/3489525.3511686","DOI":"10.1145\/3489525.3511686"},{"key":"8_CR17","doi-asserted-by":"crossref","unstructured":"Shi, L., Ma, C., Liang, W., Diao, X., Ma, W., Vosoughi, S.: Judging the judges: a systematic study of position bias in LLM-as-a-judge. In: Proceedings of IJCNLP-ACLC 2025, pp. 292\u2013314 (2025)","DOI":"10.18653\/v1\/2025.ijcnlp-long.18"},{"key":"8_CR18","doi-asserted-by":"publisher","unstructured":"Williamson, D.M., Xi, X., Breyer, F.J.: A framework for evaluation and use of automated scoring. Educ. Measure. Issues Practice 31(1), 2\u201313 (2012). https:\/\/doi.org\/10.1111\/j.1745-3992.2011.00223.x","DOI":"10.1111\/j.1745-3992.2011.00223.x"},{"key":"8_CR19","doi-asserted-by":"publisher","unstructured":"Woodrow, J., Piech, C., Koyejo, S.: Improving generative AI student feedback: Direct preference optimization with teachers in the loop. In: Proceedings of EDM 2025, pp. 442\u2013449 (2025). https:\/\/doi.org\/10.5281\/zenodo.15870266","DOI":"10.5281\/zenodo.15870266"},{"key":"8_CR20","doi-asserted-by":"publisher","unstructured":"Zhao, C., Silva, M., Poulsen, S.: Language models are few-shot graders. In: Proceedings of AIED 2025, pp. 3\u201316 (2025). https:\/\/doi.org\/10.1007\/978-3-031-98459-4_1","DOI":"10.1007\/978-3-031-98459-4_1"}],"container-title":["Lecture Notes in Computer Science","Web Engineering"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-032-29372-5_8","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,6,19]],"date-time":"2026-06-19T02:47:26Z","timestamp":1781837246000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-032-29372-5_8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026]]},"ISBN":["9783032293718","9783032293725"],"references-count":20,"URL":"https:\/\/doi.org\/10.1007\/978-3-032-29372-5_8","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026]]},"assertion":[{"value":"20 June 2026","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"The authors have no competing interests to declare that are relevant to the content of this article.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Disclosure of Interests"}},{"value":"ICWE","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Web Engineering","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Lyon","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"France","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2026","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"9 June 2026","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"12 June 2026","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"26","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"icwe2026","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/icwe2026.webengineering.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}