{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,18]],"date-time":"2025-12-18T19:53:03Z","timestamp":1766087583172,"version":"3.40.3"},"publisher-location":"Cham","reference-count":33,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783030522360"},{"type":"electronic","value":"9783030522377"}],"license":[{"start":{"date-parts":[[2020,1,1]],"date-time":"2020-01-01T00:00:00Z","timestamp":1577836800000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2020,1,1]],"date-time":"2020-01-01T00:00:00Z","timestamp":1577836800000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020]]},"DOI":"10.1007\/978-3-030-52237-7_2","type":"book-chapter","created":{"date-parts":[[2020,7,4]],"date-time":"2020-07-04T00:02:40Z","timestamp":1593820960000},"page":"16-28","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":21,"title":["Strategies for Deploying Unreliable AI Graders in High-Transparency High-Stakes Exams"],"prefix":"10.1007","author":[{"given":"Sushmita","family":"Azad","sequence":"first","affiliation":[]},{"given":"Binglin","family":"Chen","sequence":"additional","affiliation":[]},{"given":"Maxwell","family":"Fowler","sequence":"additional","affiliation":[]},{"given":"Matthew","family":"West","sequence":"additional","affiliation":[]},{"given":"Craig","family":"Zilles","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2020,6,30]]},"reference":[{"key":"2_CR1","doi-asserted-by":"crossref","unstructured":"Alikaniotis, D., Yannakoudakis, H., Rei, M.: Automatic text scoring using neural networks. In: Proceedings of the 54th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pp. 715\u2013725 (2016)","DOI":"10.18653\/v1\/P16-1068"},{"issue":"2","key":"2_CR2","doi-asserted-by":"publisher","first-page":"32","DOI":"10.1145\/1272848.1272879","volume":"39","author":"J Bennedsen","year":"2007","unstructured":"Bennedsen, J., Caspersen, M.E.: Failure rates in introductory programming. SIGCSE Bull. 39(2), 32\u201336 (2007). \nhttps:\/\/doi.org\/10.1145\/1272848.1272879","journal-title":"SIGCSE Bull."},{"issue":"1","key":"2_CR3","doi-asserted-by":"publisher","first-page":"60","DOI":"10.1007\/s40593-014-0026-8","volume":"25","author":"S Burrows","year":"2014","unstructured":"Burrows, S., Gurevych, I., Stein, B.: The eras and trends of automatic short answer grading. Int. J. Artif. Intell. Educ. 25(1), 60\u2013117 (2014). \nhttps:\/\/doi.org\/10.1007\/s40593-014-0026-8","journal-title":"Int. J. Artif. Intell. Educ."},{"key":"2_CR4","doi-asserted-by":"publisher","unstructured":"Clancy, M.J., Linn, M.C.: Patterns and pedagogy. In: The Proceedings of the Thirtieth SIGCSE Technical Symposium on Computer Science Education, SIGCSE 1999, pp. 37\u201342. ACM, New York (1999). \nhttps:\/\/doi.org\/10.1145\/299649.299673","DOI":"10.1145\/299649.299673"},{"key":"2_CR5","volume-title":"Statistical Power Analysis for the Behavioral Sciences","author":"J Cohen","year":"1988","unstructured":"Cohen, J.: Statistical Power Analysis for the Behavioral Sciences, 2nd edn. Routledge, Abingdon (1988)","edition":"2"},{"key":"2_CR6","unstructured":"Computing Research Association: Generation CS: Computer Science Undergraduate Enrollments Surge Since 2006 (2017). \nhttps:\/\/cra.org\/data\/Generation-CS"},{"key":"2_CR7","series-title":"Lecture Notes in Computer Science (Lecture Notes in Artificial Intelligence)","doi-asserted-by":"publisher","first-page":"41","DOI":"10.1007\/978-3-030-23207-8_8","volume-title":"Artificial Intelligence in Education","author":"G Converse","year":"2019","unstructured":"Converse, G., Curi, M., Oliveira, S.: Autoencoders for educational assessment. In: Isotani, S., Mill\u00e1n, E., Ogan, A., Hastings, P., McLaren, B., Luckin, R. (eds.) AIED 2019. LNCS (LNAI), vol. 11626, pp. 41\u201345. Springer, Cham (2019). \nhttps:\/\/doi.org\/10.1007\/978-3-030-23207-8_8"},{"key":"2_CR8","series-title":"Lecture Notes in Computer Science (Lecture Notes in Artificial Intelligence)","doi-asserted-by":"publisher","first-page":"84","DOI":"10.1007\/978-3-030-23204-7_8","volume-title":"Artificial Intelligence in Education","author":"SA Crossley","year":"2019","unstructured":"Crossley, S.A., Kim, M., Allen, L., McNamara, D.: Automated summarization evaluation (ASE) using natural language processing tools. In: Isotani, S., Mill\u00e1n, E., Ogan, A., Hastings, P., McLaren, B., Luckin, R. (eds.) AIED 2019. LNCS (LNAI), vol. 11625, pp. 84\u201395. Springer, Cham (2019). \nhttps:\/\/doi.org\/10.1007\/978-3-030-23204-7_8"},{"key":"2_CR9","doi-asserted-by":"crossref","unstructured":"Dasgupta, T., Naskar, A., Dey, L., Saha, R.: Augmenting textual qualitative features in deep convolution recurrent neural network for automatic essay scoring. In: Proceedings of the 5th Workshop on Natural Language Processing Techniques for Educational Applications, pp. 93\u2013102. Association for Computational Linguistics, Melbourne (2018)","DOI":"10.18653\/v1\/W18-3713"},{"key":"2_CR10","doi-asserted-by":"crossref","unstructured":"Dong, F., Zhang, Y.: Automatic features for essay scoring - an empirical study. In: Proceedings of the 2016 Conference on Empirical Methods in Natural Language Processing, pp. 1072\u20131077. Association for Computational Linguistics, Austin (2016)","DOI":"10.18653\/v1\/D16-1115"},{"key":"2_CR11","series-title":"Lecture Notes in Computer Science (Lecture Notes in Artificial Intelligence)","doi-asserted-by":"publisher","first-page":"380","DOI":"10.1007\/978-3-030-03928-8_31","volume-title":"Advances in Artificial Intelligence \u2013 IBERAMIA 2018","author":"LB Galhardi","year":"2018","unstructured":"Galhardi, L.B., Brancher, J.D.: Machine learning approach for automatic short answer grading: a systematic review. In: Simari, G.R., Ferm\u00e9, E., Guti\u00e9rrez Segura, F., Rodr\u00edguez Melquiades, J.A. (eds.) IBERAMIA 2018. LNCS (LNAI), vol. 11238, pp. 380\u2013391. Springer, Cham (2018). \nhttps:\/\/doi.org\/10.1007\/978-3-030-03928-8_31"},{"key":"2_CR12","unstructured":"Hussein, M.A., Hassan, H., Nassef, M.: Automated language essay scoring systems: a literature review. PeerJ Comput. Sci. 5, e208 (2019). \nhttps:\/\/peerj.com\/articles\/cs-208"},{"issue":"4","key":"2_CR13","doi-asserted-by":"publisher","first-page":"389","DOI":"10.1023\/A:1025779619903","volume":"37","author":"C Leacock","year":"2003","unstructured":"Leacock, C., Chodorow, M.: C-rater: automated scoring of short-answer questions. Comput. Humanit. 37(4), 389\u2013405 (2003). \nhttps:\/\/doi.org\/10.1023\/A:1025779619903","journal-title":"Comput. Humanit."},{"key":"2_CR14","doi-asserted-by":"publisher","unstructured":"Lister, R., Fidge, C., Teague, D.: Further evidence of a relationship between explaining, tracing and writing skills in introductory programming. In: Proceedings of the 14th Annual ACM SIGCSE Conference on Innovation and Technology in Computer Science Education, ITiCSE 2009, pp. 161\u2013165. ACM, New York (2009). \nhttps:\/\/doi.org\/10.1145\/1562877.1562930","DOI":"10.1145\/1562877.1562930"},{"key":"2_CR15","series-title":"Lecture Notes in Computer Science (Lecture Notes in Artificial Intelligence)","doi-asserted-by":"publisher","first-page":"220","DOI":"10.1007\/978-3-030-23204-7_19","volume-title":"Artificial Intelligence in Education","author":"M Liu","year":"2019","unstructured":"Liu, M., Shum, S.B., Mantzourani, E., Lucas, C.: Evaluating machine learning approaches to classify pharmacy students\u2019 reflective statements. In: Isotani, S., Mill\u00e1n, E., Ogan, A., Hastings, P., McLaren, B., Luckin, R. (eds.) AIED 2019. LNCS (LNAI), vol. 11625, pp. 220\u2013230. Springer, Cham (2019). \nhttps:\/\/doi.org\/10.1007\/978-3-030-23204-7_19"},{"key":"2_CR16","unstructured":"Liu, T., Ding, W., Wang, Z., Tang, J., Huang, G.Y., Liu, Z.: Automatic Short Answer Grading via Multiway Attention Networks. \narXiv:1909.10166\n\n [cs] (2019). \nhttp:\/\/arxiv.org\/abs\/1909.10166"},{"key":"2_CR17","doi-asserted-by":"crossref","unstructured":"Lopez, M., Whalley, J., Robbins, P., Lister, R.: Relationships between reading, tracing and writing skills in introductory programming. In: Proceedings of the Fourth International Workshop on Computing Education Research, pp. 101\u2013112. ACM (2008)","DOI":"10.1145\/1404520.1404531"},{"key":"2_CR18","doi-asserted-by":"publisher","unstructured":"Murphy, L., McCauley, R., Fitzgerald, S.: \u2018Explain in Plain English\u2019 questions: implications for teaching. In: Proceedings of the 43rd ACM Technical Symposium on Computer Science Education, SIGCSE 2012, pp. 385\u2013390. ACM, New York (2012). \nhttps:\/\/doi.org\/10.1145\/2157136.2157249","DOI":"10.1145\/2157136.2157249"},{"key":"2_CR19","doi-asserted-by":"publisher","unstructured":"National Academies of Sciences, Engineering, and Medicine: Assessing and Responding to the Growth of Computer Science Undergraduate Enrollments. The National Academies Press, Washington, DC (2018). \nhttps:\/\/doi.org\/10.17226\/24926\n\n. \nhttps:\/\/www.nap.edu\/catalog\/24926\/assessing-and-responding-to-the-growth-of-computer-science-undergraduate-enrollments","DOI":"10.17226\/24926"},{"key":"2_CR20","series-title":"Lecture Notes in Computer Science (Lecture Notes in Artificial Intelligence)","doi-asserted-by":"publisher","first-page":"365","DOI":"10.1007\/978-3-030-23207-8_67","volume-title":"Artificial Intelligence in Education","author":"IG Ndukwe","year":"2019","unstructured":"Ndukwe, I.G., Daniel, B.K., Amadi, C.E.: A machine learning grading system using chatbots. In: Isotani, S., Mill\u00e1n, E., Ogan, A., Hastings, P., McLaren, B., Luckin, R. (eds.) AIED 2019. LNCS (LNAI), vol. 11626, pp. 365\u2013368. Springer, Cham (2019). \nhttps:\/\/doi.org\/10.1007\/978-3-030-23207-8_67"},{"key":"2_CR21","unstructured":"Ramineni, C., Williamson, D.: Understanding mean score differences between the e-rater\u00ae automated scoring engine and humans for demographically based groups in the GRE\u00ae general test. ETS Res. Report Ser. 2018(1), 1\u201331 (2018). \nhttps:\/\/onlinelibrary.wiley.com\/doi\/abs\/10.1002\/ets2.12192"},{"key":"2_CR22","series-title":"Lecture Notes in Computer Science (Lecture Notes in Artificial Intelligence)","doi-asserted-by":"publisher","first-page":"503","DOI":"10.1007\/978-3-319-93843-1_37","volume-title":"Artificial Intelligence in Education","author":"S Saha","year":"2018","unstructured":"Saha, S., Dhamecha, T.I., Marvaniya, S., Sindhgatta, R., Sengupta, B.: Sentence level or token level features for automatic short answer grading?: Use both. In: Penstein Ros\u00e9, C., et al. (eds.) AIED 2018. LNCS (LNAI), vol. 10947, pp. 503\u2013517. Springer, Cham (2018). \nhttps:\/\/doi.org\/10.1007\/978-3-319-93843-1_37"},{"issue":"4","key":"2_CR23","doi-asserted-by":"publisher","first-page":"447","DOI":"10.1111\/medu.13504","volume":"52","author":"AH Sam","year":"2018","unstructured":"Sam, A.H., et al.: Very-short-answer questions: reliability, discrimination and acceptability. Med. Educ. 52(4), 447\u2013455 (2018)","journal-title":"Med. Educ."},{"key":"2_CR24","unstructured":"Sukkarieh, J.Z., Blackmore, J.: C-rater: automatic content scoring for short constructed responses. In: FLAIRS Conference (2009)"},{"key":"2_CR25","series-title":"Lecture Notes in Computer Science (Lecture Notes in Artificial Intelligence)","doi-asserted-by":"publisher","first-page":"469","DOI":"10.1007\/978-3-030-23204-7_39","volume-title":"Artificial Intelligence in Education","author":"C Sung","year":"2019","unstructured":"Sung, C., Dhamecha, T.I., Mukhi, N.: Improving short answer grading using transformer-based pre-training. In: Isotani, S., Mill\u00e1n, E., Ogan, A., Hastings, P., McLaren, B., Luckin, R. (eds.) AIED 2019. LNCS (LNAI), vol. 11625, pp. 469\u2013481. Springer, Cham (2019). \nhttps:\/\/doi.org\/10.1007\/978-3-030-23204-7_39"},{"key":"2_CR26","unstructured":"Suzen, N., Gorban, A., Levesley, J., Mirkes, E.: Automatic Short Answer Grading and Feedback Using Text Mining Methods. CoRR (2019). \narXiv: 1807.10543"},{"key":"2_CR27","doi-asserted-by":"crossref","unstructured":"Taghipour, K., Ng, H.T.: A neural approach to automated essay scoring. In: Proceedings of the 2016 Conference on Empirical Methods in Natural Language Processing, pp. 1882\u20131891. Association for Computational Linguistics, Austin (2016)","DOI":"10.18653\/v1\/D16-1193"},{"issue":"5","key":"2_CR28","first-page":"360","volume":"37","author":"AJ Viera","year":"2005","unstructured":"Viera, A.J., Garrett, J.M., et al.: Understanding interobserver agreement: the Kappa statistic. Fam. Med. 37(5), 360\u2013363 (2005)","journal-title":"Fam. Med."},{"key":"2_CR29","doi-asserted-by":"publisher","unstructured":"Watson, C., Li, F.W.: Failure rates in introductory programming revisited. In: Proceedings of the 2014 Conference on Innovation & #38; Technology in Computer Science Education, ITiCSE 2014, pp. 39\u201344. ACM, New York (2014). \nhttps:\/\/doi.org\/10.1145\/2591708.2591749","DOI":"10.1145\/2591708.2591749"},{"key":"2_CR30","unstructured":"West, M., Herman, G.L., Zilles, C.: PrairieLearn: mastery-based online problem solving with adaptive scoring and recommendations driven by machine learning. In: 2015 ASEE Annual Conference & Exposition. ASEE Conferences, Seattle, Washington (2015)"},{"key":"2_CR31","unstructured":"Whalley, J., et al.: An Australasian study of reading and comprehension skills in novice programmers, using the bloom and SOLO taxonomies. In: Eighth Australasian Computing Education Conference, ACE 2006 (2006)"},{"issue":"2\u20133","key":"2_CR32","doi-asserted-by":"publisher","first-page":"205","DOI":"10.1080\/08993408.2019.1565235","volume":"29","author":"B Xie","year":"2019","unstructured":"Xie, B., et al.: A theory of instruction for introductory programming skills. Comput. Sci. Educ. 29(2\u20133), 205\u2013253 (2019)","journal-title":"Comput. Sci. Educ."},{"key":"2_CR33","series-title":"Lecture Notes in Computer Science (Lecture Notes in Artificial Intelligence)","doi-asserted-by":"publisher","first-page":"399","DOI":"10.1007\/978-3-319-93846-2_75","volume-title":"Artificial Intelligence in Education","author":"X Yang","year":"2018","unstructured":"Yang, X., Huang, Y., Zhuang, F., Zhang, L., Yu, S.: Automatic Chinese short answer grading with deep autoencoder. In: Penstein Ros\u00e9, C., et al. (eds.) AIED 2018. LNCS (LNAI), vol. 10948, pp. 399\u2013404. Springer, Cham (2018). \nhttps:\/\/doi.org\/10.1007\/978-3-319-93846-2_75"}],"container-title":["Lecture Notes in Computer Science","Artificial Intelligence in Education"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-52237-7_2","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,8,9]],"date-time":"2020-08-09T08:08:22Z","timestamp":1596960502000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-030-52237-7_2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020]]},"ISBN":["9783030522360","9783030522377"],"references-count":33,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-52237-7_2","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2020]]},"assertion":[{"value":"30 June 2020","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"AIED","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Artificial Intelligence in Education","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Ifrane","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Morocco","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2020","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"6 July 2020","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"10 July 2020","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"21","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"aied2020","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/aied2020.nees.com.br\/#\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Double-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"EasyChair","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"214","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"49","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"66","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"23% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"4","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"No","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"The conference was held virtually due to the COVID-19 pandemic.","order":10,"name":"additional_info_on_review_process","label":"Additional Info on Review Process","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"This content has been made available to all.","name":"free","label":"Free to read"}]}}