{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,7]],"date-time":"2026-02-07T01:09:54Z","timestamp":1770426594755,"version":"3.49.0"},"publisher-location":"New York, NY, USA","reference-count":34,"publisher":"ACM","license":[{"start":{"date-parts":[[2025,3,31]],"date-time":"2025-03-31T00:00:00Z","timestamp":1743379200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,3,31]]},"DOI":"10.1145\/3672608.3707957","type":"proceedings-article","created":{"date-parts":[[2025,5,14]],"date-time":"2025-05-14T18:26:54Z","timestamp":1747247214000},"page":"83-92","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["UKTA: Unified Korean Text Analyzer"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-5715-4057","authenticated-orcid":false,"given":"Seokho","family":"Ahn","sequence":"first","affiliation":[{"name":"Department of Electrical and Computer Engineering, Inha university, Incheon, Republic of Korea"}]},{"ORCID":"https:\/\/orcid.org\/0009-0000-6714-9684","authenticated-orcid":false,"given":"Junhyung","family":"Park","sequence":"additional","affiliation":[{"name":"Department of Electrical and Computer Engineering, Inha university, Incheon, Republic of Korea"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-1027-105X","authenticated-orcid":false,"given":"Ganghee","family":"Go","sequence":"additional","affiliation":[{"name":"Department of Electrical and Computer Engineering, Inha university, Incheon, Republic of Korea"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4161-2882","authenticated-orcid":false,"given":"Chulhui","family":"Kim","sequence":"additional","affiliation":[{"name":"Department of Korean Education, Inha university, Incheon, Republic of Korea"}]},{"ORCID":"https:\/\/orcid.org\/0009-0000-5711-1834","authenticated-orcid":false,"given":"Jiho","family":"Jung","sequence":"additional","affiliation":[{"name":"Department of Korean Education, Inha university, Incheon, Republic of Korea"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-1832-8987","authenticated-orcid":false,"given":"Myung Sun","family":"Shin","sequence":"additional","affiliation":[{"name":"Department of Korean Education, Inha university, Incheon, Republic of Korea"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3564-7002","authenticated-orcid":false,"given":"Do-Guk","family":"Kim","sequence":"additional","affiliation":[{"name":"Department of Electrical and Computer Engineering, Inha university, Incheon, Republic of Korea"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8542-2058","authenticated-orcid":false,"given":"Young-Duk","family":"Seo","sequence":"additional","affiliation":[{"name":"Department of Electrical and Computer Engineering, Inha University, Incheon, Republic of Korea"}]}],"member":"320","published-online":{"date-parts":[[2025,5,14]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.697"},{"key":"e_1_3_2_1_2_1","first-page":"80","article-title":"Language and thought","volume":"2","author":"Carroll John B","year":"1964","unstructured":"John B Carroll. 1964. Language and thought. Reading Improvement 2, 1 (1964), 80.","journal-title":"Reading Improvement"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"crossref","first-page":"75","DOI":"10.1037\/h0093511","article-title":"IV. A statistical and comparative analysis of individual written language samples","volume":"56","author":"Chotlos John W","year":"1944","unstructured":"John W Chotlos. 1944. IV. A statistical and comparative analysis of individual written language samples. Psychological Monographs 56, 2 (1944), 75.","journal-title":"Psychological Monographs"},{"key":"e_1_3_2_1_5_1","volume-title":"The Tool for the Automatic Analysis of Cohesion 2.0: Integrating semantic similarity and text overlap. Behavior research methods 51","author":"Crossley Scott A","year":"2019","unstructured":"Scott A Crossley, Kristopher Kyle, and Mihai Dascalu. 2019. The Tool for the Automatic Analysis of Cohesion 2.0: Integrating semantic similarity and text overlap. Behavior research methods 51 (2019), 14\u201327."},{"key":"e_1_3_2_1_6_1","volume-title":"The tool for the automatic analysis of text cohesion (TAACO): Automatic assessment of local, global, and text cohesion. Behavior research methods 48","author":"Crossley Scott A","year":"2016","unstructured":"Scott A Crossley, Kristopher Kyle, and Danielle S McNamara. 2016. The tool for the automatic analysis of text cohesion (TAACO): Automatic assessment of local, global, and text cohesion. Behavior research methods 48 (2016), 1227\u20131237."},{"key":"e_1_3_2_1_7_1","volume-title":"The Importance of Assessing Student Writing and Improving Writing Instruction. Research Notes. Educational Testing Service","author":"Deane Paul","year":"2022","unstructured":"Paul Deane. 2022. The Importance of Assessing Student Writing and Improving Writing Instruction. Research Notes. Educational Testing Service (2022)."},{"key":"e_1_3_2_1_8_1","volume-title":"Individual Fairness Evaluation for Automated Essay Scoring System","author":"Doewes Afrizal","year":"2022","unstructured":"Afrizal Doewes, Akrati Saxena, Yulong Pei, and Mykola Pechenizkiy. 2022. Individual Fairness Evaluation for Automated Essay Scoring System. International Educational Data Mining Society (2022)."},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1093\/oxfordhb\/9780190917982.013.71"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.3758\/BF03195564"},{"key":"e_1_3_2_1_11_1","unstructured":"Maarten Grootendorst. [n. d.]. KeyBERT. https:\/\/github.com\/MaartenGr\/keyBERT. Last accessed on 2023-08-09."},{"key":"e_1_3_2_1_12_1","volume-title":"Probl\u00e8mes et m\u00e9thodes de la statistique linguistique. (No Title)","author":"Guiraud Pierre","year":"1959","unstructured":"Pierre Guiraud. 1959. Probl\u00e8mes et m\u00e9thodes de la statistique linguistique. (No Title) (1959)."},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"crossref","first-page":"3","DOI":"10.15858\/engtea.74.3.201909.3","article-title":"Lexical Richness in EFL Undergraduate Students","volume":"74","author":"Ha Hye Seung","year":"2019","unstructured":"Hye Seung Ha. 2019. Lexical Richness in EFL Undergraduate Students' Academic Writing. English Teaching 74, 3 (2019), 3\u201328.","journal-title":"Academic Writing. English Teaching"},{"key":"e_1_3_2_1_14_1","volume-title":"H. Daller, J. Milton & J","author":"Hout Roeland","year":"2007","unstructured":"Roeland Hout and Anne Vermeer. 2007. Comparing measures of lexical richness. In: H. Daller, J. Milton & J. Treffers-Daller (eds.), Modelling and assessing vocabulary knowledge (93\u2013116). Cambridge: Cambridge University Press. (01 2007)."},{"key":"e_1_3_2_1_15_1","volume-title":"Proceedings of the Second Workshop on Simple and Efficient Natural Language Processing. Association for Computational Linguistics, Virtual, 32\u201338","author":"Jeon Sungho","year":"2021","unstructured":"Sungho Jeon and Michael Strube. 2021. Countering the Influence of Essay Length in Neural Essay Scoring. In Proceedings of the Second Workshop on Simple and Efficient Natural Language Processing. Association for Computational Linguistics, Virtual, 32\u201338."},{"key":"e_1_3_2_1_17_1","first-page":"1","article-title":"Studies in language behavior: A program of research","volume":"56","author":"Johnson Wendell","year":"1944","unstructured":"Wendell Johnson. 1944. Studies in language behavior: A program of research. Psychological Monographs 56, 2 (1944), 1\u201315.","journal-title":"Psychological Monographs"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.softx.2024.101659"},{"key":"e_1_3_2_1_19_1","unstructured":"Kiyoung Kim. 2020. Pretrained Language Models For Korean. https:\/\/github.com\/kiyoungkim1\/LMkor."},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.21850\/kge.2024.50..193"},{"key":"e_1_3_2_1_21_1","volume-title":"Proceedings of the the Annual Conference on Human and Cognitive Language Technology. 354\u2013359","author":"Lee Yejin","year":"2022","unstructured":"Yejin Lee, Youngjin Jang, Tae il Kim, Sung-Won Choi, and Harksoo Kim. 2022. An Automated Essay Scoring Pipeline Model based on Deep Neural Networks Reflecting Argumentation Structure Information. In Proceedings of the the Annual Conference on Human and Cognitive Language Technology. 354\u2013359."},{"key":"e_1_3_2_1_22_1","volume-title":"Proceedings of the 27th International Conference on Computational Linguistics. Association for Computational Linguistics","author":"Matteson Andrew","year":"2018","unstructured":"Andrew Matteson, Chanhee Lee, Youngbum Kim, and Heuiseok Lim. 2018. Rich Character-Level Information for Korean Morphological Analysis and Part-of-Speech Tagging. In Proceedings of the 27th International Conference on Computational Linguistics. Association for Computational Linguistics, Santa Fe, New Mexico, USA, 2482\u20132492. https:\/\/aclanthology.org\/C18-1210"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1177\/0265532207080767"},{"key":"e_1_3_2_1_25_1","volume-title":"vocd-D, and HD-D: A validation study of sophisticated approaches to lexical diversity assessment. Behavior research methods 42, 2","author":"McCarthy Philip M","year":"2010","unstructured":"Philip M McCarthy and Scott Jarvis. 2010. MTLD, vocd-D, and HD-D: A validation study of sophisticated approaches to lexical diversity assessment. Behavior research methods 42, 2 (2010), 381\u2013392."},{"key":"e_1_3_2_1_26_1","volume-title":"Linguistic features of writing quality. Written communication 27, 1","author":"McNamara Danielle S","year":"2010","unstructured":"Danielle S McNamara, Scott A Crossley, and Philip M McCarthy. 2010. Linguistic features of writing quality. Written communication 27, 1 (2010), 57\u201386."},{"key":"e_1_3_2_1_27_1","volume-title":"Contextual correlates of semantic similarity. Language and cognitive processes 6, 1","author":"Miller George A","year":"1991","unstructured":"George A Miller and Walter G Charles. 1991. Contextual correlates of semantic similarity. Language and cognitive processes 6, 1 (1991), 1\u201328."},{"key":"e_1_3_2_1_28_1","unstructured":"Sungjoon Park Jihyung Moon Sungdong Kim Won Ik Cho Jiyoon Han Jangwon Park Chisung Song Junseong Kim Yongsook Song Taehwan Oh Joohong Lee Juhyun Oh Sungwon Lyu Younghoon Jeong Inkwon Lee Sangwoo Seo Dongjun Lee Hyunwoo Kim Myeonghwa Lee Seongbo Jang Seungwon Do Sunkyoung Kim Kyungtae Lim Jongwon Lee Kyumin Park Jamin Shin Seonghyun Kim Lucy Park Alice Oh Jungwoo Ha and Kyunghyun Cho. 2021. KLUE: Korean Language Understanding Evaluation. arXiv:cs.CL\/2105.09680"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10462-021-10068-2"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1002\/j.2333-8504.2012.tb02284.x"},{"key":"e_1_3_2_1_31_1","volume-title":"Sentence similarity measures for fine-grained estimation of topical relevance in learner essays. arXiv preprint arXiv:1606.03144","author":"Rei Marek","year":"2016","unstructured":"Marek Rei and Ronan Cummins. 2016. Sentence similarity measures for fine-grained estimation of topical relevance in learner essays. arXiv preprint arXiv:1606.03144 (2016)."},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"crossref","unstructured":"Nils Reimers and Iryna Gurevych. 2019. Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks. arXiv:cs.CL\/1908.10084","DOI":"10.18653\/v1\/D19-1410"},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.sbspro.2013.10.668"},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.coling-main.535"},{"key":"e_1_3_2_1_35_1","volume-title":"Comparing measures of lexical richness. Modelling and assessing vocabulary knowledge 93","author":"Hout Roeland Van","year":"2007","unstructured":"Roeland Van Hout and Anne Vermeer. 2007. Comparing measures of lexical richness. Modelling and assessing vocabulary knowledge 93 (2007), 115."},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.naacl-main.249"},{"key":"e_1_3_2_1_37_1","first-page":"711","article-title":"The development study of an automated scoring program for Korean essays","volume":"36","author":"Yongsang Lee","year":"2023","unstructured":"Lee Yongsang, Yoonsek Choi, and Seung-Hyun Lee. 2023. The development study of an automated scoring program for Korean essays, PASTA-I. Journal of Educational Evaluation 36, 4 (2023), 711\u2013730.","journal-title":"Journal of Educational Evaluation"}],"event":{"name":"SAC '25: 40th ACM\/SIGAPP Symposium on Applied Computing","location":"Catania International Airport Catania Italy","acronym":"SAC '25","sponsor":["SIGAPP ACM Special Interest Group on Applied Computing"]},"container-title":["Proceedings of the 40th ACM\/SIGAPP Symposium on Applied Computing"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3672608.3707957","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3672608.3707957","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T01:57:37Z","timestamp":1750298257000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3672608.3707957"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,3,31]]},"references-count":34,"alternative-id":["10.1145\/3672608.3707957","10.1145\/3672608"],"URL":"https:\/\/doi.org\/10.1145\/3672608.3707957","relation":{},"subject":[],"published":{"date-parts":[[2025,3,31]]},"assertion":[{"value":"2025-05-14","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}