{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T04:10:31Z","timestamp":1750219831912,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":39,"publisher":"ACM","license":[{"start":{"date-parts":[[2023,6,16]],"date-time":"2023-06-16T00:00:00Z","timestamp":1686873600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2023,6,16]]},"DOI":"10.1145\/3608218.3608227","type":"proceedings-article","created":{"date-parts":[[2023,8,24]],"date-time":"2023-08-24T18:17:49Z","timestamp":1692901069000},"page":"118-124","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Research on Graded Chinese Text Corpus for International Chinese Language Education"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0003-1104-8085","authenticated-orcid":false,"given":"Xiaojun","family":"Yin","sequence":"first","affiliation":[{"name":"Research Institute of International Chinese Language Education\/ College of International Chinese Studies, Beijing Language and Culture University, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-9866-9380","authenticated-orcid":false,"given":"Guolong","family":"Song","sequence":"additional","affiliation":[{"name":"ByteDance Technology, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0002-8339-2769","authenticated-orcid":false,"given":"Hongbin","family":"Wang","sequence":"additional","affiliation":[{"name":"Research Institute of International Chinese Language Education, Beijing Language and Culture University, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2023,8,24]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"A formula for predicting readability: Instructions. Educational research bulletin, 2 (February","author":"Dale E","year":"1948","unstructured":"Dale E , Chall J S . 1948. A formula for predicting readability: Instructions. Educational research bulletin, 2 (February 1948 ), 37-54. Dale E, Chall J S. 1948. A formula for predicting readability: Instructions. Educational research bulletin, 2 (February 1948), 37-54."},{"key":"e_1_3_2_1_2_1","article-title":"Smog grading-a new readability formula","author":"Mc Laughlin G H","year":"1969","unstructured":"Mc Laughlin G H . 1969 . Smog grading-a new readability formula . Journal of reading, 8 ( May 1969), 639-646. Mc Laughlin G H. 1969. Smog grading-a new readability formula. Journal of reading, 8 (May 1969), 639-646.","journal-title":"Journal of reading, 8"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.21236\/ADA006655"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.3115\/1219840.1219905"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.3115\/1613715.1613742"},{"key":"e_1_3_2_1_6_1","volume-title":"Proceedings of the seventh workshop on building educational applications using NLP. Association for Computational LinguisticsN. PA, United States. 163-173","author":"Vajjala S","year":"2012","unstructured":"Vajjala S , Meurers D. 2012 . On improving the accuracy of readability classification using insights from second language acquisition . In Proceedings of the seventh workshop on building educational applications using NLP. Association for Computational LinguisticsN. PA, United States. 163-173 . Vajjala S, Meurers D. 2012. On improving the accuracy of readability classification using insights from second language acquisition. In Proceedings of the seventh workshop on building educational applications using NLP. Association for Computational LinguisticsN. PA, United States. 163-173."},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/W18-0505"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.bea-1.1"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1162\/coli_a_00398"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1075\/itl.165.2.01col"},{"key":"e_1_3_2_1_12_1","volume-title":"Data-driven Applied Linguistic Research. Modern Foreign Languages, 4 (April","author":"Liu Haitao","year":"2021","unstructured":"Liu Haitao . 2021. Data-driven Applied Linguistic Research. Modern Foreign Languages, 4 (April 2021 ), 462-469. Liu Haitao. 2021. Data-driven Applied Linguistic Research. Modern Foreign Languages, 4 (April 2021), 462-469."},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.16499\/j.cnki.1003-5397.2020.01.014"},{"key":"e_1_3_2_1_14_1","article-title":"Automatic grading of Chinese text reading difficulty based on multiple linguistic features and deep features","author":"Cheng Yong","year":"2020","unstructured":"Cheng Yong , Xu Dekuan, Dong Jun .b. 2020 b. Automatic grading of Chinese text reading difficulty based on multiple linguistic features and deep features . Journal of Chinese Information Processing, 4 ( April 2020), 101-110. Cheng Yong, Xu Dekuan, Dong Jun.b. 2020b. Automatic grading of Chinese text reading difficulty based on multiple linguistic features and deep features. Journal of Chinese Information Processing, 4 (April 2020), 101-110.","journal-title":"Journal of Chinese Information Processing, 4"},{"key":"e_1_3_2_1_15_1","article-title":"Research on sentence difficulty assessment of Chinese textbooks based on crowdsourcing annotation","author":"Yu Dong","year":"2020","unstructured":"Yu Dong , Wu Siyuan, Geng Chaoyang , Tang Yuling. 2020 . Research on sentence difficulty assessment of Chinese textbooks based on crowdsourcing annotation . Journal of Chinese Information Processing, 2 ( February 2020), 16-26. Yu Dong, Wu Siyuan, Geng Chaoyang, Tang Yuling. 2020. Research on sentence difficulty assessment of Chinese textbooks based on crowdsourcing annotation. Journal of Chinese Information Processing, 2 (February 2020), 16-26.","journal-title":"Journal of Chinese Information Processing, 2"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.16499\/j.cnki.1003-5397.2021.02.010"},{"volume-title":"The Commercial Press","author":"Huang Changning","key":"e_1_3_2_1_17_1","unstructured":"Huang Changning , Li Juanzi. 2002. Corpus Linguistics. The Commercial Press . Beijing, China . Huang Changning, Li Juanzi. 2002. Corpus Linguistics. The Commercial Press. Beijing, China."},{"key":"e_1_3_2_1_18_1","volume-title":"A research on the automatic readability assessment of international Chinese reading materials based on regression model.The Chinese Journal of ICT in Education, 15 (August","author":"Sun Weiwei","year":"2018","unstructured":"Sun Weiwei , Xia Jing, Zeng Zhizhong . 2018. A research on the automatic readability assessment of international Chinese reading materials based on regression model.The Chinese Journal of ICT in Education, 15 (August 2018 ), 67-74. Sun Weiwei, Xia Jing, Zeng Zhizhong. 2018. A research on the automatic readability assessment of international Chinese reading materials based on regression model.The Chinese Journal of ICT in Education, 15 (August 2018), 67-74."},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.13724\/j.cnki.ctiw.20200103.007"},{"key":"e_1_3_2_1_20_1","volume-title":"Proceedings of the NAACL HLT 2010 Workshop on Computational Linguistics and Writing: Writing Processes and Authoring Aids. Association for Computational LinguisticsN. PA, United States. 42-50","author":"Napoles C","year":"2010","unstructured":"Napoles C , Dredze M. 2010 . Learning simple Wikipedia: A cogitation in ascertaining abecedarian language . In Proceedings of the NAACL HLT 2010 Workshop on Computational Linguistics and Writing: Writing Processes and Authoring Aids. Association for Computational LinguisticsN. PA, United States. 42-50 . Napoles C, Dredze M. 2010. Learning simple Wikipedia: A cogitation in ascertaining abecedarian language. In Proceedings of the NAACL HLT 2010 Workshop on Computational Linguistics and Writing: Writing Processes and Authoring Aids. Association for Computational LinguisticsN. PA, United States. 42-50."},{"key":"e_1_3_2_1_21_1","first-page":"378","volume-title":"Proceedings of the Third Student Workshop on Computational Linguistics","author":"Zou Hongjian","year":"2006","unstructured":"Zou Hongjian , Yang Erhong. 2006 . Text categorization of Complexity Orienting the Press Teaching of Chinese for Foreigners . In Proceedings of the Third Student Workshop on Computational Linguistics . Shenyang, China , 378 - 182 . Zou Hongjian, Yang Erhong. 2006. Text categorization of Complexity Orienting the Press Teaching of Chinese for Foreigners. In Proceedings of the Third Student Workshop on Computational Linguistics. Shenyang, China, 378-182."},{"volume-title":"A study on the syntactic complexity of secondary school English learners' essays based on syntactic annotation corpus. Master's Thesis","author":"Bi Peng 0.","key":"e_1_3_2_1_22_1","unstructured":"Bi Peng . 202 0. A study on the syntactic complexity of secondary school English learners' essays based on syntactic annotation corpus. Master's Thesis , Chinese Proficiency Test Center , Zhejiang University , Zhejiang. Bi Peng. 2020. A study on the syntactic complexity of secondary school English learners' essays based on syntactic annotation corpus. Master's Thesis, Chinese Proficiency Test Center, Zhejiang University, Zhejiang."},{"key":"e_1_3_2_1_23_1","volume-title":"A comparative study of linguistic features in Korean students' writing in different genres. Language Teaching and Linguistic Studies, 5 (September","author":"Wu Jifeng","year":"2019","unstructured":"Wu Jifeng . 2019. A comparative study of linguistic features in Korean students' writing in different genres. Language Teaching and Linguistic Studies, 5 (September 2019 ), 1-12. Wu Jifeng. 2019. A comparative study of linguistic features in Korean students' writing in different genres. Language Teaching and Linguistic Studies, 5 (September 2019), 1-12."},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.16499\/j.cnki.1003-5397.2021.01.016"},{"volume-title":"A research on the readability of texts for second language learners. Master's Thesis","author":"Cai Jianyong 0.","key":"e_1_3_2_1_25_1","unstructured":"Cai Jianyong . 202 0. A research on the readability of texts for second language learners. Master's Thesis , Chinese Proficiency Test Center, Beijing Language and Culture University , Beijing. Cai Jianyong. 2020. A research on the readability of texts for second language learners. Master's Thesis, Chinese Proficiency Test Center, Beijing Language and Culture University, Beijing."},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1037\/0278-7393.16.3.417"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1162\/COLI_a_00255"},{"volume-title":"Corpus linguistics: Method, theory and practice","author":"McEnery T","key":"e_1_3_2_1_28_1","unstructured":"McEnery T , Hardie A. 2011. Corpus linguistics: Method, theory and practice . Cambridge University Press . London, British. McEnery T, Hardie A. 2011. Corpus linguistics: Method, theory and practice. Cambridge University Press. London, British."},{"key":"e_1_3_2_1_29_1","volume-title":"Web-based Fourth Generation Corpus Analysis Tools and the BFSU CQPweb Case. Technology Enhanced Foreign Language Education, 5 (September","author":"Xu Jiajin","year":"2014","unstructured":"Xu Jiajin , Wu Liangping. 2014. Web-based Fourth Generation Corpus Analysis Tools and the BFSU CQPweb Case. Technology Enhanced Foreign Language Education, 5 (September 2014 ), 10-15+56. Xu Jiajin, Wu Liangping. 2014. Web-based Fourth Generation Corpus Analysis Tools and the BFSU CQPweb Case. Technology Enhanced Foreign Language Education, 5 (September 2014), 10-15+56."},{"volume-title":"About Corpus Linguistics","author":"Liang Maocheng","key":"e_1_3_2_1_30_1","unstructured":"Liang Maocheng . 2016. About Corpus Linguistics . Shanghai Foreign Language Education Press . Shanghai, China. Liang Maocheng. 2016. About Corpus Linguistics. Shanghai Foreign Language Education Press. Shanghai, China."},{"key":"e_1_3_2_1_31_1","unstructured":"Wei Naixing Li Wenzhong 2005. Pu Jianzhong. Corpora in Use. Shanghai Foreign Language Education. Shanghai China.  Wei Naixing Li Wenzhong 2005. Pu Jianzhong. Corpora in Use. Shanghai Foreign Language Education. Shanghai China."},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.16499\/j.cnki.1003-5397.2011.02.017"},{"key":"e_1_3_2_1_33_1","volume-title":"A Standard Corpus of Present-Day Edited American English, for use with Digital Computers","author":"Francis W. N. , H.","year":"1964","unstructured":"Francis , W. N. , H. Ku\u010dera . 1979. A Standard Corpus of Present-Day Edited American English, for use with Digital Computers . Brown University , Providence . 1964 . Revised 1971. Revised and amplified 1979. Francis, W. N. , H. Ku\u010dera. 1979. A Standard Corpus of Present-Day Edited American English, for use with Digital Computers. Brown University, Providence. 1964. Revised 1971. Revised and amplified 1979."},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1017\/S1360674304001261"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.16499\/j.cnki.1003-5397.2015.02.017"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.plrev.2018.06.006"},{"volume-title":"Data enhancement technology for Chinese language models based on generative adversarial network. Master's Thesis","author":"Zhao Pengfei","key":"e_1_3_2_1_37_1","unstructured":"Zhao Pengfei . 2018. Data enhancement technology for Chinese language models based on generative adversarial network. Master's Thesis , Chinese Proficiency Test Center , Harbin Institute of Technology, Harbin. Zhao Pengfei. 2018. Data enhancement technology for Chinese language models based on generative adversarial network. Master's Thesis, Chinese Proficiency Test Center, Harbin Institute of Technology, Harbin."},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.1609\/AAAI.V34I05.6233"},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D19-1670"}],"event":{"name":"ICBDE 2023: 2023 the 6th International Conference on Big Data and Education","acronym":"ICBDE 2023","location":"Jinan China"},"container-title":["Proceedings of the 2023 6th International Conference on Big Data and Education"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3608218.3608227","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3608218.3608227","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T16:46:33Z","timestamp":1750178793000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3608218.3608227"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,6,16]]},"references-count":39,"alternative-id":["10.1145\/3608218.3608227","10.1145\/3608218"],"URL":"https:\/\/doi.org\/10.1145\/3608218.3608227","relation":{},"subject":[],"published":{"date-parts":[[2023,6,16]]},"assertion":[{"value":"2023-08-24","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}