{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,7,27]],"date-time":"2025-07-27T07:21:15Z","timestamp":1753600875080,"version":"3.40.3"},"publisher-location":"Singapore","reference-count":38,"publisher":"Springer Nature Singapore","isbn-type":[{"type":"print","value":"9789819794423"},{"type":"electronic","value":"9789819794430"}],"license":[{"start":{"date-parts":[[2024,11,1]],"date-time":"2024-11-01T00:00:00Z","timestamp":1730419200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,11,1]],"date-time":"2024-11-01T00:00:00Z","timestamp":1730419200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-981-97-9443-0_33","type":"book-chapter","created":{"date-parts":[[2024,10,31]],"date-time":"2024-10-31T16:31:04Z","timestamp":1730392264000},"page":"377-388","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["YoloGPT: Enhancing Chinese Character Recognition and\u00a0Correction"],"prefix":"10.1007","author":[{"given":"Sheng","family":"Yang","sequence":"first","affiliation":[]},{"given":"Zhanbiao","family":"Lian","sequence":"additional","affiliation":[]},{"given":"Kunyu","family":"Li","sequence":"additional","affiliation":[]},{"given":"Peilin","family":"Liu","sequence":"additional","affiliation":[]},{"given":"Fengge","family":"Wu","sequence":"additional","affiliation":[]},{"given":"Junsuo","family":"Zhao","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,11,1]]},"reference":[{"key":"33_CR1","unstructured":"Achiam, J., et\u00a0al.: GPT-4 technical report (2023)"},{"key":"33_CR2","doi-asserted-by":"crossref","unstructured":"Wang, D., et al.: A hybrid approach to automatic corpus generation for Chinese spelling check. In: Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing (EMNLP), Brussels, Belgium (2018)","DOI":"10.18653\/v1\/D18-1273"},{"key":"33_CR3","doi-asserted-by":"publisher","unstructured":"Dong, C., et al.: A survey of natural language generation. ACM Comput. Surv. 55(8), 173:1\u2013173:38 (2023). https:\/\/doi.org\/10.1145\/3554727","DOI":"10.1145\/3554727"},{"key":"33_CR4","doi-asserted-by":"crossref","unstructured":"Girshick, R.: Fast R-CNN. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 1440\u20131448 (2015)","DOI":"10.1109\/ICCV.2015.169"},{"issue":"1","key":"33_CR5","doi-asserted-by":"publisher","first-page":"142","DOI":"10.1109\/TPAMI.2015.2437384","volume":"38","author":"R Girshick","year":"2015","unstructured":"Girshick, R., Donahue, J., Darrell, T., Malik, J.: Region-based convolutional networks for accurate object detection and segmentation. IEEE Trans. Pattern Anal. Mach. Intell. 38(1), 142\u2013158 (2015)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"33_CR6","doi-asserted-by":"crossref","unstructured":"He, K., Gkioxari, G., Doll\u00e1r, P., Girshick, R.: Mask R-CNN. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 2961\u20132969 (2017)","DOI":"10.1109\/ICCV.2017.322"},{"key":"33_CR7","doi-asserted-by":"publisher","unstructured":"Huang, H., et al.: A frustratingly easy plug-and-play detection-and-reasoning module for Chinese spelling check. In: Bouamor, H., Pino, J., Bali, K. (eds.) Findings of the Association for Computational Linguistics: EMNLP 2023, Singapore, 6\u201310 December 2023, pp. 11514\u201311525. Association for Computational Linguistics (2023). https:\/\/doi.org\/10.18653\/v1\/2023.findings-emnlp.771","DOI":"10.18653\/v1\/2023.findings-emnlp.771"},{"key":"33_CR8","unstructured":"Hussain, M.: Yolov5, yolov8 and yolov10: the go-to detectors for real-time vision (2024). https:\/\/arxiv.org\/abs\/2407.02988"},{"key":"33_CR9","unstructured":"Katinskaia, A., Yangarber, R.: GPT-3.5 for grammatical error correction. arXiv preprint arXiv:2405.08469 (2024)"},{"key":"33_CR10","doi-asserted-by":"publisher","unstructured":"Li, Y., et al.: On the (in)effectiveness of large language models for Chinese text correction. CoRR abs\/2307.09007 (2023). https:\/\/doi.org\/10.48550\/arxiv.2307.09007","DOI":"10.48550\/arxiv.2307.09007"},{"key":"33_CR11","doi-asserted-by":"publisher","unstructured":"Li, Y., et al.: Learning from the dictionary: heterogeneous knowledge guided fine-tuning for Chinese spell checking. In: Goldberg, Y., Kozareva, Z., Zhang, Y. (eds.) Findings of the Association for Computational Linguistics: EMNLP 2022, Abu Dhabi, United Arab Emirates, 7\u201311 December 2022, pp. 238\u2013249. Association for Computational Linguistics (2022). https:\/\/doi.org\/10.18653\/v1\/2022.findings-emnlp.18","DOI":"10.18653\/v1\/2022.findings-emnlp.18"},{"key":"33_CR12","unstructured":"Li, Y., et al.: Rethinking the roles of large language models in Chinese grammatical error correction (2024). https:\/\/arxiv.org\/abs\/2402.11420"},{"key":"33_CR13","doi-asserted-by":"publisher","unstructured":"Li, Y., Shen, Y.: Towards real-world writing assistance: a Chinese character checking benchmark with faked and misspelled characters. CoRR abs\/2311.11268 (2023). https:\/\/doi.org\/10.48550\/arxiv.2311.11268","DOI":"10.48550\/arxiv.2311.11268"},{"key":"33_CR14","doi-asserted-by":"publisher","unstructured":"Li, Y., et al.: The past mistake is the future wisdom: error-driven contrastive probability optimization for Chinese spell checking. In: Muresan, S., Nakov, P., Villavicencio, A. (eds.) Findings of the Association for Computational Linguistics: ACL 2022, Dublin, Ireland, 22\u201327 May 2022, pp. 3202\u20133213. Association for Computational Linguistics (2022). https:\/\/doi.org\/10.18653\/v1\/2022.findings-acl.252","DOI":"10.18653\/v1\/2022.findings-acl.252"},{"key":"33_CR15","doi-asserted-by":"publisher","unstructured":"Li, Y., et al.: When LLMs meet cunning questions: a fallacy understanding benchmark for large language models. CoRR abs\/2402.11100 (2024). https:\/\/doi.org\/10.48550\/arxiv.2402.11100","DOI":"10.48550\/arxiv.2402.11100"},{"key":"33_CR16","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"740","DOI":"10.1007\/978-3-319-10602-1_48","volume-title":"Computer Vision \u2013 ECCV 2014","author":"T-Y Lin","year":"2014","unstructured":"Lin, T.-Y., et al.: Microsoft COCO: common objects in context. In: Fleet, D., Pajdla, T., Schiele, B., Tuytelaars, T. (eds.) ECCV 2014. LNCS, vol. 8693, pp. 740\u2013755. Springer, Cham (2014). https:\/\/doi.org\/10.1007\/978-3-319-10602-1_48"},{"issue":"9","key":"33_CR17","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3560815","volume":"55","author":"P Liu","year":"2023","unstructured":"Liu, P., Yuan, W., Fu, J., Jiang, Z., Hayashi, H., Neubig, G.: Pre-train, prompt, and predict: a systematic survey of prompting methods in natural language processing. ACM Comput. Surv. 55(9), 1\u201335 (2023)","journal-title":"ACM Comput. Surv."},{"key":"33_CR18","doi-asserted-by":"publisher","unstructured":"Liu, R., Li, Y., Tao, L., Liang, D., Zheng, H.: Are we ready for a new paradigm shift? A survey on visual deep MLP. Patterns 3(7), 100520 (2022). https:\/\/doi.org\/10.1016\/j.patter.2022.100520","DOI":"10.1016\/j.patter.2022.100520"},{"key":"33_CR19","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"21","DOI":"10.1007\/978-3-319-46448-0_2","volume-title":"Computer Vision \u2013 ECCV 2016","author":"W Liu","year":"2016","unstructured":"Liu, W., et al.: SSD: single shot MultiBox detector. In: Leibe, B., Matas, J., Sebe, N., Welling, M. (eds.) ECCV 2016. LNCS, vol. 9905, pp. 21\u201337. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-46448-0_2"},{"key":"33_CR20","doi-asserted-by":"publisher","unstructured":"Ma, S., et al.: Linguistic rules-based corpus generation for native Chinese grammatical error correction. In: Goldberg, Y., Kozareva, Z., Zhang, Y. (eds.) Findings of the Association for Computational Linguistics: EMNLP 2022, Abu Dhabi, United Arab Emirates, 7\u201311 December 2022, pp. 576\u2013589. Association for Computational Linguistics (2022). https:\/\/doi.org\/10.18653\/v1\/2022.findings-emnlp.40","DOI":"10.18653\/v1\/2022.findings-emnlp.40"},{"key":"33_CR21","doi-asserted-by":"crossref","unstructured":"Ma, S., et al.: Linguistic rules-based corpus generation for native Chinese grammatical error correction. In: Findings of the Association for Computational Linguistics: EMNLP 2022 (2022)","DOI":"10.18653\/v1\/2022.findings-emnlp.40"},{"issue":"1","key":"33_CR22","doi-asserted-by":"publisher","first-page":"975","DOI":"10.1007\/s11042-021-11425-7","volume":"81","author":"R Mondal","year":"2022","unstructured":"Mondal, R., Malakar, S., Barney Smith, E.H., Sarkar, R.: Handwritten english word recognition using a deep learning based object detection architecture. Multimedia Tools Appl. 81(1), 975\u20131000 (2022)","journal-title":"Multimedia Tools Appl."},{"key":"33_CR23","doi-asserted-by":"crossref","unstructured":"Pryzant, R., Iter, D., Li, J., Lee, Y.T., Zhu, C., Zeng, M.: Automatic prompt optimization with \u201cgradient descent\u201d and beam search. arXiv preprint arXiv:2305.03495 (2023)","DOI":"10.18653\/v1\/2023.emnlp-main.494"},{"key":"33_CR24","doi-asserted-by":"publisher","unstructured":"Qin, L., et al.: Multilingual large language model: a survey of resources, taxonomy and frontiers. CoRR abs\/2404.04925 (2024). https:\/\/doi.org\/10.48550\/arxiv.2404.04925","DOI":"10.48550\/arxiv.2404.04925"},{"key":"33_CR25","doi-asserted-by":"crossref","unstructured":"Redmon, J., Divvala, S., Girshick, R., Farhadi, A.: You only look once: unified, real-time object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 779\u2013788 (2016)","DOI":"10.1109\/CVPR.2016.91"},{"key":"33_CR26","doi-asserted-by":"crossref","unstructured":"Sahoo, P., Singh, A.K., Saha, S., Jain, V., Mondal, S., Chadha, A.: A systematic survey of prompt engineering in large language models: techniques and applications. arXiv preprint arXiv:2402.07927 (2024)","DOI":"10.1007\/979-8-8688-0569-1_4"},{"key":"33_CR27","doi-asserted-by":"publisher","first-page":"529","DOI":"10.1007\/978-981-99-7962-2_39","volume-title":"ICDICI 2023","author":"M Sohan","year":"2024","unstructured":"Sohan, M., Sai Ram, T., Reddy, R., Venkata, C.: A review on YOLOv8 and its advancements. In: Jacob, I.J., Piramuthu, S., Falkowski-Gilski, P. (eds.) ICDICI 2023, pp. 529\u2013545. Springer, Singapore (2024). https:\/\/doi.org\/10.1007\/978-981-99-7962-2_39"},{"key":"33_CR28","doi-asserted-by":"publisher","unstructured":"Tseng, Y.H., Lee, L.H., Chang, L.P., Chen, H.H.: Introduction to SIGHAN 2015 bake-off for Chinese spelling check. In: Yu, L.C., Sui, Z., Zhang, Y., Ng, V. (eds.) Proceedings of the Eighth SIGHAN Workshop on Chinese Language Processing, Beijing, China, pp. 32\u201337. Association for Computational Linguistics (2015). https:\/\/doi.org\/10.18653\/v1\/W15-3106. https:\/\/aclanthology.org\/W15-3106","DOI":"10.18653\/v1\/W15-3106"},{"key":"33_CR29","unstructured":"Wu, S.H., Liu, C.L., Lee, L.H.: Chinese spelling check evaluation at SIGHAN bake-off 2013. In: Yu, L.C., Tseng, Y.H., Zhu, J., Ren, F. (eds.) Proceedings of the Seventh SIGHAN Workshop on Chinese Language Processing, Nagoya, Japan, pp. 35\u201342. Asian Federation of Natural Language Processing (2013). https:\/\/aclanthology.org\/W13-4406"},{"key":"33_CR30","doi-asserted-by":"publisher","unstructured":"Ye, J., Li, Y., Ma, S., Xie, R., Wu, W., Zheng, H.: Focus is what you need for Chinese grammatical error correction. CoRR abs\/2210.12692 (2022). https:\/\/doi.org\/10.48550\/arxiv.2210.12692","DOI":"10.48550\/arxiv.2210.12692"},{"key":"33_CR31","doi-asserted-by":"publisher","unstructured":"Ye, J., et al.: CLEME: debiasing multi-reference evaluation for grammatical error correction. In: Bouamor, H., Pino, J., Bali, K. (eds.) Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, EMNLP 2023, Singapore, 6\u201310 December 2023, pp. 6174\u20136189. Association for Computational Linguistics (2023). https:\/\/doi.org\/10.18653\/v1\/2023.emnlp-main.378","DOI":"10.18653\/v1\/2023.emnlp-main.378"},{"key":"33_CR32","doi-asserted-by":"publisher","unstructured":"Yu, L.C., Lee, L.H., Tseng, Y.H., Chen, H.H.: Overview of SIGHAN 2014 bake-off for Chinese spelling check. In: Sun, L., Zong, C., Zhang, M., Levow, G.A. (eds.) Proceedings of the Third CIPS-SIGHAN Joint Conference on Chinese Language Processing, Wuhan, China, pp. 126\u2013132. Association for Computational Linguistics (2014). https:\/\/doi.org\/10.3115\/v1\/W14-6820. https:\/\/aclanthology.org\/W14-6820","DOI":"10.3115\/v1\/W14-6820"},{"key":"33_CR33","doi-asserted-by":"publisher","unstructured":"Zhang, D., et al.: Contextual similarity is more valuable than character similarity: an empirical study for Chinese spell checking. In: IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, 4\u201310 June 2023, pp.\u00a01\u20135. IEEE (2023). https:\/\/doi.org\/10.1109\/ICASSP49357.2023.10095675","DOI":"10.1109\/ICASSP49357.2023.10095675"},{"key":"33_CR34","doi-asserted-by":"crossref","unstructured":"Zhang, Y., et al.: MuCGEC: a multi-reference multi-source evaluation dataset for Chinese grammatical error correction. In: Proceedings of the 2022 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Seattle, United States, pp. 3118\u20133130. Association for Computational Linguistics (2022). https:\/\/aclanthology.org\/2022.naacl-main.227","DOI":"10.18653\/v1\/2022.naacl-main.227"},{"key":"33_CR35","doi-asserted-by":"crossref","unstructured":"Zhang, Y., et al.: NaSGEC: a multi-domain Chinese grammatical error correction dataset from native speaker texts (2023)","DOI":"10.18653\/v1\/2023.findings-acl.630"},{"key":"33_CR36","unstructured":"Zhao, H., Wang, B., Wu, D., Che, W., Chen, Z., Wang, S.: Overview of CTC 2021: Chinese text correction for native speakers (2022). https:\/\/arxiv.org\/abs\/2208.05681"},{"key":"33_CR37","unstructured":"Zhao, W.X., et al.: A survey of large language models. arXiv preprint arXiv:2303.18223 (2023)"},{"issue":"3","key":"33_CR38","doi-asserted-by":"publisher","first-page":"257","DOI":"10.1109\/JPROC.2023.3238524","volume":"111","author":"Z Zou","year":"2023","unstructured":"Zou, Z., Chen, K., Shi, Z., Guo, Y., Ye, J.: Object detection in 20 years: a survey. Proc. IEEE 111(3), 257\u2013276 (2023)","journal-title":"Proc. IEEE"}],"container-title":["Lecture Notes in Computer Science","Natural Language Processing and Chinese Computing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-981-97-9443-0_33","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,30]],"date-time":"2024-11-30T16:09:13Z","timestamp":1732982953000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-981-97-9443-0_33"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,11,1]]},"ISBN":["9789819794423","9789819794430"],"references-count":38,"URL":"https:\/\/doi.org\/10.1007\/978-981-97-9443-0_33","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2024,11,1]]},"assertion":[{"value":"1 November 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"NLPCC","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"CCF International Conference on Natural Language Processing and Chinese Computing","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Hangzhou","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"China","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2 November 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"4 November 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"13","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"nlpcc2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/tcci.ccf.org.cn\/conference\/2024\/index.php","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}