{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,23]],"date-time":"2025-11-23T15:25:18Z","timestamp":1763911518935,"version":"3.41.0"},"publisher-location":"New York, New York, USA","reference-count":23,"publisher":"ACM Press","license":[{"start":{"date-parts":[[2019,1,1]],"date-time":"2019-01-01T00:00:00Z","timestamp":1546300800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2019]]},"DOI":"10.1145\/3368926.3369686","type":"proceedings-article","created":{"date-parts":[[2019,12,20]],"date-time":"2019-12-20T13:30:11Z","timestamp":1576848611000},"page":"132-138","source":"Crossref","is-referenced-by-count":16,"title":["OCR Error Correction for Unconstrained Vietnamese Handwritten Text"],"prefix":"10.1145","author":[{"given":"Quoc-Dung","family":"Nguyen","sequence":"first","affiliation":[{"name":"Van Lang University, Ho Chi Minh, Vietnam, Technical University of Ostrava, Ostrava-Poruba, Czech Republic"}]},{"given":"Duc-Anh","family":"Le","sequence":"additional","affiliation":[{"name":"Center for Open Data in the Humanities, Tokyo, Japan"}]},{"given":"Ivan","family":"Zelinka","sequence":"additional","affiliation":[{"name":"Technical University of Ostrava, Ostrava-Poruba, Czech Republic"}]}],"member":"320","reference":[{"key":"key-10.1145\/3368926.3369686-1","doi-asserted-by":"crossref","unstructured":"Abdelhak Boukharouba and Abdelhak Bennia. 2017. Novel feature extraction technique for the recognition of handwritten digits. Applied Computing and Informatics 13, 1 (2017), 19--26. https:\/\/doi.org\/10.1016\/j.aci.2015.05.001","DOI":"10.1016\/j.aci.2015.05.001"},{"key":"key-10.1145\/3368926.3369686-2","doi-asserted-by":"crossref","unstructured":"Amit Choudhary, Rahul Rishi, and Savita Ahlawat. 2013. Offline Handwritten Character Recognition Using Features Extracted from Binarization Technique. In AASRI Procedia, Vol. 4. 306--312. https:\/\/doi.org\/10.1016\/j.aasri.2013.10.045","DOI":"10.1016\/j.aasri.2013.10.045"},{"key":"key-10.1145\/3368926.3369686-3","doi-asserted-by":"crossref","unstructured":"Apurva A. Desai. 2010. Gujarati Handwritten Numeral Optical Character Reorganization Through Neural Network. Pattern Recognition 43, 7 (2010), 2582--2589. https:\/\/doi.org\/10.1016\/j.patcog.2010.01.008","DOI":"10.1016\/j.patcog.2010.01.008"},{"key":"key-10.1145\/3368926.3369686-4","unstructured":"Alex Graves, Marcus Liwicki, Horst Bunke, J&#252;rgen Schmidhuber, and Santiago Fern&#225;ndez. 2008. Unconstrained On-line Handwriting Recognition with Recurrent Neural Networks. In Advances in Neural Information Processing Systems 20, J. C. Platt, D. Koller, Y. Singer, and S. T. Roweis (Eds.). Curran Associates, Inc., 577--584."},{"key":"key-10.1145\/3368926.3369686-5","doi-asserted-by":"crossref","unstructured":"A. Graves, M. Liwicki, S. Fern&#225;ndez, R. Bertolami, H. Bunke, and J. Schmidhuber. 2009. A Novel Connectionist System for Unconstrained Handwriting Recognition. IEEE Transactions on Pattern Analysis and Machine Intelligence 31, 5 (2009), 855--868. https:\/\/doi.org\/10.1109\/TPAMI.2008.137","DOI":"10.1109\/TPAMI.2008.137"},{"key":"key-10.1145\/3368926.3369686-6","doi-asserted-by":"crossref","unstructured":"Aminul Islam and Diana Inkpen. 2008. Semantic Text Similarity Using Corpus-based Word Similarity and String Similarity. ACM Trans. Knowl. Discov. Data 2, 2, Article 10 (July 2008), 25 pages. https:\/\/doi.org\/10.1145\/1376815.1376819","DOI":"10.1145\/1376815.1376819"},{"key":"key-10.1145\/3368926.3369686-7","doi-asserted-by":"crossref","unstructured":"Aminul Islam and Diana Inkpen. 2009. Real-word Spelling Correction Using Google Web 1T n-gram Data Set. In Proceedings of the 18th ACM Conference on Information and Knowledge Management (CIKM '09). ACM, New York, NY, USA, 1689--1692. https:\/\/doi.org\/10.1145\/1645953.1646205","DOI":"10.1145\/1645953.1646205"},{"key":"key-10.1145\/3368926.3369686-8","doi-asserted-by":"crossref","unstructured":"J. Jo, J. Lee, and Y. Lee. 2009. Stroke-Based Online Hangul\/Korean Character Recognition. In 2009 Chinese Conference on Pattern Recognition. 1--5. https:\/\/doi.org\/10.1109\/CCPR.2009.5343953","DOI":"10.1109\/CCPR.2009.5343953"},{"key":"key-10.1145\/3368926.3369686-9","doi-asserted-by":"crossref","unstructured":"I. Kissos and N. Dershowitz. 2016. OCR Error Correction Using Character Correction and Feature-Based Word Classification. In 2016 12th IAPR Workshop on Document Analysis Systems (DAS). 198--203. https:\/\/doi.org\/10.1109\/DAS.2016.44","DOI":"10.1109\/DAS.2016.44"},{"key":"key-10.1145\/3368926.3369686-10","doi-asserted-by":"crossref","unstructured":"Anh Le Duc, Hung Nguyen, and Masaki Nakagawa. 2018. Recognizing Unconstrained Vietnamese Handwriting By Attention Based Encoder Decoder Model. In 2018 International Conference on Advanced Computing and Applications (ACOMP). 83--87. https:\/\/doi.org\/10.1109\/ACOMP.2018.00021","DOI":"10.1109\/ACOMP.2018.00021"},{"key":"key-10.1145\/3368926.3369686-11","doi-asserted-by":"crossref","unstructured":"Anh Le Duc, Hung Nguyen, and Masaki Nakagawa. 2020. An End-to-End Recognition System for Unconstrained Vietnamese Handwriting. SN Computer Science 1, 7 (Jan 2020). https:\/\/doi.org\/10.1007\/s42979-019-0001-4","DOI":"10.1007\/s42979-019-0001-4"},{"key":"key-10.1145\/3368926.3369686-12","doi-asserted-by":"crossref","unstructured":"Jie Mei, Aminul Islam, Abidalrahman Moh'd, Yajing Wu, and Evangelos Milios. 2018. Statistical learning for OCR error correction. Information Processing and Management 54, 6 (2018), 874--887. https:\/\/doi.org\/10.1016\/j.ipm.2018.06.001","DOI":"10.1016\/j.ipm.2018.06.001"},{"key":"key-10.1145\/3368926.3369686-13","doi-asserted-by":"crossref","unstructured":"Hung Tuan Nguyen, Cuong Tuan Nguyen, Pham The Bao, and Masaki Nakagawa. 2018. A database of unconstrained Vietnamese online handwriting and recognition experiments by recurrent neural networks. Pattern Recognition 78 (2018), 291--306. https:\/\/doi.org\/10.1016\/j.patcog.2018.01.013","DOI":"10.1016\/j.patcog.2018.01.013"},{"key":"key-10.1145\/3368926.3369686-14","doi-asserted-by":"crossref","unstructured":"Hung Tuan Nguyen, Cuong Tuan Nguyen, and Masaki Nakagawa. 2018. ICFHR 2018 - Competition on Vietnamese Online Handwritten Text Recognition using HANDS-VNOnDB (VOHTR2018). In 2018 16th International Conference on Frontiers in Handwriting Recognition (ICFHR). 494--499. https:\/\/doi.org\/10.1109\/ICFHR-2018.2018.00092","DOI":"10.1109\/ICFHR-2018.2018.00092"},{"key":"key-10.1145\/3368926.3369686-15","unstructured":"Phuong-Thai Nguyen, Xuan-Luong Vu, Thi-Minh-Huyen Nguyen, Van-Hiep Nguyen, and Hong-Phuong Le. 2009. Building a Large Syntactically-annotated Corpus of Vietnamese. In Proceedings of the Third Linguistic Annotation Workshop (ACL-IJCNLP '09). Association for Computational Linguistics, Stroudsburg, PA, USA, 182--185."},{"key":"key-10.1145\/3368926.3369686-16","doi-asserted-by":"crossref","unstructured":"T. T. H. Nguyen, M. Coustaty, A. Doucet, A. Jatowt, and N. V. Nguyen. 2018. Adaptive Edit-Distance and Regression Approach for Post-OCR Text Correction. Dobreva M., Hinze A., &#381;umer M. (eds) Maturity and Innovation in Digital Libraries. ICADL 2018. Lecture Notes in Computer Science 11279 (2018), 278--289. https:\/\/doi.org\/10.1007\/978-3-030-04257-8_29","DOI":"10.1007\/978-3-030-04257-8_29"},{"key":"key-10.1145\/3368926.3369686-17","doi-asserted-by":"crossref","unstructured":"Duy Nguyen K. and The Bui D. 2008. On the problem of classifying Vietnamese online handwritten characters. In 2008 10th International Conference on Control, Automation, Robotics and Vision. 803--808. https:\/\/doi.org\/10.1109\/ICARCV.2008.4795620","DOI":"10.1109\/ICARCV.2008.4795620"},{"key":"key-10.1145\/3368926.3369686-18","doi-asserted-by":"crossref","unstructured":"Duy Nguyen K. and The Bui D. 2008. Recognizing Vietnamese Online Handwritten Separated Characters. In 2008 International Conference on Advanced Language Processing and Web Information Technology. 279--284. https:\/\/doi.org\/10.1109\/ALPIT.2008.58","DOI":"10.1109\/ALPIT.2008.58"},{"key":"key-10.1145\/3368926.3369686-19","doi-asserted-by":"crossref","unstructured":"P. A. Phuong, N. Q. Tao, and L. C. Mai. 2008. An Efficient Model for Isolated Vietnamese Handwritten Recognition. In 2008 International Conference on Intelligent Information Hiding and Multimedia Signal Processing. 358--361. https:\/\/doi.org\/10.1109\/IIH-MSP.2008.67","DOI":"10.1109\/IIH-MSP.2008.67"},{"key":"key-10.1145\/3368926.3369686-20","doi-asserted-by":"crossref","unstructured":"L. Sun, T. Su, C. Liu, and R. Wang. 2016. Deep LSTM Networks for Online Chinese Handwriting Recognition. In 2016 15th International Conference on Frontiers in Handwriting Recognition (ICFHR). 271--276. https:\/\/doi.org\/10.1109\/ICFHR.2016.0059","DOI":"10.1109\/ICFHR.2016.0059"},{"key":"key-10.1145\/3368926.3369686-21","doi-asserted-by":"crossref","unstructured":"De Cao Tran. 2012. An Efficient Method for Online Vietnamese Handwritten Character Recognition. In Proceedings of the Third Symposium on Information and Communication Technology (SoICT '12). ACM, New York, NY, USA, 135--141. https:\/\/doi.org\/10.1145\/2350716.2350737","DOI":"10.1145\/2350716.2350737"},{"key":"key-10.1145\/3368926.3369686-22","doi-asserted-by":"crossref","unstructured":"K. Sonu Varghese, Ajay James, and Saravanan Chandran. 2016. A Novel Tri-Stage Recognition Scheme for Handwritten Malayalam Character Recognition. Procedia Technology 24 (2016), 1333--1340. https:\/\/doi.org\/10.1016\/j.protcy.2016.05.137","DOI":"10.1016\/j.protcy.2016.05.137"},{"key":"key-10.1145\/3368926.3369686-23","unstructured":"Cong Duy Vu Hoang and Ai Ti Aw. 2012. An Unsupervised and Data-driven Approach for Spell Checking in Vietnamese OCR-scanned Texts. In Proceedings of the Workshop on Innovative Hybrid Approaches to the Processing of Textual Data (HYBRID '12). Association for Computational Linguistics, Stroudsburg, PA, USA, 36--44."}],"event":{"number":"10","sponsor":["SOICT, School of Information and Communication Technology - HUST","NAFOSTED, The National Foundation for Science and Technology Development"],"acronym":"SoICT 2019","name":"the Tenth International Symposium","start":{"date-parts":[[2019,12,4]]},"location":"Hanoi, Ha Long Bay, Viet Nam","end":{"date-parts":[[2019,12,6]]}},"container-title":["Proceedings of the Tenth International Symposium on Information and Communication Technology  - SoICT 2019"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3368926.3369686","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/dl.acm.org\/ft_gateway.cfm?id=3369686&ftid=2101273&dwn=1","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T23:44:51Z","timestamp":1750203891000},"score":1,"resource":{"primary":{"URL":"http:\/\/dl.acm.org\/citation.cfm?doid=3368926.3369686"}},"subtitle":[],"proceedings-subject":"Information and Communication Technology","short-title":[],"issued":{"date-parts":[[2019]]},"references-count":23,"URL":"https:\/\/doi.org\/10.1145\/3368926.3369686","relation":{},"subject":[],"published":{"date-parts":[[2019]]}}}