{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,14]],"date-time":"2026-05-14T11:30:04Z","timestamp":1778758204633,"version":"3.51.4"},"reference-count":54,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0\/"}],"funder":[{"name":"Van Lang University, Vietnam"},{"DOI":"10.13039\/501100008530","name":"European Regional Development Fund within the Operational Program Research, Development and Education in Projects, \u201cA Research Platform focused on Industry 4.0 and Robotics in Ostrava Agglomeration\u201d","doi-asserted-by":"publisher","award":["CZ.02.1.01\/0.0\/0.0\/17_049\/0008425"],"award-info":[{"award-number":["CZ.02.1.01\/0.0\/0.0\/17_049\/0008425"]}],"id":[{"id":"10.13039\/501100008530","id-type":"DOI","asserted-by":"publisher"}]},{"name":"VSB\u2013TU Ostrava, Czech Republic, through the Student Grant System","award":["SP2023\/12"],"award-info":[{"award-number":["SP2023\/12"]}]},{"name":"VSB\u2013TU Ostrava, Czech Republic, through the Student Grant System","award":["SP2023\/76"],"award-info":[{"award-number":["SP2023\/76"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Access"],"published-print":{"date-parts":[[2023]]},"DOI":"10.1109\/access.2023.3283340","type":"journal-article","created":{"date-parts":[[2023,6,7]],"date-time":"2023-06-07T02:58:52Z","timestamp":1686106732000},"page":"58406-58421","source":"Crossref","is-referenced-by-count":22,"title":["An Efficient Unsupervised Approach for OCR Error Correction of Vietnamese OCR Text"],"prefix":"10.1109","volume":"11","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-1580-9032","authenticated-orcid":false,"given":"Quoc-Dung","family":"Nguyen","sequence":"first","affiliation":[{"name":"Faculty of Mechanical-Electrical and Computer Engineering, School of Technology, Van Lang University, Ho Chi Minh City, Vietnam"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Nguyet-Minh","family":"Phan","sequence":"additional","affiliation":[{"name":"Faculty of Information Technology, Saigon University, Chi Minh City, Vietnam"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8428-3332","authenticated-orcid":false,"given":"Pavel","family":"Kr\u00f6mer","sequence":"additional","affiliation":[{"name":"Department of Computer Science, VSB--Technical University of Ostrava, Ostrava, Czech Republic"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9359-9686","authenticated-orcid":false,"given":"Duc-Anh","family":"Le","sequence":"additional","affiliation":[{"name":"The Institute of Statistical Mathematics, Tokyo, Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref13","first-page":"102","article-title":"OCR quality and NLP preprocessing","author":"mieskes","year":"2019","journal-title":"Proc Workshop Widening NLP"},{"key":"ref12","first-page":"284","article-title":"Impact of imperfect OCR on part-of-speech tagging","author":"lin","year":"2003","journal-title":"Proc 7th Int Conf Document Anal Recognit"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/NLPKE.2009.5313823"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-30483-8_49"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1145\/375360.375365"},{"key":"ref52","article-title":"Language modelling for handwriting recognition","author":"swaileh","year":"2017","journal-title":"Modeling and Simulation"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.3115\/974147.974191"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/JCDL.2019.00057"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1007\/s10732-008-9080-4"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/DAS.2016.44"},{"key":"ref16","first-page":"90","article-title":"OCR post-processing error correction algorithm using Google&#x2019;s online spelling suggestion","volume":"3","author":"bassil","year":"2012","journal-title":"J Emerg Trends Comput Inf Sci"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-04257-8_29"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1016\/j.ipm.2018.06.001"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1007\/s10032-011-0160-x"},{"key":"ref50","article-title":"Statistical learning for OCR text correction","author":"mei","year":"2016","journal-title":"arXiv 1611 06950"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.3115\/1698381.1698416"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/CIG.2015.7317907"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-14627-5_13"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-63924-2_26"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-84800-070-4"},{"key":"ref41","first-page":"1","article-title":"An analysis of travelling salesman problem utilizing Hill climbing algorithm for a smart city touristic search on OpenStreetMap (OSM)","author":"\u00f6zcan","year":"2018","journal-title":"Proc 2nd Int Symp Multidisciplinary Stud Innov Technol (ISMSIT)"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/CEC.1999.785522"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1016\/j.engappai.2010.03.006"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1007\/978-981-19-0332-8_34"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1023\/A:1026564708926"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-45442-5_13"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.3115\/1119467.1119471"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2018.01.013"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2010.01.008"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/JCDL.2017.7991582"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1007\/s42979-019-0001-4"},{"key":"ref40","first-page":"36","article-title":"An unsupervised and data-driven approach for spell checking in Vietnamese OCR-scanned texts","author":"vu hoang","year":"2012","journal-title":"Proc Workshop Innov Hybrid Approaches to Process Textual Data"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-39930-8_7"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1145\/2595188.2595200"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.3115\/1557769.1557821"},{"key":"ref36","first-page":"143","article-title":"Standard language variety conversion for content localisation via SMT","author":"fancellu","year":"2014","journal-title":"Proc 17th Annual Conf Eur Assoc Mach Transl"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1063\/5.0066687"},{"key":"ref30","first-page":"219","author":"segaran","year":"2009","journal-title":"Beautiful Data The Stories behind Elegant Data Solutions"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-20227-8_1"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/ICFHR-2018.2018.00092"},{"key":"ref2","doi-asserted-by":"crossref","first-page":"855","DOI":"10.1109\/TPAMI.2008.137","article-title":"A novel connectionist system for unconstrained handwriting recognition","volume":"31","author":"graves","year":"2009","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2006.04.043"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1063\/5.0066679"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P17-4012"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D17-1288"},{"key":"ref23","first-page":"175","article-title":"OCR error correction using statistical machine translation","volume":"7","author":"afli","year":"2016","journal-title":"Int J Computat Linguistics Appl"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1145\/3383583.3398605"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.21248\/jlcl.33.2018.218"},{"key":"ref20","first-page":"119","article-title":"OCR post-processing text correction using simulated annealing (OPTeCA)","author":"khirbat","year":"2017","journal-title":"Proc Australas Lang Technol Assoc Workshop"},{"key":"ref22","first-page":"962","article-title":"Using SMT for OCR error correction of historical texts","author":"afli","year":"2016","journal-title":"Proc 10th Int Conf Lang Resour Eval (LREC)"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1007\/s10044-020-00936-y"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1145\/3368926.3369686"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/ICDAR.2017.232"},{"key":"ref29","first-page":"42","article-title":"Speech and language processing: An introduction to natural language processing","author":"jurafsky","year":"2008","journal-title":"Computational Linguistics and Speech Recognition"}],"container-title":["IEEE Access"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6287639\/10005208\/10144767.pdf?arnumber=10144767","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,7,3]],"date-time":"2023-07-03T18:25:46Z","timestamp":1688408746000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10144767\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023]]},"references-count":54,"URL":"https:\/\/doi.org\/10.1109\/access.2023.3283340","relation":{},"ISSN":["2169-3536"],"issn-type":[{"value":"2169-3536","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023]]}}}