{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,15]],"date-time":"2025-11-15T10:35:49Z","timestamp":1763202949175,"version":"3.40.3"},"publisher-location":"Cham","reference-count":24,"publisher":"Springer Nature Switzerland","isbn-type":[{"type":"print","value":"9783031766060"},{"type":"electronic","value":"9783031766077"}],"license":[{"start":{"date-parts":[[2024,11,17]],"date-time":"2024-11-17T00:00:00Z","timestamp":1731801600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,11,17]],"date-time":"2024-11-17T00:00:00Z","timestamp":1731801600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-76607-7_19","type":"book-chapter","created":{"date-parts":[[2024,11,16]],"date-time":"2024-11-16T05:01:16Z","timestamp":1731733276000},"page":"256-269","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["An Effective Approach to\u00a0Text Detection and\u00a0Recognition in\u00a0Degraded Historical Documents"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0009-0007-6391-5370","authenticated-orcid":false,"given":"Percy","family":"Maldonado-Quispe","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0125-630X","authenticated-orcid":false,"given":"Helio","family":"Pedrini","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,11,17]]},"reference":[{"issue":"6","key":"19_CR1","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3355610","volume":"52","author":"GM Binmakhashen","year":"2019","unstructured":"Binmakhashen, G.M., Mahmoud, S.A.: Document layout analysis: a comprehensive survey. ACM Comput. Surv. 52(6), 1\u201336 (2019)","journal-title":"ACM Comput. Surv."},{"issue":"3","key":"19_CR2","doi-asserted-by":"publisher","first-page":"344","DOI":"10.1016\/S0734-189X(86)80047-0","volume":"34","author":"G Borgefors","year":"1986","unstructured":"Borgefors, G.: Distance transformations in digital images. Comput. Vision Graph. Image Process. 34(3), 344\u2013371 (1986)","journal-title":"Comput. Vision Graph. Image Process."},{"key":"19_CR3","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-50252-6","volume-title":"Optical Character Recognition Systems for Different Languages with Soft Computing","author":"A Chaudhuri","year":"2017","unstructured":"Chaudhuri, A., et al.: Optical Character Recognition Systems for Different Languages with Soft Computing. Springer, Cham (2017). https:\/\/doi.org\/10.1007\/978-3-319-50252-6"},{"key":"19_CR4","doi-asserted-by":"crossref","unstructured":"Da, C., Luo, C., Zheng, Q., Yao, C.: Vision grid transformer for document layout analysis. In: IEEE\/CVF International Conference on Computer Vision, pp. 19405\u201319415 (2023)","DOI":"10.1109\/ICCV51070.2023.01783"},{"key":"19_CR5","unstructured":"Dell, M., et al.: American stories: a large-scale structured text dataset of historical U.S. newspapers. In: 37th International Conference on Neural Information Processing Systems. Curran Associates Inc., New Orleans, LA, USA (2024)"},{"key":"19_CR6","unstructured":"Gonz\u00e1lez, R.C., Woods, R.E.: Digital Image Processing. Pearson Education, London (2008)"},{"key":"19_CR7","unstructured":"Goodfellow, I., Bengio, Y., Courville, A.: Deep Learning. MIT Press, Cambridge (2016)"},{"key":"19_CR8","doi-asserted-by":"crossref","unstructured":"Ha, J., Haralick, R., Phillips, I.: Recursive X-Y cut using bounding boxes of connected components. In: 3rd International Conference on Document Analysis and Recognition, vol.\u00a02, pp. 952\u2013955 (1995)","DOI":"10.1109\/ICDAR.1995.602059"},{"key":"19_CR9","unstructured":"Klink, S., Dengel, A., Kieninger, T.: Document structure analysis based on layout and textual features. In: International Workshop on Document Analysis Systems, pp. 99\u2013111 (2000)"},{"issue":"7553","key":"19_CR10","doi-asserted-by":"publisher","first-page":"436","DOI":"10.1038\/nature14539","volume":"521","author":"Y LeCun","year":"2015","unstructured":"LeCun, Y., Bengio, Y., Hinton, G.: Deep learning. Nature 521(7553), 436\u2013444 (2015)","journal-title":"Nature"},{"key":"19_CR11","doi-asserted-by":"crossref","unstructured":"Ledig, C., et al.: Photo-realistic single image super-resolution using a generative adversarial network. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 105\u2013114 (2017)","DOI":"10.1109\/CVPR.2017.19"},{"key":"19_CR12","doi-asserted-by":"crossref","unstructured":"Li, M., et al.: DocBank: a benchmark dataset for document layout analysis. In: Scott, D., Bel, N., Zong, C. (eds.) 28th International Conference on Computational Linguistics, pp. 949\u2013960. International Committee on Computational Linguistics, Barcelona, Spain (Online) (2020)","DOI":"10.18653\/v1\/2020.coling-main.82"},{"key":"19_CR13","doi-asserted-by":"crossref","unstructured":"Liang, J., Cao, J., Sun, G., Zhang, K., Van\u00a0Gool, L., Timofte, R.: SwinIR: image restoration using swin transformer. In: IEEE\/CVF International Conference on Computer Vision Workshops, pp. 1833\u20131844 (2021)","DOI":"10.1109\/ICCVW54120.2021.00210"},{"issue":"1","key":"19_CR14","first-page":"64","volume":"27","author":"H Morgan","year":"2022","unstructured":"Morgan, H.: Conducting a qualitative document analysis. Qual. Rep. 27(1), 64\u201377 (2022)","journal-title":"Qual. Rep."},{"key":"19_CR15","volume-title":"Optical Character Recognition","author":"S Mori","year":"1999","unstructured":"Mori, S., Nishida, H., Yamada, H.: Optical Character Recognition. Wiley, New York (1999)"},{"issue":"11","key":"19_CR16","doi-asserted-by":"publisher","first-page":"1162","DOI":"10.1109\/34.244677","volume":"15","author":"L O\u2019Gorman","year":"1993","unstructured":"O\u2019Gorman, L.: The document spectrum for page layout analysis. IEEE Trans. Pattern Anal. Mach. Intell. 15(11), 1162\u20131173 (1993)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"19_CR17","doi-asserted-by":"crossref","unstructured":"Okamoto, Y., et al.: CREPE: Coordinate-Aware End-to-End Document Parser (2024). https:\/\/arxiv.org\/abs\/2405.00260","DOI":"10.1007\/978-3-031-70546-5_1"},{"issue":"3","key":"19_CR18","doi-asserted-by":"publisher","first-page":"355","DOI":"10.1016\/S0734-189X(87)80186-X","volume":"39","author":"SM Pizer","year":"1987","unstructured":"Pizer, S.M., et al.: Adaptive histogram equalization and its variations. Comput. Vision Graph. Image Process. 39(3), 355\u2013368 (1987)","journal-title":"Comput. Vision Graph. Image Process."},{"key":"19_CR19","doi-asserted-by":"crossref","unstructured":"Qi, Y., et al.: A comprehensive overview of image enhancement techniques. Arch. Comput. Methods Eng. 1\u201325 (2021)","DOI":"10.1007\/s11831-021-09587-6"},{"key":"19_CR20","unstructured":"Rao, N.V., Sastry, A., Chakravarthy, A., Kalyanchakravarthi, P.: Optical character recognition technique algorithms. J. Theor. Appl. Inf. Technol. 83(2) (2016)"},{"key":"19_CR21","doi-asserted-by":"crossref","unstructured":"Smith, R.: An overview of the tesseract OCR engine. In: Ninth International Conference on Document Analysis and Recognition, vol.\u00a02, pp. 629\u2013633 (2007)","DOI":"10.1109\/ICDAR.2007.4376991"},{"key":"19_CR22","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"53","DOI":"10.1007\/978-3-031-41734-4_4","volume-title":"Document Analysis and Recognition - ICDAR 2023","author":"J Wang","year":"2023","unstructured":"Wang, J., et al.: A graphical approach to document layout analysis. In: Fink, G.A., Jain, R., Kise, K., Zanibbi, R. (eds.) ICDAR 2023. LNCS, vol. 14191, pp. 53\u201369. Springer, Cham (2023). https:\/\/doi.org\/10.1007\/978-3-031-41734-4_4"},{"key":"19_CR23","doi-asserted-by":"crossref","unstructured":"Xu, Y., Li, M., Cui, L., Huang, S., Wei, F., Zhou, M.: LayoutLM: pre-training of text and layout for document image understanding. In: 26th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, pp. 1192\u20131200. Association for Computing Machinery, New York, NY, USA (2020)","DOI":"10.1145\/3394486.3403172"},{"key":"19_CR24","doi-asserted-by":"crossref","unstructured":"Zhong, X., Tang, J., Yepes, A.J.: PubLayNet: largest dataset ever for document layout analysis. arXiv preprint arXiv:1908.07836 (2019)","DOI":"10.1109\/ICDAR.2019.00166"}],"container-title":["Lecture Notes in Computer Science","Progress in Pattern Recognition, Image Analysis, Computer Vision, and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-76607-7_19","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,16]],"date-time":"2024-11-16T05:05:35Z","timestamp":1731733535000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-76607-7_19"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,11,17]]},"ISBN":["9783031766060","9783031766077"],"references-count":24,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-76607-7_19","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2024,11,17]]},"assertion":[{"value":"17 November 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"CIARP","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Iberoamerican Congress on Pattern Recognition","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Talca","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Chile","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"26 November 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 November 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"27","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"ciarp2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/www.ciarp24.org","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}