{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,23]],"date-time":"2025-09-23T13:49:01Z","timestamp":1758635341216,"version":"3.37.3"},"reference-count":34,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2020,5,20]],"date-time":"2020-05-20T00:00:00Z","timestamp":1589932800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2020,5,20]],"date-time":"2020-05-20T00:00:00Z","timestamp":1589932800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/501100001823","name":"Ministerstvo \u0160kolstv\u00ed, Ml\u00e1de\u017ee a T\u011blov\u00fdchovy","doi-asserted-by":"publisher","award":["CZ.02.1.01\/0.0\/0.0\/17_048\/0007267"],"award-info":[{"award-number":["CZ.02.1.01\/0.0\/0.0\/17_048\/0007267"]}],"id":[{"id":"10.13039\/501100001823","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Evolving Systems"],"published-print":{"date-parts":[[2021,3]]},"DOI":"10.1007\/s12530-020-09343-4","type":"journal-article","created":{"date-parts":[[2020,5,20]],"date-time":"2020-05-20T16:52:18Z","timestamp":1589993538000},"page":"177-190","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":6,"title":["HDPA: historical document processing and analysis framework"],"prefix":"10.1007","volume":"12","author":[{"given":"Ladislav","family":"Lenc","sequence":"first","affiliation":[]},{"given":"Ji\u0159\u00ed","family":"Mart\u00ednek","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3096-675X","authenticated-orcid":false,"given":"Pavel","family":"Kr\u00e1l","sequence":"additional","affiliation":[]},{"given":"Anguelos","family":"Nicolao","sequence":"additional","affiliation":[]},{"given":"Vincent","family":"Christlein","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2020,5,20]]},"reference":[{"key":"9343_CR1","doi-asserted-by":"publisher","first-page":"36","DOI":"10.1016\/j.patrec.2015.06.008","volume":"63","author":"E Ahmadi","year":"2015","unstructured":"Ahmadi E, Azimifar Z, Shams M, Famouri M, Shafiee MJ (2015) Document image binarization using a discriminative structural classifier. Pattern Recogn Lett 63:36\u201342","journal-title":"Pattern Recogn Lett"},{"key":"9343_CR2","doi-asserted-by":"publisher","unstructured":"Alberti M, Bouillon M, Ingold R, Liwicki M (2017) Open Evaluation Tool for Layout Analysis of Document Images. In: 2017 14th IAPR international conference on document analysis and recognition (ICDAR), Kyoto, Japan, pp 43\u201347. https:\/\/doi.org\/10.1109\/ICDAR.2017.311","DOI":"10.1109\/ICDAR.2017.311"},{"key":"9343_CR3","unstructured":"Bahdanau D, Cho K, Bengio Y (2014) Neural machine translation by jointly learning to align and translate. arXiv:1409.0473 (arXiv preprint)"},{"key":"9343_CR4","doi-asserted-by":"crossref","unstructured":"Breuel TM (2008) The ocropus open source OCR system. In: Document recognition and retrieval XV, vol 6815. International Society for Optics and Photonics, p 68150F","DOI":"10.1117\/12.783598"},{"key":"9343_CR5","doi-asserted-by":"crossref","unstructured":"Breuel TM, Ul-Hasan A, Al-Azawi MA, Shafait F (2013) High-performance ocr for printed English and fraktur using LSTM networks. In: 2013 12th international conference on document analysis and recognition (ICDAR), IEEE, pp 683\u2013687","DOI":"10.1109\/ICDAR.2013.140"},{"key":"9343_CR6","doi-asserted-by":"crossref","unstructured":"Chernyshova YS, Gayer AV, Sheshkus AV (2018) Generation method of synthetic training data for mobile OCR system. In: Tenth international conference on machine vision (ICMV 2017), vol 10696, International Society for Optics and Photonics, p 106962G","DOI":"10.1117\/12.2310119"},{"key":"9343_CR7","doi-asserted-by":"crossref","unstructured":"Clausner C, Papadopoulos C, Pletschacher S, Antonacopoulos A (2015) The ENP image and ground truth dataset of historical newspapers. In: 2015 13th international conference on document analysis and recognition (ICDAR), IEEE, pp 931\u2013935","DOI":"10.1109\/ICDAR.2015.7333898"},{"key":"9343_CR8","unstructured":"Clausner C, Pletschacher S, Antonacopoulos A (2014) Efficient ocr training data generation with aletheia. In: Proceedings of the international association for pattern recognition (IAPR), Tours, France, pp 7\u201310"},{"key":"9343_CR9","doi-asserted-by":"crossref","unstructured":"Etter D, Rawls S, Carpenter C, Sell G (2019) A synthetic recipe for OCR. In: 2019 international conference on document analysis and recognition (ICDAR). IEEE, pp 864\u2013869","DOI":"10.1109\/ICDAR.2019.00143"},{"issue":"2","key":"9343_CR10","doi-asserted-by":"publisher","first-page":"181","DOI":"10.1109\/THMS.2016.2634920","volume":"47","author":"A Garz","year":"2016","unstructured":"Garz A, Seuret M, Fischer A, Ingold R (2016) A user-centered segmentation method for complex historical manuscripts based on document graphs. IEEE Trans Human Mach Syst 47(2):181\u2013193","journal-title":"IEEE Trans Human Mach Syst"},{"issue":"5","key":"9343_CR11","doi-asserted-by":"publisher","first-page":"855","DOI":"10.1109\/TPAMI.2008.137","volume":"31","author":"A Graves","year":"2009","unstructured":"Graves A, Liwicki M, Fern\u00e1ndez S, Bertolami R, Bunke H, Schmidhuber J (2009) A novel connectionist system for unconstrained handwriting recognition. IEEE Trans Pattern Anal Mach Intell 31(5):855\u2013868","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"9343_CR12","doi-asserted-by":"crossref","unstructured":"Graves A, Fern\u00e1ndez S, Gomez F, Schmidhuber J (2006) Connectionist temporal classification: labelling unsegmented sequence data with recurrent neural networks. In: Proceedings of the 23rd international conference on Machine learning. ACM, pp 369\u2013376","DOI":"10.1145\/1143844.1143891"},{"key":"9343_CR13","unstructured":"Graves A, Schmidhuber J (2009) Offline handwriting recognition with multidimensional recurrent neural networks. In: Advances in neural information processing systems, pp 545\u2013552"},{"issue":"3","key":"9343_CR14","doi-asserted-by":"publisher","first-page":"285","DOI":"10.1007\/s10032-019-00332-1","volume":"22","author":"T Gr\u00fcning","year":"2019","unstructured":"Gr\u00fcning T, Leifert G, Strau\u00df T, Michael J, Labahn R (2019) A two-stage method for text line detection in historical documents. Int J Doc Anal Recognit 22(3):285\u2013302","journal-title":"Int J Doc Anal Recognit"},{"issue":"8","key":"9343_CR15","doi-asserted-by":"publisher","first-page":"1735","DOI":"10.1162\/neco.1997.9.8.1735","volume":"9","author":"S Hochreiter","year":"1997","unstructured":"Hochreiter S, Schmidhuber J (1997) Long short-term memory. Neural Comput 9(8):1735\u20131780","journal-title":"Neural Comput"},{"key":"9343_CR16","doi-asserted-by":"crossref","unstructured":"Kanungo T, Lee CH, Czorapinski J, Bella I (2000) Trueviz: a groundtruth\/metadata editing and visualizing toolkit for OCR. In: Document recognition and retrieval VIII, vol 4307. International Society for Optics and Photonics, pp 1\u201313","DOI":"10.1117\/12.410825"},{"issue":"8","key":"9343_CR17","first-page":"30","volume":"3","author":"V Kumar","year":"2010","unstructured":"Kumar V, Sengar PK (2010) Segmentation of printed text in devanagari script and gurmukhi script. Int J Comput Appl 3(8):30\u201333","journal-title":"Int J Comput Appl"},{"issue":"10","key":"9343_CR18","first-page":"1995","volume":"3361","author":"Y LeCun","year":"1995","unstructured":"LeCun Y, Bengio Y et al (1995) Convolutional networks for images, speech, and time series. Handb Brain Theory Neural Netw 3361(10):1995","journal-title":"Handb Brain Theory Neural Netw"},{"key":"9343_CR19","unstructured":"Leifert G, Strau\u00df T, Gr\u00fcning T, Labahn R (2016) Citlab argus for historical handwritten documents"},{"key":"9343_CR20","first-page":"12","volume":"1","author":"V Levenshtein","year":"1965","unstructured":"Levenshtein V (1965) Binary codes capable of correcting spurious insertions and deletions of ones. Russ Probl Peredachi Inf 1:12\u201325","journal-title":"Russ Probl Peredachi Inf"},{"issue":"2\u20134","key":"9343_CR21","doi-asserted-by":"publisher","first-page":"123","DOI":"10.1007\/s10032-006-0023-z","volume":"9","author":"L Likforman-Sulem","year":"2007","unstructured":"Likforman-Sulem L, Zahour A, Taconet B (2007) Text line segmentation of historical documents: a survey. IJDAR 9(2\u20134):123\u2013138","journal-title":"IJDAR"},{"key":"9343_CR22","doi-asserted-by":"crossref","unstructured":"Margner V, Pechwitz M (2001) Synthetic data for arabic ocr system development. In: Proceedings of sixth international conference on document analysis and recognition, 2001. IEEE, pp 1159\u20131163","DOI":"10.1109\/ICDAR.2001.953967"},{"key":"9343_CR23","doi-asserted-by":"publisher","unstructured":"Mart\u00ednek J, Lenc L, Kr\u00e1l P, Nicolaou A, Christlein V (2019) Hybrid training data for historical text OCR. In: 15th international conference on document analysis and recognition (ICDAR 2019), Sydney, Australia, pp 565\u2013570. https:\/\/doi.org\/10.1109\/ICDAR.2019.00096","DOI":"10.1109\/ICDAR.2019.00096"},{"key":"9343_CR24","doi-asserted-by":"crossref","unstructured":"Pletschacher S, Antonacopoulos A (2010) The page (page analysis and ground-truth elements) format framework. In: 2010 20th international conference on pattern recognition. IEEE, pp 257\u2013260","DOI":"10.1109\/ICPR.2010.72"},{"key":"9343_CR25","unstructured":"Postl W (1988) Method for automatic correction of character skew in the acquisition of a text original in the form of digital scan results. US Patent 4,723,297"},{"key":"9343_CR26","doi-asserted-by":"crossref","unstructured":"Rawls S, Cao H, Kumar S, Natarajan P (2017) Combining convolutional neural networks and LSTMS for segmentation-free OCR. In: 2017 14th IAPR international conference on document analysis and recognition (ICDAR), vol 1. IEEE, pp 155\u2013160","DOI":"10.1109\/ICDAR.2017.34"},{"key":"9343_CR27","doi-asserted-by":"crossref","unstructured":"Ronneberger O, Fischer P, Brox T (2015) U-net: Convolutional networks for biomedical image segmentation. In: International conference on medical image computing and computer-assisted intervention, Springer, pp 234\u2013241","DOI":"10.1007\/978-3-319-24574-4_28"},{"issue":"2","key":"9343_CR28","doi-asserted-by":"publisher","first-page":"225","DOI":"10.1016\/S0031-3203(99)00055-2","volume":"33","author":"J Sauvola","year":"2000","unstructured":"Sauvola J, Pietik\u00e4inen M (2000) Adaptive document image binarization. Pattern Recogn 33(2):225\u2013236","journal-title":"Pattern Recogn"},{"key":"9343_CR29","unstructured":"Shang W, Sohn K, Almeida D, Lee H (2016) Understanding and improving convolutional neural networks via concatenated rectified linear units. In: International conference on machine learning, pp 2217\u20132225"},{"issue":"11","key":"9343_CR30","doi-asserted-by":"publisher","first-page":"2298","DOI":"10.1109\/TPAMI.2016.2646371","volume":"39","author":"B Shi","year":"2017","unstructured":"Shi B, Bai X, Yao C (2017) An end-to-end trainable neural network for image-based sequence recognition and its application to scene text recognition. IEEE Trans Pattern Anal Mach Intell 39(11):2298\u20132304","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"9343_CR31","doi-asserted-by":"crossref","unstructured":"Smith R (2007) An overview of the tesseract OCR engine. In: Ninth international conference on document analysis and recognition (ICDAR 2007), vol 2. IEEE, pp 629\u2013633","DOI":"10.1109\/ICDAR.2007.4376991"},{"key":"9343_CR32","unstructured":"Strau\u00df T, Weidemann M, Michael J, Leifert G, Gr\u00fcning T, Labahn R (2018) System description of citlab\u2019s recognition and retrieval engine for icdar2017 competition on information extraction in historical handwritten records"},{"key":"9343_CR33","doi-asserted-by":"crossref","unstructured":"Van Beusekom J, Shafait F, Breuel TM (2008) Automated OCR ground truth generation. In: Document analysis systems, 2008. DAS\u201908. The eighth IAPR international workshop on, IEEE, pp 111\u2013117","DOI":"10.1109\/DAS.2008.59"},{"key":"9343_CR34","doi-asserted-by":"publisher","unstructured":"Zahour A, Likforman-Sulem L, Boussalaa W, Taconet B (2007) Text line segmentation of historical Arabic documents, pp 138\u2013142. https:\/\/doi.org\/10.1109\/ICDAR.2007.4378691","DOI":"10.1109\/ICDAR.2007.4378691"}],"container-title":["Evolving Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s12530-020-09343-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s12530-020-09343-4\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s12530-020-09343-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,5,20]],"date-time":"2021-05-20T08:32:57Z","timestamp":1621499577000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s12530-020-09343-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,5,20]]},"references-count":34,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2021,3]]}},"alternative-id":["9343"],"URL":"https:\/\/doi.org\/10.1007\/s12530-020-09343-4","relation":{},"ISSN":["1868-6478","1868-6486"],"issn-type":[{"type":"print","value":"1868-6478"},{"type":"electronic","value":"1868-6486"}],"subject":[],"published":{"date-parts":[[2020,5,20]]},"assertion":[{"value":"20 December 2019","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"23 April 2020","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"20 May 2020","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}