{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,23]],"date-time":"2026-04-23T22:32:56Z","timestamp":1776983576942,"version":"3.51.4"},"reference-count":66,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2025,5,8]],"date-time":"2025-05-08T00:00:00Z","timestamp":1746662400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2025,5,8]],"date-time":"2025-05-08T00:00:00Z","timestamp":1746662400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"funder":[{"DOI":"10.13039\/501100003130","name":"Fonds Wetenschappelijk Onderzoek","doi-asserted-by":"publisher","award":["I000921N"],"award-info":[{"award-number":["I000921N"]}],"id":[{"id":"10.13039\/501100003130","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100003130","name":"Fonds Wetenschappelijk Onderzoek","doi-asserted-by":"publisher","award":["I000921N"],"award-info":[{"award-number":["I000921N"]}],"id":[{"id":"10.13039\/501100003130","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100003130","name":"Fonds Wetenschappelijk Onderzoek","doi-asserted-by":"publisher","award":["I000921N"],"award-info":[{"award-number":["I000921N"]}],"id":[{"id":"10.13039\/501100003130","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100003130","name":"Fonds Wetenschappelijk Onderzoek","doi-asserted-by":"publisher","award":["FWOTM1151"],"award-info":[{"award-number":["FWOTM1151"]}],"id":[{"id":"10.13039\/501100003130","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100003130","name":"Fonds Wetenschappelijk Onderzoek","doi-asserted-by":"publisher","award":["FWOTM1151"],"award-info":[{"award-number":["FWOTM1151"]}],"id":[{"id":"10.13039\/501100003130","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100003130","name":"Fonds Wetenschappelijk Onderzoek","doi-asserted-by":"publisher","award":["I000921N"],"award-info":[{"award-number":["I000921N"]}],"id":[{"id":"10.13039\/501100003130","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100002749","name":"Belgian Federal Science Policy Office","doi-asserted-by":"publisher","award":["BR\/175\/A3\/COBECORE"],"award-info":[{"award-number":["BR\/175\/A3\/COBECORE"]}],"id":[{"id":"10.13039\/501100002749","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100002749","name":"Belgian Federal Science Policy Office","doi-asserted-by":"publisher","award":["BR\/175\/A3\/COBECORE"],"award-info":[{"award-number":["BR\/175\/A3\/COBECORE"]}],"id":[{"id":"10.13039\/501100002749","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100002749","name":"Belgian Federal Science Policy Office","doi-asserted-by":"publisher","award":["BR\/175\/A3\/COBECORE"],"award-info":[{"award-number":["BR\/175\/A3\/COBECORE"]}],"id":[{"id":"10.13039\/501100002749","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["IJDAR"],"published-print":{"date-parts":[[2026,3]]},"DOI":"10.1007\/s10032-025-00524-y","type":"journal-article","created":{"date-parts":[[2025,5,7]],"date-time":"2025-05-07T21:23:30Z","timestamp":1746653010000},"page":"61-75","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Human-in-the-loop tabular data extraction methods for historical climate data rescue"],"prefix":"10.1007","volume":"29","author":[{"given":"Bas","family":"Vercruysse","sequence":"first","affiliation":[]},{"given":"Julie M.","family":"Birkholz","sequence":"additional","affiliation":[]},{"given":"Krishna Kumar Thirukokaranam","family":"Chandrasekar","sequence":"additional","affiliation":[]},{"given":"Derrick","family":"Muheki","sequence":"additional","affiliation":[]},{"given":"Wim","family":"Thiery","sequence":"additional","affiliation":[]},{"given":"Hans","family":"Verbeeck","sequence":"additional","affiliation":[]},{"given":"Koen","family":"Hufkens","sequence":"additional","affiliation":[]},{"given":"Kim","family":"Jacobsen","sequence":"additional","affiliation":[]},{"given":"Christophe","family":"Verbruggen","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,5,8]]},"reference":[{"issue":"6564","key":"524_CR1","doi-asserted-by":"publisher","first-page":"158","DOI":"10.1126\/science.abi7339","volume":"374","author":"W Thiery","year":"2021","unstructured":"Thiery, W., Lange, S., Rogelj, J., Schleussner, C.-F., Gudmundsson, L., Seneviratne, S.I., Andrijevic, M., Frieler, K., Emanuel, K., Geiger, T., Bresch, D.N., Zhao, F., Willner, S.N., B\u00fcchner, M., Volkholz, J., Bauer, N., Chang, J., Ciais, P., Dury, M., Fran\u00e7ois, L., Grillakis, M., Gosling, S.N., Hanasaki, N., Hickler, T., Huber, V., Ito, A., J\u00e4germeyr, J., Khabarov, N., Koutroulis, A., Liu, W., Lutz, W., Mengel, M., M\u00fcller, C., Ostberg, S., Reyer, C.P.O., Stacke, T., Wada, Y.: Intergenerational inequities in exposure to climate extremes. Science 374(6564), 158\u2013160 (2021). https:\/\/doi.org\/10.1126\/science.abi7339","journal-title":"Science"},{"key":"524_CR2","doi-asserted-by":"publisher","unstructured":"Calvin, K., Dasgupta, D., Krinner, G., Mukherji, e.a.: Ipcc, 2023: Climate Change 2023: Synthesis Report, Summary for Policymakers. Contribution of Working Groups I, II and III to the Sixth Assessment Report of the Intergovernmental Panel on Climate Change, IPCC, Geneva, Switzerland. IPCC, 1\u201334 (2023) https:\/\/doi.org\/10.59327\/ipcc\/ar6-9789291691647.001","DOI":"10.59327\/ipcc\/ar6-9789291691647.001"},{"issue":"2","key":"524_CR3","doi-asserted-by":"publisher","first-page":"429","DOI":"10.5194\/esd-15-429-2024","volume":"15","author":"D Muheki","year":"2024","unstructured":"Muheki, D., Deijns, A., Bevacqua, E., Messori, G., Zscheischler, J., Thiery, W.: The perfect storm? co-occurring climate extremes in East Africa. Earth Syst. Dyn. 15(2), 429\u2013466 (2024). https:\/\/doi.org\/10.5194\/esd-15-429-2024","journal-title":"Earth Syst. Dyn."},{"key":"524_CR4","volume-title":"Weather and Climate Extreme Events in a Changing Climate","author":"SI Seneviratne","year":"2023","unstructured":"Seneviratne, S.I., Zhang, X., Adnan, M., Badi, W., Dereczynski, C., Luca, A.D., Ghosh, S., Iskandar, I., Kossin, J., Lewis, S., Otto, F., Pinto, I., Satoh, M., Vicente-Serrano, S.M., Wehner, M., Zhou, B.: In: Masson-Delmotte, V., Zhai, P., Pirani, A., Connors, S.L., P\u00e9an, C., Berger, S., Caud, N., Chen, Y., Goldfarb, L., Gomis, M.I., Huang, M., Leitzell, K., Lonnoy, E., Matthews, J.B.R., Maycock, T.K., Waterfield, T., Yelek\u00e7i, O., Yu, R., Zhou, B. (eds.) Weather and Climate Extreme Events in a Changing Climate. Cambridge University Press, Cambridge, UK (2023)"},{"issue":"2","key":"524_CR5","doi-asserted-by":"publisher","first-page":"160","DOI":"10.1002\/gdj3.79","volume":"6","author":"E Hawkins","year":"2019","unstructured":"Hawkins, E., Burt, S., Brohan, P., Lockwood, M., Richardson, H., Roy, M., Thomas, S.: Hourly weather observations from the Scottish highlands (1883\u20131904) rescued by volunteer citizen scientists. Geosci. Data J. 6(2), 160\u2013173 (2019). https:\/\/doi.org\/10.1002\/gdj3.79","journal-title":"Geosci. Data J."},{"issue":"2","key":"524_CR6","doi-asserted-by":"publisher","first-page":"246","DOI":"10.1002\/gdj3.157","volume":"10","author":"E Hawkins","year":"2023","unstructured":"Hawkins, E., Burt, S., McCarthy, M., Murphy, C., Ross, C., Baldock, M., Brazier, J., Hersee, G., Huntley, J., Meats, R., et al.: Millions of historical monthly rainfall observations taken in the UK and Ireland rescued by citizen scientists. Geosci. Data J. 10(2), 246\u2013261 (2023). https:\/\/doi.org\/10.1002\/gdj3.157","journal-title":"Geosci. Data J."},{"key":"524_CR7","doi-asserted-by":"publisher","first-page":"364","DOI":"10.1016\/j.future.2022.05.014","volume":"135","author":"X Wu","year":"2022","unstructured":"Wu, X., Xiao, L., Sun, Y., Zhang, J., Ma, T., He, L.: A survey of human-in-the-loop for machine learning. Future Generation Comput. Syst. 135, 364\u2013381 (2022). https:\/\/doi.org\/10.1016\/j.future.2022.05.014","journal-title":"Future Generation Comput. Syst."},{"issue":"12","key":"524_CR8","doi-asserted-by":"publisher","first-page":"389","DOI":"10.1175\/BAMS-D-19-0040.1","volume":"100","author":"S Br\u00f6nnimann","year":"2019","unstructured":"Br\u00f6nnimann, S., Allan, R., Ashcroft, L.S.B., et al.: Unlocking pre-1850 instrumental meteorological records: A global inventory. Bull. Am. Meteorol. Soc. 100(12), 389\u2013413 (2019). https:\/\/doi.org\/10.1175\/BAMS-D-19-0040.1","journal-title":"Bull. Am. Meteorol. Soc."},{"key":"524_CR9","doi-asserted-by":"crossref","unstructured":"Muheki, D., Vercruysse, B., Verbruggen, C., Ntumba, D. K., Hawkins, E., Meunier, F., Imwangana, F. M., Verbeeck, H., Birkholz, J. M., Mbifo, J., et al.: Data Rescue of Millions of Daily Precipitation and Temperature Records Collected within the Congo Basin. Technical Report, Copernicus Meetings (2024)","DOI":"10.5194\/egusphere-egu24-9889"},{"key":"524_CR10","unstructured":"Kasem, M., Abdallah, A., Berendeyev, A., Elkady, E., Abdalla, M., Mahmoud, M., Hamada, M., Nurseitov, D., Taj-Eddin, I.: Deep Learning for Table Detection and Structure Recognition: A Survey (2022). https:\/\/arxiv.org\/abs\/2211.08469"},{"key":"524_CR11","doi-asserted-by":"crossref","unstructured":"Paliwal, S., D, V., Rahul, R., Sharma, M., Vig, L.: TableNet: Deep Learning Model for End-to-End Table Detection and Tabular Data Extraction from Scanned Document Images (2020). https:\/\/arxiv.org\/abs\/2001.01469","DOI":"10.1109\/ICDAR.2019.00029"},{"key":"524_CR12","doi-asserted-by":"publisher","first-page":"66","DOI":"10.1007\/s10032-006-0017-x","volume":"8","author":"DW Embley","year":"2006","unstructured":"Embley, D.W., Hurst, M., Lopresti, D., Nagy, G.: Table-processing paradigms: A research survey. Int. J. Document Anal. Recogn. 8, 66\u201386 (2006). https:\/\/doi.org\/10.1007\/s10032-006-0017-x","journal-title":"Int. J. Document Anal. Recogn."},{"key":"524_CR13","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2304.00685","author":"J Zhang","year":"2024","unstructured":"Zhang, J., Huang, J., Jin, S., Lu, S.: Vision-language models for vision tasks: A survey. IEEE Trans. Pattern Anal. Mach. Intell. (2024). https:\/\/doi.org\/10.48550\/arXiv.2304.00685","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"524_CR14","doi-asserted-by":"crossref","unstructured":"Hirayama, Y.: A method for table structure analysis using dp matching. In: Proceedings of 3rd International Conference on Document Analysis and Recognition, vol. 2, pp. 583\u2013586 (1995). IEEE","DOI":"10.1109\/ICDAR.1995.601964"},{"key":"524_CR15","unstructured":"Hu, J., Kashi, R. S., Lopresti, D. P., Wilfong, G.: Medium-independent table detection. In: Document Recognition and Retrieval VII, vol. 3967, pp. 291\u2013302 (1999). SPIE"},{"key":"524_CR16","first-page":"1","volume":"7","author":"R Zanibbi","year":"2004","unstructured":"Zanibbi, R., Blostein, D., Cordy, J.R.: A survey of table recognition: Models, observations, transformations, and inferences. Document Anal. Recogn. 7, 1\u201316 (2004)","journal-title":"Document Anal. Recogn."},{"key":"524_CR17","unstructured":"Goodfellow, I., Bengio, Y., Courville, A.: Deep learning mit press (2016). In: Conference on Information and Communication Systems (ICICS), pp. 151\u2013156 (2016)"},{"key":"524_CR18","doi-asserted-by":"crossref","unstructured":"Hao, L., Gao, L., Yi, X., Tang, Z.: A table detection method for pdf documents based on convolutional neural networks. In: 2016 12th IAPR Workshop on Document Analysis Systems (DAS), pp. 287\u2013292 (2016). IEEE","DOI":"10.1109\/DAS.2016.23"},{"key":"524_CR19","doi-asserted-by":"crossref","unstructured":"Augusto Borges\u00a0Oliveira, D., Palhares\u00a0Viana, M.: Fast cnn-based document layout analysis. In: Proceedings of the IEEE International Conference on Computer Vision Workshops, pp. 1173\u20131180 (2017)","DOI":"10.1109\/ICCVW.2017.142"},{"issue":"4","key":"524_CR20","doi-asserted-by":"publisher","first-page":"419","DOI":"10.1007\/s10032-023-00428-9","volume":"26","author":"R Petitpierre","year":"2023","unstructured":"Petitpierre, R., Kramer, M., Rappo, L.: An end-to-end pipeline for historical censuses processing. Int. J. Document Anal. Recogn. 26(4), 419\u2013432 (2023)","journal-title":"Int. J. Document Anal. Recogn."},{"key":"524_CR21","doi-asserted-by":"publisher","unstructured":"Redmon, J., Farhadi, A.: Yolov3: An Incremental Improvement (2018) https:\/\/doi.org\/10.48550\/arXiv.1804.02767","DOI":"10.48550\/arXiv.1804.02767"},{"key":"524_CR22","doi-asserted-by":"crossref","unstructured":"Liu, W., Anguelov, D., Erhan, D., Szegedy, C., Reed, S., Fu, C.-Y., Berg, A. C.: Ssd: Single shot multibox detector. In: European Conference on Computer Vision, pp. 21\u201337 (2016). Springer","DOI":"10.1007\/978-3-319-46448-0_2"},{"key":"524_CR23","doi-asserted-by":"crossref","unstructured":"Huang, Y., Yan, Q., Li, Y., Chen, Y., Wang, X., Gao, L., Tang, Z.: A yolo-based table detection method. In: 2019 International Conference on Document Analysis and Recognition (ICDAR), pp. 813\u2013818 (2019). IEEE","DOI":"10.1109\/ICDAR.2019.00135"},{"key":"524_CR24","doi-asserted-by":"crossref","unstructured":"Kerwat, M., George, R., Shujaee, K.: Detecting knowledge artifacts in scientific document images-comparing deep learning architectures. In: 2018 Fifth International Conference on Social Networks Analysis, Management and Security (SNAMS), pp. 147\u2013152 (2018). IEEE","DOI":"10.1109\/SNAMS.2018.8554818"},{"key":"524_CR25","unstructured":"Ren, S., He, K., Girshick, R., Sun, J.: Faster r-cnn: Towards real-time object detection with region proposal networks. Adv. Neural Inf. Process. Syst. 28, 1\u201314 (2015)"},{"key":"524_CR26","unstructured":"Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: Table benchmark for image-based table detection and recognition. In: Proceedings of the Twelfth Language Resources and Evaluation Conference, pp. 1918\u20131925 (2020)"},{"key":"524_CR27","doi-asserted-by":"crossref","unstructured":"Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In: 2017 14th IAPR International Conference on Document Analysis and Recognition (ICDAR), vol. 1, pp. 1162\u20131167 (2017). IEEE","DOI":"10.1109\/ICDAR.2017.192"},{"key":"524_CR28","doi-asserted-by":"publisher","first-page":"74151","DOI":"10.1109\/ACCESS.2018.2880211","volume":"6","author":"SA Siddiqui","year":"2018","unstructured":"Siddiqui, S.A., Malik, M.I., Agne, S., Dengel, A., Ahmed, S.: Decnt: Deep deformable CNN for table detection. IEEE Access 6, 74151\u201374161 (2018)","journal-title":"IEEE Access"},{"key":"524_CR29","doi-asserted-by":"crossref","unstructured":"Girshick, R., Donahue, J., Darrell, T., Malik, J.: Rich feature hierarchies for accurate object detection and semantic segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 580\u2013587 (2014)","DOI":"10.1109\/CVPR.2014.81"},{"key":"524_CR30","unstructured":"Dosovitskiy, A., Beyer, L., Kolesnikov, A., Weissenborn, D., Zhai, X., Unterthiner, T., Dehghani, M., Minderer, M., Heigold, G., Gelly, S., et al.: An image is worth 16x16 words: Transformers for image recognition at scale. arXiv preprint arXiv:2010.11929 (2020)"},{"key":"524_CR31","unstructured":"Vaswani, A., Shazeer, N., Parmar, N., Uszkoreit, J., Jones, L., Gomez, A.N., Kaiser, \u0141., Polosukhin, I.: Attention is all you need. Adv. Neural Inf. Process. Syst. 30, 1\u201315 (2017)"},{"key":"524_CR32","doi-asserted-by":"crossref","unstructured":"Arik, S.\u00d6., Pfister, T.: Tabnet: Attentive interpretable tabular learning. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol. 35, pp. 6679\u20136687 (2021)","DOI":"10.1609\/aaai.v35i8.16826"},{"key":"524_CR33","unstructured":"Huang, X., Khetan, A., Cvitkovic, M., Karnin, Z.: Tabtransformer: Tabular data modeling using contextual embeddings. arXiv preprint arXiv:2012.06678 (2020)"},{"key":"524_CR34","doi-asserted-by":"crossref","unstructured":"Song, W., Shi, C., Xiao, Z., Duan, Z., Xu, Y., Zhang, M., Tang, J.: Autoint: Automatic feature interaction learning via self-attentive neural networks. In: Proceedings of the 28th ACM International Conference on Information and Knowledge Management, pp. 1161\u20131170 (2019)","DOI":"10.1145\/3357384.3357925"},{"issue":"3","key":"524_CR35","doi-asserted-by":"publisher","first-page":"314","DOI":"10.7763\/IJMLC.2012.V2.137","volume":"2","author":"A Singh","year":"2012","unstructured":"Singh, A., Bacchuwar, K., Bhasin, A.: A survey of OCR applications. Int. J. Mach. Learn. Comput. 2(3), 314\u2013318 (2012). https:\/\/doi.org\/10.7763\/IJMLC.2012.V2.137","journal-title":"Int. J. Mach. Learn. Comput."},{"key":"524_CR36","unstructured":"Subramani, N., Matton, A., Greaves, M., Lam, A.: A Survey of Deep Learning Approaches for OCR and Document Understanding (2020). https:\/\/arxiv.org\/abs\/2011.13534"},{"key":"524_CR37","doi-asserted-by":"publisher","first-page":"142642","DOI":"10.1109\/ACCESS.2020.3012542","volume":"8","author":"J Memon","year":"2020","unstructured":"Memon, J., Sami, M., Khan, R.A., Uddin, M.: Handwritten optical character recognition (OCR): A comprehensive systematic literature review (SLR). IEEE Access 8, 142642\u2013142668 (2020). https:\/\/doi.org\/10.1109\/ACCESS.2020.3012542","journal-title":"IEEE Access"},{"key":"524_CR38","unstructured":"Str\u00f6bel, P.B., Clematide, S., Volk, M., Hodel, T.: Transformer-based HTR for Historical Documents (2022). https:\/\/arxiv.org\/abs\/2203.11008"},{"key":"524_CR39","doi-asserted-by":"publisher","unstructured":"Romero, V., S\u00e1nchez, J. A.: The hisclima database: historical weather logs for automatic information extraction. In: 2021 16th International Conference on Document Analysis and Recognition (ICDAR), pp. 130\u2013135 (2021). https:\/\/doi.org\/10.1109\/ICPR48806.2021.9412210","DOI":"10.1109\/ICPR48806.2021.9412210"},{"key":"524_CR40","doi-asserted-by":"publisher","unstructured":"Lehenmeier, C., Burghardt, M., Mischka, B.: Layout detection and table recognition - recent challenges in digitizing historical documents and handwritten tabular data. In: Digital Libraries for Open Knowledge: 24th International Conference on Theory and Practice of Digital Libraries, TPDL 2020, pp. 229\u2013242. Springer, New York (2020). https:\/\/doi.org\/10.1007\/978-3-030-54956-5_17","DOI":"10.1007\/978-3-030-54956-5_17"},{"key":"524_CR41","doi-asserted-by":"crossref","unstructured":"Xin, D., Ma, L., Liu, J., Macke, S., Song, S., Parameswaran, A.: Accelerating human-in-the-loop machine learning: Challenges and opportunities. In: Proceedings of the Second Workshop on Data Management for End-to-end Machine Learning, pp. 1\u20134 (2018)","DOI":"10.1145\/3209889.3209897"},{"key":"524_CR42","unstructured":"Brutzkus, A., Globerson, A.: Why do larger models generalize better? a theoretical perspective via the xor problem. In: International Conference on Machine Learning, pp. 822\u2013830 (2019). PMLR"},{"key":"524_CR43","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.1810.04805","author":"J Devlin","year":"2018","unstructured":"Devlin, J., Chang, M., Lee, K., Toutanova, K.: BERT: pre-training of deep bidirectional transformers for language understanding. CoRR (2018). https:\/\/doi.org\/10.48550\/arXiv.1810.04805","journal-title":"CoRR"},{"issue":"10s","key":"524_CR44","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3505244","volume":"54","author":"S Khan","year":"2022","unstructured":"Khan, S., Naseer, M., Hayat, M., Zamir, S.W., Khan, F.S., Shah, M.: Transformers in vision: A survey. ACM Comput. Surv. 54(10s), 1\u201341 (2022)","journal-title":"ACM Comput. Surv."},{"issue":"2","key":"524_CR45","doi-asserted-by":"publisher","first-page":"303","DOI":"10.1007\/s11263-009-0275-4","volume":"88","author":"M Everingham","year":"2010","unstructured":"Everingham, M., Gool, L.V., Williams, C.K.I., Winn, J., Zisserman, A.: The pascal visual object classes (VOC) challenge. Int. J. Comput. Vis. 88(2), 303\u2013338 (2010). https:\/\/doi.org\/10.1007\/s11263-009-0275-4","journal-title":"Int. J. Comput. Vis."},{"key":"524_CR46","doi-asserted-by":"crossref","unstructured":"Muheki, D., Vercruysse, B., Chandrasekar, K. K. T., Verbruggen, C., Birkholz, J. M., Hufkens, K., Verbeeck, H., Boeckx, P., Lampe, S., Hawkins, E., Thorne, P., Ntumba, D. K., Moulasa, O. K., Thiery, W.: MeteoSaver v1.0: A Machine-Learning Based Software for the Transcription of Historical Weather Data. Manuscript under review (2024)","DOI":"10.5194\/egusphere-2024-3779"},{"key":"524_CR47","doi-asserted-by":"crossref","unstructured":"Baek, Y., Lee, B., Han, D., Yun, S., Lee, H.: Character region awareness for text detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 9365\u20139374 (2019)","DOI":"10.1109\/CVPR.2019.00959"},{"key":"524_CR48","doi-asserted-by":"publisher","first-page":"12345","DOI":"10.3390\/informatics11040077","volume":"12","author":"T Ngubane","year":"2024","unstructured":"Ngubane, T., Tapamo, J.-R.: Tableextractnet: A model of automatic detection and recognition of table structures from unstructured documents. IEEE Access 12, 12345\u201312356 (2024). https:\/\/doi.org\/10.3390\/informatics11040077","journal-title":"IEEE Access"},{"key":"524_CR49","doi-asserted-by":"publisher","unstructured":"Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: TGRNet: A table graph reconstruction network for table structure recognition. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision (ICCV), pp. 1295\u20131303 (2021). https:\/\/doi.org\/10.1109\/ICCV48922.2021.00132","DOI":"10.1109\/ICCV48922.2021.00132"},{"key":"524_CR50","unstructured":"Rakshit, S., Kundu, A., Maity, M., Mandal, S., Sarkar, S., Basu, S.: Recognition of handwritten Roman Numerals using Tesseract open source OCR engine (2010). https:\/\/arxiv.org\/abs\/1003.5898"},{"key":"524_CR51","doi-asserted-by":"publisher","unstructured":"Puigcerver, J.: Are multidimensional recurrent layers really necessary for handwritten text recognition? In: 2017 14th IAPR International Conference on Document Analysis and Recognition (ICDAR), vol. 01, pp. 67\u201372 (2017). https:\/\/doi.org\/10.1109\/ICDAR.2017.20","DOI":"10.1109\/ICDAR.2017.20"},{"key":"524_CR52","unstructured":"Puigcerver, J., Mochol\u00ed, C.: PyLaia. GitHub (2018)"},{"key":"524_CR53","doi-asserted-by":"publisher","unstructured":"Hassani, H., Silva, E. S.: The role of chatgpt in data science: How ai-assisted conversational interfaces are revolutionizing the field. Big Data Cogn. Comput. 7(2) (2023) https:\/\/doi.org\/10.3390\/bdcc7020062","DOI":"10.3390\/bdcc7020062"},{"key":"524_CR54","unstructured":"Shi, Y., Peng, D., Liao, W., Lin, Z., Chen, X., Liu, C., Zhang, Y., Jin, L.: Exploring OCR Capabilities of GPT-4V(ision) : A Quantitative and In-depth Evaluation (2023). https:\/\/arxiv.org\/abs\/2310.16809"},{"issue":"1","key":"524_CR55","doi-asserted-by":"publisher","first-page":"240","DOI":"10.1162\/dint_a_00235","volume":"6","author":"A Azaria","year":"2024","unstructured":"Azaria, A., Azoulay, R., Reches, S.: ChatGPT is a remarkable tool-for experts. Data Intell. 6(1), 240\u2013296 (2024). https:\/\/doi.org\/10.1162\/dint_a_00235","journal-title":"Data Intell."},{"key":"524_CR56","doi-asserted-by":"publisher","unstructured":"Wang, J., Liu, Z., Zhao, L., Wu, Z., Ma, C., Yu, S., Dai, H., Yang, Q., Liu, Y., Zhang, S., Shi, E., Pan, Y., Zhang, T., Zhu, D., Li, X., Jiang, X., Ge, B., Yuan, Y., Shen, D., Liu, T., Zhang, S.: Review of Large Vision Models and Visual Prompt Engineering. arXiv preprint arXiv:2307.00855 (2023) https:\/\/doi.org\/10.48550\/arXiv.2307.00855","DOI":"10.48550\/arXiv.2307.00855"},{"key":"524_CR57","unstructured":"Walker, J., Fujii, Y., Popat, A. C.: A web-based ocr service for documents. In: Proceedings of the 13th IAPR International Workshop on Document Analysis Systems (DAS), Vienna, Austria, vol. 1 (2018)"},{"issue":"3","key":"524_CR58","doi-asserted-by":"publisher","first-page":"19","DOI":"10.5121\/iju.2015.6303","volume":"6","author":"S Vijayarani","year":"2015","unstructured":"Vijayarani, S., Sakila, A.: Performance comparison of OCR tools. Int. J. UbiComp (IJU) 6(3), 19\u201330 (2015)","journal-title":"Int. J. UbiComp (IJU)"},{"key":"524_CR59","doi-asserted-by":"crossref","unstructured":"Tafti, A. P., Baghaie, A., Assefi, M., Arabnia, H. R., Yu, Z., Peissig, P.: Ocr as a service: an experimental evaluation of google docs ocr, tesseract, abbyy finereader, and transym. In: Advances in Visual Computing: 12th International Symposium, ISVC 2016, Las Vegas, NV, USA, December 12-14, 2016, Proceedings, Part I 12, pp. 735\u2013746 (2016). Springer","DOI":"10.1007\/978-3-319-50835-1_66"},{"key":"524_CR60","doi-asserted-by":"publisher","DOI":"10.1007\/s10502-022-09397-0","author":"J Nockels","year":"2022","unstructured":"Nockels, J., Gooding, P., Ames, S., Terras, M.: Understanding the application of handwritten text recognition technology in heritage contexts: A systematic review of transkribus in published research. Archival J. (2022). https:\/\/doi.org\/10.1007\/s10502-022-09397-0","journal-title":"Archival J."},{"key":"524_CR61","unstructured":"READ-COOP: Introducing Transkribus Super Models - get access to \u201cThe Text Titan I\u201d (2023)"},{"key":"524_CR62","doi-asserted-by":"publisher","unstructured":"Nockels, J., Gooding, P., Terras, M.: Are Digital Humanities platforms facilitating sufficient diversity in research? A study of the Transkribus Scholarship Programme. Digi. Scholar. Human., 018 (2024) https:\/\/doi.org\/10.1093\/llc\/fqae018","DOI":"10.1093\/llc\/fqae018"},{"key":"524_CR63","doi-asserted-by":"publisher","DOI":"10.1353\/mns.2024.a930877","author":"G Probor","year":"2024","unstructured":"Probor, G.: From digitization and images to text and content: Transkribus as a case study. Manuscript Stud. J. Schoenberg Inst. Manuscript Stud. (2024). https:\/\/doi.org\/10.1353\/mns.2024.a930877","journal-title":"Manuscript Stud. J. Schoenberg Inst. Manuscript Stud."},{"key":"524_CR64","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2109.10282","author":"M Li","year":"2021","unstructured":"Li, M., Lv, T., Cui, L., Lu, Y., Flor\u00eancio, D.A.F., Zhang, C., Li, Z., Wei, F.: Trocr: Transformer-based optical character recognition with pre-trained models. CoRR (2021). https:\/\/doi.org\/10.48550\/arXiv.2109.10282","journal-title":"CoRR"},{"key":"524_CR65","unstructured":"Leifert, G., Romein, C. A., Rabus, A., Str\u00f6bel, P., Hodel, T.: Transkribus and Beyond: Pioneering the Future of Transcription Technology (2024)"},{"key":"524_CR66","unstructured":"The OCR-D project (2024)"}],"container-title":["International Journal on Document Analysis and Recognition (IJDAR)"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10032-025-00524-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10032-025-00524-y","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10032-025-00524-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,4,10]],"date-time":"2026-04-10T06:50:28Z","timestamp":1775803828000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10032-025-00524-y"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,5,8]]},"references-count":66,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2026,3]]}},"alternative-id":["524"],"URL":"https:\/\/doi.org\/10.1007\/s10032-025-00524-y","relation":{},"ISSN":["1433-2833","1433-2825"],"issn-type":[{"value":"1433-2833","type":"print"},{"value":"1433-2825","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,5,8]]},"assertion":[{"value":"22 July 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"24 February 2025","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"24 March 2025","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"8 May 2025","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declaration"}},{"value":"The authors declare no competing interests.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflicts of interest"}}]}}