{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,21]],"date-time":"2025-12-21T06:34:58Z","timestamp":1766298898664,"version":"3.48.0"},"reference-count":57,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,10,4]],"date-time":"2025-10-04T00:00:00Z","timestamp":1759536000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,10,4]],"date-time":"2025-10-04T00:00:00Z","timestamp":1759536000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,10,4]]},"DOI":"10.1109\/cist65886.2025.11224240","type":"proceedings-article","created":{"date-parts":[[2025,11,6]],"date-time":"2025-11-06T18:48:49Z","timestamp":1762454929000},"page":"469-476","source":"Crossref","is-referenced-by-count":0,"title":["Transforming Text into Discovery: OCR Enrichment of Digital Collections in the University of Galway Library"],"prefix":"10.1109","author":[{"given":"Oksana","family":"Dereza","sequence":"first","affiliation":[{"name":"Library University of Galway,Galway,Ireland"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Marie-Louise","family":"Rouget","sequence":"additional","affiliation":[{"name":"Library University of Galway,Galway,Ireland"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Chidi","family":"Egwu","sequence":"additional","affiliation":[{"name":"University of Galway,School of Medicine,Galway,Ireland"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Cillian","family":"Joy","sequence":"additional","affiliation":[{"name":"Library University of Galway,Galway,Ireland"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"article-title":"Collections as data: Part to whole. Final report","year":"2023","author":"Padilla","key":"ref1"},{"key":"ref2","article-title":"Issue 13: OCR","author":"Markus","year":"2024","journal-title":"Europeana Tech Insight"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ICDAR.2007.4376991"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-00155-0_21"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1117\/12.783598"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1108\/00220411211256021"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1145\/3322905.3322917"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/DAS.2016.81"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ICDAR.2017.58"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.21248\/jlcl.33.2018.219"},{"issue":"1","key":"ref11","article-title":"Calamari - A high-performance Tensorflow-based deep learning package for optical character recognition","volume":"14","author":"Wick","year":"2020","journal-title":"Digital Humanities Quarterly"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.3390\/app9224853"},{"key":"ref13","article-title":"Human-centred open-source automatic text recognition for the humanities with ocr4all","volume-title":"CHAI@KI","author":"Reul","year":"2024"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1145\/3476887.3476910"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1145\/3352631.3352638"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1007\/s42001-021-00149-1"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1007\/s42803-025-00100-0"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.16995\/dscn.8094"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-06555-2_27"},{"article-title":"State of the art optical character recognition of 19th century Fraktur scripts using open source engines","year":"2018","author":"Reul","key":"ref20"},{"key":"ref21","article-title":"Performance of generic HTR models on historical Cyrillic and Glagolitic: Comparison of engines","author":"Rabus","year":"2023","journal-title":"Scripta & e-Scripta: The Journal of Interdisciplinary Mediaeval Studies"},{"article-title":"A research agenda for historical and multilingual optical character recognition","year":"2018","author":"Smith","key":"ref22"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1093\/llc\/fqz024"},{"issue":"1","key":"ref24","first-page":"1","article-title":"Ground truth OCR sample data of Finnish historical newspapers and journals in data improvement validation of a re-OCRing process","volume-title":"LIBER Quarterly: The Journal of the Association of European Research Libraries","volume":"30","author":"Kettunen","year":"2020"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.46298\/jdmdh.9806"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1002\/eng2.12832"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1145\/3677389.3702524"},{"key":"ref28","article-title":"Does context matter? Enhancing handwritten text recognition with metadata in historical manuscripts","author":"Kiessling","year":"2024","journal-title":"Computational Humanities Research"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-70549-6_23"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.46298\/jdmdh.10262"},{"article-title":"Making Old Kurdish publications processable by augmenting available optical character recognition engines","year":"2024","author":"Yaseen","key":"ref31"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.53377\/lq.13330"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/ICDAR.2017.307"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/eScience.2019.00060"},{"article-title":"PyLaia","year":"2018","author":"Puigcerver","key":"ref35"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1108\/JD-07-2018-0114"},{"issue":"12","key":"ref37","first-page":"7482","article-title":"Experimenting with training a neural network in Transkribus to recognise text in a multilingual and multi-authored manuscript collection","volume-title":"Heritage","volume":"6","author":"Capurro","year":"2023"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/CiSt56084.2023.10409998"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/ICDARW.2019.10032"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1145\/3476887.3476896"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.46298\/jdmdh.13247"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.46298\/jdmdh.10416"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.3390\/jimaging11020036"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.62235\/dk.3.2024.8508"},{"volume-title":"Emigrants and exiles: Ireland and the Irish exodus to North America","year":"1988","author":"Miller","key":"ref45"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1533\/9781780631387"},{"year":"2020","key":"ref47","article-title":"Guidelines for the creation of digital collections"},{"year":"2023","key":"ref48","article-title":"Technical guidelines for digitizing cultural heritage materials: Third edition"},{"key":"ref49","first-page":"65","article-title":"\u00abTo have the \u2018million\u2019 readers yet\u00bb: Building a digitally enhanced edition of the bilingual Irish-English newspaper An Gaodhal (1881-1898)","volume-title":"Proceedings of the Third Workshop on Language Technologies for Historical and Ancient Languages (LT4HALA) @ LREC-COLING-2024","author":"Dereza"},{"key":"ref50","article-title":"An Gaodhal newspaper (1881-1898): Full-text OCR output files (version 1)","volume-title":"Dataset","author":"Chonghaile","year":"2023"},{"key":"ref51","article-title":"OCR-D & OCR4all: Two complementary approaches for improved OCR of historical sources","author":"Baierer","year":"2021","journal-title":"HistoInformatics@ JCDL"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.46298\/jdmdh.10252"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.46298\/jdmdh.10484"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1007\/s10032-024-00507-5"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.ml4al-1.14"},{"article-title":"Proposing a comprehensive dataset for Arabic script OCR in the context of digital libraries and religious archives","year":"2025","author":"Vigliermo","key":"ref56"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1007\/s10032-025-00519-9"}],"event":{"name":"2025 IEEE 8th Congress on Information Science and Technology (CiSt)","start":{"date-parts":[[2025,10,4]]},"location":"Marrakech, Morocco","end":{"date-parts":[[2025,10,10]]}},"container-title":["2025 IEEE 8th Congress on Information Science and Technology (CiSt)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11224058\/11224068\/11224240.pdf?arnumber=11224240","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,12,21]],"date-time":"2025-12-21T06:32:51Z","timestamp":1766298771000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11224240\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,4]]},"references-count":57,"URL":"https:\/\/doi.org\/10.1109\/cist65886.2025.11224240","relation":{},"subject":[],"published":{"date-parts":[[2025,10,4]]}}}