{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,18]],"date-time":"2025-12-18T14:10:44Z","timestamp":1766067044675,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":12,"publisher":"ACM","license":[{"start":{"date-parts":[[2019,5,8]],"date-time":"2019-05-08T00:00:00Z","timestamp":1557273600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-sa\/4.0\/"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2019,5,8]]},"DOI":"10.1145\/3322905.3322910","type":"proceedings-article","created":{"date-parts":[[2019,10,23]],"date-time":"2019-10-23T15:44:57Z","timestamp":1571845497000},"page":"33-38","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":3,"title":["Automatic Semantic Text Tagging on Historical Lexica by Combining OCR and Typography Classification"],"prefix":"10.1145","author":[{"given":"Christian","family":"Reul","sequence":"first","affiliation":[{"name":"Centre for Philology and Digitality, University of W\u00fcrzburg"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Sebastian","family":"G\u00f6ttel","sequence":"additional","affiliation":[{"name":"Berlin-Brandenburg Academy of Sciences and Humanities"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Uwe","family":"Springmann","sequence":"additional","affiliation":[{"name":"Center for Information and Language Processing; LMU Munich"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Christoph","family":"Wick","sequence":"additional","affiliation":[{"name":"Chair for Artificial Intelligence, University of W\u00fcrzburg"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Kay-Michael","family":"W\u00fcrzner","sequence":"additional","affiliation":[{"name":"Berlin-Brandenburg Academy of Sciences and Humanities"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Frank","family":"Puppe","sequence":"additional","affiliation":[{"name":"Chair for Artificial Intelligence, University of W\u00fcrzburg"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2019,5,8]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"High-Performance OCR for Printed English and Fraktur Using LSTM Networks. 12th International Conference on Document Analysis and Recognition","author":"Breuel T. M.","year":"2013","unstructured":"T. M. Breuel , A. Ul-Hasan , M. A. Al-Azawi , and F. Shafait . 2013 . High-Performance OCR for Printed English and Fraktur Using LSTM Networks. 12th International Conference on Document Analysis and Recognition ( 2013 ), 683--687. T. M. Breuel, A. Ul-Hasan, M. A. Al-Azawi, and F. Shafait. 2013. High-Performance OCR for Printed English and Fraktur Using LSTM Networks. 12th International Conference on Document Analysis and Recognition (2013), 683--687."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_2_1","DOI":"10.1109\/ICDAR.2017.35"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_3_1","DOI":"10.1109\/DAS.2014.71"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"crossref","first-page":"3","DOI":"10.21248\/jlcl.33.2018.216","article-title":"Improving OCR Accuracy on Early Printed Books by combining Pretraining, Voting, and Active Learning","volume":"33","author":"Reul Christian","year":"2018","unstructured":"Christian Reul , Uwe Springmann , Christoph Wick , and Frank Puppe . 2018 . Improving OCR Accuracy on Early Printed Books by combining Pretraining, Voting, and Active Learning . JLCL 33 , 1 (2018), 3 -- 24 . Christian Reul, Uwe Springmann, Christoph Wick, and Frank Puppe. 2018. Improving OCR Accuracy on Early Printed Books by combining Pretraining, Voting, and Active Learning. JLCL 33, 1 (2018), 3--24.","journal-title":"JLCL"},{"key":"e_1_3_2_1_5_1","volume-title":"ICDAR2017 Competition on Multi-Font and Multi-Size Digitally Represented Arabic Text. In Document Analysis and Recognition (ICDAR), 2017 14th IAPR International Conference on","volume":"1","author":"Slimane Fouad","year":"2017","unstructured":"Fouad Slimane , Rolf Ingold , and Jean Hennebert . 2017 . ICDAR2017 Competition on Multi-Font and Multi-Size Digitally Represented Arabic Text. In Document Analysis and Recognition (ICDAR), 2017 14th IAPR International Conference on , Vol. 1 . IEEE, 1466--1472. Fouad Slimane, Rolf Ingold, and Jean Hennebert. 2017. ICDAR2017 Competition on Multi-Font and Multi-Size Digitally Represented Arabic Text. In Document Analysis and Recognition (ICDAR), 2017 14th IAPR International Conference on, Vol. 1. IEEE, 1466--1472."},{"key":"e_1_3_2_1_6_1","volume-title":"Principal component 2-D long short-term memory for font recognition on single Chinese characters","author":"Tao Dapeng","year":"2016","unstructured":"Dapeng Tao , Xu Lin , Lianwen Jin , and Xuelong Li. 2016. Principal component 2-D long short-term memory for font recognition on single Chinese characters . IEEE transactions on cybernetics 46, 3 ( 2016 ), 756--765. Dapeng Tao, Xu Lin, Lianwen Jin, and Xuelong Li. 2016. Principal component 2-D long short-term memory for font recognition on single Chinese characters. IEEE transactions on cybernetics 46, 3 (2016), 756--765."},{"key":"e_1_3_2_1_7_1","first-page":"6546","article-title":"Script Identification of Multi-Script Documents: A Survey","volume":"5","author":"Ubul Kurban","year":"2017","unstructured":"Kurban Ubul , Gulzira Tursun , Alimjan Aysa , Donato Impedovo , Giuseppe Pirlo , and Tuergen Yibulayin . 2017 . Script Identification of Multi-Script Documents: A Survey . IEEE Access 5 (2017), 6546 -- 6559 . Kurban Ubul, Gulzira Tursun, Alimjan Aysa, Donato Impedovo, Giuseppe Pirlo, and Tuergen Yibulayin. 2017. Script Identification of Multi-Script Documents: A Survey. IEEE Access 5 (2017), 6546--6559.","journal-title":"IEEE Access"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_8_1","DOI":"10.1109\/ICDAR.2015.7333921"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"crossref","first-page":"79","DOI":"10.21248\/jlcl.33.2018.219","article-title":"Comparison of OCR Accuracy on Early Printed Books using the Open Source Engines Calamari and OCRopus","volume":"33","author":"Wick Christoph","year":"2018","unstructured":"Christoph Wick , Christian Reul , and Frank Puppe . 2018 . Comparison of OCR Accuracy on Early Printed Books using the Open Source Engines Calamari and OCRopus . JLCL 33 , 1 (2018), 79 -- 96 . Christoph Wick, Christian Reul, and Frank Puppe. 2018. Comparison of OCR Accuracy on Early Printed Books using the Open Source Engines Calamari and OCRopus. JLCL 33, 1 (2018), 79--96.","journal-title":"JLCL"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_10_1","DOI":"10.1109\/34.954608"},{"key":"e_1_3_2_1_11_1","first-page":"249","article-title":"Optical font recognition from projection profiles","volume":"6","author":"Zramdini Abdelwahab","year":"1993","unstructured":"Abdelwahab Zramdini and Rolf Ingold . 1993 . Optical font recognition from projection profiles . Electronic Publishing 6 , 3 (1993), 249 -- 260 . Abdelwahab Zramdini and Rolf Ingold. 1993. Optical font recognition from projection profiles. Electronic Publishing 6, 3 (1993), 249--260.","journal-title":"Electronic Publishing"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_12_1","DOI":"10.1109\/34.709616"}],"event":{"acronym":"DATeCH2019","name":"DATeCH2019: 3rd International Conference on Digital Access to Textual Cultural Heritage","location":"Brussels Belgium"},"container-title":["Proceedings of the 3rd International Conference on Digital Access to Textual Cultural Heritage"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3322905.3322910","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3322905.3322910","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T01:02:26Z","timestamp":1750208546000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3322905.3322910"}},"subtitle":["A Case Study on Daniel Sander's W\u00f6rterbuch der Deutschen Sprache"],"short-title":[],"issued":{"date-parts":[[2019,5,8]]},"references-count":12,"alternative-id":["10.1145\/3322905.3322910","10.1145\/3322905"],"URL":"https:\/\/doi.org\/10.1145\/3322905.3322910","relation":{},"subject":[],"published":{"date-parts":[[2019,5,8]]},"assertion":[{"value":"2019-05-08","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}