{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,29]],"date-time":"2026-01-29T14:21:38Z","timestamp":1769696498256,"version":"3.49.0"},"publisher-location":"Cham","reference-count":27,"publisher":"Springer International Publishing","isbn-type":[{"value":"9783031065545","type":"print"},{"value":"9783031065552","type":"electronic"}],"license":[{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2022]]},"DOI":"10.1007\/978-3-031-06555-2_30","type":"book-chapter","created":{"date-parts":[[2022,5,17]],"date-time":"2022-05-17T09:10:13Z","timestamp":1652778613000},"page":"445-460","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":13,"title":["A Benchmark of\u00a0Named Entity Recognition Approaches in\u00a0Historical Documents Application to\u00a019$$^{th}$$ Century French Directories"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-8741-2398","authenticated-orcid":false,"given":"N.","family":"Abadie","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5737-5266","authenticated-orcid":false,"given":"E.","family":"Carlinet","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3757-074X","authenticated-orcid":false,"given":"J.","family":"Chazalon","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2517-2058","authenticated-orcid":false,"given":"B.","family":"Dum\u00e9nieu","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2022,5,18]]},"reference":[{"key":"30_CR1","unstructured":"Abadie, N., et al.: A dataset of french trade directories from the 19th century (FTD), March 2022. https:\/\/doi.org\/10.5281\/zenodo.6394464"},{"issue":"8","key":"30_CR2","first-page":"1","volume":"15","author":"S Bell","year":"2020","unstructured":"Bell, S., et al.: Automated data extraction from historical city directories: the rise and fall of mid-century gas stations in providence. RI. PLoS One 15(8), 1\u201312 (2020)","journal-title":"RI. PLoS One"},{"key":"30_CR3","unstructured":"Breuel, T.M.: The OCRopus open source OCR system. In: Document Recognition and Retrieval XV, vol. 6815, p. 68150F. International Society for Optics and Photonics (2008)"},{"key":"30_CR4","first-page":"2493","volume":"12","author":"R Collobert","year":"2011","unstructured":"Collobert, R., Weston, J., Bottou, L., Karlen, M., Kavukcuoglu, K., Kuksa, P.: Natural language processing (almost) from scratch. J. Mach. Learn. Res. 12, 2493\u20132537 (2011)","journal-title":"J. Mach. Learn. Res."},{"key":"30_CR5","unstructured":"Devlin, J., Chang, M.W., Lee, K., Toutanova, K.: BERT: Pre-training of deep bidirectional transformers for language understanding. In: Proceedings of NAACL-HLT, pp. 4171\u20134186 (2019)"},{"key":"30_CR6","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"87","DOI":"10.1007\/978-3-030-54956-5_7","volume-title":"Digital Libraries for Open Knowledge","author":"A Hamdi","year":"2020","unstructured":"Hamdi, A., Jean-Caurant, A., Sid\u00e8re, N., Coustaty, M., Doucet, A.: Assessing and minimizing the impact of OCR quality on named entity recognition. In: Hall, M., Mer\u010dun, T., Risse, T., Duchateau, F. (eds.) TPDL 2020. LNCS, vol. 12246, pp. 87\u2013101. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-54956-5_7"},{"key":"30_CR7","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"33","DOI":"10.1007\/978-3-030-64452-9_3","volume-title":"Digital Libraries at Times of Massive Societal Transition","author":"V-N Huynh","year":"2020","unstructured":"Huynh, V.-N., Hamdi, A., Doucet, A.: When to use OCR post-correction for named entity recognition? In: Ishita, E., Pang, N.L.S., Zhou, L. (eds.) ICADL 2020. LNCS, vol. 12504, pp. 33\u201342. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-64452-9_3"},{"key":"30_CR8","unstructured":"Kiessling, B.: Kraken contributors. http:\/\/kraken.re"},{"key":"30_CR9","doi-asserted-by":"crossref","unstructured":"Kiessling, B., Tissot, R., Stokes, P., Stokl Ben Ezra, D.: eScriptorium: An open source platform for historical document analysis. In: International Conference on Document Analysis and Recognition Workshops, p. 19. IEEE (2019)","DOI":"10.1109\/ICDARW.2019.10032"},{"key":"30_CR10","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"478","DOI":"10.1007\/978-3-030-86337-1_32","volume-title":"Document Analysis and Recognition - ICDAR 2021","author":"J Koh\u00fat","year":"2021","unstructured":"Koh\u00fat, J., Hradi\u0161, M.: TS-Net: OCR trained to switch between text transcription styles. In: Llad\u00f3s, J., Lopresti, D., Uchida, S. (eds.) ICDAR 2021. LNCS, vol. 12824, pp. 478\u2013493. Springer, Cham (2021). https:\/\/doi.org\/10.1007\/978-3-030-86337-1_32"},{"key":"30_CR11","unstructured":"Labusch, K., Neudecker, C.: Named entity disambiguation and linking historic newspaper OCR with bert. In: CLEF (2020)"},{"key":"30_CR12","doi-asserted-by":"crossref","unstructured":"Lample, G., Ballesteros, M., Subramanian, S., Kawakami, K., Dyer, C.: Neural architectures for named entity recognition. In: Proceedings of NAACL-HLT. pp. 260\u2013270 (2016)","DOI":"10.18653\/v1\/N16-1030"},{"issue":"1","key":"30_CR13","doi-asserted-by":"publisher","first-page":"50","DOI":"10.1109\/TKDE.2020.2981314","volume":"34","author":"J Li","year":"2020","unstructured":"Li, J., Sun, A., Han, J., Li, C.: A survey on deep learning for named entity recognition. IEEE Trans. Knowl. Data Eng. 34(1), 50\u201370 (2020)","journal-title":"IEEE Trans. Knowl. Data Eng."},{"issue":"1","key":"30_CR14","first-page":"339","volume":"52","author":"A Mansouri","year":"2008","unstructured":"Mansouri, A., Affendey, L.S., Mamat, A.: Named entity recognition approaches. TAL 52(1), 339\u2013344 (2008)","journal-title":"TAL"},{"key":"30_CR15","doi-asserted-by":"crossref","unstructured":"Martin, L., et al.: CamemBERT: a tasty French language model. In: ProProceedings of the 58th Annual Meeting of the Association for Computational Linguistics, pp. 7203\u20137219 (2020)","DOI":"10.18653\/v1\/2020.acl-main.645"},{"key":"30_CR16","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"748","DOI":"10.1007\/978-3-030-86331-9_48","volume-title":"Document Analysis and Recognition \u2013 ICDAR 2021","author":"L M\u00e4rz","year":"2021","unstructured":"M\u00e4rz, L., Schweter, S., Poerner, N., Roth, B., Sch\u00fctze, H.: Data centric domain adaptation for historical text with OCR rrrors. In: Llad\u00f3s, J., Lopresti, D., Uchida, S. (eds.) ICDAR 2021. LNCS, vol. 12822, pp. 748\u2013761. Springer, Cham (2021). https:\/\/doi.org\/10.1007\/978-3-030-86331-9_48"},{"issue":"1","key":"30_CR17","first-page":"69","volume":"52","author":"D Maurel","year":"2011","unstructured":"Maurel, D., Friburger, N., Antoine, J.Y., Eshkol-Taravella, I., Nouvel, D.: Casen: a transducer cascade to recognize french named entities. TAL 52(1), 69\u201396 (2011)","journal-title":"TAL"},{"issue":"1","key":"30_CR18","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1075\/li.30.1.03nad","volume":"30","author":"D Nadeau","year":"2007","unstructured":"Nadeau, D., Sekine, S.: A survey of named entity recognition and classification. Lingvisticae Investigationes 30(1), 3\u201326 (2007)","journal-title":"Lingvisticae Investigationes"},{"key":"30_CR19","doi-asserted-by":"crossref","unstructured":"Neudecker, C., Baierer, K., Gerber, M., Christian, C., Apostolos, A., Stefan, P.: A survey of OCR evaluation tools and metrics. In: The 6th International Workshop on Historical Document Imaging and Processing, pp. 13\u201318 (2021)","DOI":"10.1145\/3476887.3476888"},{"key":"30_CR20","unstructured":"Nouvel, D., Antoine, J.Y., Friburger, N., Soulet, A.: Recognizing named entities using automatically extracted transduction rules. In: 5th Language and Technology Conference, pp. 136\u2013140. Poznan, Poland (2011)"},{"key":"30_CR21","doi-asserted-by":"crossref","unstructured":"Santos, E.A.: Ocr evaluation tools for the 21st century. In: Proceedings of the Workshop on Computational Methods for Endangered Languages, vol. 1 (2019)","DOI":"10.33011\/computel.v1i.345"},{"key":"30_CR22","doi-asserted-by":"crossref","unstructured":"Smith, R.: An overview of the tesseract OCR engine. In: International Conference on Document Analysis and Recognition, vol. 2, pp. 629\u2013633. IEEE (2007)","DOI":"10.1109\/ICDAR.2007.4376991"},{"key":"30_CR23","unstructured":"Spacy authors. https:\/\/spacy.io\/"},{"key":"30_CR24","doi-asserted-by":"crossref","unstructured":"van Strien, D., Beelen, K., Ardanuy, M.C., Hosseini, K., McGillivray, B., Colavizza, G.: Assessing the impact of OCR quality on downstream NLP tasks (2020)","DOI":"10.5220\/0009169004840496"},{"key":"30_CR25","unstructured":"Transkribus contributors. https:\/\/readcoop.eu\/transkribus"},{"key":"30_CR26","unstructured":"Vaswani, A., et al.: Attention is all you need. In: Advances in Neural Information Processing Systems, pp. 5998\u20136008 (2017)"},{"key":"30_CR27","unstructured":"Wick, C., Reul, C., Puppe, F.: Calamari-a high-performance tensorflow-based deep learning package for optical character recognition. Digit. Humanit. Q. 14(1) (2020)"}],"container-title":["Lecture Notes in Computer Science","Document Analysis Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-06555-2_30","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,12]],"date-time":"2024-03-12T16:07:24Z","timestamp":1710259644000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-06555-2_30"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022]]},"ISBN":["9783031065545","9783031065552"],"references-count":27,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-06555-2_30","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022]]},"assertion":[{"value":"18 May 2022","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"DAS","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Workshop on Document Analysis Systems","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"La Rochelle","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"France","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2022","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"22 May 2022","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"25 May 2022","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"15","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"das2022","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/das2022.univ-lr.fr\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Single-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"easychair","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"94","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"52","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"16","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"55% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"2.85","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"No","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}