{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,17]],"date-time":"2025-09-17T04:38:19Z","timestamp":1758083899928,"version":"3.44.0"},"publisher-location":"Cham","reference-count":42,"publisher":"Springer Nature Switzerland","isbn-type":[{"type":"print","value":"9783032046260"},{"type":"electronic","value":"9783032046277"}],"license":[{"start":{"date-parts":[[2025,9,16]],"date-time":"2025-09-16T00:00:00Z","timestamp":1757980800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,9,16]],"date-time":"2025-09-16T00:00:00Z","timestamp":1757980800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2026]]},"DOI":"10.1007\/978-3-032-04627-7_36","type":"book-chapter","created":{"date-parts":[[2025,9,16]],"date-time":"2025-09-16T02:07:21Z","timestamp":1757988441000},"page":"620-637","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["A Handwritten Text Recognition Dataset for\u00a0Ajami Manuscripts in\u00a0Fulfulde and\u00a0Hausa"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0009-0000-3320-813X","authenticated-orcid":false,"given":"Oreen","family":"Yousuf","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3483-6725","authenticated-orcid":false,"given":"Abdulmalik","family":"Aminu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0004-0244-602X","authenticated-orcid":false,"given":"Musa Salih","family":"Muhammad","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0002-4595-2876","authenticated-orcid":false,"given":"Bashir","family":"Usman","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0005-4589-2350","authenticated-orcid":false,"given":"Mustapha Kurfi","family":"Hashim","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7873-3971","authenticated-orcid":false,"given":"Joakim","family":"Nivre","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4838-6518","authenticated-orcid":false,"given":"Be\u00e1ta","family":"Megyesi","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3192-0961","authenticated-orcid":false,"given":"Christian","family":"H\u00f8gel","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,9,16]]},"reference":[{"key":"36_CR1","doi-asserted-by":"publisher","first-page":"51242","DOI":"10.1109\/ACCESS.2021.3066477","volume":"9","author":"HM Al-Barhamtoshy","year":"2021","unstructured":"Al-Barhamtoshy, H.M., Jambi, K.M., Abdou, S.M., Rashwan, M.A.: Arabic documents information retrieval for printed, handwritten, and calligraphy image. IEEE Access 9, 51242\u201351257 (2021)","journal-title":"IEEE Access"},{"key":"36_CR2","doi-asserted-by":"crossref","unstructured":"Al-Ma\u2019adeed, S., Elliman, D., Higgins, C.A.: A data base for Arabic handwritten text recognition research. In: Proceedings Eighth International Workshop on Frontiers in Handwriting Recognition, pp. 485\u2013489. IEEE (2002)","DOI":"10.1109\/IWFHR.2002.1030957"},{"key":"36_CR3","unstructured":"Allen, J.P., Miller, M.T., Mullan, J., Smith, D.: Digitizing the Islamicate Written Traditions: History, State of the Field, and Best Practices for Open-source Arabic-script OCR (2022). https:\/\/openiti.org\/assets\/documents\/aocp1WhitePaper.pdf, white paper for the Open Islamicate Texts Initiative Arabic-script OCR Catalyst project, Phase I"},{"key":"36_CR4","unstructured":"Banfield, A.W., Macintyre, J.L.: A grammar of the Nupe language: together with a vocabulary. Society for promoting Christian knowledge (1915)"},{"key":"36_CR5","doi-asserted-by":"publisher","unstructured":"Bondarev, D.: Intralinear Ajami (Type 2). A-label: African Languages Between the Lines (2019). https:\/\/doi.org\/10.58079\/awu4, https:\/\/ajami.hypotheses.org\/841. retrieved March 4 2025","DOI":"10.58079\/awu4"},{"key":"36_CR6","doi-asserted-by":"crossref","unstructured":"Bondarev, D.: A Typology of West African Ajami Manuscripts: Languages, Layout and Research Perspectives. Exploring Written Artefacts: Objects, Methods, and Concepts (Studies in Manuscript Cultures, 25), Berlin: De Gruyter pp, 707\u2013728 (2021)","DOI":"10.1515\/9783110753301-035"},{"key":"36_CR7","doi-asserted-by":"crossref","unstructured":"Bondarev, D., Dobronravin, N.: Standardisation Tendencies in Kanuri and Hausa Ajami Writings. Creating Standards p.\u00a0237 (2019)","DOI":"10.1515\/9783110639063-010"},{"key":"36_CR8","unstructured":"Boston University: NEH Ajami Project. Online Resource (2025). https:\/\/sites.bu.edu\/nehajami\/, project website hosted by Boston University"},{"key":"36_CR9","unstructured":"Boston University: The Four Languages of Ajami. Online Resource (2025), https:\/\/sites.bu.edu\/nehajami\/the-four-languages\/, NEH Ajami Project, Boston University"},{"key":"36_CR10","unstructured":"Boston University Open Repository: Boston University Digital Collections. Online Resource (2025). https:\/\/open.bu.edu\/communities\/fb6a0f91-0c58-4dc8-b383-9b5880a05315, available online"},{"key":"36_CR11","doi-asserted-by":"crossref","unstructured":"Chen, D., et al.: MONSTERMASH: multidirectional, overlapping, nested, spiral text extraction for recognition models of arabic-script handwriting. In: International Conference on Document Analysis and Recognition, pp. 87\u2013101. Springer (2024)","DOI":"10.1007\/978-3-031-70642-4_6"},{"key":"36_CR12","unstructured":"Ibrahim, H.: \u201cAgapet\u201d \u2013 Advanced HTR for Christian Arabic Manuscripts (2024). https:\/\/agapet.hypotheses.org\/4, retrieved March 7, 2025"},{"key":"36_CR13","doi-asserted-by":"crossref","unstructured":"Kiessling, B., Ezra, D.S.B., Miller, M.T.: BADAM: a public dataset for baseline detection in arabic-script manuscripts. In: Proceedings of the 5th International Workshop on Historical Document Imaging and Processing, pp. 13\u201318 (2019)","DOI":"10.1145\/3352631.3352648"},{"key":"36_CR14","unstructured":"Kiessling, B., Kurin, G., Miller, M.T., Smail, K.: Advances and Limitations in Open Source Arabic-Script OCR: A Case Study. arXiv preprint arXiv:2402.10943 (2024)"},{"key":"36_CR15","doi-asserted-by":"crossref","unstructured":"Kiessling, B., Tissot, R., Stokes, P., Ezra, D.S.B.: eScriptorium: an open source platform for historical document analysis. In: 2019 International Conference on Document Analysis and Recognition Workshops (icdarw). vol.\u00a02, pp. 19\u201319. IEEE (2019)","DOI":"10.1109\/ICDARW.2019.10032"},{"key":"36_CR16","doi-asserted-by":"crossref","unstructured":"Lamsaf, A., Aitkerroum, M., Boulaknadel, S., Fakhri, Y.: Text line and word extraction of Arabic handwritten documents. In: Innovations in Smart Cities Applications Edition 2: The Proceedings of the Third International Conference on Smart City Applications, pp. 492\u2013503. Springer (2019)","DOI":"10.1007\/978-3-030-11196-0_42"},{"key":"36_CR17","doi-asserted-by":"crossref","unstructured":"Lorigo, L., Govindaraju, V.: Segmentation and pre-recognition of Arabic handwriting. In: Eighth International Conference on Document Analysis and Recognition (ICDAR\u201905), pp. 605\u2013609. IEEE (2005)","DOI":"10.1109\/ICDAR.2005.207"},{"key":"36_CR18","doi-asserted-by":"crossref","unstructured":"Lutf, M., You, X., Cheung, Y.m., Chen, C.P.: Arabic font recognition based on diacritics features. Pattern Recogn. 47(2), 672\u2013684 (2014)","DOI":"10.1016\/j.patcog.2013.07.015"},{"key":"36_CR19","doi-asserted-by":"crossref","unstructured":"Mahmoud, S.A., et al.: KHATT: Arabic offline handwritten text database. In: 2012 International Conference on Frontiers in Handwriting Recognition, pp. 449\u2013454. IEEE (2012)","DOI":"10.1109\/ICFHR.2012.224"},{"key":"36_CR20","unstructured":"Maliweb: Sauvegarde et protection des patrimoines culturels: Plus de 320.000 manuscrits num\u00e9ris\u00e9s par SAVAMA-DCI et ses partenaires (2022). https:\/\/www.maliweb.net\/art-culture\/~ sauvegarde-et-protection-des-patrimoines-culturels\/~ plus-de-320-000-manuscrits-numerises-par-savama-dci-et-ses-partenaires-2989835.html"},{"issue":"1","key":"36_CR21","doi-asserted-by":"publisher","first-page":"103","DOI":"10.1017\/S0020743817000964","volume":"50","author":"MT Miller","year":"2018","unstructured":"Miller, M.T., Romanov, M.G., Savant, S.B.: Digitizing the Textual Heritage of the Premodern Islamicate World: Principles and Plans. Int. J. Middle East Stud. 50(1), 103\u2013109 (2018). https:\/\/doi.org\/10.1017\/S0020743817000964","journal-title":"Int. J. Middle East Stud."},{"key":"36_CR22","doi-asserted-by":"crossref","unstructured":"Mumin, M.: The Arabic script in Africa: Understudied Literacy. In: The Arabic Script in Africa, pp. 41\u201376. Brill (2014)","DOI":"10.1163\/9789004256804_004"},{"key":"36_CR23","doi-asserted-by":"publisher","DOI":"10.1016\/j.dib.2024.110813","volume":"56","author":"R Najam","year":"2024","unstructured":"Najam, R., Faizullah, S.: A scarce dataset for ancient Arabic handwritten text recognition. Data Brief 56, 110813 (2024)","journal-title":"Data Brief"},{"key":"36_CR24","doi-asserted-by":"publisher","unstructured":"Ngom, F.: Muslims beyond the arab world: the odyssey of Ajami and the Muridiyya. Oxford University Press (2016). https:\/\/doi.org\/10.1093\/acprof:oso\/9780190279868.001.0001","DOI":"10.1093\/acprof:oso\/9780190279868.001.0001"},{"key":"36_CR25","doi-asserted-by":"publisher","unstructured":"Ngom, F.: West African Manuscripts in Arabic and African Languages and Digital Preservation (2017). https:\/\/doi.org\/10.1093\/acrefore\/9780190277734.013.123, https:\/\/oxfordre.com\/africanhistory\/view\/10.1093\/acrefore\/9780190277734.001.0001\/acrefore-9780190277734-e-123","DOI":"10.1093\/acrefore\/9780190277734.013.123"},{"key":"36_CR26","unstructured":"Ngom, F., Glovsky, D., Diallo, B.B., Sow, N., Rodima-Taylor, D., other contributors: Knowledge to Follow God. Online Manuscript Collection (2022). https:\/\/sites.bu.edu\/nehajami\/the-four-languages\/fula\/fula-manuscripts\/gandal-fii-rewugol-alla\/"},{"key":"36_CR27","doi-asserted-by":"crossref","unstructured":"Ngom, F., Rodima-Taylor, D., Robinson, D.: AJam\u012b Literacies of Africa: the Jausa, Fula, Mandinka, and Wolof Traditions. Islamic Africa 14(2), 119\u2013143 (2023)","DOI":"10.1163\/21540993-20230002"},{"key":"36_CR28","unstructured":"Ngom, F., et al.: The Harlot\u2019s Song. Online Resource (2022). https:\/\/sites.bu.edu\/nehajami\/the-four-languages\/hausa\/hausa-manuscripts\/falke-1486-wakar-karuwa\/"},{"key":"36_CR29","unstructured":"Open Islamicate Texts Initiative (OpenITI): ACDC Results - Gen2 Print N7M5 Union FT Model (2025). https:\/\/github.com\/OpenITI\/acdc_results\/blob\/main\/models\/gen2-print-n7m5-union-ft_best.mlmodel. Accessed 07 Mar 2025"},{"key":"36_CR30","unstructured":"Open Islamicate Texts Initiative (OpenITI): Arabic Script OCR Models (2025), https:\/\/github.com\/OpenITI\/arabic_script_ocr_models\/tree\/main, accessed: 2025-03-07"},{"key":"36_CR31","unstructured":"Pechwitz, M., Maddouri, S.S., M\u00e4rgner, V., Ellouze, N., Amiri, H., et\u00a0al.: IFN\/ENIT-database of handwritten Arabic words. In: Proceedings of CIFED. vol.\u00a02, pp. 127\u2013136. Citeseer (2002)"},{"key":"36_CR32","unstructured":"Qur\u2019an, 28:4: SOAS Digital Collections, Borno and Old Kanembu Islamic Manuscripts. Online Manuscript Collection (17th century), http:\/\/digital.soas.ac.uk\/LOAA003335\/00001\/481, MS 1YM (the \u2018Yerima Mustafa manuscript\u2019), c. late seventeenth century. SOAS, University of London. All rights reserved"},{"key":"36_CR33","unstructured":"Qur\u2019an, 28:4: SOAS Digital Collections, Borno and Old Kanembu Islamic Manuscripts, MS 4MM (the \u2018Malam Muhammadu manuscript\u2019 or \u2018Waziri of Gwandu manuscript\u2019). Online Manuscript Collection (17th century), https:\/\/digital.soas.ac.uk\/LOAA003340\/00001\/172, SOAS, University of London. All rights reserved"},{"key":"36_CR34","unstructured":"Qur\u2019an, 28:4: SOAS Digital Collections, Borno and Old Kanembu Islamic Manuscripts, MS AR33 (\u2018Arabic manuscript collections\u2019 from Kaduna National Archives). Online Manuscript Collection (18th - early 19th century), https:\/\/digital.soas.ac.uk\/LOAA003342\/00001\/742, SOAS, University of London. All rights reserved"},{"key":"36_CR35","doi-asserted-by":"crossref","unstructured":"Rambach, A.D.: The Blue Koran. A contribution to the debate on its possible origin and date. J. Islamic Manuscripts 8(2), 127\u2013143 (2017)","DOI":"10.1163\/1878464X-00801004"},{"key":"36_CR36","unstructured":"Romanov, M., Miller, M., Savant, S., Seydi, M.: Open Islamicate texts initiative: a machine-readable corpus of texts produced in the premodern Islamicate world (Poster). In: Digital Humanities 2019 Conference Papers (9-12 July 2019). Utrecht University, 2019 (2019)"},{"key":"36_CR37","unstructured":"Serin, M.: T\u00fcrk Hat \u00dcstadlar\u0131 1: Hattat Aziz Efendi. Kubbealt\u0131 Akademisi K\u00fclt\u00fcr ve San\u2019at Vakf\u0131 (1999)"},{"key":"36_CR38","unstructured":"Sultan \u2019Ali Al-Mashhadi: Divan of Sultan Husayn Mirza. https:\/\/www.loc.gov\/item\/2019714483\/ (1492). manuscript\/Mixed Material, retrieved from the Library of Congress"},{"key":"36_CR39","unstructured":"led\u00a0by Suphan\u00a0Kirmizialtin, D.O.C.T.: Ottoman Turkish Print Model. https:\/\/readcoop.eu\/model\/ottoman-turkish-print\/. Accessed 07 Mar 2025"},{"key":"36_CR40","doi-asserted-by":"crossref","unstructured":"Vogler, N., Allen, J.P., Miller, M.T., Berg-Kirkpatrick, T.: Lacuna Reconstruction: Self-supervised Pre-training for Low-Resource Historical Document Transcription. arXiv preprint arXiv:2112.08692 (2021)","DOI":"10.18653\/v1\/2022.findings-naacl.15"},{"key":"36_CR41","unstructured":"Wrisley, D.: The HTR Working Group\u00a0at NYU Abu\u00a0Dhabi: Arabic Khat 17-20 Century Handwritten Model (2025). https:\/\/www.transkribus.org\/model\/arabic-khat-17-20-century-handwritten, HTR model for Arabic manuscripts from the 17th to 20th centuries"},{"key":"36_CR42","doi-asserted-by":"crossref","unstructured":"Zahour, A., Likforman-Sulem, L., Boussalaa, W., Taconet, B.: Text line segmentation of historical arabic documents. In: Ninth International Conference on Document Analysis and Recognition (ICDAR 2007). vol.\u00a01, pp. 138\u2013142. IEEE (2007)","DOI":"10.1109\/ICDAR.2007.4378691"}],"container-title":["Lecture Notes in Computer Science","Document Analysis and Recognition \u2013 ICDAR 2025"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-032-04627-7_36","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,16]],"date-time":"2025-09-16T02:07:33Z","timestamp":1757988453000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-032-04627-7_36"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,9,16]]},"ISBN":["9783032046260","9783032046277"],"references-count":42,"URL":"https:\/\/doi.org\/10.1007\/978-3-032-04627-7_36","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2025,9,16]]},"assertion":[{"value":"16 September 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"The authors have no competing interests to declare that are relevant to the content of this article.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Disclosure of Interests"}},{"value":"ICDAR","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Document Analysis and Recognition","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Wuhan","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"China","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2025","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"16 September 2025","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"21 September 2025","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"icdar2025","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/iapr.org\/icdar2025","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}