{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,18]],"date-time":"2026-06-18T22:15:20Z","timestamp":1781820920455,"version":"3.54.5"},"publisher-location":"Cham","reference-count":30,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783032046239","type":"print"},{"value":"9783032046246","type":"electronic"}],"license":[{"start":{"date-parts":[[2025,9,17]],"date-time":"2025-09-17T00:00:00Z","timestamp":1758067200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,9,17]],"date-time":"2025-09-17T00:00:00Z","timestamp":1758067200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2026]]},"DOI":"10.1007\/978-3-032-04624-6_28","type":"book-chapter","created":{"date-parts":[[2025,9,16]],"date-time":"2025-09-16T05:34:39Z","timestamp":1758000879000},"page":"476-492","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Ar-Q-Former: Historical Newspaper Article Separation Based on\u00a0Multimodal Transformer Structure"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0009-0002-7857-8737","authenticated-orcid":false,"given":"Wenjun","family":"Sun","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1009-3875","authenticated-orcid":false,"given":"Nancy","family":"Girdhar","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5993-1630","authenticated-orcid":false,"given":"Hanh Thi Hong","family":"Tran","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0787-2990","authenticated-orcid":false,"given":"Carlos-Emiliano","family":"Gonz\u00e1lez-Gallardo","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0123-439X","authenticated-orcid":false,"given":"Micka\u00ebl","family":"Coustaty","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6160-3356","authenticated-orcid":false,"given":"Antoine","family":"Doucet","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2025,9,17]]},"reference":[{"issue":"9","key":"28_CR1","doi-asserted-by":"publisher","first-page":"767","DOI":"10.1080\/08839510600903858","volume":"20","author":"M Aiello","year":"2006","unstructured":"Aiello, M., Pegoretti, A.: Textual article clustering in newspaper pages. Appl. Artif. Intell. 20(9), 767\u2013796 (2006)","journal-title":"Appl. Artif. Intell."},{"key":"28_CR2","doi-asserted-by":"crossref","unstructured":"Bansal, A., Chaudhury, S., Roy, S.D., Srivastava, J.: Newspaper article extraction using hierarchical fixed point model. In: 2014 11th IAPR International Workshop on Document Analysis Systems, pp. 257\u2013261. IEEE (2014)","DOI":"10.1109\/DAS.2014.42"},{"key":"28_CR3","doi-asserted-by":"crossref","unstructured":"Barman, R., Ehrmann, M., Clematide, S., Oliveira, S.A., Kaplan, F.: Combining visual and textual features for semantic segmentation of historical newspapers. J. Data Mining Digit. Humanit. (HistoInformatics) (2021)","DOI":"10.46298\/jdmdh.6107"},{"key":"28_CR4","doi-asserted-by":"crossref","unstructured":"Boro\u015f, E., et al.: Alleviating digitization errors in named entity recognition for historical documents. In: Proceedings of the 24th Conference on Computational Natural Language Learning, pp. 431\u2013441 (2020)","DOI":"10.18653\/v1\/2020.conll-1.35"},{"issue":"20","key":"28_CR5","doi-asserted-by":"publisher","first-page":"24314","DOI":"10.1007\/s10489-023-04782-3","volume":"53","author":"X Canhui","year":"2023","unstructured":"Canhui, X., Yuteng, L., Cao, S., Honghong, Z., Hengyue, B., Yinong, C.: Him: hierarchical multimodal network for document layout analysis. Appl. Intell. 53(20), 24314\u201324326 (2023)","journal-title":"Appl. Intell."},{"key":"28_CR6","doi-asserted-by":"crossref","unstructured":"Da, C., Luo, C., Zheng, Q., Yao, C.: Vision grid transformer for document layout analysis. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 19462\u201319472 (2023)","DOI":"10.1109\/ICCV51070.2023.01783"},{"key":"28_CR7","unstructured":"Dosovitskiy, A., et al.: An image is worth 16x16 words: transformers for image recognition at scale. In: International Conference on Learning Representations (2020)"},{"key":"28_CR8","unstructured":"Doucet, A., et al.: Newseye: a digital investigator for historical newspapers. In: 15th Annual International Conference of the Alliance of Digital Humanities Organizations, DH 2020 (2020)"},{"key":"28_CR9","doi-asserted-by":"crossref","unstructured":"Furmaniak, R.: Unsupervised newspaper segmentation using language context. In: Ninth International Conference on Document Analysis and Recognition (ICDAR 2007), vol.\u00a02, pp. 1263\u20131267. IEEE (2007)","DOI":"10.1109\/ICDAR.2007.4377118"},{"issue":"2","key":"28_CR10","doi-asserted-by":"publisher","first-page":"181","DOI":"10.1109\/THMS.2016.2634920","volume":"47","author":"A Garz","year":"2016","unstructured":"Garz, A., Seuret, M., Fischer, A., Ingold, R.: A user-centered segmentation method for complex historical manuscripts based on document graphs. IEEE Trans. Hum.-Mach. Syst. 47(2), 181\u2013193 (2016)","journal-title":"IEEE Trans. Hum.-Mach. Syst."},{"key":"28_CR11","doi-asserted-by":"crossref","unstructured":"Gatos, B., Mantzaris, S., Chandrinos, K., Tsigris, A., Perantonis, S.J.: Integrated algorithms for newspaper page decomposition and article tracking. In: Proceedings of the Fifth International Conference on Document Analysis and Recognition. ICDAR 1999 (Cat. No. PR00318), pp. 559\u2013562. IEEE (1999)","DOI":"10.1109\/ICDAR.1999.791849"},{"key":"28_CR12","doi-asserted-by":"crossref","unstructured":"Girdhar, N., Coustaty, M., Doucet, A.: STRAS: a semantic textual-cues leveraged rule-based approach for article separation in historical newspapers. In: International Conference on Asian Digital Libraries, pp. 89\u2013105. Springer (2023)","DOI":"10.1007\/978-981-99-8085-7_8"},{"key":"28_CR13","doi-asserted-by":"crossref","unstructured":"Girdhar, N., Coustaty, M., Doucet, A.: Digitizing history: transitioning historical paper documents to digital content for information retrieval and mining\u2014a comprehensive survey. IEEE Trans. Comput. Soc. Syst. (2024)","DOI":"10.1109\/TCSS.2024.3378419"},{"key":"28_CR14","doi-asserted-by":"crossref","unstructured":"Girdhar, N., Sharma, D., Coustaty, M., Doucet, A.: Leveraging transfer learning for article segmentation in historical newspapers. In: International Conference on Theory and Practice of Digital Libraries, pp. 222\u2013238. Springer (2024)","DOI":"10.1007\/978-3-031-72437-4_13"},{"key":"28_CR15","doi-asserted-by":"crossref","unstructured":"Gr\u00fcning, T., Labahn, R., Diem, M., Kleber, F., Fiel, S.: Read-bad: a new dataset and evaluation scheme for baseline detection in archival documents. In: 2018 13th IAPR International Workshop on Document Analysis Systems (DAS), pp. 351\u2013356. IEEE (2018)","DOI":"10.1109\/DAS.2018.38"},{"key":"28_CR16","unstructured":"Hadjar, K., Hitz, O., Ingold, R.: Newspaper page decomposition using a split and merge approach. In: Proceedings of Sixth International Conference on Document Analysis and Recognition, pp. 1186\u20131189. IEEE (2001)"},{"key":"28_CR17","doi-asserted-by":"crossref","unstructured":"Huang, Y., Lv, T., Cui, L., Lu, Y., Wei, F.: Layoutlmv3: pre-training for document AI with unified text and image masking. In: Proceedings of the 30th ACM International Conference on Multimedia, pp. 4083\u20134091 (2022)","DOI":"10.1145\/3503161.3548112"},{"key":"28_CR18","doi-asserted-by":"crossref","unstructured":"Isaac, A., Haslhofer, B.: Europeana linked open data\u2013data. europeana. eu. Semantic Web 4(3), 291\u2013297 (2013)","DOI":"10.3233\/SW-120092"},{"key":"28_CR19","unstructured":"Kastanas, S., Tan, S., He, Y.: Document AI: a comparative study of transformer-based, graph-based models, and convolutional neural networks for document layout analysis. arXiv preprint arXiv:2308.15517 (2023)"},{"key":"28_CR20","doi-asserted-by":"crossref","unstructured":"Kettunen, K., Ruokolainen, T., Liukkonen, E., Tranouez, P., Antelme, D., Paquet, T.: Detecting articles in a digitized finnish historical newspaper collection 1771-1929: early results using the pivaj software. In: Proceedings of the 3rd International Conference on Digital Access to Textual Cultural Heritage, pp. 59\u201364 (2019)","DOI":"10.1145\/3322905.3322911"},{"key":"28_CR21","unstructured":"Li, J., Li, D., Savarese, S., Hoi, S.: Blip-2: bootstrapping language-image pre-training with frozen image encoders and large language models. In: International Conference on Machine Learning, pp. 19730\u201319742. PMLR (2023)"},{"key":"28_CR22","doi-asserted-by":"crossref","unstructured":"Luo, C., Cheng, C., Zheng, Q., Yao, C.: Geolayoutlm: geometric pre-training for visual information extraction. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 7092\u20137101 (2023)","DOI":"10.1109\/CVPR52729.2023.00685"},{"key":"28_CR23","doi-asserted-by":"crossref","unstructured":"Meier, B., Stadelmann, T., Stampfli, J., Arnold, M., Cieliebak, M.: Fully convolutional neural networks for newspaper article segmentation. In: 2017 14th IAPR International Conference on Document Analysis and Recognition (ICDAR), vol.\u00a01, pp. 414\u2013419. IEEE (2017)","DOI":"10.1109\/ICDAR.2017.75"},{"key":"28_CR24","doi-asserted-by":"crossref","unstructured":"Palfray, T., Hebert, D., Nicolas, S., Tranouez, P., Paquet, T.: Logical segmentation for article extraction in digitized old newspapers. In: Proceedings of the 2012 ACM Symposium on Document Engineering, pp. 129\u2013132 (2012)","DOI":"10.1145\/2361354.2361383"},{"key":"28_CR25","doi-asserted-by":"crossref","unstructured":"Pillai, P., Mangsuli, P.: Document layout analysis using detection transformers. In: Abu Dhabi International Petroleum Exhibition and Conference, p. D031S102R001. SPE (2021)","DOI":"10.2118\/207266-MS"},{"key":"28_CR26","unstructured":"Schweter, S., M\u00e4rz, L., Schmid, K., \u00c7ano, E.: hmbert: historical multilingual language models for named entity recognition. arXiv preprint arXiv:2205.15575 (2022)"},{"key":"28_CR27","doi-asserted-by":"crossref","unstructured":"Sun, W., Tran, H.T.H., Gonz\u00e1lez-Gallardo, C.E., Coustaty, M., Doucet, A.: Global-seg: text semantic segmentation based on global semantic pair relations. In: International Conference on Document Analysis and Recognition, pp. 253\u2013269. Springer (2024)","DOI":"10.1007\/978-3-031-70546-5_15"},{"key":"28_CR28","doi-asserted-by":"crossref","unstructured":"Sun, W., Tran, H.T.H., Gonz\u00e1lez-Gallardo, C.E., Coustaty, M., Doucet, A.: Lias: layout information-based article separation in historical newspapers. In: International Conference on Theory and Practice of Digital Libraries, pp. 256\u2013272. Springer (2024)","DOI":"10.1007\/978-3-031-72437-4_15"},{"key":"28_CR29","doi-asserted-by":"crossref","unstructured":"Tang, Z., et al.: Unifying vision, text, and layout for universal document processing. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 19254\u201319264 (2023)","DOI":"10.1109\/CVPR52729.2023.01845"},{"key":"28_CR30","doi-asserted-by":"crossref","unstructured":"Girdhar, N., Coustaty, M., Doucet, A.: Benchmarking NAS for article separation in historical newspapers. In: International Conference on Asian Digital Libraries, pp. 76\u201388. Springer (2023)","DOI":"10.1007\/978-981-99-8085-7_7"}],"container-title":["Lecture Notes in Computer Science","Document Analysis and Recognition \u2013 ICDAR 2025"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-032-04624-6_28","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,16]],"date-time":"2025-09-16T05:34:49Z","timestamp":1758000889000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-032-04624-6_28"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,9,17]]},"ISBN":["9783032046239","9783032046246"],"references-count":30,"URL":"https:\/\/doi.org\/10.1007\/978-3-032-04624-6_28","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,9,17]]},"assertion":[{"value":"17 September 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ICDAR","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Document Analysis and Recognition","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Wuhan","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"China","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2025","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"16 September 2025","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"21 September 2025","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"icdar2025","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/iapr.org\/icdar2025","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}