{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,7]],"date-time":"2026-05-07T12:07:26Z","timestamp":1778155646677,"version":"3.51.4"},"publisher-location":"New York, NY, USA","reference-count":23,"publisher":"ACM","license":[{"start":{"date-parts":[[2022,8,14]],"date-time":"2022-08-14T00:00:00Z","timestamp":1660435200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2022,8,14]]},"DOI":"10.1145\/3534678.3539043","type":"proceedings-article","created":{"date-parts":[[2022,8,12]],"date-time":"2022-08-12T19:06:12Z","timestamp":1660331172000},"page":"3743-3751","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":106,"title":["DocLayNet: A Large Human-Annotated Dataset for Document-Layout Segmentation"],"prefix":"10.1145","author":[{"given":"Birgit","family":"Pfitzmann","sequence":"first","affiliation":[{"name":"IBM Research, Rueschlikon, Switzerland"}]},{"given":"Christoph","family":"Auer","sequence":"additional","affiliation":[{"name":"IBM Research, Rueschlikon, Switzerland"}]},{"given":"Michele","family":"Dolfi","sequence":"additional","affiliation":[{"name":"IBM Research, Rueschlikon, Switzerland"}]},{"given":"Ahmed S.","family":"Nassar","sequence":"additional","affiliation":[{"name":"IBM Research, Rueschlikon, Switzerland"}]},{"given":"Peter","family":"Staar","sequence":"additional","affiliation":[{"name":"IBM Research, Rueschlikon, Switzerland"}]}],"member":"320","published-online":{"date-parts":[[2022,8,14]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDAR.2013.292"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDAR.2017.229"},{"key":"e_1_3_2_1_3_1","volume-title":"Eva-Maria Lang. ICDAR 2019 Competition on Table Detection and Recognition (cTDaR)","author":"D\u00e9jean Herv\u00e9","year":"2019","unstructured":"Herv\u00e9 D\u00e9jean, Jean-Luc Meunier, Liangcai Gao, Yilun Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. ICDAR 2019 Competition on Table Detection and Recognition (cTDaR), April 2019. http:\/\/sac.founderit.com\/."},{"key":"e_1_3_2_1_4_1","first-page":"605","volume-title":"Proceedings of the International Conference on Document Analysis and Recognition, ICDAR","author":"Yepes Antonio Jimeno","year":"2021","unstructured":"Antonio Jimeno Yepes, Peter Zhong, and Douglas Burdick. Competition on scientific literature parsing. In Proceedings of the International Conference on Document Analysis and Recognition, ICDAR, pages 605--617. LNCS 12824, Springer-Verlag, sep 2021."},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10032-021-00391-3"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDAR.2019.00166"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.coling-main.82"},{"key":"e_1_3_2_1_8_1","volume-title":"SemWebEval@ESWC","author":"Ahmad Riaz","year":"2016","unstructured":"Riaz Ahmad, Muhammad Tanvir Afzal, and M. Qadir. Information extraction from pdf sources based on rule-based system using integrated formats. In SemWebEval@ESWC, 2016."},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.81"},{"key":"e_1_3_2_1_10_1","first-page":"1440","volume-title":"Girshick. Fast R-CNN. In 2015 IEEE International Conference on Computer Vision, ICCV","author":"Ross","year":"2015","unstructured":"Ross B. Girshick. Fast R-CNN. In 2015 IEEE International Conference on Computer Vision, ICCV, pages 1440--1448. IEEE Computer Society, dec 2015."},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2016.2577031"},{"key":"e_1_3_2_1_12_1","first-page":"2980","volume-title":"Girshick. Mask R-CNN. In IEEE International Conference on Computer Vision, ICCV","author":"He Kaiming","year":"2017","unstructured":"Kaiming He, Georgia Gkioxari, Piotr Doll\u00e1 r, and Ross B. Girshick. Mask R-CNN. In IEEE International Conference on Computer Vision, ICCV, pages 2980--2988. IEEE Computer Society, Oct 2017."},{"key":"e_1_3_2_1_13_1","unstructured":"Glenn Jocher Alex Stoken Ayush Chaurasia Jirka Borovec NanoCode012 TaoXie Yonghye Kwon Kalen Michael Liu Changyu Jiacong Fang Abhiram V Laughing tkianai yxNONG Piotr Skalski Adam Hogan Jebastin Nadar imyhxy Lorenzo Mammana Alex Wang Cristi Fati Diego Montes Jan Hajek Laurentiu Diaconu Mai Thanh Minh Marc albinxavi fatih oleg and wanghao yang. ultralytics\/yolov5: v6.0 - yolov5n nano models roboflow integration tensorflow export opencv dnn support October 2021."},{"key":"e_1_3_2_1_14_1","volume-title":"End-to-end object detection with transformers. CoRR, abs\/2005.12872","author":"Carion Nicolas","year":"2020","unstructured":"Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-end object detection with transformers. CoRR, abs\/2005.12872, 2020."},{"key":"e_1_3_2_1_15_1","volume-title":"Efficientdet: Scalable and efficient object detection. CoRR, abs\/1911.09070","author":"Tan Mingxing","year":"2019","unstructured":"Mingxing Tan, Ruoming Pang, and Quoc V. Le. Efficientdet: Scalable and efficient object detection. CoRR, abs\/1911.09070, 2019."},{"key":"e_1_3_2_1_16_1","volume-title":"Piotr Doll\u00e1 r, and C. Lawrence Zitnick. Microsoft COCO: common objects in context","author":"Lin Tsung-Yi","year":"2014","unstructured":"Tsung-Yi Lin, Michael Maire, Serge J. Belongie, Lubomir D. Bourdev, Ross B. Girshick, James Hays, Pietro Perona, Deva Ramanan, Piotr Doll\u00e1 r, and C. Lawrence Zitnick. Microsoft COCO: common objects in context, 2014."},{"key":"e_1_3_2_1_17_1","unstructured":"Yuxin Wu Alexander Kirillov Francisco Massa Wan-Yen Lo and Ross Girshick. Detectron2 2019."},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v35i17.17777"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1145\/3394486.3403172"},{"key":"e_1_3_2_1_20_1","volume-title":"Vtlayout: Fusion of visual and text features for document layout analysis","author":"Li Shoubin","year":"2021","unstructured":"Shoubin Li, Xuyan Ma, Shuaiqun Pan, Jun Hu, Lin Shi, and Qing Wang. Vtlayout: Fusion of visual and text features for document layout analysis, 2021."},{"key":"e_1_3_2_1_21_1","volume-title":"Vsr: A unified framework for document layout analysis combining vision, semantics and relations","author":"Zhang Peng","year":"2021","unstructured":"Peng Zhang, Can Li, Liang Qiao, Zhanzhan Cheng, Shiliang Pu, Yi Niu, and Fei Wu. Vsr: A unified framework for document layout analysis combining vision, semantics and relations, 2021."},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1145\/3219819.3219834"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1186\/s40537-019-0197-0"}],"event":{"name":"KDD '22: The 28th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","location":"Washington DC USA","acronym":"KDD '22","sponsor":["SIGMOD ACM Special Interest Group on Management of Data","SIGKDD ACM Special Interest Group on Knowledge Discovery in Data"]},"container-title":["Proceedings of the 28th ACM SIGKDD Conference on Knowledge Discovery and Data Mining"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3534678.3539043","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3534678.3539043","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T18:09:50Z","timestamp":1750183790000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3534678.3539043"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,8,14]]},"references-count":23,"alternative-id":["10.1145\/3534678.3539043","10.1145\/3534678"],"URL":"https:\/\/doi.org\/10.1145\/3534678.3539043","relation":{},"subject":[],"published":{"date-parts":[[2022,8,14]]},"assertion":[{"value":"2022-08-14","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}