{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,11]],"date-time":"2025-09-11T19:19:44Z","timestamp":1757618384819,"version":"3.44.0"},"reference-count":55,"publisher":"Springer Science and Business Media LLC","issue":"8","license":[{"start":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T00:00:00Z","timestamp":1750118400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T00:00:00Z","timestamp":1750118400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"funder":[{"name":"Shaanxi Key Research Project in 2021","award":["2021GY-102"],"award-info":[{"award-number":["2021GY-102"]}]},{"name":"Xi\u2019an Science & Technology Project","award":["21RGZN0012, 23ZDCYTSGG0026-2022"],"award-info":[{"award-number":["21RGZN0012, 23ZDCYTSGG0026-2022"]}]},{"name":"Xianyang Key Research Project","award":["2021ZDYF-GY-0031"],"award-info":[{"award-number":["2021ZDYF-GY-0031"]}]},{"name":"Shaanxi Key Project of Department-City Linkage","award":["2022GD-TSLD-61-3"],"award-info":[{"award-number":["2022GD-TSLD-61-3"]}]},{"name":"Hangzhou Research Institute Conception Fund of Xidian University","award":["GNYZ2023GY0402"],"award-info":[{"award-number":["GNYZ2023GY0402"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Complex Intell. Syst."],"published-print":{"date-parts":[[2025,8]]},"DOI":"10.1007\/s40747-025-01975-w","type":"journal-article","created":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T04:35:40Z","timestamp":1750134940000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["TableStructureFormer: an improved masked-attention mask transformer model with long-distance feature aggregation and deep detail supervision for table structure recognition"],"prefix":"10.1007","volume":"11","author":[{"given":"Chenglong","family":"Yu","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0047-8955","authenticated-orcid":false,"given":"Weibin","family":"Li","sequence":"additional","affiliation":[]},{"given":"Zixuan","family":"Zhu","sequence":"additional","affiliation":[]},{"given":"Wei","family":"Li","sequence":"additional","affiliation":[]},{"given":"Jianchao","family":"Du","sequence":"additional","affiliation":[]},{"given":"Shiwei","family":"Zhang","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,6,17]]},"reference":[{"key":"1975_CR1","doi-asserted-by":"crossref","unstructured":"Xue W, Baosheng Y, Wang W, Tao D, Li Q (2021) TGRNet: a table graph reconstruction network for table structure recognition. In: IEEE\/CVF international conference on computer vision, pp 1275\u20131284","DOI":"10.1109\/ICCV48922.2021.00133"},{"key":"1975_CR2","first-page":"2992","volume":"37","author":"H Xing","year":"2023","unstructured":"Xing H, Gao F, Long R, Jiajun B, Zheng Q, Li L, Yao C, Zhi Y (2023) LORE: logical location regression network for table structure recognition. AAAI Conf Artif Intell 37:2992\u20133000","journal-title":"AAAI Conf Artif Intell"},{"key":"1975_CR3","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2024.110816","volume":"157","author":"R Long","year":"2025","unstructured":"Long R, Xing H, Yang Z, Zheng Q, Zhi Y, Huang F, Yao C (2025) LORE++: logical location regression network for table structure recognition with pre-training. Pattern Recognit 157:110816","journal-title":"Pattern Recognit"},{"key":"1975_CR4","doi-asserted-by":"crossref","unstructured":"Qiao L, Li Z, Cheng Z, Zhang P, Shiliang P, Niu Y, Ren W, Tan W, Fei W (2021) LGPMA: complicated table structure recognition with local and global pyramid mask alignment. In: IEEE international conference on document analysis and recognition","DOI":"10.1007\/978-3-030-86549-8_7"},{"key":"1975_CR5","unstructured":"Chi Z, Huang H, Xu H-D, Yu H, Yin W, Mao X-L (2019) Complicated table structure recognition. arXiv:abs\/1908.04729"},{"key":"1975_CR6","doi-asserted-by":"crossref","unstructured":"Zheng X, Burdick D, Lucian PX, Zhong NX, Wang R (2020) Global table extractor (GTE): a framework for joint table identification and cell structure recognition using visual context. In: IEEE winter conference on applications of computer vision, pp 697\u2013706","DOI":"10.1109\/WACV48630.2021.00074"},{"key":"1975_CR7","doi-asserted-by":"crossref","unstructured":"Baek Y, Nam D, Surh J, Shin S, Kim S (2023) TRACE: table reconstruction aligned to corner and edges. arXiv:abs\/2305.00630","DOI":"10.1007\/978-3-031-41734-4_29"},{"key":"1975_CR8","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2022.109006","volume":"133","author":"C Ma","year":"2022","unstructured":"Ma C, Lin W, Sun L, Huo Q (2022) Robust table detection and structure recognition from heterogeneous document images. Pattern Recognit 133:109006","journal-title":"Pattern Recognit"},{"key":"1975_CR9","doi-asserted-by":"crossref","unstructured":"Lin W, Sun Z, Ma C, Li M, Wang J, Sun L, Huo Q (2022) TSRFormer: table structure recognition with transformers. In: Proceedings of the 30th ACM international conference on multimedia","DOI":"10.1145\/3503161.3548038"},{"key":"1975_CR10","unstructured":"Guo Z, Yu Y, Lv P, Zhang C, Li H, Wang Z, Yao K, Liu J, Wang J (2022) TRUST: an accurate and end-to-end table structure recognizer using splitting-based transformers. arXiv:abs\/2208.14687"},{"key":"1975_CR11","unstructured":"Liu H, Li X, Gong M, Liu B, Wu Y, Jiang D, Liu Y, Sun X (2023) Grab what you need: rethinking complex table structure recognition with flexible components deliberation. arXiv: abs\/2303.09174"},{"key":"1975_CR12","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2022.108565","volume":"126","author":"Z Zhang","year":"2021","unstructured":"Zhang Z, Zhang J, Jun D (2021) Split, embed and merge: an accurate table structure recognizer. Pattern Recognit 126:108565","journal-title":"Pattern Recognit"},{"key":"1975_CR13","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2024.110279","volume":"149","author":"Z Zhang","year":"2023","unstructured":"Zhang Z, Pengfei H, Ma J, Jun D, Zhang J, Zhu H, Yin B, Yin B, Liu C (2023) SEMv2: table separation line detection based on instance segmentation. Pattern Recognit 149:110279","journal-title":"Pattern Recognit"},{"key":"1975_CR14","doi-asserted-by":"crossref","unstructured":"Paliwal S, Vishwanath D, Rahul R, Sharma M, Vig L (2019) TableNet: deep Learning model for end-to-end table detection and tabular data extraction from scanned document images. In: International conference on document analysis and recognition (ICDAR)","DOI":"10.1109\/ICDAR.2019.00029"},{"key":"1975_CR15","doi-asserted-by":"crossref","unstructured":"Schreiber S, Agne S, Wolf I, Dengel A, Ahmedd S (2017) DeepDeSRT: deep learning for detection and structure recognition of tables in document images. In: 2017 14th IAPR international conference on document analysis and recognition, pp 1162\u20131167","DOI":"10.1109\/ICDAR.2017.192"},{"key":"1975_CR16","doi-asserted-by":"crossref","unstructured":"Siddiqui SA, Fateh IA, Rizvi STR, Dengel A, Ahmed S (2019) DeepTabStR: deep learning based table structure recognition. In: International conference on document analysis and recognition, pp 1403\u20131409","DOI":"10.1109\/ICDAR.2019.00226"},{"key":"1975_CR17","doi-asserted-by":"publisher","first-page":"113521","DOI":"10.1109\/ACCESS.2021.3103413","volume":"9","author":"K Azeem Hashmi","year":"2021","unstructured":"Azeem Hashmi K, Stricker D, Liwicki M, Afzal MN, Afzal MZ (2021) Guided table structure recognition through anchor optimization. IEEE Access 9:113521\u2013113534","journal-title":"IEEE Access"},{"key":"1975_CR18","doi-asserted-by":"crossref","unstructured":"Siddiqui SA, Khan PI, Dengel A, Ahmed S (2019) Rethinking semantic segmentation for table structure recognition in documents. In: International conference on document analysis and recognition (ICDAR), pp 1397\u20131402","DOI":"10.1109\/ICDAR.2019.00225"},{"key":"1975_CR19","doi-asserted-by":"crossref","unstructured":"Anand A, Jaiswal R, Bhuyan P, Gupta M, Bangar S, Imam Md.M, Shah RR, Satoh S (2023) TC-OCR: TableCraft OCR for efficient detection & recognition of table structure & content. In: Proceedings of the 1st international workshop on deep multimodal learning for information retrieval, pp 11\u201318","DOI":"10.1145\/3606040.3617444"},{"key":"1975_CR20","doi-asserted-by":"crossref","unstructured":"Huang Y, Ning L, Chen D, Li Y, Xie Z, Zhu S, Gao L, Peng W (2023) Improving table structure recognition with visual-alignment sequential coordinate modeling. In: IEEE\/CVF conference on computer vision and pattern recognition (CVPR), pp 11134\u201311143","DOI":"10.1109\/CVPR52729.2023.01071"},{"key":"1975_CR21","doi-asserted-by":"crossref","unstructured":"Jain A, Paliwal S, Sharma M, Vig L (2022) TSR-DSAW: table structure recognition via deep spatial association of words. arXiv:abs\/2203.06873","DOI":"10.14428\/esann\/2021.ES2021-109"},{"key":"1975_CR22","doi-asserted-by":"crossref","unstructured":"Ly NT, Takasu A, Nguyen P, Takeda H (2023) Rethinking image-based table recognition using weakly supervised methods. In: International conference on pattern recognition applications and methods","DOI":"10.5220\/0011682600003411"},{"key":"1975_CR23","doi-asserted-by":"crossref","unstructured":"Zhong X, ShafieiBavani E, Yepes AJ (2019) Image-based table recognition: data, model, and evaluation. In: European conference on computer vision","DOI":"10.1007\/978-3-030-58589-1_34"},{"key":"1975_CR24","doi-asserted-by":"crossref","unstructured":"Nassar A, Livathinos N, Lysak M, Staar P (2022) TableFormer: table structure understanding with transformers. In: IEEE\/CVF conference on computer vision and pattern Recognition (CVPR), pp 4604\u20134613","DOI":"10.1109\/CVPR52688.2022.00457"},{"key":"1975_CR25","unstructured":"Li C, Guo R, Zhou J, An M, Du Y, Zhu L, Liu Y, Hu X, Yu D (2022) Pp-structurev2: a stronger document analysis system. arXiv:abs\/2210.05391"},{"key":"1975_CR26","unstructured":"Cui C, Gao T, Wei S, Du Y, Guo R, Dong S, Lu B, Zhou Y, Lv X, Liu Q, Hu X, Yu D, Ma Y (2021) PP-LCNet: a lightweight CPU convolutional neural network. arXiv:abs\/2109.15099"},{"key":"1975_CR27","doi-asserted-by":"crossref","unstructured":"Ly NT, Takasu A (2023) An end-to-end multi-task learning model for image-based table recognition. arXiv:abs\/2303.08648","DOI":"10.5220\/0011685000003417"},{"key":"1975_CR28","unstructured":"Peng SY, Chakravarthy A, Lee S, Wang X, BR, Chau Duen H (2024) UniTable: towards a unified framework for table recognition via self-supervised pretraining. arXiv:abs\/2403.04822"},{"key":"1975_CR29","doi-asserted-by":"crossref","unstructured":"Kudale D, Kasuba BV, Subramanian V, Chaudhuri P, Ramakrishnan G (2024) SPRINT: script-agnostic structure recognition in tables. In: International conference on document analysis and recognition, pp 350\u2013367","DOI":"10.1007\/978-3-031-70549-6_21"},{"key":"1975_CR30","doi-asserted-by":"crossref","unstructured":"Wan J, Song S, Wenwen Y, Liu Y, Cheng W, Huang F, Bai X, Yao C, Yang Z (2024) OmniParser: a unified framework for text spotting, key information extraction and table recognition. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 15641\u201315653","DOI":"10.1109\/CVPR52733.2024.01481"},{"key":"1975_CR31","doi-asserted-by":"crossref","unstructured":"Qin C, Zhang Z, Hu P, Liu C, Ma J, Du J (2024) SEMv3: a fast and robust approach to table separation line detection. arXiv:abs\/2405.11862","DOI":"10.24963\/ijcai.2024\/132"},{"key":"1975_CR32","unstructured":"Li M, Cui L, Huang S, Wei F, Zhou M, Li Z (2019) TableBank: a benchmark dataset for table detection and recognition. arXiv:abs\/1903.01949"},{"key":"1975_CR33","doi-asserted-by":"crossref","unstructured":"Long R, Wang W, Xue N, Gao F, Yang Z, Wang Y, Xia G-S (2021) Parsing table structures in the wild. In: IEEE\/CVF international conference on computer vision (ICCV), pp 924\u2013932","DOI":"10.1109\/ICCV48922.2021.00098"},{"key":"1975_CR34","doi-asserted-by":"crossref","unstructured":"Smock B, Pesala R, Abraham R (2021) PubTables-1M: towards comprehensive table extraction from unstructured documents. In: IEEE\/CVF conference on computer vision and pattern recognition (CVPR), pp 4624-4632","DOI":"10.1109\/CVPR52688.2022.00459"},{"key":"1975_CR35","unstructured":"Ye J, Qi X, He Y, Chen Y, Gu D, Gao P, Xiao R (2021) PingAn-VCGroup\u2019s solution for ICDAR 2021 competition on scientific literature parsing task B: table recognition to HTML. arXiv:abs\/2105.01848"},{"key":"1975_CR36","doi-asserted-by":"crossref","unstructured":"Newell A, Yang K, Deng J (2016) Stacked hourglass networks for human pose estimation. In: European conference on computer vision","DOI":"10.1007\/978-3-319-46484-8_29"},{"key":"1975_CR37","first-page":"1","volume":"32","author":"X Pan","year":"2018","unstructured":"Pan X, Shi J, Luo P, Wang X, Tang X (2018) Spatial as deep: spatial CNN for traffic scene understanding. Proc AAAI Conf Artif Intell 32:1","journal-title":"Proc AAAI Conf Artif Intell"},{"key":"1975_CR38","doi-asserted-by":"crossref","unstructured":"He K, Zhang X, Ren S, Sun J (2016) Deep residual learning for image recognition. In: IEEE conference on computer vision and pattern recognition (CVPR), pp 770\u2013778","DOI":"10.1109\/CVPR.2016.90"},{"key":"1975_CR39","doi-asserted-by":"crossref","unstructured":"Wang J, Lin W, Ma C, Li M, Sun Z, Sun L, Huo Q (2023) Robust table structure recognition with dynamic queries enhanced detection transformer. Pattern Recognit 144:109817","DOI":"10.1016\/j.patcog.2023.109817"},{"key":"1975_CR40","doi-asserted-by":"crossref","unstructured":"Huang Y-X, Liu H-I, Shuai H-H, Cheng W-H (2024) DQ-DETR: DETR with dynamic query for tiny object detection. arXiv:abs\/2404.03507","DOI":"10.1007\/978-3-031-73116-7_17"},{"key":"1975_CR41","unstructured":"Ren S, He K, Girshick R, Sun J (2015) Faster R-CNN: towards real-time object detection with region proposal networks. In: Advances in neural information processing systems, vol 28"},{"key":"1975_CR42","doi-asserted-by":"crossref","unstructured":"Long J, Shelhamer E, Darrell T (2015) Fully convolutional networks for semantic segmentation. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 3431\u20133440","DOI":"10.1109\/CVPR.2015.7298965"},{"key":"1975_CR43","doi-asserted-by":"crossref","unstructured":"Xiong Y, Li Z, Chen Y, Wang F, Zhu X, Luo J, Wang W, Tong L, Li H, Qiao Y, Lu L, Zhou J, Dai J (2024) Efficient deformable ConvNets: rethinking dynamic and sparse operator for vision applications. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 5652\u20135661","DOI":"10.1109\/CVPR52733.2024.00540"},{"key":"1975_CR44","doi-asserted-by":"crossref","unstructured":"Hou Q, Zhang L, Cheng M-M, Feng J (2020) Strip pooling: rethinking spatial pooling for scene parsing. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 4003\u20134012","DOI":"10.1109\/CVPR42600.2020.00406"},{"key":"1975_CR45","unstructured":"Cheng B, Schwing Alexander G, Kirillov A (2021) Per-pixel classification is not all you need for semantic segmentation. In: Neural information processing systems"},{"key":"1975_CR46","doi-asserted-by":"crossref","unstructured":"Cheng B, Misra I, Schwing Alexander G, Kirillov A, Girdhar R (2022) Masked-attention mask transformer for universal image segmentation. In: IEEE\/CVF conference on computer vision and pattern recognition (CVPR), pp 1280\u20131289","DOI":"10.1109\/CVPR52688.2022.00135"},{"key":"1975_CR47","doi-asserted-by":"crossref","unstructured":"Kirillov A, Yuxin W, He K, Girshick R (2020) PointRend: image segmentation as rendering. In: IEEE\/CVF conference on computer vision and pattern recognition (CVPR), pp 9796\u20139805","DOI":"10.1109\/CVPR42600.2020.00982"},{"key":"1975_CR48","doi-asserted-by":"crossref","unstructured":"Fan M, Lai S, Huang J, Wei X, Chai Z, Luo J, Wei X (2021) Rethinking BiSeNet for real-time semantic segmentation. In: IEEE\/CVF conference on computer vision and pattern recognition (CVPR), pp 9711\u20139720","DOI":"10.1109\/CVPR46437.2021.00959"},{"key":"1975_CR49","doi-asserted-by":"crossref","unstructured":"Shrivastava A, Gupta A, Girshick R (2016) Training region-based object detectors with online hard example mining. In: IEEE conference on computer vision and pattern recognition (CVPR), pp 761\u2013769","DOI":"10.1109\/CVPR.2016.89"},{"key":"1975_CR50","unstructured":"Loshchilov I, Hutter F (2017) Decoupled weight decay regularization. arXiv: abs\/1711.05101"},{"key":"1975_CR51","doi-asserted-by":"crossref","unstructured":"Ronneberger O, Fischer P, Brox T (2015) U-Net: convolutional networks for biomedical image segmentation. arXiv:abs\/1505.04597","DOI":"10.1007\/978-3-319-24574-4_28"},{"key":"1975_CR52","doi-asserted-by":"crossref","unstructured":"Chen L-C, Zhu Y, Papandreou G, Schroff F, Adam H (2018) Encoder-decoder with Atrous separable convolution for semantic image segmentation. In: European conference on computer vision","DOI":"10.1007\/978-3-030-01234-2_49"},{"key":"1975_CR53","unstructured":"Xie E, Wang W, Yu Z, Anandkumar A, Alvarez JM, Luo P (2021) SegFormer: simple and efficient design for semantic segmentation with transformers. In: Neural information processing systems"},{"key":"1975_CR54","unstructured":"Guo M-H, Lu C-Z, Hou Q, Liu Z, Cheng M-M, Hu S-M (2022) SegNeXt: rethinking convolutional attention design for semantic segmentation. arXiv:abs\/2209.08575"},{"key":"1975_CR55","doi-asserted-by":"crossref","unstructured":"Liu Z, Lin Y, Cao Y, Han H, Wei Y, Zhang Z, Lin S, Guo B (2021) Swin transformer: hierarchical vision transformer using shifted windows. In: Proceedings of the IEEE\/CVF international conference on computer vision (ICCV), pp 9992\u201310002","DOI":"10.1109\/ICCV48922.2021.00986"}],"container-title":["Complex &amp; Intelligent Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s40747-025-01975-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s40747-025-01975-w\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s40747-025-01975-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,6]],"date-time":"2025-09-06T20:53:02Z","timestamp":1757191982000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s40747-025-01975-w"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,6,17]]},"references-count":55,"journal-issue":{"issue":"8","published-print":{"date-parts":[[2025,8]]}},"alternative-id":["1975"],"URL":"https:\/\/doi.org\/10.1007\/s40747-025-01975-w","relation":{},"ISSN":["2199-4536","2198-6053"],"issn-type":[{"type":"print","value":"2199-4536"},{"type":"electronic","value":"2198-6053"}],"subject":[],"published":{"date-parts":[[2025,6,17]]},"assertion":[{"value":"1 January 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"29 May 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"17 June 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"This manuscript did not involve human participants or animal-related research, so the informed consent statement and welfare of animals are not applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical and informed consent for data used"}}],"article-number":"343"}}