{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,10]],"date-time":"2025-10-10T07:21:03Z","timestamp":1760080863484,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":57,"publisher":"ACM","license":[{"start":{"date-parts":[[2023,8,22]],"date-time":"2023-08-22T00:00:00Z","timestamp":1692662400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2023,8,22]]},"DOI":"10.1145\/3573128.3604901","type":"proceedings-article","created":{"date-parts":[[2023,8,4]],"date-time":"2023-08-04T10:15:41Z","timestamp":1691144141000},"page":"1-10","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":1,"title":["WEATHERGOV+"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-8654-1593","authenticated-orcid":false,"given":"Amanda","family":"Dash","sequence":"first","affiliation":[{"name":"University of Victoria, Victoria, British Columbia, Canada"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5594-977X","authenticated-orcid":false,"given":"Melissa","family":"Cote","sequence":"additional","affiliation":[{"name":"University of Victoria, Victoria, British Columbia, Canada"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8991-0999","authenticated-orcid":false,"given":"Alexandra Branzan","family":"Albu","sequence":"additional","affiliation":[{"name":"University of Victoria, Victoria, British Columbia, Canada"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2023,8,22]]},"reference":[{"doi-asserted-by":"crossref","unstructured":"R. Barzilay and M. Lapata. 2005. Collective content selection for concept-to-text generation. In EMNLP. ACL 331--8.","key":"e_1_3_2_1_1_1","DOI":"10.3115\/1220575.1220617"},{"unstructured":"Z. Chi H. Huang H.-D. Xu et al. 2019. Complicated table structure recognition. arXiv preprint arXiv:1908.04729 (2019).","key":"e_1_3_2_1_2_1"},{"doi-asserted-by":"crossref","unstructured":"B. Co\u00fcasnon and A. Lemaitre. 2014. Recognition of tables and forms. In Handb. Doc. Image Process. Recognit. D. Doermann and K. Tombre (Eds.). Springer 647--77.","key":"e_1_3_2_1_3_1","DOI":"10.1007\/978-0-85729-859-1_20"},{"doi-asserted-by":"crossref","unstructured":"Y. Deng D. Rosenberg and G. Mann. 2019. Challenges in end-to-end neural scientific table recognition. In ICDAR. IEEE 894--901.","key":"e_1_3_2_1_4_1","DOI":"10.1109\/ICDAR.2019.00148"},{"doi-asserted-by":"crossref","unstructured":"P. A. Duboue and K. R. McKeown. 2003. Statistical acquisition of content selection rules for natural language generation. In EMNLP. 121--8.","key":"e_1_3_2_1_5_1","DOI":"10.3115\/1119355.1119371"},{"doi-asserted-by":"crossref","unstructured":"J. Fang X. Tao Z. Tang et al. 2012. Dataset ground-truth and performance metrics for table detection evaluation. In DAS. IEEE 445--9.","key":"e_1_3_2_1_6_1","DOI":"10.1109\/DAS.2012.29"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_7_1","DOI":"10.1007\/978-3-030-87626-5_8"},{"key":"e_1_3_2_1_8_1","volume-title":"ICDAR 2019 competition on table detection and recognition (cTDaR). In ICDAR. IEEE, 1510--5.","author":"Gao L.","year":"2019","unstructured":"L. Gao, Y. Huang, H. D\u00e9jean, et al. 2019. ICDAR 2019 competition on table detection and recognition (cTDaR). In ICDAR. IEEE, 1510--5."},{"key":"e_1_3_2_1_9_1","volume-title":"ICDAR2017 competition on","author":"Gao L.","year":"2017","unstructured":"L. Gao, X. Yi, Z. Jiang, et al. 2017. ICDAR2017 competition on page object detection. In ICDAR, Vol. 1. IEEE, 1417--22."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_10_1","DOI":"10.1613\/jair.5477"},{"key":"e_1_3_2_1_11_1","volume-title":"ICDAR 2013 table competition. In ICDAR. IEEE, 1449--53","author":"G\u00f6bel M.","year":"2013","unstructured":"M. G\u00f6bel, T. Hassan, E. Oro, et al. 2013. ICDAR 2013 table competition. In ICDAR. IEEE, 1449--53."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_12_1","DOI":"10.1109\/ACCESS.2021.3087865"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_13_1","DOI":"10.3390\/jimaging7100214"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_14_1","DOI":"10.18653\/v1\/N18-2098"},{"volume-title":"ICDAR 2021 competition on scientific literature parsing. In ICDAR. Springer, 605--17","author":"Jimeno Yepes A.","unstructured":"A. Jimeno Yepes, P. Zhong, and D. Burdick. 2021. ICDAR 2021 competition on scientific literature parsing. In ICDAR. Springer, 605--17.","key":"e_1_3_2_1_15_1"},{"key":"e_1_3_2_1_16_1","volume-title":"ICDAR 2021 competition on scientific table image recognition to LaTeX. In ICDAR. Springer, 754--66","author":"Kayal P.","year":"2021","unstructured":"P. Kayal, M. Anand, H. Desai, et al. 2021. ICDAR 2021 competition on scientific table image recognition to LaTeX. In ICDAR. Springer, 754--66."},{"unstructured":"P. Kayal M. Anand H. Desai et al. 2022. Tables to LaTeX: structure and content extraction from scientific tables. Int. J. Doc. Anal. Recognit. (2022) 1--10.","key":"e_1_3_2_1_17_1"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_18_1","DOI":"10.3390\/jimaging9030062"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_19_1","DOI":"10.5555\/2591248.2591256"},{"doi-asserted-by":"crossref","unstructured":"R. Lebret D. Grangier and M. Auli. 2016. Neural text generation from structured data with application to the biography domain. In EMNLP. 1203--13.","key":"e_1_3_2_1_20_1","DOI":"10.18653\/v1\/D16-1128"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_21_1","DOI":"10.1007\/s11042-021-11819-7"},{"unstructured":"M. Li L. Cui S. Huang et al. 2020. TableBank: Table benchmark for image-based table detection and recognition. In LREC. 1918--25.","key":"e_1_3_2_1_22_1"},{"doi-asserted-by":"crossref","unstructured":"P. Liang M. I. Jordan and D. Klein. 2009. Learning semantic correspondences with less supervision. In AFNLP. ACL and AFNLP 91--9.","key":"e_1_3_2_1_23_1","DOI":"10.3115\/1687878.1687893"},{"unstructured":"C.-Y. Lin and E. Hovy. 2003. Automatic evaluation of summaries using n-gram co-occurrence statistics. In HLT-NAACL. 150--7.","key":"e_1_3_2_1_24_1"},{"unstructured":"J. Liu X. Liu J. Sheng et al. 2019. Pyramid mask text detector. arXiv preprint arXiv:1903.11800 (2019).","key":"e_1_3_2_1_25_1"},{"doi-asserted-by":"crossref","unstructured":"S. Liu J. Cao R. Yang et al. 2022. Long text and multi-table summarization: Dataset and method. In EMNLP. 1995--2010.","key":"e_1_3_2_1_26_1","DOI":"10.18653\/v1\/2022.findings-emnlp.145"},{"doi-asserted-by":"crossref","unstructured":"D. Lopresti and G. Nagy. 2001. A tabular survey of automated table processing. In GREC. Springer 93--120.","key":"e_1_3_2_1_27_1","DOI":"10.1007\/3-540-40953-X_9"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_28_1","DOI":"10.1016\/j.patcog.2021.107980"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_29_1","DOI":"10.1016\/j.patcog.2022.109006"},{"doi-asserted-by":"crossref","unstructured":"H. Mei M. Bansal and M. R. Walter. 2016. What to talk about and how? Selective generation using LSTMs with coarse-to-fine alignment. In NAACL. 720--30.","key":"e_1_3_2_1_30_1","DOI":"10.18653\/v1\/N16-1086"},{"doi-asserted-by":"crossref","unstructured":"K. Papineni S. Roukos T. Ward et al. 2002. BLEU: a method for automatic evaluation of machine translation. In ACL. 311--8.","key":"e_1_3_2_1_31_1","DOI":"10.3115\/1073083.1073135"},{"doi-asserted-by":"crossref","unstructured":"A. Parikh X. Wang S. Gehrmann et al. 2020. ToTTo: A controlled table-to-text generation dataset. In EMNLP. 1173--86.","key":"e_1_3_2_1_32_1","DOI":"10.18653\/v1\/2020.emnlp-main.89"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_33_1","DOI":"10.1609\/aaai.v33i01.33016908"},{"doi-asserted-by":"crossref","unstructured":"R. Puduppully L. Dong and M. Lapata. 2019. Data-to-text generation with entity modeling. In ACL. 2023--35.","key":"e_1_3_2_1_34_1","DOI":"10.18653\/v1\/P19-1195"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_35_1","DOI":"10.1162\/tacl_a_00381"},{"doi-asserted-by":"crossref","unstructured":"S. R. Qasim H. Mahmood and F. Shafait. 2019. Rethinking table recognition using graph neural networks. In ICDAR. IEEE 142--7.","key":"e_1_3_2_1_36_1","DOI":"10.1109\/ICDAR.2019.00031"},{"key":"e_1_3_2_1_37_1","volume-title":"LGPMA: Complicated table structure recognition with local and global pyramid mask alignment","author":"Qiao L.","year":"2021","unstructured":"L. Qiao, Z. Li, Z. Cheng, et al. 2021. LGPMA: Complicated table structure recognition with local and global pyramid mask alignment. In ICDAR. Springer, 99--114."},{"doi-asserted-by":"crossref","unstructured":"C. Rebuffel M. Roberti L. Soulier et al. 2022. Controlling hallucinations at word level in data-to-text generation. Data Min. Knowl. Discov. (2022) 1--37.","key":"e_1_3_2_1_38_1","DOI":"10.1007\/s10618-021-00801-4"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_39_1","DOI":"10.1016\/j.artint.2005.06.006"},{"doi-asserted-by":"crossref","unstructured":"K. Sel\u00e7uk Candan H. Cao Y. Qi et al. 2009. AlphaSum: Size-constrained table summarization using value lattices. In EDBT. 96--107.","key":"e_1_3_2_1_40_1","DOI":"10.1145\/1516360.1516373"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_41_1","DOI":"10.1609\/aaai.v32i1.11947"},{"doi-asserted-by":"crossref","unstructured":"A. Shahab F. Shafait T. Kieninger et al. 2010. An open approach towards the benchmarking of table structure recognition systems. In DAS. 113--20.","key":"e_1_3_2_1_42_1","DOI":"10.1145\/1815330.1815345"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_43_1","DOI":"10.1002\/widm.1482"},{"doi-asserted-by":"crossref","unstructured":"S. A. Siddiqui I. A. Fateh S. T. R. Rizvi et al. 2019. DeepTabStR: Deep learning based table structure recognition. In ICDAR. IEEE 1403--9.","key":"e_1_3_2_1_44_1","DOI":"10.1109\/ICDAR.2019.00226"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_45_1","DOI":"10.1109\/ACCESS.2018.2880211"},{"doi-asserted-by":"crossref","unstructured":"B. Smock R. Pesala and R. Abraham. 2022. PubTables-1M: Towards comprehensive table extraction from unstructured documents. In CVPR. 4634--42.","key":"e_1_3_2_1_46_1","DOI":"10.1109\/CVPR52688.2022.00459"},{"doi-asserted-by":"crossref","unstructured":"T. Tang J. Li Z. Chen et al. 2022. TextBox 2.0: a text generation library with pre-trained language models. In EMNLP. ACL 435--44.","key":"e_1_3_2_1_47_1","DOI":"10.18653\/v1\/2022.emnlp-demos.42"},{"key":"e_1_3_2_1_48_1","volume-title":"MVP: Multi-task supervised pre-training for natural language generation. arXiv preprint arXiv:2206.12131","author":"Tang T.","year":"2022","unstructured":"T. Tang, J. Li, W. X. Zhao, and other. 2022. MVP: Multi-task supervised pre-training for natural language generation. arXiv preprint arXiv:2206.12131 (2022)."},{"key":"e_1_3_2_1_49_1","volume-title":"PASS: A Dutch data-to-text system for soccer, targeted towards specific audiences. In NLG. 95--104.","author":"van der Lee C.","year":"2017","unstructured":"C. van der Lee, E. Krahmer, and S. Wubben. 2017. PASS: A Dutch data-to-text system for soccer, targeted towards specific audiences. In NLG. 95--104."},{"unstructured":"A. Vaswani N. Shazeer N. Parmar et al. 2017. Attention is all you need. Adv. Neural. Inf. Process. Syst. 30 (2017).","key":"e_1_3_2_1_50_1"},{"doi-asserted-by":"crossref","unstructured":"W. Wang E. Xie X. Li et al. 2019. Shape robust text detection with progressive scale expansion network. In CVPR. 9336--45.","key":"e_1_3_2_1_51_1","DOI":"10.1109\/CVPR.2019.00956"},{"doi-asserted-by":"crossref","unstructured":"S. Wiseman S. M. Shieber and A. M. Rush. 2017. Challenges in data-to-document generation. In EMNLP. 2253--63.","key":"e_1_3_2_1_52_1","DOI":"10.18653\/v1\/D17-1239"},{"unstructured":"Y. W. Wong and R. Mooney. 2007. Generation by inverting a semantic parser that uses statistical machine translation. In HLT-NAACL. 172--9.","key":"e_1_3_2_1_53_1"},{"key":"e_1_3_2_1_54_1","first-page":"110","article-title":"A large-scale dataset for end-to-end table recognition in the wild. Sci","volume":"10","author":"Yang F.","year":"2023","unstructured":"F. Yang, L. Hu, X. Liu, et al. 2023. A large-scale dataset for end-to-end table recognition in the wild. Sci. Data 10, 1 (2023), 110.","journal-title":"Data"},{"key":"e_1_3_2_1_55_1","volume-title":"B: Table recognition to HTML. arXiv preprint arXiv:2105.01848","author":"Ye J.","year":"2021","unstructured":"J. Ye, X. Qi, Y. He, et al. 2021. PingAn-VCGroup's solution for ICDAR 2021 competition on scientific literature parsing task B: Table recognition to HTML. arXiv preprint arXiv:2105.01848 (2021)."},{"doi-asserted-by":"crossref","unstructured":"X. Zheng D. Burdick L. Popa et al. 2021. Global table extractor (GTE): A framework for joint table identification and cell structure recognition using visual context. In WACV. 697--706.","key":"e_1_3_2_1_56_1","DOI":"10.1109\/WACV48630.2021.00074"},{"volume-title":"Image-based table recognition: data, model, and evaluation","author":"Zhong X.","unstructured":"X. Zhong, E. ShafieiBavani, and A. Jimeno Yepes. 2020. Image-based table recognition: data, model, and evaluation. In ECCV. Springer, 564--80.","key":"e_1_3_2_1_57_1"}],"event":{"sponsor":["SIGWEB ACM Special Interest Group on Hypertext, Hypermedia, and Web"],"acronym":"DocEng '23","name":"DocEng '23: ACM Symposium on Document Engineering 2023","location":"Limerick Ireland"},"container-title":["Proceedings of the ACM Symposium on Document Engineering 2023"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3573128.3604901","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3573128.3604901","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T16:45:38Z","timestamp":1750178738000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3573128.3604901"}},"subtitle":["A Table Recognition and Summarization Dataset to Bridge the Gap Between Document Image Analysis and Natural Language Generation"],"short-title":[],"issued":{"date-parts":[[2023,8,22]]},"references-count":57,"alternative-id":["10.1145\/3573128.3604901","10.1145\/3573128"],"URL":"https:\/\/doi.org\/10.1145\/3573128.3604901","relation":{},"subject":[],"published":{"date-parts":[[2023,8,22]]},"assertion":[{"value":"2023-08-22","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}