{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,15]],"date-time":"2025-11-15T10:34:15Z","timestamp":1763202855597,"version":"3.44.0"},"publisher-location":"New York, NY, USA","reference-count":47,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,3,4]],"date-time":"2024-03-04T00:00:00Z","timestamp":1709510400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"name":"the National Natural Science Foundation of China","award":["U21B2009"],"award-info":[{"award-number":["U21B2009"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,3,4]]},"DOI":"10.1145\/3616855.3635777","type":"proceedings-article","created":{"date-parts":[[2024,3,4]],"date-time":"2024-03-04T18:18:12Z","timestamp":1709576292000},"page":"181-189","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":3,"title":["TTC-QuAli: A Text-Table-Chart Dataset for Multimodal Quantity Alignment"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-0692-2228","authenticated-orcid":false,"given":"Haoyu","family":"Dong","sequence":"first","affiliation":[{"name":"Institute of Information Engineering, Chinese Academy of Sciences &amp; School of Cyber Security, University of Chinese Academy of Sciences, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6272-7545","authenticated-orcid":false,"given":"Haochen","family":"Wang","sequence":"additional","affiliation":[{"name":"Peking University, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0007-9707-7272","authenticated-orcid":false,"given":"Anda","family":"Zhou","sequence":"additional","affiliation":[{"name":"University of Edinburgh, Edinburgh, United Kingdom"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4416-3974","authenticated-orcid":false,"given":"Yue","family":"Hu","sequence":"additional","affiliation":[{"name":"Institute of Information Engineering, Chinese Academy of Sciences &amp; School of Cyber Security, University of Chinese Academy of Sciences, Beijing, China"}]}],"member":"320","published-online":{"date-parts":[[2024,3,4]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"https:\/\/www.bls.gov","author":"Accessed","year":"2023","unstructured":"Accessed 2023 BLS, https:\/\/www.bls.gov. 2023. U.S. Bureau of Labor Statistics."},{"key":"e_1_3_2_1_2_1","unstructured":"https:\/\/www.cdc.gov Accessed 2023 CDC. 2023. Centers for Disease Control and Prevention."},{"volume-title":"ttps:\/\/www.census.gov","year":"2023","key":"e_1_3_2_1_3_1","unstructured":"2023 Census, ttps:\/\/www.census.gov. 2023. Census Bureau."},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1109\/WACV45572.2020.9093269"},{"key":"e_1_3_2_1_5_1","volume-title":"Hitab: A hierarchical table dataset for question answering and natural language generation. arXiv preprint arXiv:2108.06712","author":"Cheng Zhoujun","year":"2021","unstructured":"Zhoujun Cheng, Haoyu Dong, Zhiruo Wang, Ran Jia, Jiaqi Guo, Yan Gao, Shi Han, Jian-Guang Lou, and Dongmei Zhang. 2021. Hitab: A hierarchical table dataset for question answering and natural language generation. arXiv preprint arXiv:2108.06712 (2021)."},{"key":"e_1_3_2_1_6_1","volume-title":"ChartReader: A Unified Framework for Chart Derendering and Comprehension without Heuristic Rules. arXiv preprint arXiv:2304.02173","author":"Cheng Zhi-Qi","year":"2023","unstructured":"Zhi-Qi Cheng, Qi Dai, Siyao Li, Jingdong Sun, Teruko Mitamura, and Alexander G Hauptmann. 2023. ChartReader: A Unified Framework for Chart Derendering and Comprehension without Heuristic Rules. arXiv preprint arXiv:2304.02173 (2023)."},{"key":"e_1_3_2_1_7_1","volume-title":"International Conference on Machine Learning. PMLR","author":"Cho Jaemin","year":"2021","unstructured":"Jaemin Cho, Jie Lei, Hao Tan, and Mohit Bansal. 2021. Unifying vision-and-language tasks via text generation. In International Conference on Machine Learning. PMLR, 1931--1942."},{"key":"e_1_3_2_1_8_1","volume-title":"Bhargava Urala Kota, and Venu Govindaraju","author":"Davila Kenny","year":"2020","unstructured":"Kenny Davila, Srirangaraj Setlur, David Doermann, Bhargava Urala Kota, and Venu Govindaraju. 2020. Chart mining: A survey of methods for automated chart analysis. IEEE transactions on pattern analysis and machine intelligence, Vol. 43, 11 (2020), 3799--3819."},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.14778\/3430915.3430921"},{"key":"e_1_3_2_1_10_1","volume-title":"Bert: Pre-training of deep bidirectional transformers for language understanding. arXiv preprint arXiv:1810.04805","author":"Devlin Jacob","year":"2018","unstructured":"Jacob Devlin, Ming-Wei Chang, Kenton Lee, and Kristina Toutanova. 2018. Bert: Pre-training of deep bidirectional transformers for language understanding. arXiv preprint arXiv:1810.04805 (2018)."},{"key":"e_1_3_2_1_11_1","volume-title":"Table pretraining: A survey on model architectures, pretraining objectives, and downstream tasks. arXiv preprint arXiv:2201.09745","author":"Dong Haoyu","year":"2022","unstructured":"Haoyu Dong, Zhoujun Cheng, Xinyi He, Mengyu Zhou, Anda Zhou, Fan Zhou, Ao Liu, Shi Han, and Dongmei Zhang. 2022. Table pretraining: A survey on model architectures, pretraining objectives, and downstream tasks. arXiv preprint arXiv:2201.09745 (2022)."},{"key":"e_1_3_2_1_12_1","volume-title":"Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision. 6213--6221","author":"Hassan Muhammad Yusuf","year":"2023","unstructured":"Muhammad Yusuf Hassan, Mayank Singh, et al. 2023. LineEX: Data Extraction From Scientific Line Charts. In Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision. 6213--6221."},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.322"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.398"},{"volume-title":"Computer Graphics Forum","author":"Hoque Enamul","key":"e_1_3_2_1_15_1","unstructured":"Enamul Hoque, Parsa Kavehzadeh, and Ahmed Masry. 2022. Chart question answering: State of the art and future directions. In Computer Graphics Forum, Vol. 41. Wiley Online Library, 555--572."},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1145\/2983323.2983772"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE.2019.00094"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.naacl-main.270"},{"key":"e_1_3_2_1_19_1","unstructured":"https:\/\/www.imf.org IMF. 2023. International Monetary Fund."},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00592"},{"key":"e_1_3_2_1_21_1","volume-title":"Figureqa: An annotated figure dataset for visual reasoning. arXiv preprint arXiv:1710.07300","author":"Kahou Samira Ebrahimi","year":"2017","unstructured":"Samira Ebrahimi Kahou, Vincent Michalski, Adam Atkinson, \u00c1kos K\u00e1d\u00e1r, Adam Trischler, and Yoshua Bengio. 2017. Figureqa: An annotated figure dataset for visual reasoning. arXiv preprint arXiv:1710.07300 (2017)."},{"key":"e_1_3_2_1_22_1","volume-title":"Rixie Tiffany Ko Leong, Jia Qing Tan, Enamul Hoque, and Shafiq Joty.","author":"Kantharaj Shankar","year":"2022","unstructured":"Shankar Kantharaj, Xuan Long Do, Rixie Tiffany Ko Leong, Jia Qing Tan, Enamul Hoque, and Shafiq Joty. 2022. OpenCQA: Open-ended Question Answering with Charts. arXiv preprint arXiv:2210.06628 (2022)."},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1109\/WACV51458.2022.00261"},{"key":"e_1_3_2_1_24_1","volume-title":"The measurement of observer agreement for categorical data. biometrics","author":"Richard Landis J","year":"1977","unstructured":"J Richard Landis and Gary G Koch. 1977. The measurement of observer agreement for categorical data. biometrics (1977), 159--174."},{"key":"e_1_3_2_1_25_1","volume-title":"Bart: Denoising sequence-to-sequence pre-training for natural language generation, translation, and comprehension. arXiv preprint arXiv:1910.13461","author":"Lewis Mike","year":"2019","unstructured":"Mike Lewis, Yinhan Liu, Naman Goyal, Marjan Ghazvininejad, Abdelrahman Mohamed, Omer Levy, Ves Stoyanov, and Luke Zettlemoyer. 2019. Bart: Denoising sequence-to-sequence pre-training for natural language generation, translation, and comprehension. arXiv preprint arXiv:1910.13461 (2019)."},{"key":"e_1_3_2_1_26_1","volume-title":"Francesco Piccinno, Syrine Krichene, Chenxi Pang, Kenton Lee, Mandar Joshi, Wenhu Chen, Nigel Collier, and Yasemin Altun.","author":"Liu Fangyu","year":"2022","unstructured":"Fangyu Liu, Julian Martin Eisenschlos, Francesco Piccinno, Syrine Krichene, Chenxi Pang, Kenton Lee, Mandar Joshi, Wenhu Chen, Nigel Collier, and Yasemin Altun. 2022a. DePlot: One-shot visual language reasoning by plot-to-table translation. arXiv preprint arXiv:2212.10505 (2022)."},{"key":"e_1_3_2_1_27_1","volume-title":"MatCha: Enhancing Visual Language Pretraining with Math Reasoning and Chart Derendering. arXiv preprint arXiv:2212.09662","author":"Liu Fangyu","year":"2022","unstructured":"Fangyu Liu, Francesco Piccinno, Syrine Krichene, Chenxi Pang, Kenton Lee, Mandar Joshi, Yasemin Altun, Nigel Collier, and Julian Martin Eisenschlos. 2022b. MatCha: Enhancing Visual Language Pretraining with Math Reasoning and Chart Derendering. arXiv preprint arXiv:2212.09662 (2022)."},{"key":"e_1_3_2_1_28_1","volume-title":"Tapex: Table pre-training via learning a neural sql executor. arXiv preprint arXiv:2107.07653","author":"Liu Qian","year":"2021","unstructured":"Qian Liu, Bei Chen, Jiaqi Guo, Zeqi Lin, and Jian-guang Lou. 2021. Tapex: Table pre-training via learning a neural sql executor. arXiv preprint arXiv:2107.07653 (2021)."},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1109\/WACV48630.2021.00196"},{"key":"e_1_3_2_1_30_1","volume-title":"Jia Qing Tan, Shafiq Joty, and Enamul Hoque.","author":"Masry Ahmed","year":"2022","unstructured":"Ahmed Masry, Do Xuan Long, Jia Qing Tan, Shafiq Joty, and Enamul Hoque. 2022. Chartqa: A benchmark for question answering about charts with visual and logical reasoning. arXiv preprint arXiv:2203.10244 (2022)."},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1109\/WACV45572.2020.9093523"},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDIM.2011.6093320"},{"volume-title":"https:\/\/www.nsf.gov","year":"2023","key":"e_1_3_2_1_33_1","unstructured":"2023 NSF, https:\/\/www.nsf.gov. 2023. National Science Foundation."},{"key":"e_1_3_2_1_34_1","volume-title":"Compositional semantic parsing on semi-structured tables. arXiv preprint arXiv:1508.00305","author":"Pasupat Panupong","year":"2015","unstructured":"Panupong Pasupat and Percy Liang. 2015. Compositional semantic parsing on semi-structured tables. arXiv preprint arXiv:1508.00305 (2015)."},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.5555\/3455716.3455856"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1109\/IRI51335.2021.00050"},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.1145\/2623330.2623749"},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2021.3069205"},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.emnlp-main.264"},{"key":"e_1_3_2_1_40_1","volume-title":"Proc. of NeurIPS, D. Lee, M. Sugiyama, U. Luxburg, I. Guyon, and R. Garnett (Eds.)","volume":"29","author":"Sohn Kihyuk","year":"2016","unstructured":"Kihyuk Sohn. 2016. Improved Deep Metric Learning with Multi-class N-pair Loss Objective. In Proc. of NeurIPS, D. Lee, M. Sugiyama, U. Luxburg, I. Guyon, and R. Garnett (Eds.), Vol. 29. Curran Associates, Inc., 1857--1865."},{"key":"e_1_3_2_1_41_1","unstructured":"https:\/\/www150.statcan.gc.ca StatCan. 2023. Statistics Canada. (2023)."},{"key":"e_1_3_2_1_42_1","volume-title":"Representing numbers in NLP: a survey and a vision. arXiv preprint arXiv:2103.13136","author":"Thawani Avijit","year":"2021","unstructured":"Avijit Thawani, Jay Pujara, Pedro A Szekely, and Filip Ilievski. 2021. Representing numbers in NLP: a survey and a vision. arXiv preprint arXiv:2103.13136 (2021)."},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1145\/3447548.3467434"},{"key":"e_1_3_2_1_44_1","doi-asserted-by":"crossref","unstructured":"Chenyu Yang Ruixue Fan Nan Tang Meihui Zhang Xiaoman Zhao Ju Fan and Xiaoyong Du. 2023. Pay \"Attention\" to Chart Images for What You Read on Text. (2023).","DOI":"10.1145\/3555041.3589714"},{"key":"e_1_3_2_1_45_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.745"},{"key":"e_1_3_2_1_46_1","unstructured":"Mingyang Zhou Yi R. Fung Long Chen Christopher Thomas Heng Ji and Shih-Fu Chang. 2023. Enhanced Chart Understanding in Vision and Language Task via Cross-modal Pre-training on Plot Table Pairs."},{"key":"e_1_3_2_1_47_1","volume-title":"TAT-QA: A Question Answering Benchmark on a Hybrid of Tabular and Textual Content in Finance. arXiv preprint arXiv:2105.07624","author":"Zhu Fengbin","year":"2021","unstructured":"Fengbin Zhu, Wenqiang Lei, Youcheng Huang, Chao Wang, Shuo Zhang, Jiancheng Lv, Fuli Feng, and Tat-Seng Chua. 2021. TAT-QA: A Question Answering Benchmark on a Hybrid of Tabular and Textual Content in Finance. arXiv preprint arXiv:2105.07624 (2021). io"}],"event":{"name":"WSDM '24: The 17th ACM International Conference on Web Search and Data Mining","sponsor":["SIGMOD ACM Special Interest Group on Management of Data","SIGWEB ACM Special Interest Group on Hypertext, Hypermedia, and Web","SIGKDD ACM Special Interest Group on Knowledge Discovery in Data","SIGIR ACM Special Interest Group on Information Retrieval"],"location":"Merida Mexico","acronym":"WSDM '24"},"container-title":["Proceedings of the 17th ACM International Conference on Web Search and Data Mining"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3616855.3635777","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3616855.3635777","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T00:52:43Z","timestamp":1755823963000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3616855.3635777"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,3,4]]},"references-count":47,"alternative-id":["10.1145\/3616855.3635777","10.1145\/3616855"],"URL":"https:\/\/doi.org\/10.1145\/3616855.3635777","relation":{},"subject":[],"published":{"date-parts":[[2024,3,4]]},"assertion":[{"value":"2024-03-04","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}