{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,19]],"date-time":"2026-03-19T02:23:40Z","timestamp":1773887020455,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":63,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,6,9]],"date-time":"2024-06-09T00:00:00Z","timestamp":1717891200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,6,9]]},"DOI":"10.1145\/3626246.3653376","type":"proceedings-article","created":{"date-parts":[[2024,5,23]],"date-time":"2024-05-23T10:26:39Z","timestamp":1716459999000},"page":"41-54","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":6,"title":["ByteCard: Enhancing ByteDance's Data Warehouse with Learned Cardinality Estimation"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0005-4696-8572","authenticated-orcid":false,"given":"Yuxing","family":"Han","sequence":"first","affiliation":[{"name":"Data Platform, ByteDance, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-9407-8651","authenticated-orcid":false,"given":"Haoyu","family":"Wang","sequence":"additional","affiliation":[{"name":"Data Platform, ByteDance &amp; East China Normal University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-3448-3831","authenticated-orcid":false,"given":"Lixiang","family":"Chen","sequence":"additional","affiliation":[{"name":"Data Platform, ByteDance &amp; East China Normal University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0008-1121-617X","authenticated-orcid":false,"given":"Yifeng","family":"Dong","sequence":"additional","affiliation":[{"name":"Data Platform, ByteDance, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0005-6294-0967","authenticated-orcid":false,"given":"Xing","family":"Chen","sequence":"additional","affiliation":[{"name":"Data Platform, ByteDance, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-6052-9434","authenticated-orcid":false,"given":"Benquan","family":"Yu","sequence":"additional","affiliation":[{"name":"Data Platform, ByteDance, San Jose, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5128-8882","authenticated-orcid":false,"given":"Chengcheng","family":"Yang","sequence":"additional","affiliation":[{"name":"East China Normal University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4132-8630","authenticated-orcid":false,"given":"Weining","family":"Qian","sequence":"additional","affiliation":[{"name":"East China Normal University, Shanghai, China"}]}],"member":"320","published-online":{"date-parts":[[2024,6,9]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.14778\/1687553.1687625"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"crossref","unstructured":"Daniel J Abadi Daniel S Myers David J DeWitt and Samuel R Madden. 2006. Materialization Strategies in a Column-Oriented DBMS. In ICDE. 466--475.","DOI":"10.1109\/ICDE.2007.367892"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"crossref","unstructured":"Nikos Armenatzoglou Sanuj Basu Naga Bhanoori Mengchu Cai Naresh Chainani Kiran Chinta Venkatraman Govindaraju Todd J Green Monish Gupta Sebastian Hillig et al. 2022. Amazon Redshift re-invented. In SIGMOD. 2205--2217.","DOI":"10.1145\/3514221.3526045"},{"key":"e_1_3_2_1_4_1","volume-title":"Understanding the Python. In PyCON Python Conference","author":"Beazley David","year":"2010","unstructured":"David Beazley. 2010. Understanding the Python. In PyCON Python Conference. Atlanta, Georgia. 1--62."},{"key":"e_1_3_2_1_5_1","first-page":"1877","article-title":"Language models are few-shot learners","volume":"33","author":"Brown Tom","year":"2020","unstructured":"Tom Brown, Benjamin Mann, Nick Ryder, Melanie Subbiah, Jared D Kaplan, Prafulla Dhariwal, Arvind Neelakantan, Pranav Shyam, Girish Sastry, Amanda Askell, et al. 2020. Language models are few-shot learners. NIPS , Vol. 33 (2020), 1877--1901.","journal-title":"NIPS"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1080\/01621459.1992.10475194"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"crossref","unstructured":"Moses Charikar Surajit Chaudhuri Rajeev Motwani and Vivek Narasayya. 2000. Towards estimation error guarantees for distinct values. In SIGMOD. 268--279.","DOI":"10.1145\/335168.335230"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"crossref","unstructured":"Lixiang Chen Ruihao Chen Chengcheng Yang Yuxing Han Rong Zhang Xuan Zhou Peiquan Jin and Weining Qian. 2023. Workload-Aware Log-Structured Merge Key-Value Store for NVM-SSD Hybrid Storage. In ICDE. 2198--2210.","DOI":"10.1109\/ICDE55515.2023.00171"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.1968.1054142"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1109\/TNET.2019.2940705"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"crossref","unstructured":"Benoit Dageville Thierry Cruanes Marcin Zukowski Vadim Antonov Artin Avanes Jon Bock Jonathan Claybaugh Daniel Engovatov Martin Hentschel Jiansheng Huang et al. 2016. The snowflake elastic data warehouse. In SIGMOD. 215--226.","DOI":"10.1145\/2882903.2903741"},{"key":"e_1_3_2_1_12_1","unstructured":"Yifan Dai Yien Xu Aishwarya Ganesan Ramnatthan Alagappan Brian Kroth Andrea Arpaci-Dusseau and Remzi Arpaci-Dusseau. 2020. From $$WiscKey$$ to Bourbon: A Learned Index for $$Log-Structured$$ Merge Trees. In OSDI. 155--171."},{"key":"e_1_3_2_1_13_1","first-page":"4062","article-title":"SageDB","volume":"15","author":"Ding Jialin","year":"2022","unstructured":"Jialin Ding, Ryan Marcus, Andreas Kipf, Vikram Nathan, Aniruddha Nrusimha, Kapil Vaidya, Alexander van Renen, and Tim Kraska. 2022. SageDB: An Instance-Optimized Data Analytics System. PVLDB, Vol. 15, 13 (2022), 4062--4078.","journal-title":"An Instance-Optimized Data Analytics System. PVLDB"},{"key":"e_1_3_2_1_14_1","volume-title":"What is the expectation maximization algorithm? Nature biotechnology","author":"Do Chuong B","year":"2008","unstructured":"Chuong B Do and Serafim Batzoglou. 2008. What is the expectation maximization algorithm? Nature biotechnology, Vol. 26, 8 (2008), 897--899."},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.14778\/3329772.3329780"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"crossref","unstructured":"Philippe Flajolet \u00c9ric Fusy Olivier Gandouet and Fr\u00e9d\u00e9ric Meunier. 2007. Hyperloglog: the analysis of a near-optimal cardinality estimation algorithm. In Discrete Mathematics and Theoretical Computer Science. 137--156.","DOI":"10.46298\/dmtcs.3545"},{"key":"e_1_3_2_1_17_1","volume-title":"aGrUM: a Graphical Universal Model framework","author":"Gonzales Christophe","unstructured":"Christophe Gonzales, Lionel Torti, and Pierre-Henri Wuillemin. 2017. aGrUM: a Graphical Universal Model framework. In IEA\/AIE. 171--177."},{"key":"e_1_3_2_1_18_1","first-page":"19","article-title":"The cascades framework for query optimization","volume":"18","author":"Graefe Goetz","year":"1995","unstructured":"Goetz Graefe. 1995. The cascades framework for query optimization. IEEE Data Eng. Bull. , Vol. 18, 3 (1995), 19--29.","journal-title":"IEEE Data Eng. Bull."},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"crossref","unstructured":"Yue Han Guoliang Li Haitao Yuan and Ji Sun. 2021a. An autonomous materialized view management system with deep reinforcement learning. In ICDE. 2159--2164.","DOI":"10.1109\/ICDE51399.2021.00217"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.14778\/3503585.3503586"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"crossref","unstructured":"Stefan Heule Marc Nunkesser and Alexander Hall. 2013. Hyperloglog in practice: Algorithmic engineering of a state of the art cardinality estimation algorithm. In EDBT\/ICDT. 683--692.","DOI":"10.1145\/2452376.2452456"},{"key":"e_1_3_2_1_22_1","volume-title":"One model to rule them all: towards zero-shot learning for databases. arXiv:2105.00642","author":"Hilprecht Benjamin","year":"2021","unstructured":"Benjamin Hilprecht and Carsten Binnig. 2021. One model to rule them all: towards zero-shot learning for databases. arXiv:2105.00642 (2021)."},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.14778\/3551793.3551799"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.14778\/3384345.3384349"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.14778\/3415478.3415535"},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"crossref","unstructured":"Zachary G Ives and Nicholas E Taylor. 2008. Sideways information passing for push-style query processing. In ICDE. 774--783.","DOI":"10.1109\/ICDE.2008.4497486"},{"key":"e_1_3_2_1_27_1","unstructured":"Andreas Kipf Thomas Kipf Bernhard Radke Viktor Leis Peter Boncz and Alfons Kemper. 2019. Learned cardinalities: Estimating correlated joins with deep learning. In CIDR."},{"key":"e_1_3_2_1_28_1","volume-title":"Probabilistic graphical models: principles and techniques","author":"Koller Daphne","unstructured":"Daphne Koller and Nir Friedman. 2009. Probabilistic graphical models: principles and techniques. MIT press."},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.14778\/2367502.2367518"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.14778\/3611479.3611494"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.14778\/2850583.2850594"},{"key":"e_1_3_2_1_32_1","first-page":"643","article-title":"Query optimization through the looking glass, and what we found running the join order benchmark","volume":"27","author":"Leis Viktor","year":"2018","unstructured":"Viktor Leis, Bernhard Radke, Andrey Gubichev, Atanas Mirchev, Peter Boncz, Alfons Kemper, and Thomas Neumann. 2018. Query optimization through the looking glass, and what we found running the join order benchmark. PVLDB, Vol. 27, 5 (2018), 643--668.","journal-title":"PVLDB"},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.14778\/3476311.3476380"},{"key":"e_1_3_2_1_34_1","volume-title":"Opportunistic view materialization with deep reinforcement learning. arXiv:1903.01363","author":"Liang Xi","year":"2019","unstructured":"Xi Liang, Aaron J Elmore, and Sanjay Krishnan. 2019. Opportunistic view materialization with deep reinforcement learning. arXiv:1903.01363 (2019)."},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.14778\/3476249.3476254"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2004.1267047"},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.14778\/3583140.3583164"},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.14778\/3476249.3476274"},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.1145\/3555041.3589677"},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"publisher","DOI":"10.14778\/1920841.1920902"},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"crossref","unstructured":"P Griffiths Selinger Morton M Astrahan Donald D Chamberlin Raymond A Lorie and Thomas G Price. 1979. Access path selection in a relational database management system. In SIGMOD. 23--34.","DOI":"10.1145\/582095.582099"},{"key":"e_1_3_2_1_42_1","volume-title":"Raghu Ramakrishnan, Divesh Srivastava, Peter J Stuckey, and S Sudarshan.","author":"Seshadri Praveen","year":"1996","unstructured":"Praveen Seshadri, Joseph M Hellerstein, Hamid Pirahesh, TY Cliff Leung, Raghu Ramakrishnan, Divesh Srivastava, Peter J Stuckey, and S Sudarshan. 1996. Cost-based optimization for magic: Algebra and implementation. In SIGMOD. 435--446."},{"key":"e_1_3_2_1_43_1","volume-title":"Rover: An online Spark SQL tuning service via generalized transfer learning. In SIGKDD. 4800--4812.","author":"Shen Yu","year":"2023","unstructured":"Yu Shen, Xinyuyang Ren, Yupeng Lu, Huaijun Jiang, Huanyong Xu, Di Peng, Yang Li, Wentao Zhang, and Bin Cui. 2023. Rover: An online Spark SQL tuning service via generalized transfer learning. In SIGKDD. 4800--4812."},{"key":"e_1_3_2_1_44_1","doi-asserted-by":"crossref","unstructured":"Lakshmikant Shrinivas Sreenath Bodagala Ramakrishna Varadarajan Ariel Cary Vivek Bharathan and Chuck Bear. 2013. Materialization Strategies in the Vertica Analytic Database: Lessons Learned. In ICDE. 1196--1207.","DOI":"10.1109\/ICDE.2013.6544909"},{"key":"e_1_3_2_1_45_1","doi-asserted-by":"crossref","unstructured":"Tarique Siddiqui Alekh Jindal Shi Qiao Hiren Patel and Wangchao Le. 2020. Cost models for big data query processing: Learning retrofitting and our findings. In SIGMOD. 99--113.","DOI":"10.1145\/3318464.3380584"},{"key":"e_1_3_2_1_46_1","doi-asserted-by":"publisher","DOI":"10.14778\/3368289.3368296"},{"key":"e_1_3_2_1_47_1","doi-asserted-by":"publisher","DOI":"10.14778\/3485450.3485459"},{"key":"e_1_3_2_1_48_1","first-page":"1","article-title":"Presto: A Decade of SQL Analytics at Meta","volume":"1","author":"Sun Yutian","year":"2023","unstructured":"Yutian Sun, Tim Meehan, Rebecca Schlussel, Wenlei Xie, Masha Basmanova, Orri Erling, Andrii Rosa, Shixuan Fan, Rongrong Zhong, Arun Thirupathi, et al. 2023. Presto: A Decade of SQL Analytics at Meta. SIGMOD, Vol. 1, 2 (2023), 1--25.","journal-title":"SIGMOD"},{"key":"e_1_3_2_1_49_1","doi-asserted-by":"crossref","unstructured":"Chuzhe Tang Youyun Wang Zhiyuan Dong Gansen Hu Zhaoguo Wang Minjie Wang and Haibo Chen. 2020. XIndex: a scalable learned index for multicore data storage. In PPoPP. 308--320.","DOI":"10.1145\/3332466.3374547"},{"key":"e_1_3_2_1_50_1","doi-asserted-by":"crossref","unstructured":"Saravanan Thirumuruganathan Suraj Shetiya Nick Koudas and Gautam Das. 2022. Prediction Intervals for Learned Cardinality Estimation: An Experimental Evaluation. In ICDE. 3051--3064.","DOI":"10.1109\/ICDE53745.2022.00274"},{"key":"e_1_3_2_1_51_1","doi-asserted-by":"crossref","unstructured":"Dana Van Aken Andrew Pavlo Geoffrey J Gordon and Bohan Zhang. 2017. Automatic database management system tuning through large-scale machine learning. In SIGMOD. 1009--1024.","DOI":"10.1145\/3035918.3064029"},{"key":"e_1_3_2_1_52_1","doi-asserted-by":"publisher","DOI":"10.14778\/3485450.3485458"},{"key":"e_1_3_2_1_53_1","unstructured":"Jason Wei Yi Tay Rishi Bommasani Colin Raffel Barret Zoph Sebastian Borgeaud Dani Yogatama Maarten Bosma Denny Zhou Donald Metzler et al. 2022. Emergent abilities of large language models. arXiv:2206.07682 (2022)."},{"key":"e_1_3_2_1_54_1","first-page":"272","article-title":"Learning to Be a Statistician","volume":"15","author":"Wu Renzhi","year":"2021","unstructured":"Renzhi Wu, Bolin Ding, Xu Chu, Zhewei Wei, Xiening Dai, Tao Guan, and Jingren Zhou. 2021. Learning to Be a Statistician: Learned Estimator for Number of Distinct Values. PVLDB, Vol. 15, 2 (2021), 272--284.","journal-title":"Learned Estimator for Number of Distinct Values. PVLDB"},{"key":"e_1_3_2_1_55_1","first-page":"1","article-title":"FactorJoin","volume":"1","author":"Wu Ziniu","year":"2023","unstructured":"Ziniu Wu, Parimarjan Negi, Mohammad Alizadeh, Tim Kraska, and Samuel Madden. 2023. FactorJoin: A New Cardinality Estimation Framework for Join Queries. SIGMOD, Vol. 1, 1 (2023), 1--27.","journal-title":"A New Cardinality Estimation Framework for Join Queries. SIGMOD"},{"key":"e_1_3_2_1_56_1","volume-title":"BayesCard: A Unified Bayesian Framework for Cardinality Estimation. arXiv:2012.14743","author":"Wu Ziniu","year":"2020","unstructured":"Ziniu Wu and Amir Shaikhha. 2020. BayesCard: A Unified Bayesian Framework for Cardinality Estimation. arXiv:2012.14743 (2020)."},{"key":"e_1_3_2_1_57_1","volume-title":"A Unified Transferable Model for ML-Enhanced DBMS. CIDR","author":"Wu Ziniu","year":"2022","unstructured":"Ziniu Wu, Peilun Yang, Pei Yu, Rong Zhu, Yuxing Han, Yaliang Li, Defu Lian, Kai Zeng, and Jingren Zhou. 2022. A Unified Transferable Model for ML-Enhanced DBMS. CIDR (2022)."},{"key":"e_1_3_2_1_58_1","first-page":"61","article-title":"NeuroCard","volume":"14","author":"Yang Zongheng","year":"2021","unstructured":"Zongheng Yang, Amog Kamsetty, Sifei Luan, Eric Liang, Yan Duan, Xi Chen, and Ion Stoica. 2021. NeuroCard: One Cardinality Estimator for All Tables. PVLDB, Vol. 14, 1 (2021), 61--73.","journal-title":"One Cardinality Estimator for All Tables. PVLDB"},{"key":"e_1_3_2_1_59_1","doi-asserted-by":"publisher","DOI":"10.14778\/3368289.3368294"},{"key":"e_1_3_2_1_60_1","doi-asserted-by":"publisher","DOI":"10.14778\/3352063.3352124"},{"key":"e_1_3_2_1_61_1","doi-asserted-by":"crossref","unstructured":"Ji Zhang Yu Liu Ke Zhou Guoliang Li Zhili Xiao Bin Cheng Jiashu Xing Yangtao Wang Tianheng Cheng Li Liu et al. 2019. An end-to-end automatic cloud database tuning system using deep reinforcement learning. In SIGMOD. 415--432.","DOI":"10.1145\/3299869.3300085"},{"key":"e_1_3_2_1_62_1","doi-asserted-by":"crossref","unstructured":"Xinyi Zhang Hong Wu Zhuo Chang Shuowei Jin Jian Tan Feifei Li Tieying Zhang and Bin Cui. 2021. ResTune: Resource Oriented Tuning Boosted by Meta-Learning for Cloud Databases. In SIGMOD. 2102--2114.","DOI":"10.1145\/3448016.3457291"},{"key":"e_1_3_2_1_63_1","first-page":"1489","article-title":"FLAT","volume":"14","author":"Zhu Rong","year":"2021","unstructured":"Rong Zhu, Ziniu Wu, Yuxing Han, Kai Zeng, Andreas Pfadler, Zhengping Qian, Jingren Zhou, and Bin Cui. 2021. FLAT: Fast, Lightweight and Accurate Method for Cardinality Estimation. PVLDB, Vol. 14, 9 (2021), 1489--1502. io","journal-title":"Fast, Lightweight and Accurate Method for Cardinality Estimation. PVLDB"}],"event":{"name":"SIGMOD\/PODS '24: International Conference on Management of Data","location":"Santiago AA Chile","acronym":"SIGMOD\/PODS '24","sponsor":["SIGMOD ACM Special Interest Group on Management of Data"]},"container-title":["Companion of the 2024 International Conference on Management of Data"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3626246.3653376","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3626246.3653376","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T11:29:56Z","timestamp":1755862196000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3626246.3653376"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,6,9]]},"references-count":63,"alternative-id":["10.1145\/3626246.3653376","10.1145\/3626246"],"URL":"https:\/\/doi.org\/10.1145\/3626246.3653376","relation":{},"subject":[],"published":{"date-parts":[[2024,6,9]]},"assertion":[{"value":"2024-06-09","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}