{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,26]],"date-time":"2026-05-26T20:02:48Z","timestamp":1779825768841,"version":"3.53.1"},"publisher-location":"New York, NY, USA","reference-count":80,"publisher":"ACM","funder":[{"name":"National Key R&#x5c;&#x5c;&amp;D Program of China","award":["2023YFB4502400"],"award-info":[{"award-number":["2023YFB4502400"]}]},{"name":"Fundamental and Interdisciplinary Disciplines Breakthrough Plan of the Ministry of Education of China","award":["JYB2025XDXM103"],"award-info":[{"award-number":["JYB2025XDXM103"]}]},{"name":"Shenzhen Project","award":["CJGJZD20230724093403007"],"award-info":[{"award-number":["CJGJZD20230724093403007"]}]},{"name":"NSF of China","award":["62441236, 62372296, 62432007, U25A6024, 62502304, U25A20437, 62525202, 62232009"],"award-info":[{"award-number":["62441236, 62372296, 62432007, U25A6024, 62502304, U25A20437, 62525202, 62232009"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2026,5,31]]},"DOI":"10.1145\/3788853.3803080","type":"proceedings-article","created":{"date-parts":[[2026,5,26]],"date-time":"2026-05-26T19:14:47Z","timestamp":1779822887000},"page":"320-333","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["ByteHouse: ByteDance's Cloud-Native Data Warehouse for Real-Time Multimodal Data Analytics"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0005-4696-8572","authenticated-orcid":false,"given":"Yuxing","family":"Han","sequence":"first","affiliation":[{"name":"ByteDance, Shanghai, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0002-2204-8040","authenticated-orcid":false,"given":"Yu","family":"Lin","sequence":"additional","affiliation":[{"name":"ByteDance, Hangzhou, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0008-1121-617X","authenticated-orcid":false,"given":"Yifeng","family":"Dong","sequence":"additional","affiliation":[{"name":"ByteDance, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2285-7836","authenticated-orcid":false,"given":"Xuanhe","family":"Zhou","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong Univ., Shanghai, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0004-3302-1753","authenticated-orcid":false,"given":"Xindong","family":"Peng","sequence":"additional","affiliation":[{"name":"ByteDance, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-6000-227X","authenticated-orcid":false,"given":"Xinhui","family":"Tian","sequence":"additional","affiliation":[{"name":"ByteDance, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-7336-0280","authenticated-orcid":false,"given":"Zhiyuan","family":"You","sequence":"additional","affiliation":[{"name":"Bytedance, Hangzhou, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-0177-7497","authenticated-orcid":false,"given":"Yingzhong","family":"Guo","sequence":"additional","affiliation":[{"name":"ByteDance, Hangzhou, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-9859-4147","authenticated-orcid":false,"given":"Xi","family":"Chen","sequence":"additional","affiliation":[{"name":"ByteDance, Shanghai, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-1748-2881","authenticated-orcid":false,"given":"Weiping","family":"Qu","sequence":"additional","affiliation":[{"name":"ByteDance, Shanghai, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0004-9540-6093","authenticated-orcid":false,"given":"Tao","family":"Meng","sequence":"additional","affiliation":[{"name":"ByteDance, Hangzhou, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0002-6484-1979","authenticated-orcid":false,"given":"Dayue","family":"Gao","sequence":"additional","affiliation":[{"name":"ByteDance, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-9407-8651","authenticated-orcid":false,"given":"Haoyu","family":"Wang","sequence":"additional","affiliation":[{"name":"ByteDance, Shanghai, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0002-5007-7535","authenticated-orcid":false,"given":"Liuxi","family":"Wei","sequence":"additional","affiliation":[{"name":"Bytedance, Singapore, Singapore"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-4821-1558","authenticated-orcid":false,"given":"Huanchen","family":"Zhang","sequence":"additional","affiliation":[{"name":"Tsinghua University, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0965-9058","authenticated-orcid":false,"given":"Fan","family":"Wu","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong Univ., Shanghai, China"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"320","published-online":{"date-parts":[[2026,5,30]]},"reference":[{"key":"e_1_3_2_1_1_1","unstructured":"2025. Amazon Redshift. https:\/\/aws.amazon.com\/redshift\/. Accessed: 2025-10-27."},{"key":"e_1_3_2_1_2_1","first-page":"1","article-title":"ALP: Adaptive lossless floating-point compression","volume":"1","author":"Afroozeh Azim","year":"2023","unstructured":"Azim Afroozeh, Leonardo X Kuffo, and Peter Boncz. 2023. ALP: Adaptive lossless floating-point compression. SIGMOD 1, 4 (2023), 1-26.","journal-title":"SIGMOD"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.14778\/3476311.3476377"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1145\/3589776"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"crossref","unstructured":"Allen Institute for AI. 2020. C4 Dataset: Colossal Clean Crawled Corpus. https: \/\/huggingface.co\/datasets\/allenai\/c4. Accessed: 2025-10-27.","DOI":"10.1109\/MMUL.2020.3016438"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1145\/3299869.3314047"},{"key":"e_1_3_2_1_7_1","volume-title":"Apache Doris: An MPP Analytical Database for Real-Time Analytics. https:\/\/github.com\/apache\/doris. Accessed: 2025-10-27.","author":"Community Apache Doris","year":"2017","unstructured":"Apache Doris Community. 2017. Apache Doris: An MPP Analytical Database for Real-Time Analytics. https:\/\/github.com\/apache\/doris. Accessed: 2025-10-27."},{"key":"e_1_3_2_1_8_1","volume-title":"MS MARCO: A human generated machine reading comprehension dataset. arXiv preprint arXiv:1611.09268","author":"Bajaj Payal","year":"2016","unstructured":"Payal Bajaj, Daniel Campos, Nick Craswell, Li Deng, Jianfeng Gao, Xiaodong Liu, Rangan Majumder, Andrew McNamara, Bhaskar Mitra, Tri Nguyen, et al. 2016. MS MARCO: A human generated machine reading comprehension dataset. arXiv preprint arXiv:1611.09268 (2016)."},{"key":"e_1_3_2_1_9_1","volume-title":"14th USENIX Symposium on Operating Systems Design and Implementation (OSDI . 753-768","author":"Berg Benjamin","year":"2020","unstructured":"Benjamin Berg, Daniel S Berger, Sara McAllister, Isaac Grosof, Sathya Gunasekar, Jimmy Lu, Michael Uhlar, Jim Carrig, Nathan Beckmann, Mor Harchol-Balter, et al. 2020. The {CacheLib} caching engine: Design and experiences at scale. In 14th USENIX Symposium on Operating Systems Design and Implementation (OSDI . 753-768."},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.14778\/3407790.3407851"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.14778\/3587136.3587137"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1145\/2566486.2567977"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"crossref","unstructured":"Jianlv Chen Shitao Xiao Peitian Zhang Kun Luo Defu Lian and Zheng Liu. 2024. BGE M3-Embedding: Multi-Lingual Multi-Functionality Multi-Granularity Text Embeddings Through Self-Knowledge Distillation. arXiv:2402.03216 [cs.CL]","DOI":"10.18653\/v1\/2024.findings-acl.137"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.findings-acl.137"},{"key":"e_1_3_2_1_15_1","unstructured":"Cohere Team. 2022. Wikipedia Dataset (December 2022). https:\/\/huggingface.co\/datasets\/Cohere\/wikipedia-22-12. Accessed: 2025-10-27."},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1145\/2491245"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1145\/1571941.1572114"},{"key":"e_1_3_2_1_18_1","volume-title":"The Snowflake Elastic Data Warehouse. In SIGMOD Conference. ACM, 215-226","author":"Dageville Beno\u00eet","year":"2016","unstructured":"Beno\u00eet Dageville, Thierry Cruanes, Marcin Zukowski, Vadim Antonov, Artin Avanes, Jon Bock, Jonathan Claybaugh, Daniel Engovatov, Martin Hentschel, Jiansheng Huang, AllisonW. Lee, Ashish Motivala, Abdul Q. Munir, Steven Pelley, Peter Povinec, Greg Rahn, Spyridon Triantafyllis, and Philipp Unterbrunner. 2016. The Snowflake Elastic Data Warehouse. In SIGMOD Conference. ACM, 215-226."},{"key":"e_1_3_2_1_19_1","first-page":"1704","article-title":"Optimization of common table expressions in mpp database systems","volume":"8","author":"El-Helw Amr","year":"2015","unstructured":"Amr El-Helw, Venkatesh Raghavan, Mohamed A Soliman, George Caragea, Zhongxian Gu, and Michalis Petropoulos. 2015. Optimization of common table expressions in mpp database systems. VLDB 8, 12 (2015), 1704-1715.","journal-title":"VLDB"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE.2011.5767901"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1016\/B978-012722442-8\/50089-6"},{"key":"e_1_3_2_1_22_1","unstructured":"Pengfei Gao Zhao Tian Xiangxin Meng XinchenWang Ruida Hu Yuanan Xiao Yizhou Liu Zhao Zhang Junjie Chen Cuiyun Gao et al. 2025. Trae agent: An llm-based agent for software engineering with test-time scaling. arXiv preprint arXiv:2507.23370 (2025)."},{"key":"e_1_3_2_1_23_1","volume-title":"Pooling methods in deep neural networks, a review. arXiv preprint arXiv:2009.07485","author":"Gholamalinezhad Hossein","year":"2020","unstructured":"Hossein Gholamalinezhad and Hossein Khosravi. 2020. Pooling methods in deep neural networks, a review. arXiv preprint arXiv:2009.07485 (2020)."},{"key":"e_1_3_2_1_24_1","first-page":"19","article-title":"The cascades framework for query optimization","volume":"18","author":"Graefe Goetz","year":"1995","unstructured":"Goetz Graefe. 1995. The cascades framework for query optimization. IEEE Data Eng. Bull. 18, 3 (1995), 19-29.","journal-title":"IEEE Data Eng. Bull."},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE.1993.344061"},{"key":"e_1_3_2_1_26_1","volume-title":"AutoComp: Automated Data Compaction for Log-Structured Tables in Data Lakes. In Companion of the 2025 International Conference on Management of Data. 404-417","author":"Gruenheid Anja","year":"2025","unstructured":"Anja Gruenheid, Jes\u00fas Camacho-Rodr\u00edguez, Carlo Curino, Raghu Ramakrishnan, Stanislav Pak, Sumedh Sakdeo, Lenisha Gandhi, Sandeep K Singhal, Pooja Nilangekar, and Daniel J Abadi. 2025. AutoComp: Automated Data Compaction for Log-Structured Tables in Data Lakes. In Companion of the 2025 International Conference on Management of Data. 404-417."},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1145\/3626246.3653376"},{"key":"e_1_3_2_1_28_1","volume-title":"Ravishankar Krishnawamy, and Rohan Kadekodi.","author":"Subramanya Suhas Jayaram","year":"2019","unstructured":"Suhas Jayaram Subramanya, Fnu Devvrit, Harsha Vardhan Simhadri, Ravishankar Krishnawamy, and Rohan Kadekodi. 2019. DiskAnn: Fast accurate billion-point nearest neighbor search on a single node. Advances in neural information processing Systems 32 (2019)."},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1145\/3695053.3731005"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.14778\/3415478.3415550"},{"key":"e_1_3_2_1_31_1","unstructured":"Andreas Kipf Thomas Kipf Bernhard Radke Viktor Leis Peter Boncz and Alfons Kemper. 2019. Learned cardinalities: Estimating correlated joins with deep learning. In CIDR."},{"key":"e_1_3_2_1_32_1","volume-title":"Probabilistic graphical models: principles and techniques","author":"Koller Daphne","unstructured":"Daphne Koller and Nir Friedman. 2009. Probabilistic graphical models: principles and techniques. MIT press."},{"key":"e_1_3_2_1_33_1","first-page":"1","article-title":"Btrblocks: Efficient columnar compression for data lakes","volume":"1","author":"Kuschewski Maximilian","year":"2023","unstructured":"Maximilian Kuschewski, David Sauerwein, Adnan Alhomssi, and Viktor Leis. 2023. Btrblocks: Efficient columnar compression for data lakes. SIGMOD 1, 2 (2023), 1-26.","journal-title":"SIGMOD"},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.14778\/2367502.2367518"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.14778\/3712221.3712224"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1002\/spe.2203"},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.14778\/3685800.3685806"},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.1145\/3539618.3591977"},{"key":"e_1_3_2_1_39_1","volume-title":"UNIFY: Unified Index for Range Filtered Approximate Nearest Neighbors Search. arXiv preprint arXiv:2412.02448","author":"Liang Anqi","year":"2024","unstructured":"Anqi Liang, Pengcheng Zhang, Bin Yao, Zhongpu Chen, Yitong Song, and Guangxu Cheng. 2024. UNIFY: Unified Index for Range Filtered Approximate Nearest Neighbors Search. arXiv preprint arXiv:2412.02448 (2024)."},{"key":"e_1_3_2_1_40_1","volume-title":"Efficient and robust approximate nearest neighbor search using hierarchical navigable small world graphs","author":"Malkov Yu A","year":"2018","unstructured":"Yu A Malkov and Dmitry A Yashunin. 2018. Efficient and robust approximate nearest neighbor search using hierarchical navigable small world graphs. IEEE transactions on pattern analysis and machine intelligence 42, 4 (2018), 824-836."},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"publisher","DOI":"10.14778\/3342263.3342644"},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"publisher","DOI":"10.14778\/3342263.3342644"},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.14778\/1920841.1920886"},{"key":"e_1_3_2_1_44_1","doi-asserted-by":"publisher","DOI":"10.14778\/3415478.3415568"},{"key":"e_1_3_2_1_45_1","doi-asserted-by":"publisher","DOI":"10.14778\/3750601.3750636"},{"key":"e_1_3_2_1_46_1","volume-title":"BlendHouse: A Cloud-Native Vector Database System in ByteHouse. In 2025 IEEE 41st International Conference on Data Engineering (ICDE). IEEE, 4332-4345","author":"Niu Zhaojie","year":"2025","unstructured":"Zhaojie Niu, Xinhui Tian, Xindong Peng, and Xing Chen. 2025. BlendHouse: A Cloud-Native Vector Database System in ByteHouse. In 2025 IEEE 41st International Conference on Data Engineering (ICDE). IEEE, 4332-4345."},{"key":"e_1_3_2_1_47_1","unstructured":"pgvector Team. 2023. pgvector: Open-source vector similarity search for PostgreSQL. https:\/\/github.com\/pgvector\/pgvector. Accessed: 2025-10-27."},{"key":"e_1_3_2_1_48_1","volume-title":"Towards Functional Decomposition of Storage Formats. In Conference on Innovative Data Systems Research (CIDR).","author":"Prammer Martin","year":"2025","unstructured":"Martin Prammer, Xinyu Zeng, Ruijun Meng, Wes McKinney, Huanchen Zhang, Andrew Pavlo, and Jignesh M Patel. 2025. Towards Functional Decomposition of Storage Formats. In Conference on Innovative Data Systems Research (CIDR)."},{"key":"e_1_3_2_1_49_1","doi-asserted-by":"publisher","DOI":"10.1145\/3555041.3589677"},{"key":"e_1_3_2_1_50_1","doi-asserted-by":"publisher","DOI":"10.14778\/3681954.3682001"},{"key":"e_1_3_2_1_51_1","volume-title":"Semantic word clouds with background corpus normalization and tdistributed stochastic neighbor embedding. arXiv preprint arXiv:1708.03569","author":"Schubert Erich","year":"2017","unstructured":"Erich Schubert, Andreas Spitz, Michael Weiler, Johanna Gei\u00df, and Michael Gertz. 2017. Semantic word clouds with background corpus normalization and tdistributed stochastic neighbor embedding. arXiv preprint arXiv:1708.03569 (2017)."},{"key":"e_1_3_2_1_52_1","doi-asserted-by":"publisher","DOI":"10.14778\/3685800.3685802"},{"key":"e_1_3_2_1_53_1","doi-asserted-by":"publisher","DOI":"10.1145\/1376616.1376673"},{"key":"e_1_3_2_1_54_1","doi-asserted-by":"publisher","DOI":"10.1145\/235968.233360"},{"key":"e_1_3_2_1_55_1","doi-asserted-by":"publisher","DOI":"10.14778\/3685800.3685828"},{"key":"e_1_3_2_1_56_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE.2012.106"},{"key":"e_1_3_2_1_57_1","doi-asserted-by":"publisher","DOI":"10.1145\/2588555.2595637"},{"key":"e_1_3_2_1_58_1","volume-title":"Streaming Democratized: Ease Across the Latency Spectrum with Delayed View Semantics and Snowflake Dynamic Tables. In Companion of the 2025 International Conference on Management of Data. 622-634","author":"Sotolongo Daniel","year":"2025","unstructured":"Daniel Sotolongo, Daniel Mills, Tyler Akidau, Anirudh Santhiar, Attila-P\u00e9ter T\u00f3th, Botong Huang, Boyuan Zhang, Igor Belianski, Ling Geng, Matt Uhlar, et al. 2025. Streaming Democratized: Ease Across the Latency Spectrum with Delayed View Semantics and Snowflake Dynamic Tables. In Companion of the 2025 International Conference on Management of Data. 622-634."},{"key":"e_1_3_2_1_59_1","unstructured":"StarRocks Team. 2020. StarRocks: A High-Performance MPP Database for Analytics. https:\/\/github.com\/StarRocks\/starrocks. Accessed: 2025-10-27."},{"key":"e_1_3_2_1_60_1","doi-asserted-by":"publisher","DOI":"10.14778\/3368289.3368296"},{"key":"e_1_3_2_1_61_1","unstructured":"ClickHouse Team. 2021. ClickBench: A Benchmark for Analytical DBMS. https: \/\/github.com\/ClickHouse\/ClickBench. Accessed: 2025-10-27."},{"key":"e_1_3_2_1_62_1","volume-title":"Apache Arrow: A cross-language development platform for in-memory data. https:\/\/arrow.apache.org\/. Accessed: 2025-10-24.","author":"Software Foundation The Apache","year":"2025","unstructured":"The Apache Software Foundation. 2025. Apache Arrow: A cross-language development platform for in-memory data. https:\/\/arrow.apache.org\/. Accessed: 2025-10-24."},{"key":"e_1_3_2_1_63_1","unstructured":"Transaction Processing Performance Council. 2018. TPC-DS Benchmark (Version 3.2). http:\/\/www.tpc.org\/tpcds\/. Accessed: 2025-10-27."},{"key":"e_1_3_2_1_64_1","doi-asserted-by":"publisher","DOI":"10.1145\/3299869.3300088"},{"key":"e_1_3_2_1_65_1","doi-asserted-by":"publisher","DOI":"10.1145\/3035918.3056101"},{"key":"e_1_3_2_1_66_1","volume-title":"Vortex: A Next-Generation High-Performance Data Format for AI and Analytics. https:\/\/vortex.dev.","author":"Team Vortex Project","year":"2024","unstructured":"Vortex Project Team. 2024. Vortex: A Next-Generation High-Performance Data Format for AI and Analytics. https:\/\/vortex.dev."},{"key":"e_1_3_2_1_67_1","doi-asserted-by":"publisher","DOI":"10.1145\/3448016.3457550"},{"key":"e_1_3_2_1_68_1","doi-asserted-by":"publisher","DOI":"10.14778\/3421424.3421427"},{"key":"e_1_3_2_1_69_1","doi-asserted-by":"publisher","DOI":"10.1111\/j.1467-8659.2011.01923.x"},{"key":"e_1_3_2_1_70_1","volume-title":"Bayescard: Revitilizing bayesian frameworks for cardinality estimation. arXiv preprint arXiv:2012.14743","author":"Wu Ziniu","year":"2020","unstructured":"Ziniu Wu, Amir Shaikhha, Rong Zhu, Kai Zeng, Yuxing Han, and Jingren Zhou. 2020. Bayescard: Revitilizing bayesian frameworks for cardinality estimation. arXiv preprint arXiv:2012.14743 (2020)."},{"key":"e_1_3_2_1_71_1","doi-asserted-by":"publisher","DOI":"10.1145\/3589281"},{"key":"e_1_3_2_1_72_1","doi-asserted-by":"publisher","DOI":"10.1145\/3600006.3613147"},{"key":"e_1_3_2_1_73_1","doi-asserted-by":"publisher","DOI":"10.1145\/3626246.3653377"},{"key":"e_1_3_2_1_74_1","doi-asserted-by":"crossref","unstructured":"Xinyu Zeng Ruijun Meng Martin Prammer Wes McKinney Jignesh M. Patel Andrew Pavlo and Huanchen Zhang. 2026. F3: The Open-Source Data File Format for the Future. (2026). SIGMOD).","DOI":"10.1145\/3749163"},{"key":"e_1_3_2_1_75_1","doi-asserted-by":"publisher","DOI":"10.14778\/3352063.3352124"},{"key":"e_1_3_2_1_76_1","volume-title":"Proceedings of the MSST","author":"Zhang Yiwen","year":"2024","unstructured":"Yiwen Zhang, Guokuan Li, Kai Lu, Jiguang Wan, Ting Yao, Huatao Wu, and Daohui Wang. 2024. PhatKV: Towards an Efficient Metadata Engine for KVbased File Systems on Modern SSD. In Proceedings of the MSST 2024. IEEE."},{"key":"e_1_3_2_1_77_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE.2010.5447802"},{"key":"e_1_3_2_1_78_1","doi-asserted-by":"publisher","DOI":"10.14778\/3583140.3583160"},{"key":"e_1_3_2_1_79_1","first-page":"1489","article-title":"FLAT: Fast, Lightweight and Accurate Method for Cardinality Estimation","volume":"14","author":"Zhu Rong","year":"2021","unstructured":"Rong Zhu, Ziniu Wu, Yuxing Han, Kai Zeng, Andreas Pfadler, Zhengping Qian, Jingren Zhou, and Bin Cui. 2021. FLAT: Fast, Lightweight and Accurate Method for Cardinality Estimation. VLDB 14, 9 (2021), 1489-1502.","journal-title":"VLDB"},{"key":"e_1_3_2_1_80_1","unstructured":"Zilliz. 2023. VectorDBBench: A Benchmark Suite for Vector Databases. https:\/\/github.com\/zilliztech\/VectorDBBench. Accessed: 2025-11-17."}],"event":{"name":"SIGMOD\/PODS '26: International Conference on Management of Data","location":"Bengaluru India","sponsor":["SIGMOD ACM Special Interest Group on Management of Data"]},"container-title":["Companion of the International Conference on Management of Data"],"original-title":[],"deposited":{"date-parts":[[2026,5,26]],"date-time":"2026-05-26T19:15:55Z","timestamp":1779822955000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3788853.3803080"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,5,30]]},"references-count":80,"alternative-id":["10.1145\/3788853.3803080","10.1145\/3788853"],"URL":"https:\/\/doi.org\/10.1145\/3788853.3803080","relation":{},"subject":[],"published":{"date-parts":[[2026,5,30]]},"assertion":[{"value":"2026-05-30","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}