{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T13:40:13Z","timestamp":1755870013245,"version":"3.44.0"},"publisher-location":"New York, NY, USA","reference-count":65,"publisher":"ACM","content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,6,8]]},"DOI":"10.1145\/3721145.3725752","type":"proceedings-article","created":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T12:57:17Z","timestamp":1755867437000},"page":"868-883","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["ORION: Optimizing OLAP Query Execution with Proactive Caching and Separate Operators"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0008-3220-3685","authenticated-orcid":false,"given":"Zhixin","family":"Tong","sequence":"first","affiliation":[{"name":"Shanghai Jiao Tong University, Shanghai, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5470-210X","authenticated-orcid":false,"given":"Jiuchen","family":"Shi","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, Shanghai, China and The Hong Kong Polytechnic University, Hong Kong, Hong Kong"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5832-0347","authenticated-orcid":false,"given":"Quan","family":"Chen","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, Shanghai, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0004-3685-0901","authenticated-orcid":false,"given":"Pu","family":"Pang","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, Shanghai, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4060-9438","authenticated-orcid":false,"given":"Shixuan","family":"Sun","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, Shanghai, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-4974-3761","authenticated-orcid":false,"given":"Jie","family":"Meng","sequence":"additional","affiliation":[{"name":"Huawei Cloud, Chengdu, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0000-7130-3330","authenticated-orcid":false,"given":"Jiang","family":"Liu","sequence":"additional","affiliation":[{"name":"Huawei Cloud, Chengdu, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9678-7228","authenticated-orcid":false,"given":"En","family":"Shao","sequence":"additional","affiliation":[{"name":"Institute of Computing Technology, Chinese Academy of Sciences, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0034-2302","authenticated-orcid":false,"given":"Minyi","family":"Guo","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, Shanghai, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2025,8,22]]},"reference":[{"key":"e_1_3_3_2_2_2","doi-asserted-by":"crossref","unstructured":"Daniel Abadi Peter Boncz Stavros Harizopoulos Stratos Idreos Samuel Madden et\u00a0al. 2013. The design and implementation of modern column-oriented database systems. Foundations and Trends\u00ae in Databases 5 3 (2013) 197\u2013280.","DOI":"10.1561\/1900000024"},{"key":"e_1_3_3_2_3_2","doi-asserted-by":"publisher","DOI":"10.1145\/1376616.1376712"},{"key":"e_1_3_3_2_4_2","volume-title":"cuDF: GPU DataFrame Library","author":"AI RAPIDS","year":"2024","unstructured":"RAPIDS AI. 2024. cuDF: GPU DataFrame Library. https:\/\/github.com\/rapidsai\/cudf"},{"key":"e_1_3_3_2_5_2","volume-title":"RAPIDS","author":"AI RAPIDS","year":"2024","unstructured":"RAPIDS AI. 2024. RAPIDS. https:\/\/rapids.ai\/"},{"key":"e_1_3_3_2_6_2","volume-title":"Alluxio","year":"2024","unstructured":"Alluxio. 2024. Alluxio. https:\/\/www.alluxio.io\/"},{"key":"e_1_3_3_2_7_2","doi-asserted-by":"publisher","DOI":"10.1145\/3514221.3517876"},{"key":"e_1_3_3_2_8_2","doi-asserted-by":"crossref","unstructured":"Jiashen Cao Rathijit Sen Matteo Interlandi Joy Arulraj and Hyesoon Kim. 2023. GPU Database Systems Characterization and Optimization. Proceedings of the VLDB Endowment 17 3 (2023) 441\u2013454.","DOI":"10.14778\/3632093.3632107"},{"key":"e_1_3_3_2_9_2","doi-asserted-by":"crossref","unstructured":"Surajit Chaudhuri and Umeshwar Dayal. 1997. An overview of data warehousing and OLAP technology. ACM Sigmod record 26 1 (1997) 65\u201374.","DOI":"10.1145\/248603.248616"},{"key":"e_1_3_3_2_10_2","doi-asserted-by":"crossref","unstructured":"Surajit Chaudhuri and Umeshwar Dayal. 1997. An overview of data warehousing and OLAP technology. ACM Sigmod record 26 1 (1997) 65\u201374.","DOI":"10.1145\/248603.248616"},{"key":"e_1_3_3_2_11_2","doi-asserted-by":"crossref","unstructured":"Mohamed\u00a0L Chouder Stefano Rizzi and Rachid Chalal. 2019. EXODuS: exploratory OLAP over document stores. Information Systems 79 (2019) 44\u201357.","DOI":"10.1016\/j.is.2017.11.004"},{"key":"e_1_3_3_2_12_2","volume-title":"Alibaba Cloud Object Storage Service","author":"Cloud Alibaba","year":"2024","unstructured":"Alibaba Cloud. 2024. Alibaba Cloud Object Storage Service. https:\/\/www.alibabacloud.com\/product\/oss"},{"key":"e_1_3_3_2_13_2","volume-title":"Ceph: A Scalable, High-Performance Distributed Storage System","author":"Community Ceph","year":"2024","unstructured":"Ceph Community. 2024. Ceph: A Scalable, High-Performance Distributed Storage System. https:\/\/ceph.io\/en\/"},{"key":"e_1_3_3_2_14_2","volume-title":"SQLite Home Page","author":"Consortium SQLite","year":"2024","unstructured":"SQLite Consortium. 2024. SQLite Home Page. https:\/\/www.sqlite.org\/"},{"key":"e_1_3_3_2_15_2","volume-title":"TPC-H Benchmark","author":"Council Transaction Processing\u00a0Performance","year":"2024","unstructured":"Transaction Processing\u00a0Performance Council. 2024. TPC-H Benchmark. http:\/\/www.tpc.org\/tpch\/"},{"key":"e_1_3_3_2_16_2","doi-asserted-by":"publisher","DOI":"10.1145\/2723372.2735377"},{"key":"e_1_3_3_2_17_2","doi-asserted-by":"crossref","unstructured":"Markus Dreseler Martin Boissier Tilmann Rabl and Matthias Uflacker. 2020. Quantifying TPC-H choke points and their optimizations. Proceedings of the VLDB Endowment 13 8 (2020) 1206\u20131220.","DOI":"10.14778\/3389133.3389138"},{"key":"e_1_3_3_2_18_2","volume-title":"Apache Arrow","author":"Foundation Apache\u00a0Software","year":"2024","unstructured":"Apache\u00a0Software Foundation. 2024. Apache Arrow. https:\/\/arrow.apache.org\/"},{"key":"e_1_3_3_2_19_2","volume-title":"Apache Parquet","author":"Foundation Apache\u00a0Software","year":"2024","unstructured":"Apache\u00a0Software Foundation. 2024. Apache Parquet. https:\/\/parquet.apache.org\/ July 31, 2024."},{"key":"e_1_3_3_2_20_2","volume-title":"Apache Spark Official Website","author":"Foundation Apache\u00a0Software","year":"2024","unstructured":"Apache\u00a0Software Foundation. 2024. Apache Spark Official Website. https:\/\/spark.apache.org\/"},{"key":"e_1_3_3_2_21_2","volume-title":"Spark SQL, DataFrames and Datasets Guide","author":"Foundation Apache\u00a0Software","year":"2024","unstructured":"Apache\u00a0Software Foundation. 2024. Spark SQL, DataFrames and Datasets Guide. https:\/\/spark.apache.org\/docs\/latest\/sql-data-sources.html"},{"key":"e_1_3_3_2_22_2","volume-title":"Connectors","author":"Foundation Presto","year":"2024","unstructured":"Presto Foundation. 2024. Connectors. https:\/\/prestodb.io\/docs\/current\/develop\/connectors.html"},{"key":"e_1_3_3_2_23_2","volume-title":"Presto","author":"Foundation Presto","year":"2024","unstructured":"Presto Foundation. 2024. Presto. https:\/\/prestodb.io\/"},{"key":"e_1_3_3_2_24_2","volume-title":"Trino","author":"Foundation Trino","year":"2024","unstructured":"Trino Foundation. 2024. Trino. https:\/\/trino.io\/"},{"key":"e_1_3_3_2_25_2","doi-asserted-by":"publisher","DOI":"10.5555\/3571885.3571976"},{"key":"e_1_3_3_2_26_2","volume-title":"JuiceFS: A Distributed POSIX File System built on top of Redis and S3","author":"Inc. Juicedata","year":"2024","unstructured":"Juicedata Inc.2024. JuiceFS: A Distributed POSIX File System built on top of Redis and S3. https:\/\/github.com\/juicedata\/juicefs"},{"key":"e_1_3_3_2_27_2","volume-title":"RubiX: A caching library that can be used to cache data from cloud stores such as Amazon S3, Azure Blob Storage, Google Cloud Storage, and others.","author":"Inc. Qubole","year":"2017","unstructured":"Qubole Inc.2017. RubiX: A caching library that can be used to cache data from cloud stores such as Amazon S3, Azure Blob Storage, Google Cloud Storage, and others.https:\/\/github.com\/qubole\/rubix"},{"key":"e_1_3_3_2_28_2","unstructured":"Intel Corporation. 2020. Intel\u00aeAVX-512 Instructions. Intel\u00aeDeveloper Zone (2020). Available at https:\/\/www.intel.com\/content\/www\/us\/en\/developer\/articles\/technical\/intel-avx-512-instructions.html."},{"key":"e_1_3_3_2_29_2","unstructured":"Tomas Karnagel Ren\u00e9 M\u00fcller and Guy\u00a0M Lohman. 2015. Optimizing GPU-accelerated Group-By and Aggregation. ADMS@ VLDB 8 (2015) 20."},{"key":"e_1_3_3_2_30_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICDEW53142.2021.00015"},{"key":"e_1_3_3_2_31_2","doi-asserted-by":"crossref","unstructured":"Guoliang Li Haowen Dong and Chao Zhang. 2022. Cloud databases: New techniques challenges and opportunities. Proceedings of the VLDB Endowment 15 12 (2022) 3758\u20133761.","DOI":"10.14778\/3554821.3554893"},{"key":"e_1_3_3_2_32_2","doi-asserted-by":"crossref","unstructured":"Jing Li Hung-Wei Tseng Chunbin Lin Yannis Papakonstantinou and Steven Swanson. 2016. Hippogriffdb: Balancing i\/o and gpu bandwidth in big data analytics. Proceedings of the VLDB Endowment 9 14 (2016) 1647\u20131658.","DOI":"10.14778\/3007328.3007331"},{"key":"e_1_3_3_2_33_2","doi-asserted-by":"publisher","DOI":"10.1145\/3542929.3563503"},{"key":"e_1_3_3_2_34_2","doi-asserted-by":"publisher","DOI":"10.1145\/3514221.3520166"},{"key":"e_1_3_3_2_35_2","unstructured":"Wes McKinney et\u00a0al. 2011. pandas: a foundational Python library for data analysis and statistics. Python for high performance and scientific computing 14 9 (2011) 1\u20139."},{"key":"e_1_3_3_2_36_2","unstructured":"J\u00e9r\u00f4me Meinke. 2015. In-memory OLAP aggregation on GPUs using CUDA Dynamic Parallelism. (2015)."},{"key":"e_1_3_3_2_37_2","volume-title":"MinIO","author":"MinIO Inc.","year":"2024","unstructured":"Inc. MinIO. 2024. MinIO. https:\/\/min.io\/"},{"key":"e_1_3_3_2_38_2","first-page":"561","volume-title":"13th USENIX symposium on operating systems design and implementation (OSDI 18)","author":"Moritz Philipp","year":"2018","unstructured":"Philipp Moritz, Robert Nishihara, Stephanie Wang, Alexey Tumanov, Richard Liaw, Eric Liang, Melih Elibol, Zongheng Yang, William Paul, Michael\u00a0I Jordan, et\u00a0al. 2018. Ray: A distributed framework for emerging { AI} applications. In 13th USENIX symposium on operating systems design and implementation (OSDI 18). 561\u2013577."},{"key":"e_1_3_3_2_39_2","volume-title":"Spark-RAPIDS","year":"2024","unstructured":"NVIDIA. 2024. Spark-RAPIDS. https:\/\/nvidia.github.io\/spark-rapids\/"},{"key":"e_1_3_3_2_40_2","volume-title":"OmniSci Documentation: Overview","year":"2020","unstructured":"OmniSci. 2020. OmniSci Documentation: Overview. https:\/\/docs.omnisci.com\/v5.1.1\/1_overview.html"},{"key":"e_1_3_3_2_41_2","volume-title":"Presto Administration: Configuration Properties","year":"2024","unstructured":"PrestoDB. 2024. Presto Administration: Configuration Properties. https:\/\/prestodb.io\/docs\/current\/admin\/properties.html"},{"key":"e_1_3_3_2_42_2","doi-asserted-by":"publisher","DOI":"10.1145\/3514221.3526055"},{"key":"e_1_3_3_2_43_2","doi-asserted-by":"publisher","DOI":"10.1145\/3575693.3575748"},{"key":"e_1_3_3_2_44_2","doi-asserted-by":"publisher","DOI":"10.1145\/3299869.3320212"},{"key":"e_1_3_3_2_45_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICDCS54860.2022.00067"},{"key":"e_1_3_3_2_46_2","volume-title":"Amazon EMR: Use Presto with Amazon S3 Select","author":"Services Amazon\u00a0Web","year":"2024","unstructured":"Amazon\u00a0Web Services. 2024. Amazon EMR: Use Presto with Amazon S3 Select. https:\/\/docs.aws.amazon.com\/emr\/latest\/ReleaseGuide\/emr-presto-s3select.html"},{"key":"e_1_3_3_2_47_2","volume-title":"Amazon Simple Storage Service","author":"Services Amazon\u00a0Web","year":"2024","unstructured":"Amazon\u00a0Web Services. 2024. Amazon Simple Storage Service. https:\/\/aws.amazon.com\/s3\/"},{"key":"e_1_3_3_2_48_2","volume-title":"Getting Started with Amazon Redshift Spectrum","author":"Services Amazon\u00a0Web","year":"2024","unstructured":"Amazon\u00a0Web Services. 2024. Getting Started with Amazon Redshift Spectrum. https:\/\/docs.aws.amazon.com\/redshift\/latest\/dg\/c-getting-started-using-spectrum.html"},{"key":"e_1_3_3_2_49_2","doi-asserted-by":"publisher","DOI":"10.1145\/3318464.3380595"},{"key":"e_1_3_3_2_50_2","doi-asserted-by":"publisher","DOI":"10.1145\/3542929.3563490"},{"key":"e_1_3_3_2_51_2","unstructured":"Jiuchen Shi Kaihua Fu Jiawen Wang Quan Chen Deze Zeng and Minyi Guo. 2024. Adaptive QoS-aware microservice deployment with excessive loads via intra-and inter-datacenter scheduling. IEEE Transactions on Parallel and Distributed Systems (2024)."},{"key":"e_1_3_3_2_52_2","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS53621.2022.00039"},{"key":"e_1_3_3_2_53_2","first-page":"403","volume-title":"2023 USENIX Annual Technical Conference (USENIX ATC 23)","author":"Shi Jiuchen","year":"2023","unstructured":"Jiuchen Shi, Hang Zhang, Zhixin Tong, Quan Chen, Kaihua Fu, and Minyi Guo. 2023. Nodens: Enabling resource efficient and fast { QoS} recovery of dynamic microservice applications in datacenters. In 2023 USENIX Annual Technical Conference (USENIX ATC 23). 403\u2013417."},{"key":"e_1_3_3_2_54_2","volume-title":"Substrait: Cross-Language Serialization for Relational Algebra","year":"2024","unstructured":"Substrait. 2024. Substrait: Cross-Language Serialization for Relational Algebra. https:\/\/substrait.io\/"},{"key":"e_1_3_3_2_55_2","first-page":"901","volume-title":"2024 USENIX Annual Technical Conference (USENIX ATC 24)","author":"Tang Chunxu","year":"2024","unstructured":"Chunxu Tang, Bin Fan, Jing Zhao, Chen Liang, Yi Wang, Beinan Wang, Ziyue Qiu, Lu Qiu, Bowen Ding, Shouzhuo Sun, Saiguang Che, Jiaming Mai, Shouwei Chen, Yu Zhu, Jianjian Xie, Yutian\u00a0(James) Sun, Yao Li, Yangjun Zhang, Ke Wang, and Mingmin Chen. 2024. Data Caching for Enterprise-Grade Petabyte-Scale OLAP. In 2024 USENIX Annual Technical Conference (USENIX ATC 24). USENIX Association, Santa Clara, CA, 901\u2013915. https:\/\/www.usenix.org\/conference\/atc24\/presentation\/tang"},{"key":"e_1_3_3_2_56_2","volume-title":"Ray: Actors","author":"Team Ray","year":"2024","unstructured":"Ray Team. 2024. Ray: Actors. https:\/\/docs.ray.io\/en\/latest\/ray-core\/actors.html"},{"key":"e_1_3_3_2_57_2","doi-asserted-by":"crossref","unstructured":"Ashish Thusoo Joydeep\u00a0Sen Sarma Namit Jain Zheng Shao Prasad Chakka Suresh Anthony Hao Liu Pete Wyckoff and Raghotham Murthy. 2009. Hive: a warehousing solution over a map-reduce framework. Proceedings of the VLDB Endowment 2 2 (2009) 1626\u20131629.","DOI":"10.14778\/1687553.1687609"},{"key":"e_1_3_3_2_58_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-54420-0_40"},{"key":"e_1_3_3_2_59_2","doi-asserted-by":"crossref","unstructured":"Tobias Vin\u00e7on Christian Kn\u00f6dler Leonardo Solis-Vasquez Arthur Bernhardt Sajjad Tamimi Lukas Weber Florian Stock Andreas Koch and Ilia Petrov. 2022. Near-data processing in database systems on native computational storage under htap workloads. Proceedings of the VLDB Endowment 15 10 (2022) 1991\u20132004.","DOI":"10.14778\/3547305.3547307"},{"key":"e_1_3_3_2_60_2","doi-asserted-by":"crossref","unstructured":"Jialun Wang Wenhao Pang Chuliang Weng and Aoying Zhou. 2023. D-Cubicle: boosting data transfer dynamically for large-scale analytical queries in single-GPU systems. Frontiers of Computer Science 17 4 (2023) 174610.","DOI":"10.1007\/s11704-022-2160-z"},{"key":"e_1_3_3_2_61_2","doi-asserted-by":"publisher","DOI":"10.4018\/978-1-59904-364-7"},{"key":"e_1_3_3_2_62_2","doi-asserted-by":"crossref","unstructured":"Yifei Yang Matt Youill Matthew Woicik Yizhou Liu Xiangyao Yu Marco Serafini Ashraf Aboulnaga and Michael Stonebraker. 2021. Flexpushdowndb: Hybrid pushdown and caching in a cloud dbms. Proceedings of the VLDB Endowment 14 11 (2021).","DOI":"10.14778\/3476249.3476265"},{"key":"e_1_3_3_2_63_2","doi-asserted-by":"publisher","unstructured":"Yifei Yang Xiangyao Yu Marco Serafini Ashraf Aboulnaga and Michael Stonebraker. 2024. FlexpushdownDB: rethinking computation pushdown for cloud OLAP DBMSs. The VLDB Journal (10 Jul 2024). 10.1007\/s00778-024-00867-8","DOI":"10.1007\/s00778-024-00867-8"},{"key":"e_1_3_3_2_64_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE48307.2020.00174"},{"key":"e_1_3_3_2_65_2","first-page":"293","volume-title":"2020 USENIX Annual Technical Conference (USENIX ATC 20)","author":"Yuan Gina","year":"2020","unstructured":"Gina Yuan, Shoumik Palkar, Deepak Narayanan, and Matei Zaharia. 2020. Offload Annotations: Bringing Heterogeneous Computing to Existing Libraries and Workloads. In 2020 USENIX Annual Technical Conference (USENIX ATC 20). USENIX Association, 293\u2013306. https:\/\/www.usenix.org\/conference\/atc20\/presentation\/yuan"},{"key":"e_1_3_3_2_66_2","doi-asserted-by":"crossref","unstructured":"Yansong Zhang Yu Zhang Jiaheng Lu Shan Wang Zhuan Liu and Ruichen Han. 2020. One size does not fit all: accelerating OLAP workloads with GPUs. Distributed and Parallel Databases 38 (2020) 995\u20131037.","DOI":"10.1007\/s10619-020-07304-z"}],"event":{"name":"ICS '25: 2025 International Conference on Supercomputing","location":"Salt Lake City USA","acronym":"ICS '25","sponsor":["SIGARCH ACM Special Interest Group on Computer Architecture"]},"container-title":["Proceedings of the 39th ACM International Conference on Supercomputing"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3721145.3725752","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T13:00:35Z","timestamp":1755867635000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3721145.3725752"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,6,8]]},"references-count":65,"alternative-id":["10.1145\/3721145.3725752","10.1145\/3721145"],"URL":"https:\/\/doi.org\/10.1145\/3721145.3725752","relation":{},"subject":[],"published":{"date-parts":[[2025,6,8]]},"assertion":[{"value":"2025-08-22","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}