{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,23]],"date-time":"2026-04-23T07:54:34Z","timestamp":1776930874881,"version":"3.51.2"},"publisher-location":"New York, NY, USA","reference-count":52,"publisher":"ACM","content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,11,16]]},"DOI":"10.1145\/3731599.3767371","type":"proceedings-article","created":{"date-parts":[[2025,11,7]],"date-time":"2025-11-07T16:20:02Z","timestamp":1762532402000},"page":"290-299","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Integrating Distributed SQL Query Engines with Object-Based Computational Storage"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0005-0634-7923","authenticated-orcid":false,"given":"Junghyun","family":"Ryu","sequence":"first","affiliation":[{"name":"Sogang University, South Korea, Seoul, Republic of Korea"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0091-3507","authenticated-orcid":false,"given":"Soon","family":"Hwang","sequence":"additional","affiliation":[{"name":"Sogang University, South Korea, Seoul, Republic of Korea"}]},{"ORCID":"https:\/\/orcid.org\/0009-0008-9293-173X","authenticated-orcid":false,"given":"Junhyeok","family":"Park","sequence":"additional","affiliation":[{"name":"Sogang University, South Korea, Seoul, Republic of Korea"}]},{"ORCID":"https:\/\/orcid.org\/0009-0008-5259-8960","authenticated-orcid":false,"given":"Seonghoon","family":"Ahn","sequence":"additional","affiliation":[{"name":"Sogang University, South Korea, Seoul, Republic of Korea"}]},{"ORCID":"https:\/\/orcid.org\/0009-0000-8937-7653","authenticated-orcid":false,"given":"JeoungAhn","family":"Park","sequence":"additional","affiliation":[{"name":"SK hynix Inc., Seongnam, Republic of Korea"}]},{"ORCID":"https:\/\/orcid.org\/0009-0002-4535-0269","authenticated-orcid":false,"given":"Jeongjin","family":"Lee","sequence":"additional","affiliation":[{"name":"SK hynix Inc., Seongnam, Republic of Korea"}]},{"ORCID":"https:\/\/orcid.org\/0009-0004-7332-6762","authenticated-orcid":false,"given":"Jinna","family":"Yang","sequence":"additional","affiliation":[{"name":"SK hynix Inc., Seongnam, Republic of Korea"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5944-4453","authenticated-orcid":false,"given":"Soonyeal","family":"Yang","sequence":"additional","affiliation":[{"name":"SK hynix Inc., Seongnam, Republic of Korea"}]},{"ORCID":"https:\/\/orcid.org\/0009-0009-8803-5016","authenticated-orcid":false,"given":"Jungki","family":"Noh","sequence":"additional","affiliation":[{"name":"SK hynix Inc., Seongnam, Republic of Korea"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7457-9874","authenticated-orcid":false,"given":"Qing","family":"Zheng","sequence":"additional","affiliation":[{"name":"Los Alamos National Laboratory (LANL), Los Alamos, NM, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9375-8931","authenticated-orcid":false,"given":"Woosuk","family":"Chung","sequence":"additional","affiliation":[{"name":"SK hynix Inc., Seongnam, Republic of Korea"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4017-8124","authenticated-orcid":false,"given":"Hoshik","family":"Kim","sequence":"additional","affiliation":[{"name":"SK hynix Inc., Seongnam, Republic of Korea"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8786-3850","authenticated-orcid":false,"given":"Youngjae","family":"Kim","sequence":"additional","affiliation":[{"name":"Sogang University, South Korea, Seoul, Republic of Korea"}]}],"member":"320","published-online":{"date-parts":[[2025,11,15]]},"reference":[{"key":"e_1_3_3_2_2_2","doi-asserted-by":"crossref","unstructured":"Mark Ainsworth Ozan Tugluk Ben Whitney and Scott Klasky. 2018. Multilevel techniques for compression and reduction of scientific data\u2014the univariate case. Springer Computing and Visualization in Science 19 5\u20136 (2018).","DOI":"10.1007\/s00791-018-00303-9"},{"key":"e_1_3_3_2_3_2","unstructured":"Amazon Web Services. 2024. Amazon Athena Documentation. https:\/\/docs.aws.amazon.com\/athena\/latest\/ug\/what-is.html."},{"key":"e_1_3_3_2_4_2","unstructured":"Amazon Web Services Inc.2006. Amazon S3. https:\/\/aws.amazon.com\/s3\/. [Online; accessed 2025-08-24]."},{"key":"e_1_3_3_2_5_2","unstructured":"Apache Foundation. 2010. Apache Hive. https:\/\/hive.apache.org\/. [Online; accessed 2025-08-24]."},{"key":"e_1_3_3_2_6_2","unstructured":"Apache Foundation. 2010. Apache Spark. https:\/\/spark.apache.org\/. [Online; accessed 2025-08-24]."},{"key":"e_1_3_3_2_7_2","unstructured":"Apache Foundation. 2013. Apache ORC. https:\/\/orc.apache.org\/. [Online; accessed 2025-08-24]."},{"key":"e_1_3_3_2_8_2","unstructured":"Apache Foundation. 2013. Apache Parquet. https:\/\/parquet.apache.org\/. [Online; accessed 2025-08-24]."},{"key":"e_1_3_3_2_9_2","unstructured":"Apache Foundation. 2013. HDFS Architecture Guide. https:\/\/hadoop.apache.org\/docs\/r1.2.1\/hdfs_design.html. Accessed: 2025-08-23."},{"key":"e_1_3_3_2_10_2","unstructured":"Apache Foundation. 2016. Apache Arrow. https:\/\/arrow.apache.org\/. [Online; accessed 2025-08-24]."},{"key":"e_1_3_3_2_11_2","doi-asserted-by":"publisher","DOI":"10.1145\/2828612.2828624"},{"key":"e_1_3_3_2_12_2","unstructured":"Zbigniew Baranowski and Vasileios Dimakopoulos. 2020. Introduction to Presto. CERN Indico Event 869037. https:\/\/indico.cern.ch\/event\/869037\/contributions\/3663775\/attachments\/1960650\/3258410\/Introduction_to_Presto.pdf"},{"key":"e_1_3_3_2_13_2","unstructured":"Yann Collet and Chip Turner. 2016. Zstandard - Real-time Data Compression Algorithm. https:\/\/github.com\/facebook\/zstd."},{"key":"e_1_3_3_2_14_2","doi-asserted-by":"publisher","unstructured":"Matthieu Dorier Gabriel Antoniu Franck Cappello Marc Snir Robert Sisneros Orcun Yildiz Shadi Ibrahim Tom Peterka and Leigh Orf. 2016. Damaris: Addressing performance variability in data management for post-petascale simulations. ACM Transactions on Parallel Computing 3 3 (2016). 10.1145\/2987371","DOI":"10.1145\/2987371"},{"key":"e_1_3_3_2_15_2","doi-asserted-by":"publisher","unstructured":"Dominik Durner Viktor Leis and Thomas Neumann. 2023. Exploiting Cloud Object Storage for High-Performance Analytics. Proceedings of the VLDB Endowment 16 11 (2023). 10.14778\/3603581.3603592","DOI":"10.14778\/3603581.3603592"},{"key":"e_1_3_3_2_16_2","doi-asserted-by":"publisher","DOI":"10.1145\/3669940.3707234"},{"key":"e_1_3_3_2_17_2","doi-asserted-by":"publisher","unstructured":"Frank Gadban and Julian Kunkel. 2021. Analyzing the Performance of the S3 Object Storage API for HPC Workloads. MDPI Applied Sciences 11 18 (2021). 10.3390\/app11188540","DOI":"10.3390\/app11188540"},{"key":"e_1_3_3_2_18_2","unstructured":"GNU Project. 2022. GNU Gzip: General-Purpose Data Compression Software. https:\/\/www.gnu.org\/software\/gzip\/."},{"key":"e_1_3_3_2_19_2","unstructured":"Google. 2011. Snappy. https:\/\/github.com\/google\/snappy. [Online; accessed 2025-08-24]."},{"key":"e_1_3_3_2_20_2","unstructured":"Google. 2015. gRPC. https:\/\/grpc.io. [Online; accessed 2025-08-24]."},{"key":"e_1_3_3_2_21_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-69953-04"},{"key":"e_1_3_3_2_22_2","doi-asserted-by":"publisher","unstructured":"Insoon Jo Duck-Ho Bae Andre\u00a0S. Yoon Jeong-Uk Kang Sangyeun Cho Daniel D.\u00a0G. Lee and Jaeheon Jeong. 2016. YourSQL: a high-performance database system leveraging in-storage computing. Proc. VLDB Endow. 9 12 (2016). 10.14778\/2994509.2994512","DOI":"10.14778\/2994509.2994512"},{"key":"e_1_3_3_2_23_2","unstructured":"Patchett John Samsel Francesca Tsai Karen Gisler Galen Rogers David Abram Greg and Turton Terece. 2016. Visualization and analysis of threats from asteroid ocean impacts. Los Alamos National Laboratory Technical Report."},{"key":"e_1_3_3_2_24_2","unstructured":"Jongryool Kim. 2023. Accelerating Data Analytics Using Object Based Computational Storage in a HPC. https:\/\/sc23.supercomputing.org\/proceedings\/exhibitor_forum\/exhibitor_forum_pages\/exforum116.html The International Conference for High Performance Computing Networking Storage and Analysis (SC)."},{"key":"e_1_3_3_2_25_2","doi-asserted-by":"publisher","DOI":"10.1109\/DCC50243.2021.00018"},{"key":"e_1_3_3_2_26_2","doi-asserted-by":"publisher","DOI":"10.1109\/BigData.2018.8622520"},{"key":"e_1_3_3_2_27_2","doi-asserted-by":"publisher","unstructured":"Peter Lindstrom. 2014. Fixed-Rate Compressed Floating-Point Arrays. IEEE Transactions on Visualization and Computer Graphics 20 12 (2014). 10.1109\/TVCG.2014.2346458","DOI":"10.1109\/TVCG.2014.2346458"},{"key":"e_1_3_3_2_28_2","doi-asserted-by":"publisher","unstructured":"Peter Lindstrom and Martin Isenburg. 2006. Fast and Efficient Compression of Floating-Point Data. IEEE Transactions on Visualization and Computer Graphics 12 5 (2006). 10.1109\/TVCG.2006.143","DOI":"10.1109\/TVCG.2006.143"},{"key":"e_1_3_3_2_29_2","doi-asserted-by":"publisher","DOI":"10.1145\/1383529.1383533"},{"key":"e_1_3_3_2_30_2","unstructured":"Los Alamos National Laboratory. 2024. Laghos Sample Dataset. https:\/\/github.com\/lanl-ocs\/laghos-sample-dataset. [Online; accessed 2025-08-24]."},{"key":"e_1_3_3_2_31_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE53745.2022.00165"},{"key":"e_1_3_3_2_32_2","unstructured":"LZ4. 2011. LZ4 - Extremely fast compression. https:\/\/github.com\/lz4\/lz4. [Online; accessed 2025-08-24]."},{"key":"e_1_3_3_2_33_2","unstructured":"Dominic Manno. 2023. Improving Storage Systems for Simulation Science with Computational Storage. Compute+Memory+Storage Summit."},{"key":"e_1_3_3_2_34_2","doi-asserted-by":"publisher","unstructured":"Sergey Melnik Andrey Gubarev Jing\u00a0Jing Long Geoffrey Romer Shiva Shivakumar Matt Tolton Theo Vassilakis Hossein Ahmadi Dan Delorey Slava Min Mosha Pasumansky and Jeff Shute. 2020. Dremel: A Decade of Interactive SQL Analysis at Web Scale. Proceedings of the VLDB Endowment 13 12 (2020). 10.14778\/3415478.3415568","DOI":"10.14778\/3415478.3415568"},{"key":"e_1_3_3_2_35_2","unstructured":"MinIO Inc.2016. MinIO: S3 Compatible Exascale Object Store for AI. https:\/\/min.io\/. Accessed: 2025-08-23."},{"key":"e_1_3_3_2_36_2","unstructured":"MinIO Inc.2019. MinIO Select: S3 Select API Support. https:\/\/github.com\/minio\/minio\/blob\/master\/docs\/select\/README.md. Accessed: 2025-08-23."},{"key":"e_1_3_3_2_37_2","doi-asserted-by":"publisher","DOI":"10.1145\/3654983"},{"key":"e_1_3_3_2_38_2","doi-asserted-by":"publisher","DOI":"10.1109\/CLUSTER52292.2023.00019"},{"key":"e_1_3_3_2_39_2","unstructured":"Presto Foundation. 2013. Hive Connector. https:\/\/prestodb.io\/docs\/current\/connector\/hive.html. Accessed: 2025-08-23."},{"key":"e_1_3_3_2_40_2","unstructured":"Presto Foundation. 2013. SPI Overview. https:\/\/prestodb.io\/docs\/current\/develop\/spi-overview.html. Accessed: 2025-08-23."},{"key":"e_1_3_3_2_41_2","unstructured":"Randall Hunt. 2017. S3 Select and Glacier Select \u2013 Retrieving Subsets of Objects. https:\/\/aws.amazon.com\/ko\/blogs\/aws\/s3-glacier-select\/"},{"key":"e_1_3_3_2_42_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE.2019.00196"},{"key":"e_1_3_3_2_43_2","unstructured":"Nick Smith Bo Jayatilaka David Mason Oliver Gutsche Alison Peisker Robert Illingworth and Chris Jones. 2023. A Ceph S3 Object Data Store for HEP. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2311.16321 (2023). https:\/\/arxiv.org\/abs\/2311.16321"},{"key":"e_1_3_3_2_44_2","unstructured":"Snowflake Inc.2014. Snowflake AI Data Cloud. https:\/\/www.snowflake.com\/. Accessed: 2025-08-23."},{"key":"e_1_3_3_2_45_2","doi-asserted-by":"crossref","unstructured":"James\u00a0A Storer and Thomas\u00a0G Szymanski. 1982. Data compression via textual substitution. Journal of the ACM (JACM) 29 4 (1982).","DOI":"10.1145\/322344.322346"},{"key":"e_1_3_3_2_46_2","unstructured":"Substrait Project. 2021. Substrait. https:\/\/substrait.io\/. Accessed: 2025-08-23."},{"key":"e_1_3_3_2_47_2","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS.2017.115"},{"key":"e_1_3_3_2_48_2","unstructured":"Transaction Processing Performance Council. 2017. TPC Benchmark H (Decision Support). http:\/\/www.tpc.org\/tpch\/. Revision 2.17.3."},{"key":"e_1_3_3_2_49_2","unstructured":"Andrew Waldman. 2018. Evaluation of the Presto Query Engine for integrating relational databases with big data platforms at scale. CERN openlab Summer Student Lightning Talk. https:\/\/cds.cern.ch\/record\/2634287"},{"key":"e_1_3_3_2_50_2","doi-asserted-by":"crossref","unstructured":"Yifei Yang Xiangyao Yu Marco Serafini Ashraf Aboulnaga and Michael Stonebraker. 2024. FlexpushdownDB: Rethinking Computation Pushdown for Cloud OLAP DBMSs. The VLDB Journal 33 5 (2024).","DOI":"10.1007\/s00778-024-00867-8"},{"key":"e_1_3_3_2_51_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE48307.2020.00174"},{"key":"e_1_3_3_2_52_2","unstructured":"Qing Zheng. 2023. Toward Open Object-Based Computational Storage For Analysis Query Pushdown. The 9th International Parallel Data Systems Workshop (PDSW) Work-in-Progress (WIP) Session."},{"key":"e_1_3_3_2_53_2","doi-asserted-by":"crossref","unstructured":"Jacob Ziv and Abraham Lempel. 1977. A universal algorithm for sequential data compression. IEEE Transactions on Information Theory 23 3 (1977).","DOI":"10.1109\/TIT.1977.1055714"}],"event":{"name":"SC Workshops '25: Workshops of the International Conference for High Performance Computing, Networking, Storage and Analysis","location":"St Louis MO USA","acronym":"SC Workshops '25","sponsor":["SIGHPC ACM Special Interest Group on High Performance Computing, Special Interest Group on High Performance Computing"]},"container-title":["Proceedings of the SC '25 Workshops of the International Conference for High Performance Computing, Networking, Storage and Analysis"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3731599.3767371","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,1,9]],"date-time":"2026-01-09T19:35:50Z","timestamp":1767987350000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3731599.3767371"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,11,15]]},"references-count":52,"alternative-id":["10.1145\/3731599.3767371","10.1145\/3731599"],"URL":"https:\/\/doi.org\/10.1145\/3731599.3767371","relation":{},"subject":[],"published":{"date-parts":[[2025,11,15]]},"assertion":[{"value":"2025-11-15","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}