{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,8]],"date-time":"2026-01-08T03:04:18Z","timestamp":1767841458821,"version":"3.49.0"},"publisher-location":"New York, NY, USA","reference-count":110,"publisher":"ACM","license":[{"start":{"date-parts":[[2025,3,30]],"date-time":"2025-03-30T00:00:00Z","timestamp":1743292800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"DOI":"10.13039\/501100006374","name":"NSF (National Science Foundation)","doi-asserted-by":"publisher","award":["2106530"],"award-info":[{"award-number":["2106530"]}],"id":[{"id":"10.13039\/501100006374","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,3,30]]},"DOI":"10.1145\/3669940.3707234","type":"proceedings-article","created":{"date-parts":[[2025,2,6]],"date-time":"2025-02-06T12:28:01Z","timestamp":1738844881000},"page":"540-556","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":3,"title":["Fusion: An Analytics Object Store Optimized for Query Pushdown"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-0741-1913","authenticated-orcid":false,"given":"Jianan","family":"Lu","sequence":"first","affiliation":[{"name":"Princeton University, Princeton, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3367-009X","authenticated-orcid":false,"given":"Ashwini","family":"Raina","sequence":"additional","affiliation":[{"name":"Princeton University, Princeton, USA"}]},{"ORCID":"https:\/\/orcid.org\/0009-0007-4046-2022","authenticated-orcid":false,"given":"Asaf","family":"Cidon","sequence":"additional","affiliation":[{"name":"Columbia University, New York, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5305-2395","authenticated-orcid":false,"given":"Michael J.","family":"Freedman","sequence":"additional","affiliation":[{"name":"Princeton University, Princeton, USA"}]}],"member":"320","published-online":{"date-parts":[[2025,3,30]]},"reference":[{"key":"e_1_3_2_1_1_1","unstructured":"[n. d.]. Amazon S3. https:\/\/aws.amazon.com\/s3\/."},{"key":"e_1_3_2_1_2_1","unstructured":"[n. d.]. Apache arrowparquet. https:\/\/arrow.apache.org\/docs\/python\/parquet.html."},{"key":"e_1_3_2_1_3_1","unstructured":"[n. d.]. Apache Avro. https:\/\/avro.apache.org\/."},{"key":"e_1_3_2_1_4_1","unstructured":"[n. d.]. Apache Parquet. https:\/\/parquet.apache.org\/."},{"key":"e_1_3_2_1_5_1","unstructured":"[n. d.]. Azure Data Lake Storage Query Acceleration. https:\/\/learn.microsoft.com\/en-us\/azure\/storage\/blobs\/datalake-storage-query-acceleration."},{"key":"e_1_3_2_1_6_1","unstructured":"[n. d.]. Cloudlab. https:\/\/www.cloudlab.us."},{"key":"e_1_3_2_1_7_1","unstructured":"[n. d.]. Filtering and retrieving data using Amazon S3 Select. https:\/\/docs.aws.amazon.com\/AmazonS3\/latest\/userguide\/selecting-content-from-objects.html."},{"key":"e_1_3_2_1_8_1","unstructured":"[n. d.]. gurobipy 11.0.0. https:\/\/pypi.org\/project\/gurobipy\/."},{"key":"e_1_3_2_1_9_1","unstructured":"[n. d.]. HDFS erasure coding. https:\/\/hadoop.apache.org\/docs\/stable\/hadoop-project-dist\/hadoop-hdfs\/HDFSErasureCoding.html."},{"key":"e_1_3_2_1_10_1","unstructured":"[n. d.]. Lance: modern columnar data format for ML. https:\/\/lancedb.github.io\/lance\/."},{"key":"e_1_3_2_1_11_1","unstructured":"[n. d.]. MinIO Select API Quickstart Guide. https:\/\/github.com\/minio\/minio\/blob\/master\/docs\/select\/README.md."},{"key":"e_1_3_2_1_12_1","unstructured":"[n. d.]. NYC yellow taxi dataset queries. https:\/\/docs.timescale.com\/tutorials\/latest\/nyc-taxi-cab\/query-nyc\/."},{"key":"e_1_3_2_1_13_1","unstructured":"[n. d.]. NYC yellow taxi trip record data. https:\/\/www.nyc.gov\/site\/tlc\/about\/tlc-trip-record-data.page."},{"key":"e_1_3_2_1_14_1","unstructured":"[n. d.]. pyarrow. https:\/\/pypi.org\/project\/pyarrow\/."},{"key":"e_1_3_2_1_15_1","unstructured":"[n. d.]. TPC-H specification. https:\/\/www.tpc.org\/TPC_Documents_Current_Versions\/pdf\/TPC-H_v3.0.1.pdf."},{"key":"e_1_3_2_1_16_1","unstructured":"[n. d.]. Using Lua in the Ceph distributed storage system. https:\/\/www.lua.org\/wshop17\/Watkins.pdf."},{"key":"e_1_3_2_1_17_1","unstructured":"[n. d.]. Wondershaper. https:\/\/github.com\/magnific0\/wondershaper."},{"key":"e_1_3_2_1_18_1","volume-title":"10th USENIX Conference on File and Storage Technologies (FAST 12)","unstructured":"2012. Rethinking Erasure Codes for Cloud File Systems: Minimizing I\/O for Recovery and Degraded Reads. In 10th USENIX Conference on File and Storage Technologies (FAST 12). USENIX Association, San Jose, CA. https:\/\/www.usenix.org\/conference\/fast12\/rethinking-erasurecodes-cloud-file-systems-minimizing-io-recovery-and-degraded"},{"key":"e_1_3_2_1_19_1","unstructured":"2017. Backblaze Vaults: Zettabyte-Scale Cloud Storage Architecture. https:\/\/www.backblaze.com\/blog\/vault-cloud-storage-architecture\/."},{"key":"e_1_3_2_1_20_1","unstructured":"2021. Benchmarking Cloud Data-warehouse Bigquery to Scale Fast. https:\/\/cloud.google.com\/blog\/products\/data-analytics\/benchmarking-cloud-data-warehouse-bigquery-to-scale-fast."},{"key":"e_1_3_2_1_21_1","unstructured":"2021. Run queries 3x faster with up to 70% cost savings on the latest Amazon Athena engine. https:\/\/aws.amazon.com\/blogs\/bigdata\/run-queries-3x-faster-with-up-to-70-cost-savings-on-thelatest-amazon-athena-engine\/."},{"key":"e_1_3_2_1_22_1","unstructured":"2022. Upgrade to Athena engine version 3 to increase query performance and access more analytics features. https:\/\/aws.amazon.com\/blogs\/big-data\/upgrade-to-athenaengine-version-3-to-increase-query-performance-and-accessmore-analytics-features\/."},{"key":"e_1_3_2_1_23_1","unstructured":"2023. Apache Zookeeper. https:\/\/zookeeper.apache.org."},{"key":"e_1_3_2_1_24_1","unstructured":"2023. AQUA (Advanced Query Accelerator) for Amazon Redshift. https:\/\/pages.awscloud.com\/AQUA_Preview.html\/."},{"key":"e_1_3_2_1_25_1","unstructured":"2023. AWS S3 select command. https:\/\/docs.aws.amazon.com\/AmazonS3\/latest\/userguide\/s3-select-sql-reference-select.html."},{"key":"e_1_3_2_1_26_1","unstructured":"2023. Azure Data Lake Storage query acceleration. https:\/\/docs.microsoft.com\/en-us\/azure\/storage\/blobs\/datalake-storage-query-acceleration\/."},{"key":"e_1_3_2_1_27_1","unstructured":"2023. etccd. https:\/\/etcd.io\/."},{"key":"e_1_3_2_1_28_1","unstructured":"2023. JavaScript Object Notation. https:\/\/www.json.org\/json-en.html."},{"key":"e_1_3_2_1_29_1","unstructured":"2023. Minio erasure coding parameters. https:\/\/blog.min.io\/erasurecoding-cpu-utilization\/."},{"key":"e_1_3_2_1_30_1","unstructured":"2023. Samsung SmartSSD Computational Storage. https:\/\/news.samsung.com\/global\/samsung-electronics-developssecond-generation-smartssd-computational-storage-drive-withupgraded-processing-functionality."},{"key":"e_1_3_2_1_31_1","unstructured":"2023. TPC-H benchmark. https:\/\/www.tpc.org\/tpch\/."},{"key":"e_1_3_2_1_32_1","unstructured":"[n. d.]. Amazon Athena. https:\/\/aws.amazon.com\/athena."},{"key":"e_1_3_2_1_33_1","unstructured":"[n. d.]. Ceph erasure coding parameters. https:\/\/docs.ceph.com\/en\/quincy\/rados\/operations\/erasure-code-profile\/."},{"key":"e_1_3_2_1_34_1","unstructured":"[n. d.]. Google Cloud BigQuery. https:\/\/cloud.google.com\/bigquery."},{"key":"e_1_3_2_1_35_1","unstructured":"[n. d.]. MinIO: High Performance Object Storage for Modern Data Lakes. https:\/\/min.io\/."},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1145\/3465332.3470881"},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.1002\/jos.74"},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.1007\/s00778-002-0074--9"},{"key":"e_1_3_2_1_39_1","unstructured":"ORC Apache. 2018. Apache ORC: High-Performance Columnar Storage for Hadoop."},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"publisher","DOI":"10.1016\/0196--6774(84)90004-X"},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"publisher","DOI":"10.1016\/0167-6377(83)90042-1"},{"key":"e_1_3_2_1_42_1","volume-title":"Pelican: A Building Block for Exascale Cold Data Storage. In 11th USENIX Symposium on Operating Systems Design and Implementation (OSDI 14)","author":"Balakrishnan Shobana","year":"2014","unstructured":"Shobana Balakrishnan, Richard Black, Austin Donnelly, Paul England, Adam Glass, Dave Harper, Sergey Legtchenko, Aaron Ogus, Eric Peterson, and Antony Rowstron. 2014. Pelican: A Building Block for Exascale Cold Data Storage. In 11th USENIX Symposium on Operating Systems Design and Implementation (OSDI 14). USENIX Association, Broomfield, CO, 351--365. https:\/\/www.usenix.org\/conference\/osdi14\/technical-sessions\/presentation\/balakrishnan"},{"key":"e_1_3_2_1_43_1","volume-title":"Adaptive Placement for In-memory Storage Functions. In 2020 USENIX Annual Technical Conference (USENIX ATC 20)","author":"Bhardwaj Ankit","year":"2020","unstructured":"Ankit Bhardwaj, Chinmay Kulkarni, and Ryan Stutsman. 2020. Adaptive Placement for In-memory Storage Functions. In 2020 USENIX Annual Technical Conference (USENIX ATC 20). USENIX Association, 127--141. https:\/\/www.usenix.org\/conference\/atc20\/presentation\/bhardwaj"},{"key":"e_1_3_2_1_44_1","first-page":"1","article-title":"Bounded space online variable-sized bin packing","volume":"13","author":"Burkard Rainer E.","year":"1997","unstructured":"Rainer E. Burkard and Guochuan Zhang. 1997. Bounded space online variable-sized bin packing. Acta Cybernetica 13, 1 (Jan. 1997), 63--76. https:\/\/cyber.bibl.u-szeged.hu\/index.php\/actcybern\/article\/view\/3480","journal-title":"Acta Cybernetica"},{"key":"e_1_3_2_1_45_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10479-015--2082--3"},{"key":"e_1_3_2_1_46_1","doi-asserted-by":"publisher","DOI":"10.1137\/S0097539799356265"},{"key":"e_1_3_2_1_47_1","volume-title":"2017 USENIX Annual Technical Conference (USENIX ATC 17)","author":"Chen Yu Lin","year":"2017","unstructured":"Yu Lin Chen, Shuai Mu, Jinyang Li, Cheng Huang, Jin Li, Aaron Ogus, and Douglas Phillips. 2017. Giza: Erasure Coding Objects across Global Data Centers. In 2017 USENIX Annual Technical Conference (USENIX ATC 17). USENIX Association, Santa Clara, CA, 539-- 551. https:\/\/www.usenix.org\/conference\/atc17\/technical-sessions\/presentation\/chen-yu-lin"},{"key":"e_1_3_2_1_48_1","unstructured":"Henrik I. Christensen A. Khan Sebastian Pokutta and Prasad Tetali. 2016. Multidimensional Bin Packing and Other Related Problems : A Survey. https:\/\/api.semanticscholar.org\/CorpusID:9048170"},{"key":"e_1_3_2_1_49_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.cosrev.2016.12.001"},{"key":"e_1_3_2_1_50_1","volume-title":"Bin packing approximation algorithms: Survey and classification","author":"Coffman Edward G.","unstructured":"Edward G. Coffman, J\u00e1nos Csirik, G\u00e1bor Galambos, Silvano Martello, and Daniele Vigo. 2013. Bin packing approximation algorithms: Survey and classification. Vol. 1--5. Springer, 455--531. https:\/\/doi.org\/10.1007\/ 978--1--4419--7997--1_35"},{"key":"e_1_3_2_1_51_1","doi-asserted-by":"publisher","DOI":"10.1007\/BF00288885"},{"key":"e_1_3_2_1_52_1","unstructured":"E. G. Coffman M. R. Garey and D. S. Johnson. 1996. Approximation algorithms for bin packing: a survey. PWS Publishing Co. USA 46--93."},{"key":"e_1_3_2_1_53_1","doi-asserted-by":"publisher","DOI":"10.1007\/BF00289157"},{"key":"e_1_3_2_1_54_1","doi-asserted-by":"publisher","DOI":"10.1016\/0166-218X(88)90052--2"},{"key":"e_1_3_2_1_55_1","doi-asserted-by":"publisher","DOI":"10.1145\/2882903.2903741"},{"key":"e_1_3_2_1_56_1","doi-asserted-by":"publisher","DOI":"10.1145\/1327452.1327492"},{"key":"e_1_3_2_1_57_1","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.2010.2054295"},{"key":"e_1_3_2_1_58_1","doi-asserted-by":"publisher","DOI":"10.1145\/2463676.2465295"},{"key":"e_1_3_2_1_59_1","doi-asserted-by":"publisher","DOI":"10.14778\/3476311.3476385"},{"key":"e_1_3_2_1_60_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.jda.2010.07.002"},{"key":"e_1_3_2_1_61_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-77918--6_19"},{"key":"e_1_3_2_1_62_1","unstructured":"Andrew Fikes. 2010. Storage Architecture and Challenges. https:\/\/cloud.google.com\/files\/storage_architecture_and_challenges.pdf."},{"key":"e_1_3_2_1_63_1","doi-asserted-by":"publisher","unstructured":"Luke Finlay and Prabhu Manyem. 2005. Online LIB problems: Heuristics for Bin Covering and lower bounds for Bin Packing. http:\/\/dx.doi.org\/10.1051\/ro:2006001 39 (07 2005). https:\/\/doi.org\/10.1051\/ro:2006001","DOI":"10.1051\/ro:2006001"},{"key":"e_1_3_2_1_64_1","doi-asserted-by":"publisher","DOI":"10.1137\/0215016"},{"key":"e_1_3_2_1_65_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10479-015-1973-7"},{"key":"e_1_3_2_1_66_1","doi-asserted-by":"publisher","DOI":"10.1016\/0097-3165(76)90001-7"},{"key":"e_1_3_2_1_67_1","doi-asserted-by":"publisher","DOI":"10.1145\/800152.804907"},{"key":"e_1_3_2_1_68_1","unstructured":"Martin Josef Geiger. 2008. Bin Packing Under Multiple Objectives - a Heuristic Approximation Approach. arXiv:0809.0755 [cs.AI] https:\/\/arxiv.org\/abs\/0809.0755"},{"key":"e_1_3_2_1_69_1","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.2012.2208937"},{"key":"e_1_3_2_1_70_1","doi-asserted-by":"publisher","DOI":"10.1137\/0117039"},{"key":"e_1_3_2_1_71_1","doi-asserted-by":"publisher","DOI":"10.1145\/2740070.2626334"},{"key":"e_1_3_2_1_72_1","doi-asserted-by":"publisher","DOI":"10.1145\/2723372.2742795"},{"key":"e_1_3_2_1_73_1","volume-title":"Exploiting Combined Locality for Wide- Stripe Erasure Coding in Distributed Storage. In 19th USENIX Conference on File and Storage Technologies (FAST 21)","author":"Hu Yuchong","year":"2021","unstructured":"Yuchong Hu, Liangfeng Cheng, Qiaori Yao, Patrick P. C. Lee,Weichun Wang, and Wei Chen. 2021. Exploiting Combined Locality for Wide- Stripe Erasure Coding in Distributed Storage. In 19th USENIX Conference on File and Storage Technologies (FAST 21). USENIX Association, 233--248. https:\/\/www.usenix.org\/conference\/fast21\/presentation\/hu"},{"key":"e_1_3_2_1_74_1","volume-title":"Exploiting Combined Locality for Wide- Stripe Erasure Coding in Distributed Storage. In 19th USENIX Conference on File and Storage Technologies (FAST 21)","author":"Hu Yuchong","year":"2021","unstructured":"Yuchong Hu, Liangfeng Cheng, Qiaori Yao, Patrick P. C. Lee,Weichun Wang, and Wei Chen. 2021. Exploiting Combined Locality for Wide- Stripe Erasure Coding in Distributed Storage. In 19th USENIX Conference on File and Storage Technologies (FAST 21). USENIX Association, 233--248. https:\/\/www.usenix.org\/conference\/fast21\/presentation\/hu"},{"key":"e_1_3_2_1_75_1","doi-asserted-by":"publisher","DOI":"10.1145\/2435204.2435207"},{"key":"e_1_3_2_1_76_1","volume-title":"Erasure Coding in Windows Azure Storage. In 2012 USENIX Annual Technical Conference (USENIX ATC 12)","author":"Huang Cheng","year":"2012","unstructured":"Cheng Huang, Huseyin Simitci, Yikang Xu, Aaron Ogus, Brad Calder, Parikshit Gopalan, Jin Li, and Sergey Yekhanin. 2012. Erasure Coding in Windows Azure Storage. In 2012 USENIX Annual Technical Conference (USENIX ATC 12). USENIX Association, Boston, MA, 15--26. https:\/\/www.usenix.org\/conference\/atc12\/technicalsessions\/presentation\/huang"},{"key":"e_1_3_2_1_77_1","doi-asserted-by":"publisher","DOI":"10.1016\/S0377-2217(02)00247-3"},{"key":"e_1_3_2_1_78_1","doi-asserted-by":"publisher","DOI":"10.1145\/321906.321917"},{"key":"e_1_3_2_1_79_1","volume-title":"Splinter: Bare-Metal Extensions for Multi-Tenant Low-Latency Storage. In 13th USENIX Symposium on Operating Systems Design and Implementation (OSDI 18)","author":"Kulkarni Chinmay","year":"2018","unstructured":"Chinmay Kulkarni, Sara Moore, Mazhar Naqvi, Tian Zhang, Robert Ricci, and Ryan Stutsman. 2018. Splinter: Bare-Metal Extensions for Multi-Tenant Low-Latency Storage. In 13th USENIX Symposium on Operating Systems Design and Implementation (OSDI 18). USENIX Association, Carlsbad, CA, 627--643. https:\/\/www.usenix.org\/conference\/osdi18\/presentation\/kulkarni"},{"key":"e_1_3_2_1_80_1","doi-asserted-by":"publisher","DOI":"10.1109\/MSST.2015.7208288"},{"key":"e_1_3_2_1_81_1","volume-title":"OpenEC: Toward Unified and Configurable Erasure Coding Management in Distributed Storage Systems. In 17th USENIX Conference on File and Storage Technologies (FAST 19)","author":"Li Xiaolu","year":"2019","unstructured":"Xiaolu Li, Runhui Li, Patrick P. C. Lee, and Yuchong Hu. 2019. OpenEC: Toward Unified and Configurable Erasure Coding Management in Distributed Storage Systems. In 17th USENIX Conference on File and Storage Technologies (FAST 19). USENIX Association, Boston, MA, 331--344. https:\/\/www.usenix.org\/conference\/fast19\/presentation\/li"},{"key":"e_1_3_2_1_82_1","doi-asserted-by":"publisher","DOI":"10.1145\/3589323"},{"key":"e_1_3_2_1_83_1","doi-asserted-by":"publisher","DOI":"10.1109\/IWQoS.2013.6550268"},{"key":"e_1_3_2_1_84_1","doi-asserted-by":"publisher","DOI":"10.1016\/S0898-1221(98)00087-X"},{"key":"e_1_3_2_1_85_1","doi-asserted-by":"publisher","DOI":"10.14778\/3415478.3415568"},{"key":"e_1_3_2_1_86_1","doi-asserted-by":"crossref","unstructured":"Nir Menakerman and Raphael Rom. 2001. Bin Packing with Item Fragmentation. 313--324.","DOI":"10.1007\/3-540-44634-6_29"},{"key":"e_1_3_2_1_87_1","volume-title":"11th USENIX Symposium on Operating Systems Design and Implementation (OSDI 14)","author":"Muralidhar Subramanian","year":"2014","unstructured":"Subramanian Muralidhar, Wyatt Lloyd, Sabyasachi Roy, Cory Hill, Ernest Lin, Weiwen Liu, Satadru Pan, Shiva Shankar, Viswanath Sivakumar, Linpeng Tang, and Sanjeev Kumar. 2014. f4: Facebook's Warm BLOB Storage System. In 11th USENIX Symposium on Operating Systems Design and Implementation (OSDI 14). USENIX Association, Broomfield, CO, 383--398. https:\/\/www.usenix.org\/conference\/osdi14\/technical-sessions\/presentation\/muralidhar"},{"key":"e_1_3_2_1_88_1","doi-asserted-by":"crossref","unstructured":"Aniket Murhekar David Arbour Tung Mai and Anup Rao. 2023. Dynamic Vector Bin Packing for Online Resource Allocation in the Cloud. arXiv:2304.08648 [cs.DS] https:\/\/arxiv.org\/abs\/2304.08648","DOI":"10.1145\/3558481.3591314"},{"key":"e_1_3_2_1_89_1","unstructured":"Rina Panigrahy Kunal Talwar Lincoln K. Uyeda and Udi Wieder. 2011. Heuristics for Vector Bin Packing. https:\/\/api.semanticscholar.org\/CorpusID:17946270"},{"key":"e_1_3_2_1_90_1","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.2014.2325570"},{"key":"e_1_3_2_1_91_1","doi-asserted-by":"publisher","DOI":"10.1145\/2740070.2626325"},{"key":"e_1_3_2_1_92_1","doi-asserted-by":"publisher","DOI":"10.1145\/2619239.2626325"},{"key":"e_1_3_2_1_93_1","volume-title":"Low-Latency Cluster Caching with Online Erasure Coding. In 12th USENIX Symposium on Operating Systems Design and Implementation (OSDI 16)","author":"Rashmi K. V.","year":"2016","unstructured":"K. V. Rashmi, Mosharaf Chowdhury, Jack Kosaian, Ion Stoica, and Kannan Ramchandran. 2016. EC-Cache: Load-Balanced, Low-Latency Cluster Caching with Online Erasure Coding. In 12th USENIX Symposium on Operating Systems Design and Implementation (OSDI 16). USENIX Association, Savannah, GA, 401--417. https:\/\/www.usenix.org\/conference\/osdi16\/technical-sessions\/presentation\/rashmi"},{"key":"e_1_3_2_1_94_1","volume-title":"5th USENIX Workshop on Hot Topics in Storage and File Systems (HotStorage . USENIX Association","author":"Rashmi K. V.","year":"2013","unstructured":"K. V. Rashmi, Nihar B. Shah, Dikang Gu, Hairong Kuang, Dhruba Borthakur, and Kannan Ramchandran. 2013. A Solution to the Network Challenges of Data Recovery in Erasure-coded Distributed Storage Systems: A Study on the Facebook Warehouse Cluster. In 5th USENIX Workshop on Hot Topics in Storage and File Systems (HotStorage . USENIX Association, San Jose, CA. https:\/\/www.usenix.org\/conference\/hotstorage13\/workshop-program\/presentation\/rashmi"},{"key":"e_1_3_2_1_95_1","doi-asserted-by":"publisher","DOI":"10.14778\/2535573.2488339"},{"key":"e_1_3_2_1_96_1","doi-asserted-by":"publisher","DOI":"10.1137\/S0895480100369948"},{"key":"e_1_3_2_1_97_1","doi-asserted-by":"publisher","DOI":"10.1137\/S0097539702412908"},{"key":"e_1_3_2_1_98_1","doi-asserted-by":"publisher","DOI":"10.1007\/s00224-007-9082-x"},{"key":"e_1_3_2_1_99_1","doi-asserted-by":"publisher","DOI":"10.1145\/3477132.3483558"},{"key":"e_1_3_2_1_100_1","doi-asserted-by":"publisher","DOI":"10.1109\/MSST.2010.5496972"},{"key":"e_1_3_2_1_101_1","doi-asserted-by":"publisher","DOI":"10.14569\/IJACSA.2017.081034"},{"key":"e_1_3_2_1_102_1","volume-title":"Albis: High-Performance File Format for Big Data Systems. In 2018 USENIX Annual Technical Conference (USENIX ATC 18)","author":"Trivedi Animesh","year":"2018","unstructured":"Animesh Trivedi, Patrick Stuedi, Jonas Pfefferle, Adrian Schuepbach, and Bernard Metzler. 2018. Albis: High-Performance File Format for Big Data Systems. In 2018 USENIX Annual Technical Conference (USENIX ATC 18). USENIX Association, Boston, MA, 615--630. https:\/\/www.usenix.org\/conference\/atc18\/presentation\/trivedi"},{"key":"e_1_3_2_1_103_1","volume-title":"Proceedings of the 7th Symposium on Operating Systems Design and Implementation","author":"Weil Sage A.","year":"2006","unstructured":"Sage A. Weil, Scott A. Brandt, Ethan L. Miller, Darrell D. E. Long, and Carlos Maltzahn. 2006. Ceph: A Scalable, High-Performance Distributed File System. In Proceedings of the 7th Symposium on Operating Systems Design and Implementation (Seattle,Washington) (OSDI'06). USENIX Association, USA, 307--320."},{"key":"e_1_3_2_1_104_1","volume-title":"13th USENIX Conference on File and Storage Technologies (FAST 15)","author":"Xia Mingyuan","unstructured":"Mingyuan Xia, Mohit Saxena, Mario Blaum, and David A. Pease. 2015. A Tale of Two Erasure Codes in HDFS. In 13th USENIX Conference on File and Storage Technologies (FAST 15). USENIX Association, Santa Clara, CA, 213--226. https:\/\/www.usenix.org\/conference\/fast15\/technical-sessions\/presentation\/xia"},{"key":"e_1_3_2_1_105_1","doi-asserted-by":"publisher","DOI":"10.14778\/3476249.3476265"},{"key":"e_1_3_2_1_106_1","volume-title":"Enhancing Computation Pushdown for Cloud OLAP Databases. https:\/\/arxiv.org\/pdf\/2312.15405.pdf","author":"Yang Yifei","year":"2023","unstructured":"Yifei Yang, Xiangyao Yu, Marco Serafini, Ashraf Aboulnaga, and Michael Stonebraker. 2023. Enhancing Computation Pushdown for Cloud OLAP Databases. https:\/\/arxiv.org\/pdf\/2312.15405.pdf (2023)."},{"key":"e_1_3_2_1_107_1","volume-title":"18th USENIX Symposium on Networked Systems Design and Implementation (NSDI 21)","author":"You Jie","year":"2021","unstructured":"Jie You, Jingfeng Wu, Xin Jin, and Mosharaf Chowdhury. 2021. Ship Compute or Ship Data? Why Not Both?. In 18th USENIX Symposium on Networked Systems Design and Implementation (NSDI 21). USENIX Association, 633--651. https:\/\/www.usenix.org\/conference\/nsdi21\/presentation\/you"},{"key":"e_1_3_2_1_108_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE48307.2020.00174"},{"key":"e_1_3_2_1_109_1","volume-title":"Spark: Cluster Computing with Working Sets. In 2nd USENIX Workshop on Hot Topics in Cloud Computing (HotCloud 10)","author":"Zaharia Matei","year":"2010","unstructured":"Matei Zaharia, Mosharaf Chowdhury, Michael J. Franklin, Scott Shenker, and Ion Stoica. 2010. Spark: Cluster Computing with Working Sets. In 2nd USENIX Workshop on Hot Topics in Cloud Computing (HotCloud 10). USENIX Association, Boston, MA. https:\/\/www.usenix.org\/conference\/hotcloud-10\/spark-clustercomputing-working-sets"},{"key":"e_1_3_2_1_110_1","doi-asserted-by":"publisher","DOI":"10.14778\/3626292.3626298"}],"event":{"name":"ASPLOS '25: 30th ACM International Conference on Architectural Support for Programming Languages and Operating Systems","location":"Rotterdam Netherlands","acronym":"ASPLOS '25","sponsor":["SIGPLAN ACM Special Interest Group on Programming Languages","SIGOPS ACM Special Interest Group on Operating Systems","SIGARCH ACM Special Interest Group on Computer Architecture"]},"container-title":["Proceedings of the 30th ACM International Conference on Architectural Support for Programming Languages and Operating Systems, Volume 1"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3669940.3707234","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3669940.3707234","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,21]],"date-time":"2025-08-21T14:48:47Z","timestamp":1755787727000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3669940.3707234"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,3,30]]},"references-count":110,"alternative-id":["10.1145\/3669940.3707234","10.1145\/3669940"],"URL":"https:\/\/doi.org\/10.1145\/3669940.3707234","relation":{},"subject":[],"published":{"date-parts":[[2025,3,30]]},"assertion":[{"value":"2025-03-30","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}