{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,13]],"date-time":"2026-03-13T08:56:25Z","timestamp":1773392185496,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":48,"publisher":"ACM","license":[{"start":{"date-parts":[[2022,6,12]],"date-time":"2022-06-12T00:00:00Z","timestamp":1654992000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"Swiss National Science Foundation (SNSF)","award":["178894"],"award-info":[{"award-number":["178894"]}]},{"DOI":"10.13039\/100010667","name":"H2020 Industrial Leadership","doi-asserted-by":"publisher","award":["825041"],"award-info":[{"award-number":["825041"]}],"id":[{"id":"10.13039\/100010667","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2022,6,12]]},"DOI":"10.1145\/3533737.3535095","type":"proceedings-article","created":{"date-parts":[[2022,6,13]],"date-time":"2022-06-13T13:12:09Z","timestamp":1655125929000},"page":"1-8","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":5,"title":["Sampling-Based AQP in Modern Analytical Engines"],"prefix":"10.1145","author":[{"given":"Viktor","family":"Sanca","sequence":"first","affiliation":[{"name":"DIAS Lab, EPFL, Switzerland"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Anastasia","family":"Ailamaki","sequence":"additional","affiliation":[{"name":"DIAS Lab, EPFL, Switzerland and RAW Labs SA, Switzerland"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2022,6,13]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1145\/2465351.2465355"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1109\/SSDBM.2007.29"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1145\/3399666.3399924"},{"key":"e_1_3_2_1_4_1","volume-title":"Second Biennial Conference on Innovative Data Systems Research, CIDR 2005, Asilomar, CA, USA, January 4-7, 2005, Online Proceedings. CIDR, 225\u2013237","author":"Boncz A.","year":"2005","unstructured":"Peter\u00a0 A. Boncz , Marcin Zukowski , and Niels Nes . 2005 . MonetDB\/X100: Hyper-Pipelining Query Execution . In Second Biennial Conference on Innovative Data Systems Research, CIDR 2005, Asilomar, CA, USA, January 4-7, 2005, Online Proceedings. CIDR, 225\u2013237 . http:\/\/cidrdb.org\/cidr2005\/papers\/P19.pdf Peter\u00a0A. Boncz, Marcin Zukowski, and Niels Nes. 2005. MonetDB\/X100: Hyper-Pipelining Query Execution. In Second Biennial Conference on Innovative Data Systems Research, CIDR 2005, Asilomar, CA, USA, January 4-7, 2005, Online Proceedings. CIDR, 225\u2013237. http:\/\/cidrdb.org\/cidr2005\/papers\/P19.pdf"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1145\/375663.375694"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1145\/1007568.1007602"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1145\/3035918.3056097"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.14778\/3303753.3303760"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1561\/1900000004"},{"key":"e_1_3_2_1_10_1","unstructured":"Intel\u00ae corporation. 2021. Intel product specifications. Retrieved 2021-09-01 from https:\/\/ark.intel.com\/  Intel\u00ae corporation. 2021. Intel product specifications. Retrieved 2021-09-01 from https:\/\/ark.intel.com\/"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1109\/MC.2021.3125165"},{"key":"e_1_3_2_1_12_1","volume-title":"Practically Random: C++ library of statistical tests for RNGs. URL: https:\/\/sourceforge. net\/projects\/pracrand","author":"Doty-Humphrey Chris","year":"2010","unstructured":"Chris Doty-Humphrey . 2010 . Practically Random: C++ library of statistical tests for RNGs. URL: https:\/\/sourceforge. net\/projects\/pracrand (2010). Chris Doty-Humphrey. 2010. Practically Random: C++ library of statistical tests for RNGs. URL: https:\/\/sourceforge. net\/projects\/pracrand (2010)."},{"key":"e_1_3_2_1_13_1","volume-title":"Algorithms, Probability, Networks, and Games - Scientific Papers and Essays Dedicated to Paul G. Spirakis on the Occasion of His 60th Birthday(Lecture Notes in Computer Science, Vol.\u00a09295), Christos\u00a0D","author":"Efraimidis S.","unstructured":"Pavlos\u00a0 S. Efraimidis . 2015. Weighted Random Sampling over Data Streams . In Algorithms, Probability, Networks, and Games - Scientific Papers and Essays Dedicated to Paul G. Spirakis on the Occasion of His 60th Birthday(Lecture Notes in Computer Science, Vol.\u00a09295), Christos\u00a0D . Zaroliagis, Grammati\u00a0E. Pantziou, and Spyros\u00a0C. Kontogiannis (Eds.). Springer , 183\u2013195. https:\/\/doi.org\/10.1007\/978-3-319-24024-4_12 Pavlos\u00a0S. Efraimidis. 2015. Weighted Random Sampling over Data Streams. In Algorithms, Probability, Networks, and Games - Scientific Papers and Essays Dedicated to Paul G. Spirakis on the Occasion of His 60th Birthday(Lecture Notes in Computer Science, Vol.\u00a09295), Christos\u00a0D. Zaroliagis, Grammati\u00a0E. Pantziou, and Spyros\u00a0C. Kontogiannis (Eds.). Springer, 183\u2013195. https:\/\/doi.org\/10.1007\/978-3-319-24024-4_12"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1145\/377674.377676"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1145\/93605.98720"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1109\/69.273032"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1145\/3186728.3164145"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1145\/253262.253291"},{"key":"e_1_3_2_1_19_1","first-page":"7","article-title":"DeepDB: Learn from Data, Not from Queries!Proc","volume":"13","author":"Hilprecht Benjamin","year":"2020","unstructured":"Benjamin Hilprecht , Andreas Schmidt , Moritz Kulessa , Alejandro Molina , Kristian Kersting , and Carsten Binnig . 2020 . DeepDB: Learn from Data, Not from Queries!Proc . VLDB Endow. 13 , 7 (March 2020), 992\u20131005. https:\/\/doi.org\/10.14778\/3384345.3384349 Benjamin Hilprecht, Andreas Schmidt, Moritz Kulessa, Alejandro Molina, Kristian Kersting, and Carsten Binnig. 2020. DeepDB: Learn from Data, Not from Queries!Proc. VLDB Endow. 13, 7 (March 2020), 992\u20131005. https:\/\/doi.org\/10.14778\/3384345.3384349","journal-title":"VLDB Endow."},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.14778\/3352063.3352130"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1145\/2882903.2882940"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.14778\/2994509.2994516"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.14778\/2735479.2735485"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1145\/3035918.3056099"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1090\/S0025-5718-99-00996-5"},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1145\/1268776.1268777"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1145\/3230636"},{"key":"e_1_3_2_1_28_1","unstructured":"Daniel Lemire. 2021. testingRNG : testing popular random-number generators. Retrieved 2021-09-01 from https:\/\/github.com\/lemire\/testingRNG  Daniel Lemire. 2021. testingRNG : testing popular random-number generators. Retrieved 2021-09-01 from https:\/\/github.com\/lemire\/testingRNG"},{"key":"e_1_3_2_1_29_1","first-page":"379","article-title":"Approximate Query Processing: What is New and Where to Go? - A Survey on Approximate Query Processing. Data Sci","volume":"3","author":"Li Kaiyu","year":"2018","unstructured":"Kaiyu Li and Guoliang Li . 2018 . Approximate Query Processing: What is New and Where to Go? - A Survey on Approximate Query Processing. Data Sci . Eng. 3 , 4 (2018), 379 \u2013 397 . https:\/\/doi.org\/10.1007\/s41019-018-0074-4 Kaiyu Li and Guoliang Li. 2018. Approximate Query Processing: What is New and Where to Go? - A Survey on Approximate Query Processing. Data Sci. Eng. 3, 4 (2018), 379\u2013397. https:\/\/doi.org\/10.1007\/s41019-018-0074-4","journal-title":"Eng."},{"key":"e_1_3_2_1_30_1","volume-title":"Sampling: design and analysis","author":"Lohr L","unstructured":"Sharon\u00a0 L Lohr . 2019. Sampling: design and analysis . Chapman and Hall\/CRC. Sharon\u00a0L Lohr. 2019. Sampling: design and analysis. Chapman and Hall\/CRC."},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1145\/3299869.3324958"},{"key":"e_1_3_2_1_32_1","volume-title":"Proceedings of the 30th International Conference on Machine Learning(Proceedings of Machine Learning Research, Vol.\u00a028)","author":"Meng Xiangrui","year":"2013","unstructured":"Xiangrui Meng . 2013 . Scalable Simple Random Sampling and Stratified Sampling . In Proceedings of the 30th International Conference on Machine Learning(Proceedings of Machine Learning Research, Vol.\u00a028) , Sanjoy Dasgupta and David McAllester (Eds.). PMLR, Atlanta, Georgia, USA, 531\u2013539. https:\/\/proceedings.mlr.press\/v28\/meng13a.html Xiangrui Meng. 2013. Scalable Simple Random Sampling and Stratified Sampling. In Proceedings of the 30th International Conference on Machine Learning(Proceedings of Machine Learning Research, Vol.\u00a028), Sanjoy Dasgupta and David McAllester (Eds.). PMLR, Atlanta, Georgia, USA, 531\u2013539. https:\/\/proceedings.mlr.press\/v28\/meng13a.html"},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.1145\/1476589.1476628"},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.14778\/2002938.2002940"},{"key":"e_1_3_2_1_35_1","volume-title":"Umbra: A Disk-Based System with In-Memory Performance. In 10th Conference on Innovative Data Systems Research, CIDR","author":"Neumann Thomas","year":"2020","unstructured":"Thomas Neumann and Michael\u00a0 J. Freitag . 2020 . Umbra: A Disk-Based System with In-Memory Performance. In 10th Conference on Innovative Data Systems Research, CIDR 2020, Amsterdam, The Netherlands , January 12-15, 2020, Online Proceedings. CIDR. http:\/\/cidrdb.org\/cidr2020\/papers\/p29-neumann-cidr20.pdf Thomas Neumann and Michael\u00a0J. Freitag. 2020. Umbra: A Disk-Based System with In-Memory Performance. In 10th Conference on Innovative Data Systems Research, CIDR 2020, Amsterdam, The Netherlands, January 12-15, 2020, Online Proceedings. CIDR. http:\/\/cidrdb.org\/cidr2020\/papers\/p29-neumann-cidr20.pdf"},{"key":"e_1_3_2_1_36_1","volume-title":"Elastic and Online Approximate Query Processing. In 35th IEEE International Conference on Data Engineering, ICDE 2019","author":"Olma Matthaios","year":"2019","unstructured":"Matthaios Olma , Odysseas Papapetrou , Raja Appuswamy , and Anastasia Ailamaki . 2019 . Taster: Self-Tuning , Elastic and Online Approximate Query Processing. In 35th IEEE International Conference on Data Engineering, ICDE 2019 , Macao, China , April 8-11, 2019. IEEE, 482\u2013493. https:\/\/doi.org\/10.1109\/ICDE.2019.00050 Matthaios Olma, Odysseas Papapetrou, Raja Appuswamy, and Anastasia Ailamaki. 2019. Taster: Self-Tuning, Elastic and Online Approximate Query Processing. In 35th IEEE International Conference on Data Engineering, ICDE 2019, Macao, China, April 8-11, 2019. IEEE, 482\u2013493. https:\/\/doi.org\/10.1109\/ICDE.2019.00050"},{"key":"e_1_3_2_1_37_1","volume-title":"The Star Schema Benchmark and Augmented Fact Table Indexing","author":"O\u2019Neil Patrick","unstructured":"Patrick O\u2019Neil , Elizabeth O\u2019Neil , Xuedong Chen , and Stephen Revilak . 2009. The Star Schema Benchmark and Augmented Fact Table Indexing . Springer-Verlag , Berlin, Heidelberg , 237\u2013252. https:\/\/doi.org\/10.1007\/978-3-642-10424-4_17 Patrick O\u2019Neil, Elizabeth O\u2019Neil, Xuedong Chen, and Stephen Revilak. 2009. The Star Schema Benchmark and Augmented Fact Table Indexing. Springer-Verlag, Berlin, Heidelberg, 237\u2013252. https:\/\/doi.org\/10.1007\/978-3-642-10424-4_17"},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.1145\/63039.63042"},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.1145\/3183713.3196905"},{"key":"e_1_3_2_1_40_1","volume-title":"The digitization of the world from edge to core","author":"Reinsel-John David","year":"2018","unstructured":"David Reinsel-John Gantz-John Rydning . 2018. The digitization of the world from edge to core . Framingham : International Data Corporation( 2018 ), 16. David Reinsel-John Gantz-John Rydning. 2018. The digitization of the world from edge to core. Framingham: International Data Corporation(2018), 16."},{"key":"e_1_3_2_1_41_1","unstructured":"Allen Samuels. 2018. The Consequences of Infinite Storage Bandwidth. https:\/\/events.static.linuxfound.org\/sites\/events\/files\/slides\/Keynote_Allen%20Samuels_Final.pdf  Allen Samuels. 2018. The Consequences of Infinite Storage Bandwidth. https:\/\/events.static.linuxfound.org\/sites\/events\/files\/slides\/Keynote_Allen%20Samuels_Final.pdf"},{"key":"e_1_3_2_1_42_1","unstructured":"Peter Sanders Sebastian Lamm Lorenz H\u00fcbschle-Schneider Emanuel Schrade and Carsten Dachsbacher. 2016. Efficient Random Sampling - Parallel Vectorized Cache-Efficient and Online. CoRR abs\/1610.05141(2016). arXiv:1610.05141http:\/\/arxiv.org\/abs\/1610.05141  Peter Sanders Sebastian Lamm Lorenz H\u00fcbschle-Schneider Emanuel Schrade and Carsten Dachsbacher. 2016. Efficient Random Sampling - Parallel Vectorized Cache-Efficient and Online. CoRR abs\/1610.05141(2016). arXiv:1610.05141http:\/\/arxiv.org\/abs\/1610.05141"},{"key":"e_1_3_2_1_43_1","volume-title":"The Flash Transformed Data Center. In Fifth Annual Non-Volatile Memories Workshop. https:\/\/www.flashmemorysummit.com\/English\/Collaterals\/Proceedings\/2014\/20140805_Keynote5_SanDisk_Scaramuzzo.pdf","author":"Scaramuzzo J","year":"2014","unstructured":"J Scaramuzzo . 2014 . The Flash Transformed Data Center. In Fifth Annual Non-Volatile Memories Workshop. https:\/\/www.flashmemorysummit.com\/English\/Collaterals\/Proceedings\/2014\/20140805_Keynote5_SanDisk_Scaramuzzo.pdf J Scaramuzzo. 2014. The Flash Transformed Data Center. In Fifth Annual Non-Volatile Memories Workshop. https:\/\/www.flashmemorysummit.com\/English\/Collaterals\/Proceedings\/2014\/20140805_Keynote5_SanDisk_Scaramuzzo.pdf"},{"key":"e_1_3_2_1_44_1","unstructured":"Panagiotis Sioulas Viktor Sanca Ioannis Mytilinis and Anastasia Ailamaki. 2021. Accelerating Complex Analytics using Speculation.. In CIDR.  Panagiotis Sioulas Viktor Sanca Ioannis Mytilinis and Anastasia Ailamaki. 2021. Accelerating Complex Analytics using Speculation.. In CIDR."},{"key":"e_1_3_2_1_45_1","first-page":"6","article-title":"Micro-Architectural Analysis of OLAP","volume":"13","author":"Sirin Utku","year":"2020","unstructured":"Utku Sirin and Anastasia Ailamaki . 2020 . Micro-Architectural Analysis of OLAP : Limitations and Opportunities. Proc. VLDB Endow. 13 , 6 (Feb. 2020), 840\u2013853. https:\/\/doi.org\/10.14778\/3380750.3380755 Utku Sirin and Anastasia Ailamaki. 2020. Micro-Architectural Analysis of OLAP: Limitations and Opportunities. Proc. VLDB Endow. 13, 6 (Feb. 2020), 840\u2013853. https:\/\/doi.org\/10.14778\/3380750.3380755","journal-title":"Limitations and Opportunities. Proc. VLDB Endow."},{"key":"e_1_3_2_1_46_1","volume-title":"DISC 2011, Rome, Italy, September 20-22, 2011. Proceedings(Lecture Notes in Computer Science, Vol.\u00a06950)","author":"Tirthapura Srikanta","year":"2011","unstructured":"Srikanta Tirthapura and David\u00a0 P. Woodruff . 2011 . Optimal Random Sampling from Distributed Streams Revisited. In Distributed Computing - 25th International Symposium , DISC 2011, Rome, Italy, September 20-22, 2011. Proceedings(Lecture Notes in Computer Science, Vol.\u00a06950) , David Peleg (Ed.). Springer, 283\u2013297. https:\/\/doi.org\/10.1007\/978-3-642-24100-0_27 Srikanta Tirthapura and David\u00a0P. Woodruff. 2011. Optimal Random Sampling from Distributed Streams Revisited. In Distributed Computing - 25th International Symposium, DISC 2011, Rome, Italy, September 20-22, 2011. Proceedings(Lecture Notes in Computer Science, Vol.\u00a06950), David Peleg (Ed.). Springer, 283\u2013297. https:\/\/doi.org\/10.1007\/978-3-642-24100-0_27"},{"key":"e_1_3_2_1_47_1","doi-asserted-by":"publisher","DOI":"10.1145\/3147.3165"},{"key":"e_1_3_2_1_48_1","first-page":"345","article-title":"Ray Tracing Gems II: Next Generation Real-Time Rendering with DXR, Vulkan, and OptiX. Apress, Berkeley, CA","author":"Wyman Chris","year":"2021","unstructured":"Chris Wyman . 2021 . Ray Tracing Gems II: Next Generation Real-Time Rendering with DXR, Vulkan, and OptiX. Apress, Berkeley, CA , Chapter 22, Weighted Reservoir Sampling: Randomly Sampling Streams , 345 \u2013 349 . https:\/\/doi.org\/10.1007\/978-1-4842-7185-8_22 Chris Wyman. 2021. Ray Tracing Gems II: Next Generation Real-Time Rendering with DXR, Vulkan, and OptiX. Apress, Berkeley, CA, Chapter 22, Weighted Reservoir Sampling: Randomly Sampling Streams, 345\u2013349. https:\/\/doi.org\/10.1007\/978-1-4842-7185-8_22","journal-title":"Chapter 22, Weighted Reservoir Sampling: Randomly Sampling Streams"}],"event":{"name":"SIGMOD\/PODS '22: International Conference on Management of Data","location":"Philadelphia PA USA","acronym":"SIGMOD\/PODS '22","sponsor":["SIGMOD ACM Special Interest Group on Management of Data"]},"container-title":["Data Management on New Hardware"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3533737.3535095","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3533737.3535095","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T18:43:40Z","timestamp":1750272220000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3533737.3535095"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,6,12]]},"references-count":48,"alternative-id":["10.1145\/3533737.3535095","10.1145\/3533737"],"URL":"https:\/\/doi.org\/10.1145\/3533737.3535095","relation":{},"subject":[],"published":{"date-parts":[[2022,6,12]]},"assertion":[{"value":"2022-06-13","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}