{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,8]],"date-time":"2026-05-08T18:58:09Z","timestamp":1778266689686,"version":"3.51.4"},"publisher-location":"New York, NY, USA","reference-count":66,"publisher":"ACM","license":[{"start":{"date-parts":[[2022,6,10]],"date-time":"2022-06-10T00:00:00Z","timestamp":1654819200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"name":"Shenzhen Institute of Artificial Intelligence and Robotics for Society (AIRS) Chinese University of Hong Kong Shenzhen"},{"name":"Key-Area Research and Development Program of Guangdong Province","award":["2019B010155003"],"award-info":[{"award-number":["2019B010155003"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2022,6,10]]},"DOI":"10.1145\/3514221.3526157","type":"proceedings-article","created":{"date-parts":[[2022,6,12]],"date-time":"2022-06-12T02:33:49Z","timestamp":1655001229000},"page":"674-684","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":26,"title":["LOCAT: Low-Overhead Online Configuration Auto-Tuning of Spark SQL Applications"],"prefix":"10.1145","author":[{"given":"Jinhan","family":"Xin","sequence":"first","affiliation":[{"name":"Shenzhen Institute of Advanced Technology (SIAT), Chinese Academy of Sciences (CAS) &amp; University of Chinese Academy of Sciences (UCAS), Shenzhen, China"}]},{"given":"Kai","family":"Hwang","sequence":"additional","affiliation":[{"name":"The Chinese University of Hong Kong, Shenzhen, Shenzhen, China"}]},{"given":"Zhibin","family":"Yu","sequence":"additional","affiliation":[{"name":"Shenzhen Institute of Advanced Technology (SIAT), Chinese Academy of Sciences (CAS) &amp; Shenzhen Huawei Cloud Computing Co.,Ltd., Shenzhen, China"}]}],"member":"320","published-online":{"date-parts":[[2022,6,11]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.tjem.2018.08.001"},{"key":"e_1_3_2_1_2_1","volume-title":"Proceedings of the 14th USENIX Conference on Networked Systems Design and Implementation","author":"Alipourfard Omid","year":"2017","unstructured":"Omid Alipourfard, Hongqiang Harry Liu, Jianshu Chen, Shivaram Venkataraman, Minlan Yu, and Ming Zhang. 2017. Cherrypick: Adaptively Unearthing the Best Cloud Configurations for Big Data Analytics. In Proceedings of the 14th USENIX Conference on Networked Systems Design and Implementation (Boston, MA, USA) (NSDI'17). USENIX Association, USA, 469--482. https:\/\/www.usenix.org\/conference\/nsdi17\/technical-sessions\/presentation\/alipourfard"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1007\/s11227-020-03307-w"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1145\/2723372.2742797"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1109\/TKDE.2018.2850339"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1109\/BigData.2018.8622018"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1007\/978--3--319--16486--1_61"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.2307\/2287012"},{"key":"e_1_3_2_1_9_1","first-page":"179","article-title":"Pearson versus Spearman, Kendall's tau correlation analysis on structure-activity relationships of biologic active compounds","volume":"5","author":"Bolboaca Sorana-Daniela","year":"2006","unstructured":"Sorana-Daniela Bolboaca and Lorentz J\u00e4ntschi. 2006. Pearson versus Spearman, Kendall's tau correlation analysis on structure-activity relationships of biologic active compounds. Leonardo Journal of Sciences 5, 9 (2006), 179--200. http:\/\/ljs.academicdirect.org\/A09\/179_200.htm","journal-title":"Leonardo Journal of Sciences"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1007\/978--3--319-04936--6_5"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.compeleceng.2013.11.024"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1109\/tbdata.2019.2948338"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1145\/3357384.3358090"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1109\/ISPASS.2016.7482079"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1109\/CLOUD.2018.00038"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1504\/IJBPIM.2015.073665"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1109\/DISTRA.2018.8601018"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICC.2019.8761785"},{"key":"e_1_3_2_1_19_1","volume-title":"Tuneful: An Online Significance-Aware Configuration Tuner for Big Data Analytics. arXiv preprint arXiv:2001.08002","author":"Fekry Ayat","year":"2020","unstructured":"Ayat Fekry, Lucian Carata, Thomas Pasquier, Andrew Rice, and Andy Hopper. 2020. Tuneful: An Online Significance-Aware Configuration Tuner for Big Data Analytics. arXiv preprint arXiv:2001.08002 (2020). arXiv:2001.08002 http:\/\/arxiv.org\/abs\/2001.08002"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2017.2647939"},{"key":"e_1_3_2_1_21_1","volume-title":"Feature extraction: foundations and applications","author":"Guyon Isabelle","year":"1922","unstructured":"Isabelle Guyon, Steve Gunn, Masoud Nikravesh, and Lofti A Zadeh. 2008. Feature extraction: foundations and applications. Vol. 207. Springer. https:\/\/eprints.soton.ac.uk\/261922\/"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1007\/978--3--642--39678--6_24"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1016\/S0951--8320(03)00058--9"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1145\/3381027"},{"key":"e_1_3_2_1_25_1","unstructured":"Matthew Hoffman Eric Brochu Nando de Freitas et al. 2011. Portfolio Allocation for Bayesian Optimization. In UAI. Citeseer 327--336. https:\/\/dl.acm.org\/doi\/abs\/10.5555\/3020548.3020587"},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDCS.2018.00070"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDEW.2010.5452747"},{"key":"e_1_3_2_1_28_1","volume-title":"Evaluating Hive and Spark SQL with BigBench. arXiv preprint arXiv:1512.08417","author":"Ivanov Todor","year":"2015","unstructured":"Todor Ivanov and Max-Georg Beer. 2015. Evaluating Hive and Spark SQL with BigBench. arXiv preprint arXiv:1512.08417 (2015). arXiv:1512.08417 http:\/\/arxiv.org\/abs\/1512.08417"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1145\/2967938.2967957"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1023\/A:1008306431147"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1007\/978--3-030--33495--6_34"},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.1145\/3318464.3380591"},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.14778\/3352063.3352129"},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.15835\/nbha4319881"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1049\/cp.2015.0832"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1109\/MICRO.2018.00056"},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.1007\/978--94-009-0909-0"},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.1007\/978--3--319--47898--2_24"},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.1109\/PADSW.2018.8644891"},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"publisher","DOI":"10.1007\/978--3--540--28650--9_4"},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"publisher","DOI":"10.5815\/ijeme.2020.04.02"},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE.2019.00196"},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1109\/JPROC.2015.2494218"},{"key":"e_1_3_2_1_44_1","doi-asserted-by":"publisher","DOI":"10.1007\/978--3--319--72401-0_10"},{"key":"e_1_3_2_1_45_1","volume-title":"Weinberger (Eds.)","volume":"25","author":"Snoek Jasper","year":"2012","unstructured":"Jasper Snoek, Hugo Larochelle, and Ryan P Adams. 2012. Practical Bayesian Optimization of Machine Learning Algorithms. In Advances in Neural Information Processing Systems, F. Pereira, C. J. C. Burges, L. Bottou, and K. Q. Weinberger (Eds.), Vol. 25. Curran Associates, Inc. https:\/\/proceedings.neurips.cc\/paper\/2012\/file\/05311655a15b75fab86956663e1819cd-Paper.pdf"},{"key":"e_1_3_2_1_46_1","volume-title":"Retrieved","year":"2022","unstructured":"SparkConf 2022. Configuration - Spark 3.2.1 Documentation. Retrieved March 28, 2022 from https:\/\/spark.apache.org\/docs\/latest\/configuration.html"},{"key":"e_1_3_2_1_47_1","volume-title":"Retrieved","year":"2022","unstructured":"SparkTuning 2022. Tuning - Spark 3.2.1 Documentation. Retrieved March 28, 2022 from https:\/\/spark.apache.org\/docs\/latest\/tuning.html"},{"key":"e_1_3_2_1_48_1","doi-asserted-by":"publisher","DOI":"10.1007\/3--540--47987--2_41"},{"key":"e_1_3_2_1_49_1","doi-asserted-by":"publisher","DOI":"10.14778\/1687553.1687609"},{"key":"e_1_3_2_1_50_1","unstructured":"TPC Benchmark DS. 2020. http:\/\/www.tpc.org\/tpc_documents_current_versions\\\/pdf\/tpc-ds_v2.3.0.pdf."},{"key":"e_1_3_2_1_51_1","doi-asserted-by":"publisher","DOI":"10.1145\/2523616.2523633"},{"key":"e_1_3_2_1_52_1","doi-asserted-by":"publisher","DOI":"10.1590\/0103--8478cr20160946"},{"key":"e_1_3_2_1_53_1","volume-title":"Ernest: Efficient Performance Prediction for Large-Scale Advanced Analytics. In 13th USENIX Symposium on Networked Systems Design and Implementation (NSDI 16)","author":"Venkataraman Shivaram","year":"2016","unstructured":"Shivaram Venkataraman, Zongheng Yang, Michael Franklin, Benjamin Recht, and Ion Stoica. 2016. Ernest: Efficient Performance Prediction for Large-Scale Advanced Analytics. In 13th USENIX Symposium on Networked Systems Design and Implementation (NSDI 16). USENIX Association, Santa Clara, CA, 363--378. https:\/\/www.usenix.org\/conference\/nsdi16\/technical-sessions\/presentation\/venkataraman"},{"key":"e_1_3_2_1_54_1","doi-asserted-by":"publisher","DOI":"10.1109\/HPCC-SmartCity-DSS.2016.0088"},{"key":"e_1_3_2_1_55_1","doi-asserted-by":"publisher","DOI":"10.1109\/HPCC-CSS-ICESS.2015.246"},{"key":"e_1_3_2_1_56_1","doi-asserted-by":"publisher","DOI":"10.1109\/34.735807"},{"key":"e_1_3_2_1_57_1","volume-title":"LOCAT: Low-Overhead Online Configuration Auto-Tuning of Spark SQL Applications. arXiv:2203.14889 [cs.DC] https:\/\/arxiv.org\/abs\/2203.14889","author":"Xin Jinhan","year":"2022","unstructured":"Jinhan Xin, Kai Hwang, and Zhibin Yu. 2022. LOCAT: Low-Overhead Online Configuration Auto-Tuning of Spark SQL Applications. arXiv:2203.14889 [cs.DC] https:\/\/arxiv.org\/abs\/2203.14889"},{"key":"e_1_3_2_1_58_1","doi-asserted-by":"publisher","DOI":"10.1145\/3296957.3173187"},{"key":"e_1_3_2_1_59_1","doi-asserted-by":"publisher","DOI":"10.1109\/BigData.2017.8257950"},{"key":"e_1_3_2_1_60_1","volume-title":"Proceedings of the 2nd USENIX Conference on Hot Topics in Cloud Computing","author":"Zaharia Matei","year":"2010","unstructured":"Matei Zaharia, Mosharaf Chowdhury, Michael J. Franklin, Scott Shenker, and Ion Stoica. 2010. Spark: Cluster Computing with Working Sets. In Proceedings of the 2nd USENIX Conference on Hot Topics in Cloud Computing (Boston, MA) (HotCloud'10). USENIX Association, USA, 10. https:\/\/dl.acm.org\/doi\/abs\/10.5555\/1863103.1863113"},{"key":"e_1_3_2_1_61_1","doi-asserted-by":"publisher","DOI":"10.1002\/0470011815.b2a15150"},{"key":"e_1_3_2_1_62_1","doi-asserted-by":"publisher","DOI":"10.38094\/jastt1224"},{"key":"e_1_3_2_1_63_1","doi-asserted-by":"publisher","DOI":"10.1145\/3299869.3300085"},{"key":"e_1_3_2_1_64_1","doi-asserted-by":"publisher","DOI":"10.1109\/SmartCloud.2016.33"},{"key":"e_1_3_2_1_65_1","doi-asserted-by":"publisher","DOI":"10.1145\/3127479.3128605"},{"key":"e_1_3_2_1_66_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.future.2017.07.003"}],"event":{"name":"SIGMOD\/PODS '22: International Conference on Management of Data","location":"Philadelphia PA USA","acronym":"SIGMOD\/PODS '22","sponsor":["SIGMOD ACM Special Interest Group on Management of Data"]},"container-title":["Proceedings of the 2022 International Conference on Management of Data"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3514221.3526157","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3514221.3526157","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T18:10:13Z","timestamp":1750183813000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3514221.3526157"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,6,10]]},"references-count":66,"alternative-id":["10.1145\/3514221.3526157","10.1145\/3514221"],"URL":"https:\/\/doi.org\/10.1145\/3514221.3526157","relation":{},"subject":[],"published":{"date-parts":[[2022,6,10]]},"assertion":[{"value":"2022-06-11","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}