{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,27]],"date-time":"2025-03-27T21:17:58Z","timestamp":1743110278915,"version":"3.40.3"},"publisher-location":"Cham","reference-count":51,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783031151156"},{"type":"electronic","value":"9783031151163"}],"license":[{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2022]]},"DOI":"10.1007\/978-3-031-15116-3_1","type":"book-chapter","created":{"date-parts":[[2022,8,18]],"date-time":"2022-08-18T17:17:53Z","timestamp":1660843073000},"page":"3-21","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Serving Hybrid-Cloud SQL Interactive Queries at\u00a0Twitter"],"prefix":"10.1007","author":[{"given":"Chunxu","family":"Tang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Beinan","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Huijun","family":"Wu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zhenzhao","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yao","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Vrushali","family":"Channapattan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zhenxiao","family":"Luo","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ruchin","family":"Kabra","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mainak","family":"Ghosh","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Nikhil Kantibhai","family":"Navadiya","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Prachi","family":"Mishra","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Prateek","family":"Mukhedkar","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Anneliese","family":"Lu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2022,8,19]]},"reference":[{"unstructured":"Aurora configuration (2017). http:\/\/aurora.apache.org\/documentation\/latest\/reference\/configuration-tutorial\/","key":"1_CR1"},{"unstructured":"Apache Beam SQL (2021). https:\/\/beam.apache.org\/documentation\/dsls\/sql\/overview\/","key":"1_CR2"},{"unstructured":"Apache Druid SQL (2021). https:\/\/druid.apache.org\/docs\/latest\/querying\/sql.html","key":"1_CR3"},{"unstructured":"Apache Zeppelin (2021). https:\/\/zeppelin.apache.org\/","key":"1_CR4"},{"unstructured":"Google BigQuery (2021). https:\/\/cloud.google.com\/bigquery","key":"1_CR5"},{"unstructured":"Hadoop ViewFs (2021). https:\/\/hadoop.apache.org\/docs\/stable\/hadoop-project-dist\/hadoop-hdfs\/ViewFs.html","key":"1_CR6"},{"unstructured":"Helium packages (2021). https:\/\/zeppelin.apache.org\/helium_packages.html","key":"1_CR7"},{"unstructured":"Jupyter project (2021). https:\/\/jupyter.org\/","key":"1_CR8"},{"unstructured":"TPC-H benchmark (2021). http:\/\/www.tpc.org\/tpch\/","key":"1_CR9"},{"unstructured":"Agrawal, P.: A new collaboration with Google Cloud (2018). https:\/\/blog.twitter.com\/engineering\/en_us\/topics\/infrastructure\/2018\/a-new-collaboration-with-google-cloud.html","key":"1_CR10"},{"issue":"12","key":"1_CR11","doi-asserted-by":"publisher","first-page":"3204","DOI":"10.14778\/3415478.3415545","volume":"13","author":"J Aguilar-Saborit","year":"2020","unstructured":"Aguilar-Saborit, J., et al.: POLARIS: the distributed SQL engine in azure synapse. Proc. VLDB Endow. 13(12), 3204\u20133216 (2020)","journal-title":"Proc. VLDB Endow."},{"doi-asserted-by":"crossref","unstructured":"Aleyasen, A., Soliman, M.A., Antova, L., Waas, F.M., Winslett, M.: High-throughput adaptive data virtualization via context-aware query routing. In: 2018 IEEE International Conference on Big Data (Big Data), pp. 1709\u20131718. IEEE (2018)","key":"1_CR12","DOI":"10.1109\/BigData.2018.8622277"},{"doi-asserted-by":"crossref","unstructured":"Armbrust, M., et al.: Spark SQL: relational data processing in Spark. In: Proceedings of the 2015 ACM SIGMOD International Conference on Management of Data, pp. 1383\u20131394 (2015)","key":"1_CR13","DOI":"10.1145\/2723372.2742797"},{"unstructured":"Barga, R.: Hadoop filesystem at Twitter (2015). https:\/\/blog.twitter.com\/engineering\/en_us\/a\/2015\/hadoop-filesystem-at-twitter","key":"1_CR14"},{"issue":"12","key":"1_CR15","doi-asserted-by":"publisher","first-page":"2022","DOI":"10.14778\/3352063.3352121","volume":"12","author":"B Chattopadhyay","year":"2019","unstructured":"Chattopadhyay, B., et al.: Procella: unifying serving and analytical data at YouTube. Proc. VLDB Endow. 12(12), 2022\u20132034 (2019)","journal-title":"Proc. VLDB Endow."},{"doi-asserted-by":"crossref","unstructured":"Dageville, B., et al.: The snowflake elastic data warehouse. In: Proceedings of the 2016 International Conference on Management of Data, pp. 215\u2013226 (2016)","key":"1_CR16","DOI":"10.1145\/2882903.2903741"},{"issue":"1","key":"1_CR17","doi-asserted-by":"publisher","first-page":"107","DOI":"10.1145\/1327452.1327492","volume":"51","author":"J Dean","year":"2008","unstructured":"Dean, J., Ghemawat, S.: MapReduce: simplified data processing on large clusters. Commun. ACM 51(1), 107\u2013113 (2008)","journal-title":"Commun. ACM"},{"issue":"1","key":"1_CR18","doi-asserted-by":"publisher","first-page":"72","DOI":"10.1145\/1629175.1629198","volume":"53","author":"J Dean","year":"2010","unstructured":"Dean, J., Ghemawat, S.: MapReduce: a flexible data processing tool. Commun. ACM 53(1), 72\u201377 (2010)","journal-title":"Commun. ACM"},{"unstructured":"Dem, J.L.: Graduating apache parquet (2015). https:\/\/blog.twitter.com\/engineering\/en_us\/a\/2015\/graduating-apache-parquet.html","key":"1_CR19"},{"doi-asserted-by":"crossref","unstructured":"Gupta, A., et al.: Amazon redshift and the case for simpler data warehouses. In: Proceedings of the 2015 ACM SIGMOD International Conference on Management of Data, pp. 1917\u20131923 (2015)","key":"1_CR20","DOI":"10.1145\/2723372.2742795"},{"unstructured":"Hashemi, M.: The infrastructure behind Twitter: efficiency and optimization (2016). https:\/\/blog.twitter.com\/engineering\/en_us\/topics\/infrastructure\/2016\/the-infrastructure-behind-twitter-efficiency-and-optimization","key":"1_CR21"},{"unstructured":"Hindman, B., et al.: Mesos: a platform for fine-grained resource sharing in the data center. In: NSDI, vol. 11, p. 22 (2011)","key":"1_CR22"},{"unstructured":"Krishnan, S.: Discovery and consumption of analytics data at Twitter (2016). https:\/\/blog.twitter.com\/engineering\/en_us\/topics\/insights\/2016\/discovery-and-consumption-of-analytics-data-at-twitter.html","key":"1_CR23"},{"issue":"12","key":"1_CR24","doi-asserted-by":"publisher","first-page":"1790","DOI":"10.14778\/2367502.2367518","volume":"5","author":"A Lamb","year":"2012","unstructured":"Lamb, A., et al.: The vertica analytic database: C-store 7 years later. Proc. VLDB Endow. 5(12), 1790\u20131801 (2012)","journal-title":"Proc. VLDB Endow."},{"doi-asserted-by":"crossref","unstructured":"Lawrence, R.: Integration and virtualization of relational SQL and NoSQL systems including MySQL and MongoDB. In: 2014 International Conference on Computational Science and Computational Intelligence, vol. 1, pp. 285\u2013290. IEEE (2014)","key":"1_CR25","DOI":"10.1109\/CSCI.2014.56"},{"doi-asserted-by":"crossref","unstructured":"Lawrence, R.: Faster querying for database integration and virtualization with distributed semi-joins. In: 2017 International Conference on Computational Science and Computational Intelligence (CSCI), pp. 1406\u20131410. IEEE (2017)","key":"1_CR26","DOI":"10.1109\/CSCI.2017.246"},{"doi-asserted-by":"crossref","unstructured":"Li, Y., et al.: A performance evaluation of spark graphframes for fast and scalable graph analytics at Twitter. In: 2021 IEEE International Conference on Big Data (Big Data), pp. 5959\u20135959. IEEE (2021)","key":"1_CR27","DOI":"10.1109\/BigData52589.2021.9671499"},{"doi-asserted-by":"crossref","unstructured":"Luo, Z., et al.: From batch processing to real time analytics: running presto at scale. In: 2022 IEEE 38th International Conference on Data Engineering (ICDE). IEEE (2022) (in press)","key":"1_CR28","DOI":"10.1109\/ICDE53745.2022.00165"},{"doi-asserted-by":"crossref","unstructured":"Mami, M.N., Graux, D., Scerri, S., Jabeen, H., Auer, S., Lehmann, J.: Uniform access to multiform data lakes using semantic technologies. In: Proceedings of the 21st International Conference on Information Integration and Web-Based Applications & Services, pp. 313\u2013322 (2019)","key":"1_CR29","DOI":"10.1145\/3366030.3366054"},{"issue":"1\u20132","key":"1_CR30","doi-asserted-by":"publisher","first-page":"330","DOI":"10.14778\/1920841.1920886","volume":"3","author":"S Melnik","year":"2010","unstructured":"Melnik, S., et al.: Dremel: interactive analysis of web-scale datasets. Proc. VLDB Endow. 3(1\u20132), 330\u2013339 (2010)","journal-title":"Proc. VLDB Endow."},{"issue":"12","key":"1_CR31","doi-asserted-by":"publisher","first-page":"3461","DOI":"10.14778\/3415478.3415568","volume":"13","author":"S Melnik","year":"2020","unstructured":"Melnik, S., et al.: Dremel: a decade of interactive SQL analysis at web scale. Proc. VLDB Endow. 13(12), 3461\u20133472 (2020)","journal-title":"Proc. VLDB Endow."},{"doi-asserted-by":"crossref","unstructured":"Mousa, A.H., Shiratuddin, N.: Data warehouse and data virtualization comparative study. In: 2015 International Conference on Developments of E-Systems Engineering (DeSE), pp. 369\u2013372. IEEE (2015)","key":"1_CR32","DOI":"10.1109\/DeSE.2015.26"},{"key":"1_CR33","doi-asserted-by":"publisher","first-page":"419","DOI":"10.1007\/978-1-4842-6186-6_19","volume-title":"BigQuery for Data Warehousing","author":"M Mucchetti","year":"2020","unstructured":"Mucchetti, M.: BigQuery ML. In: Mucchetti, M. (ed.) BigQuery for Data Warehousing, pp. 419\u2013468. Springer, Berkeley (2020). https:\/\/doi.org\/10.1007\/978-1-4842-6186-6_19"},{"unstructured":"Rottinghuis, J.: Partly Cloudy: the start of a journey into the cloud (2019). https:\/\/blog.twitter.com\/engineering\/en_us\/topics\/infrastructure\/2019\/the-start-of-a-journey-into-the-cloud.html","key":"1_CR34"},{"doi-asserted-by":"crossref","unstructured":"Schwarzkopf, M., Konwinski, A., Abd-El-Malek, M., Wilkes, J.: Omega: flexible, scalable schedulers for large compute clusters. In: Proceedings of the 8th ACM European Conference on Computer Systems, pp. 351\u2013364 (2013)","key":"1_CR35","DOI":"10.1145\/2465351.2465386"},{"doi-asserted-by":"crossref","unstructured":"Sethi, R., et al.: Presto: SQL on everything. In: 2019 IEEE 35th International Conference on Data Engineering (ICDE), pp. 1802\u20131813. IEEE (2019)","key":"1_CR36","DOI":"10.1109\/ICDE.2019.00196"},{"issue":"12","key":"1_CR37","doi-asserted-by":"publisher","first-page":"2170","DOI":"10.14778\/3352063.3352133","volume":"12","author":"J Tan","year":"2019","unstructured":"Tan, J., et al.: Choosing a cloud DBMS: architectures and tradeoffs. Proc. VLDB Endow. 12(12), 2170\u20132182 (2019)","journal-title":"Proc. VLDB Endow."},{"unstructured":"Tang, C., et al.: Twine: a unified cluster management system for shared infrastructure. In: 14th USENIX Symposium on Operating Systems Design and Implementation (OSDI 2020), pp. 787\u2013803 (2020)","key":"1_CR38"},{"doi-asserted-by":"crossref","unstructured":"Tang, C., et al.: Taming hybrid-cloud fast and scalable graph analytics at Twitter. arXiv preprint arXiv:2204.11338 (2022)","key":"1_CR39","DOI":"10.1109\/GLOBECOM48099.2022.10000674"},{"doi-asserted-by":"crossref","unstructured":"Tang, C., et al.: Forecasting SQL query cost at Twitter. In: 2021 IEEE International Conference on Cloud Engineering (IC2E), pp. 154\u2013160. IEEE (2021)","key":"1_CR40","DOI":"10.1109\/IC2E52221.2021.00030"},{"unstructured":"Tang, C., et al.: Hybrid-cloud SQL federation system at Twitter. In: ECSA (Companion) (2021)","key":"1_CR41"},{"issue":"2","key":"1_CR42","doi-asserted-by":"publisher","first-page":"1626","DOI":"10.14778\/1687553.1687609","volume":"2","author":"A Thusoo","year":"2009","unstructured":"Thusoo, A., et al.: Hive: a warehousing solution over a map-reduce framework. Proc. VLDB Endow. 2(2), 1626\u20131629 (2009)","journal-title":"Proc. VLDB Endow."},{"doi-asserted-by":"crossref","unstructured":"Tirmazi, M., et al.: Borg: the next generation. In: Proceedings of the Fifteenth European Conference on Computer Systems, pp. 1\u201314 (2020)","key":"1_CR43","DOI":"10.1145\/3342195.3387517"},{"key":"1_CR44","doi-asserted-by":"publisher","first-page":"93","DOI":"10.1016\/j.is.2017.04.002","volume":"69","author":"\u00c1 Vathy-Fogarassy","year":"2017","unstructured":"Vathy-Fogarassy, \u00c1., Hugy\u00e1k, T.: Uniform data access platform for SQL and NoSQL database systems. Inf. Syst. 69, 93\u2013105 (2017)","journal-title":"Inf. Syst."},{"doi-asserted-by":"crossref","unstructured":"Vavilapalli, V.K., et al.: Apache Hadoop YARN: yet another resource negotiator. In: Proceedings of the 4th Annual Symposium on Cloud Computing, pp. 1\u201316 (2013)","key":"1_CR45","DOI":"10.1145\/2523616.2523633"},{"doi-asserted-by":"crossref","unstructured":"Verma, A., Pedrosa, L., Korupolu, M., Oppenheimer, D., Tune, E., Wilkes, J.: Large-scale cluster management at Google with Borg. In: Proceedings of the Tenth European Conference on Computer Systems, pp. 1\u201317 (2015)","key":"1_CR46","DOI":"10.1145\/2741948.2741964"},{"doi-asserted-by":"crossref","unstructured":"VijayaRenu, L., Wang, Z., Rottinghuis, J.: Scaling event aggregation at Twitter to handle billions of events per minute. In: 2020 IEEE Infrastructure Conference, pp. 1\u20134. IEEE (2020)","key":"1_CR47","DOI":"10.1109\/IEEECONF47748.2020.9377618"},{"issue":"12","key":"1_CR48","doi-asserted-by":"publisher","first-page":"3152","DOI":"10.14778\/3415478.3415541","volume":"13","author":"C Wei","year":"2020","unstructured":"Wei, C., et al.: AnalyticDB-V: a hybrid analytical engine towards query fusion for structured and unstructured data. Proc. VLDB Endow. 13(12), 3152\u20133165 (2020)","journal-title":"Proc. VLDB Endow."},{"doi-asserted-by":"crossref","unstructured":"Wu, H., et al.: Migrate on-premises real-time data analytics jobs into the cloud. In: 2021 IEEE 8th International Conference on Data Science and Advanced Analytics (DSAA), pp. 1\u20132. IEEE (2021)","key":"1_CR49","DOI":"10.1109\/DSAA53316.2021.9564177"},{"doi-asserted-by":"crossref","unstructured":"Wu, H., et al.: Move real-time data analytics to the cloud: a case study on heron to dataflow migration. In: 2021 IEEE International Conference on Big Data (Big Data), pp. 2064\u20132067. IEEE (2021)","key":"1_CR50","DOI":"10.1109\/BigData52589.2021.9671294"},{"issue":"12","key":"1_CR51","doi-asserted-by":"publisher","first-page":"2059","DOI":"10.14778\/3352063.3352124","volume":"12","author":"C Zhan","year":"2019","unstructured":"Zhan, C., et al.: AnalyticDB: real-time OLAP database system at Alibaba cloud. Proc. VLDB Endow. 12(12), 2059\u20132070 (2019)","journal-title":"Proc. VLDB Endow."}],"container-title":["Lecture Notes in Computer Science","Software Architecture"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-15116-3_1","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,2,15]],"date-time":"2023-02-15T06:00:55Z","timestamp":1676440855000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-15116-3_1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022]]},"ISBN":["9783031151156","9783031151163"],"references-count":51,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-15116-3_1","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2022]]},"assertion":[{"value":"19 August 2022","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECSA","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Software Architecture","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"V\u00e4xj\u00f6","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Sweden","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2021","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"13 September 2021","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"17 September 2021","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"ecsa2021","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/conf.researchr.org\/home\/ecsa-2021","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Single-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"EasyChair","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"58","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"11","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"0","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"19% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"2","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Workshops were held virtually. For the workshop, 17 papers were submitted and 15 papers were selected.","order":10,"name":"additional_info_on_review_process","label":"Additional Info on Review Process","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}