{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,26]],"date-time":"2025-03-26T22:33:53Z","timestamp":1743028433021,"version":"3.40.3"},"publisher-location":"Cham","reference-count":22,"publisher":"Springer Nature Switzerland","isbn-type":[{"type":"print","value":"9783031812255"},{"type":"electronic","value":"9783031812262"}],"license":[{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-81226-2_24","type":"book-chapter","created":{"date-parts":[[2025,2,5]],"date-time":"2025-02-05T16:19:17Z","timestamp":1738772357000},"page":"275-285","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Strainer: Windowing-Based Advanced Sampling in\u00a0Stream Processing Systems"],"prefix":"10.1007","author":[{"given":"Nikola","family":"Koevski","sequence":"first","affiliation":[]},{"given":"S\u00e9rgio","family":"Esteves","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9285-0736","authenticated-orcid":false,"given":"Lu\u00eds","family":"Veiga","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,2,6]]},"reference":[{"key":"24_CR1","doi-asserted-by":"crossref","unstructured":"Acharya, S., Gibbons, P.B., Poosala, V.: Congressional samples for approximate answering of group-by queries. In: Proceedings of the 2000 ACM SIGMOD International Conference on Management of Data, SIGMOD \u201900, pp. 487\u2013498. ACM, New York (2000)","DOI":"10.1145\/342009.335450"},{"key":"24_CR2","doi-asserted-by":"crossref","unstructured":"Chaudhuri, S., Das, G., Datar, M., Motwani, R., Narasayya, V.: Overcoming limitations of sampling for aggregation queries. In: Proceedings of the 17th International Conference on Data Engineering, pp. 534\u2013542. IEEE (2001)","DOI":"10.1109\/ICDE.2001.914867"},{"issue":"1","key":"24_CR3","doi-asserted-by":"publisher","first-page":"23","DOI":"10.1186\/s40537-022-00565-8","volume":"9","author":"ME Coimbra","year":"2022","unstructured":"Coimbra, M.E., Esteves, S., Francisco, A.P., Veiga, L.: Veilgraph: incremental graph stream processing. J. Big Data 9(1), 23 (2022)","journal-title":"J. Big Data"},{"key":"24_CR4","doi-asserted-by":"crossref","unstructured":"Cormode, G., Duffield, N.: Sampling for big data: A tutorial. In Proceedings of the 20th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, KDD 2014, pp. 1975\u20131975, New York, NY, USA, (2014)","DOI":"10.1145\/2623330.2630811"},{"key":"24_CR5","doi-asserted-by":"crossref","unstructured":"Das, T., Zhong, Y., Stoica, I., Shenker, S.: Adaptive stream processing using dynamic batch sizing. In: Proceedings of the ACM Symposium on Cloud Computing, SOCC \u201914, pp. 16:1\u201316:13. ACM, New York ( 2014)","DOI":"10.1145\/2670979.2670995"},{"key":"24_CR6","doi-asserted-by":"crossref","unstructured":"Esteves, S., Galhardas, H., Veiga, L.: Adaptive execution of continuous and data-intensive workflows with machine learning. In: Proceedings of the 19th International Middleware Conference, Middleware \u201918, pp. 239\u2013252. Association for Computing Machinery, New York (2018)","DOI":"10.1145\/3274808.3274827"},{"key":"24_CR7","unstructured":"Gibbons, P.B.: Distinct sampling for highly-accurate answers to distinct values queries and event reports. In: Proceedings of the 27th International Conference on Very Large Data Bases, VLDB \u201901, pp. 541\u2013550. Morgan Kaufmann Publishers Inc., San Francisco (2001)"},{"key":"24_CR8","doi-asserted-by":"crossref","unstructured":"Gibbons, P.B., Matias, Y.: New sampling-based summary statistics for improving approximate query answers. In: Proceedings of the 1998 ACM SIGMOD International Conference on Management of Data, SIGMOD \u201998, pp. 331\u2013342. ACM, New York (1998)","DOI":"10.1145\/276304.276334"},{"key":"24_CR9","doi-asserted-by":"crossref","unstructured":"Goiri, I., Bianchini, R.,\u00a0Nagarakatte, S., Nguyen, T.D.: Approxhadoop: Bringing approximations to mapreduce frameworks. In Proceedings of the Twentieth International Conference on Architectural Support for Programming Languages and Operating Systems, ASPLOS \u201915, pp. 383\u2013397. ACM, New York (2015)","DOI":"10.1145\/2694344.2694351"},{"key":"24_CR10","doi-asserted-by":"crossref","unstructured":"Ha, S.-H., Brown, P., Michiardi, P.: Resource management for parallel processing frameworks with load awareness at worker side. In: 2017 IEEE International Congress on Big Data (BigData Congress), pp. 161\u2013168. IEEE (2017)","DOI":"10.1109\/BigDataCongress.2017.30"},{"key":"24_CR11","doi-asserted-by":"crossref","unstructured":"Hu, W.,\u00a0Zhang, B.: Study of sampling techniques and algorithms in data stream environments. In 2012 9th International Conference on Fuzzy Systems and Knowledge Discovery (FSKD), pp. 1028\u20131034. IEEE (2012)","DOI":"10.1109\/FSKD.2012.6234278"},{"key":"24_CR12","doi-asserted-by":"crossref","unstructured":"Krishnan, D.R., Quoc, D.L., Bhatotia, P., Fetzer, C., Rodrigues, R.: Incapprox: a data analytics system for incremental approximate computing. In: Proceedings of the 25th International Conference on World Wide Web, WWW \u201916, pp. 1133\u20131144, Republic and Canton of Geneva, Switzerland, 2016. International World Wide Web Conferences Steering Committee","DOI":"10.1145\/2872427.2883026"},{"key":"24_CR13","doi-asserted-by":"crossref","unstructured":"Liu, C.-M., Liao, K.-T.: Efficiently predicting frequent patterns over uncertain data streams. Procedia Comput. Sci. 160, 15 \u2013 22 (2019). The 10th International Conference on Emerging Ubiquitous Systems and Pervasive Networks (EUSPN-2019) \/ The 9th International Conference on Current and Future Trends of Information and Communication Technologies in Healthcare (ICTH-2019) \/ Affiliated Workshops","DOI":"10.1016\/j.procs.2019.09.438"},{"issue":"12","key":"24_CR14","doi-asserted-by":"publisher","first-page":"1970","DOI":"10.14778\/3352063.3352112","volume":"12","author":"J Lu","year":"2019","unstructured":"Lu, J., Chen, Y., Herodotou, H., Babu, S.: Speedup your analytics: Automatic parameter tuning for databases and big data systems. Proc. VLDB Endow. 12(12), 1970\u20131973 (2019)","journal-title":"Proc. VLDB Endow."},{"issue":"2","key":"24_CR15","doi-asserted-by":"publisher","first-page":"989","DOI":"10.1007\/s10462-019-09685-9","volume":"53","author":"A Mohamed","year":"2020","unstructured":"Mohamed, A., Najafabadi, M.K., Wah, Y.B., Zaman, E.A.K., Maskat, R.: The state of the art and taxonomy of big data analytics: view from new big data framework. Artif. Intell. Rev. 53(2), 989\u20131037 (2020)","journal-title":"Artif. Intell. Rev."},{"key":"24_CR16","doi-asserted-by":"crossref","unstructured":"Morais, B., Coimbra, M.E., Veiga, L.: pk-graph: Partitioned k 2-trees to enable compact and dynamic graphs in spark graphx. In: International Conference on Cooperative Information Systems, pp. 149\u2013167. Springer (2022)","DOI":"10.1007\/978-3-031-17834-4_9"},{"key":"24_CR17","series-title":"Cloud and Grid Computing (CCGRID)","first-page":"312","volume-title":"2019 19th IEEE\/ACM International Symposium on Cluster","author":"O Runsewe","year":"2019","unstructured":"Runsewe, O., Samaan, N.: Cram: a container resource allocation mechanism for big data streaming applications. In: 2019 19th IEEE\/ACM International Symposium on Cluster. Cloud and Grid Computing (CCGRID), pp. 312\u2013320. IEEE Computer Society, Los Alamitos (2019)"},{"key":"24_CR18","doi-asserted-by":"crossref","unstructured":"Shukla, A., Simmhan, Y.L.: Model-driven scheduling for distributed stream processing systems. CoRR, abs\/1702.01785 (2017)","DOI":"10.1002\/cpe.4257"},{"key":"24_CR19","doi-asserted-by":"crossref","unstructured":"Sun, L., Franklin, M.J., Krishnan, S., Xin, R.S.: Fine-grained partitioning for aggressive data skipping. In: Proceedings of the 2014 ACM SIGMOD International Conference on Management of Data, SIGMOD \u201914, pp. 1115\u20131126. ACM, New York (2014)","DOI":"10.1145\/2588555.2610515"},{"key":"24_CR20","unstructured":"Tatbul, N., \u00c7etintemel, U., Zdonik, S.: Staying fit: Efficient load shedding techniques for distributed stream processing. In: Proceedings of the 33rd International Conference on Very Large Data Bases, VLDB \u201907, pp. 159\u2013170. VLDB Endowment (2007)"},{"key":"24_CR21","unstructured":"Tatbul, N., Zdonik, S.: Window-aware load shedding for aggregation queries over data streams. In: Proceedings of the 32Nd International Conference on Very Large Data Bases, VLDB \u201906, pp. 799\u2013810. VLDB Endowment (2006)"},{"issue":"1","key":"24_CR22","doi-asserted-by":"publisher","first-page":"37","DOI":"10.1145\/3147.3165","volume":"11","author":"JS Vitter","year":"1985","unstructured":"Vitter, J.S.: Random sampling with a reservoir. ACM Trans. Math. Softw. 11(1), 37\u201357 (1985)","journal-title":"ACM Trans. Math. Softw."}],"container-title":["Lecture Notes in Computer Science","Economics of Grids, Clouds, Systems, and Services"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-81226-2_24","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,2,5]],"date-time":"2025-02-05T16:19:34Z","timestamp":1738772374000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-81226-2_24"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"ISBN":["9783031812255","9783031812262"],"references-count":22,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-81226-2_24","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2025]]},"assertion":[{"value":"6 February 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"GECON","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on the Economics of Grids, Clouds, Systems, and Services","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Rome","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Italy","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"27 September 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"28 September 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"20","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"gecon2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/gecon2024.gecon-conference.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}