{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,14]],"date-time":"2026-03-14T09:49:09Z","timestamp":1773481749631,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":86,"publisher":"ACM","license":[{"start":{"date-parts":[[2017,10,14]],"date-time":"2017-10-14T00:00:00Z","timestamp":1507939200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2017,10,14]]},"DOI":"10.1145\/3132747.3132758","type":"proceedings-article","created":{"date-parts":[[2017,10,12]],"date-time":"2017-10-12T12:51:09Z","timestamp":1507812669000},"page":"647-664","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":26,"title":["Low-Latency Analytics on Colossal Data Streams with SummaryStore"],"prefix":"10.1145","author":[{"given":"Nitin","family":"Agrawal","sequence":"first","affiliation":[{"name":"Samsung Research"}]},{"given":"Ashish","family":"Vulimiri","sequence":"additional","affiliation":[{"name":"Samsung Research"}]}],"member":"320","published-online":{"date-parts":[[2017,10,14]]},"reference":[{"key":"e_1_3_2_2_1_1","unstructured":"Green Button Initiative. http\/\/:www.greenbuttondata.org. Green Button Initiative. http\/\/:www.greenbuttondata.org."},{"key":"e_1_3_2_2_2_1","unstructured":"Protocol Buffers. http:\/\/code.google.com\/p\/protobuf. Protocol Buffers. http:\/\/code.google.com\/p\/protobuf."},{"key":"e_1_3_2_2_3_1","unstructured":"Stratified sampling. Wikipedia. Posted at https:\/\/en.wikipedia.org\/wiki\/Stratified_sampling#Disadvantages. Stratified sampling. Wikipedia. Posted at https:\/\/en.wikipedia.org\/wiki\/Stratified_sampling#Disadvantages."},{"key":"e_1_3_2_2_4_1","unstructured":"Three sigma rule. Wikipedia. Posted at https:\/\/en.wikipedia.org\/wiki\/Three_sigma_rule. Three sigma rule. Wikipedia. Posted at https:\/\/en.wikipedia.org\/wiki\/Three_sigma_rule."},{"key":"e_1_3_2_2_5_1","doi-asserted-by":"crossref","unstructured":"Introducing Kale. https:\/\/codeascraft.com\/2013\/06\/11\/introducing-kale\/ 2013. Introducing Kale. https:\/\/codeascraft.com\/2013\/06\/11\/introducing-kale\/ 2013.","DOI":"10.1063\/pt.4.2491"},{"key":"e_1_3_2_2_6_1","unstructured":"Ganglia Monitoring System. http:\/\/ganglia.info\/ 2016. Ganglia Monitoring System. http:\/\/ganglia.info\/ 2016."},{"key":"e_1_3_2_2_7_1","unstructured":"IBM Informix TimeSeries. https:\/\/www-01.ibm.com\/software\/data\/informix\/timeseries 2016. IBM Informix TimeSeries. https:\/\/www-01.ibm.com\/software\/data\/informix\/timeseries 2016."},{"key":"e_1_3_2_2_8_1","unstructured":"InfluxDB:Downsampling and Data Retention. https:\/\/docs.influxdata.com\/influxdb\/v0.9\/guides\/downsampling_and_retention\/ 2016. InfluxDB:Downsampling and Data Retention. https:\/\/docs.influxdata.com\/influxdb\/v0.9\/guides\/downsampling_and_retention\/ 2016."},{"key":"e_1_3_2_2_9_1","unstructured":"Netflix Atlas time-series telemetry platform. https:\/\/github.com\/Netflix\/atlas 2016. Netflix Atlas time-series telemetry platform. https:\/\/github.com\/Netflix\/atlas 2016."},{"key":"e_1_3_2_2_10_1","unstructured":"Netflix Edda. https:\/\/github.com\/Netflix\/edda 2016. Netflix Edda. https:\/\/github.com\/Netflix\/edda 2016."},{"key":"e_1_3_2_2_11_1","unstructured":"SQL for IBM Tivoli Storage Manager. http:\/\/thobias.org\/tsm\/sql\/ 2016. SQL for IBM Tivoli Storage Manager. http:\/\/thobias.org\/tsm\/sql\/ 2016."},{"key":"e_1_3_2_2_12_1","unstructured":"Multivariate normal distribution. https:\/\/en.wikipedia.org\/wiki\/Multivariate_normal_distribution 2017. Multivariate normal distribution. https:\/\/en.wikipedia.org\/wiki\/Multivariate_normal_distribution 2017."},{"key":"e_1_3_2_2_13_1","doi-asserted-by":"publisher","DOI":"10.1145\/1055709.1055714"},{"key":"e_1_3_2_2_14_1","doi-asserted-by":"publisher","DOI":"10.1145\/2500128"},{"key":"e_1_3_2_2_15_1","first-page":"337","volume-title":"12th USENIX Symposium on Networked Systems Design and Implementation (NSDI15)","author":"Agarwal R.","year":"2015"},{"key":"e_1_3_2_2_16_1","doi-asserted-by":"publisher","DOI":"10.1145\/2588555.2593667"},{"key":"e_1_3_2_2_17_1","doi-asserted-by":"publisher","DOI":"10.1145\/2465351.2465355"},{"key":"e_1_3_2_2_18_1","first-page":"39","volume-title":"14th USENIX Conference on File and Storage Technologies (FAST 16)","author":"Andersen M. P.","year":"2016"},{"key":"e_1_3_2_2_19_1","first-page":"13","volume-title":"KDD workshop on temporal data mining","volume":"1","author":"Antunes CM.","year":"2001"},{"key":"e_1_3_2_2_20_1","unstructured":"Apache. Apache Commons Math library. http:\/\/commons.apache. org\/proper\/commons-math\/ 2016. Apache. Apache Commons Math library. http:\/\/commons.apache. org\/proper\/commons-math\/ 2016."},{"key":"e_1_3_2_2_21_1","unstructured":"P. Bailis D. Narayanan and S. Madden. Macrobase: Analytic monitoring for the internet of things. arXivpreprint arXiv: 1603.00567 2016. P. Bailis D. Narayanan and S. Madden. Macrobase: Analytic monitoring for the internet of things. arXivpreprint arXiv: 1603.00567 2016."},{"key":"e_1_3_2_2_22_1","doi-asserted-by":"publisher","DOI":"10.1145\/277858.277897"},{"key":"e_1_3_2_2_23_1","doi-asserted-by":"publisher","DOI":"10.1145\/1345448.1345465"},{"key":"e_1_3_2_2_24_1","volume-title":"Workshop on Hot Topics in System Dependability (HotDep)","author":"Bhagwan R.","year":"2005"},{"key":"e_1_3_2_2_25_1","doi-asserted-by":"publisher","DOI":"10.1007\/11841036_16"},{"key":"e_1_3_2_2_26_1","doi-asserted-by":"publisher","DOI":"10.1145\/362686.362692"},{"key":"e_1_3_2_2_27_1","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2003.814614"},{"key":"e_1_3_2_2_28_1","doi-asserted-by":"publisher","DOI":"10.1137\/0916069"},{"key":"e_1_3_2_2_29_1","doi-asserted-by":"publisher","DOI":"10.1007\/s11257-012-9136-x"},{"key":"e_1_3_2_2_30_1","doi-asserted-by":"publisher","DOI":"10.1145\/2168836.2168854"},{"key":"e_1_3_2_2_31_1","doi-asserted-by":"publisher","DOI":"10.1016\/S1389-1286(99)00018-3"},{"key":"e_1_3_2_2_32_1","doi-asserted-by":"publisher","DOI":"10.1145\/773153.773175"},{"key":"e_1_3_2_2_33_1","doi-asserted-by":"publisher","DOI":"10.1145\/1376916.1376930"},{"key":"e_1_3_2_2_34_1","unstructured":"C. Cortes and D. Pregibon. Giga-mining. C. Cortes and D. Pregibon. Giga-mining."},{"key":"e_1_3_2_2_35_1","unstructured":"Cory Watson. Observability at Twitter. https:\/\/blog.twitter.com\/2013\/observability-at-twitter 2013. Cory Watson. Observability at Twitter. https:\/\/blog.twitter.com\/2013\/observability-at-twitter 2013."},{"key":"e_1_3_2_2_36_1","volume-title":"Methuen","author":"Cox D. R.","year":"1962"},{"key":"e_1_3_2_2_37_1","doi-asserted-by":"publisher","DOI":"10.1109\/90.650143"},{"key":"e_1_3_2_2_38_1","doi-asserted-by":"publisher","DOI":"10.1145\/2806777.2806839"},{"key":"e_1_3_2_2_39_1","doi-asserted-by":"publisher","DOI":"10.1137\/S0097539701398363"},{"key":"e_1_3_2_2_40_1","volume-title":"NSDI","author":"Dawson-Haggerty S.","year":"2013"},{"key":"e_1_3_2_2_41_1","unstructured":"Dennis Shasha. Time Series in Finance: the array database approach. http:\/\/cs.nyu.edu\/shasha\/papers\/jagtalk.html 1997. Dennis Shasha. Time Series in Finance: the array database approach. http:\/\/cs.nyu.edu\/shasha\/papers\/jagtalk.html 1997."},{"key":"e_1_3_2_2_42_1","first-page":"45","volume-title":"USENIX Annual Technical Conference","author":"Desnoyers P.","year":"2007"},{"key":"e_1_3_2_2_43_1","doi-asserted-by":"publisher","DOI":"10.1145\/1133572.1133593"},{"key":"e_1_3_2_2_44_1","doi-asserted-by":"publisher","DOI":"10.1145\/1823844.1823853"},{"key":"e_1_3_2_2_45_1","unstructured":"Federal Reserve Economic Data. https:\/\/en.wikipedia.org\/wiki\/Federal_Reserve_Economic_Data 2017. Federal Reserve Economic Data. https:\/\/en.wikipedia.org\/wiki\/Federal_Reserve_Economic_Data 2017."},{"key":"e_1_3_2_2_46_1","first-page":"243","volume-title":"11th USENIX Symposium on Networked Systems Design and Implementation (NSDI 14)","author":"Gupta T","year":"2014"},{"key":"e_1_3_2_2_47_1","volume-title":"Proc. of Symposium on Simulation for Architecture and Urban Design","author":"Hailemariam E.","year":"2011"},{"key":"e_1_3_2_2_48_1","unstructured":"Price Trends: Internal Hard Drives. https:\/\/pcpartpicker.com\/trends\/internal-hard-drive\/. Price Trends: Internal Hard Drives. https:\/\/pcpartpicker.com\/trends\/internal-hard-drive\/."},{"key":"e_1_3_2_2_49_1","doi-asserted-by":"publisher","DOI":"10.1145\/253260.253274"},{"key":"e_1_3_2_2_50_1","unstructured":"InfluxData. Influxdb time-series database. http:\/\/influxdb.com 2015. InfluxData. Influxdb time-series database. http:\/\/influxdb.com 2015."},{"key":"e_1_3_2_2_51_1","unstructured":"K. J. Jacob and D. Shasha. Fintime -- a financial benchmark. K. J. Jacob and D. Shasha. Fintime -- a financial benchmark."},{"key":"e_1_3_2_2_52_1","unstructured":"Jamie Wilkinson. Google Prometheus: A practical guide to alerting at scale. https:\/\/docs.google.com\/presentation\/d\/1X1rKozAUuF2MVc1YXElFWq9wkcWv3Axdldl8LOH9Vik\/edit#slide=id.g598ef96a6_0_341 2016. Jamie Wilkinson. Google Prometheus: A practical guide to alerting at scale. https:\/\/docs.google.com\/presentation\/d\/1X1rKozAUuF2MVc1YXElFWq9wkcWv3Axdldl8LOH9Vik\/edit#slide=id.g598ef96a6_0_341 2016."},{"key":"e_1_3_2_2_53_1","unstructured":"Jason Kincaid. Facebook EdgeRank: The Secret Sauce That Makes Facebook's News Feed Tick. https:\/\/techcrunch.com\/2010\/04\/22\/facebook-edgerank 2010. Jason Kincaid. Facebook EdgeRank: The Secret Sauce That Makes Facebook's News Feed Tick. https:\/\/techcrunch.com\/2010\/04\/22\/facebook-edgerank 2010."},{"key":"e_1_3_2_2_54_1","doi-asserted-by":"crossref","unstructured":"S. Kandula A. Shanbhag A. Vitorovic M. Olma R. Grandl S. Chaudhuri and B. Ding. Quickr: Lazily approximating complex adhoc queries in bigdata clusters. 2016. S. Kandula A. Shanbhag A. Vitorovic M. Olma R. Grandl S. Chaudhuri and B. Ding. Quickr: Lazily approximating complex adhoc queries in bigdata clusters. 2016.","DOI":"10.1145\/2882903.2882940"},{"key":"e_1_3_2_2_55_1","first-page":"485","volume-title":"13th USENIX Symposium on Networked Systems Design and Implementation (NSDI16)","author":"Khandelwal A.","year":"2016"},{"key":"e_1_3_2_2_56_1","doi-asserted-by":"publisher","DOI":"10.1145\/1557019.1557072"},{"key":"e_1_3_2_2_57_1","unstructured":"D. M. Lane. Online statistics education: A multimedia course of study. http:\/\/onlinestatbook.com\/. D. M. Lane. Online statistics education: A multimedia course of study. http:\/\/onlinestatbook.com\/."},{"key":"e_1_3_2_2_58_1","first-page":"229","volume-title":"15th USENIX Conference on File and Storage Technologies (FAST 17)","author":"Lautenschlager F.","year":"2017"},{"key":"e_1_3_2_2_59_1","unstructured":"D. Leary. Nimble Storage Blog: Why Does Enterprise Storage Cost So Much?. https:\/\/www.nimblestorage.com\/blog\/why-does-enterprise-storage-cost-so-much\/ 2010. D. Leary. Nimble Storage Blog: Why Does Enterprise Storage Cost So Much?. https:\/\/www.nimblestorage.com\/blog\/why-does-enterprise-storage-cost-so-much\/ 2010."},{"key":"e_1_3_2_2_60_1","doi-asserted-by":"publisher","DOI":"10.1145\/1772690.1772758"},{"key":"e_1_3_2_2_61_1","unstructured":"Mike Keane. 1.5 million Log Lines per Second. http\/\/:www.bigdataeverywhere.com\/files\/chicago\/BDE-15millionLogLinesPerSecond-KEANE.pdf 2014. Mike Keane. 1.5 million Log Lines per Second. http\/\/:www.bigdataeverywhere.com\/files\/chicago\/BDE-15millionLogLinesPerSecond-KEANE.pdf 2014."},{"key":"e_1_3_2_2_62_1","volume-title":"DTIC Document","author":"Mitchell T","year":"2010"},{"key":"e_1_3_2_2_63_1","unstructured":"M. Natrella. NIST\/SEMATECH e-handbook of statistical methods. 2010. M. Natrella. NIST\/SEMATECH e-handbook of statistical methods. 2010."},{"key":"e_1_3_2_2_64_1","unstructured":"NOAA Global Surface Summary of the Day Weather Data. https:\/\/cloud.google.com\/bigquery\/public-data\/noaa-gsod. NOAA Global Surface Summary of the Day Weather Data. https:\/\/cloud.google.com\/bigquery\/public-data\/noaa-gsod."},{"key":"e_1_3_2_2_65_1","volume-title":"Cengage Learning","author":"Peck R.","year":"2015"},{"key":"e_1_3_2_2_66_1","doi-asserted-by":"publisher","DOI":"10.14778\/2824032.2824078"},{"key":"e_1_3_2_2_67_1","unstructured":"Power Law. https:\/\/en.wikipedia.org\/wiki\/Power_law. Power Law. https:\/\/en.wikipedia.org\/wiki\/Power_law."},{"key":"e_1_3_2_2_68_1","unstructured":"Prophet: forecasting at scale. https:\/\/research.fb.com\/prophet-forecasting-at-scale\/ Feb 2017. Prophet: forecasting at scale. https:\/\/research.fb.com\/prophet-forecasting-at-scale\/ Feb 2017."},{"key":"e_1_3_2_2_69_1","first-page":"275","volume-title":"11th USENIX Symposium on Networked Systems Design andImplemen-tation (NSDI 14)","author":"Rabkin A.","year":"2014"},{"key":"e_1_3_2_2_70_1","doi-asserted-by":"publisher","DOI":"10.1145\/1689239.1689243"},{"key":"e_1_3_2_2_71_1","volume-title":"Google Inc.","author":"Reiss C.","year":"2011"},{"key":"e_1_3_2_2_72_1","unstructured":"RocksDB. RocksDB. http:\/\/rocksdb.org\/ 2016. RocksDB. RocksDB. http:\/\/rocksdb.org\/ 2016."},{"key":"e_1_3_2_2_73_1","first-page":"127","volume-title":"HotOS","author":"Roscoe T","year":"2003"},{"key":"e_1_3_2_2_74_1","unstructured":"B. Sigoure. Opentsdb scalable time series database (tsdb). http:\/\/opentsdb.net 2012. B. Sigoure. Opentsdb scalable time series database (tsdb). http:\/\/opentsdb.net 2012."},{"key":"e_1_3_2_2_75_1","doi-asserted-by":"publisher","DOI":"10.1145\/2487166.2487174"},{"key":"e_1_3_2_2_76_1","doi-asserted-by":"publisher","DOI":"10.1023\/A:1022633531479"},{"key":"e_1_3_2_2_77_1","doi-asserted-by":"crossref","unstructured":"S. J. Taylor and B. Letham. Facebook open source project: Forecasting at scale. https:\/\/github.com\/facebookincubator\/prophet 2017. S. J. Taylor and B. Letham. Facebook open source project: Forecasting at scale. https:\/\/github.com\/facebookincubator\/prophet 2017.","DOI":"10.7287\/peerj.preprints.3190v2"},{"key":"e_1_3_2_2_78_1","unstructured":"Ted Friedman. Gartner Report: \"Internet of Things: Biggest Impact Ever on Information and Master Data\". http\/\/:www.gartner.com\/webinar\/3291728?srcId=1-7389946120 2016. Ted Friedman. Gartner Report: \"Internet of Things: Biggest Impact Ever on Information and Master Data\". http\/\/:www.gartner.com\/webinar\/3291728?srcId=1-7389946120 2016."},{"key":"e_1_3_2_2_79_1","volume-title":"Springer Science & Business Media","author":"Thrun S.","year":"2012"},{"key":"e_1_3_2_2_80_1","unstructured":"M. van Rijmenam. Self-driving cars will create 2 petabytes of data what are the big data opportunities for the car industry? https:\/\/datafloq.com\/read\/self-driving-cars-create-2-petabytes-data-annually\/172 2017. M. van Rijmenam. Self-driving cars will create 2 petabytes of data what are the big data opportunities for the car industry? https:\/\/datafloq.com\/read\/self-driving-cars-create-2-petabytes-data-annually\/172 2017."},{"key":"e_1_3_2_2_81_1","doi-asserted-by":"publisher","DOI":"10.1145\/3147.3165"},{"key":"e_1_3_2_2_82_1","volume-title":"FAST","author":"Wallace G","year":"2012"},{"key":"e_1_3_2_2_83_1","unstructured":"W. W.-S. Wei. Time series analysis. Addison-Wesley publ Reading 1994. W. W.-S. Wei. Time series analysis. Addison-Wesley publ Reading 1994."},{"key":"e_1_3_2_2_84_1","unstructured":"Wikipedia Traffic Statistics V2. https:\/\/aws.amazon.com\/datasets\/wikipedia-traffic-statistics-v2\/. Wikipedia Traffic Statistics V2. https:\/\/aws.amazon.com\/datasets\/wikipedia-traffic-statistics-v2\/."},{"key":"e_1_3_2_2_85_1","unstructured":"J. Wilkes. More Google cluster data. Google research blog. Posted at http:\/\/googleresearch.blogspot.com\/2011\/11\/more-google-cluster-data.html. J. Wilkes. More Google cluster data. Google research blog. Posted at http:\/\/googleresearch.blogspot.com\/2011\/11\/more-google-cluster-data.html."},{"key":"e_1_3_2_2_86_1","first-page":"2","volume-title":"Proceedings of the 2012 Symposium on Simulation for Architecture and Urban Design","author":"Yang Z."}],"event":{"name":"SOSP '17: ACM SIGOPS 26th Symposium on Operating Systems Principles","location":"Shanghai China","acronym":"SOSP '17","sponsor":["SIGOPS ACM Special Interest Group on Operating Systems","USENIX Assoc USENIX Assoc"]},"container-title":["Proceedings of the 26th Symposium on Operating Systems Principles"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3132747.3132758","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3132747.3132758","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,26]],"date-time":"2025-06-26T11:23:32Z","timestamp":1750937012000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3132747.3132758"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,10,14]]},"references-count":86,"alternative-id":["10.1145\/3132747.3132758","10.1145\/3132747"],"URL":"https:\/\/doi.org\/10.1145\/3132747.3132758","relation":{},"subject":[],"published":{"date-parts":[[2017,10,14]]},"assertion":[{"value":"2017-10-14","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}