{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,2]],"date-time":"2026-06-02T05:05:27Z","timestamp":1780376727120,"version":"3.54.1"},"reference-count":84,"publisher":"Springer Science and Business Media LLC","issue":"5","license":[{"start":{"date-parts":[[2019,9,3]],"date-time":"2019-09-03T00:00:00Z","timestamp":1567468800000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2019,9,3]],"date-time":"2019-09-03T00:00:00Z","timestamp":1567468800000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["The VLDB Journal"],"published-print":{"date-parts":[[2019,10]]},"DOI":"10.1007\/s00778-019-00565-w","type":"journal-article","created":{"date-parts":[[2019,9,3]],"date-time":"2019-09-03T09:03:23Z","timestamp":1567501403000},"page":"821-846","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":9,"title":["On the performance and convergence of distributed stream processing via approximate fault tolerance"],"prefix":"10.1007","volume":"28","author":[{"given":"Zhinan","family":"Cheng","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Qun","family":"Huang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4501-4364","authenticated-orcid":false,"given":"Patrick P. C.","family":"Lee","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2019,9,3]]},"reference":[{"key":"565_CR1","doi-asserted-by":"publisher","first-page":"120","DOI":"10.1007\/s00778-003-0095-z","volume":"12","author":"DJ Abadi","year":"2003","unstructured":"Abadi, D.J., Carney, D., Cetintemel, U., Cherniack, M., Convey, C., Lee, S., Stonebraker, M., Tatbul, N., Zdonik, S.: Aurora: a new model and architecture for data stream management. VLDB J. 12, 120\u2013139 (2003)","journal-title":"VLDB J."},{"key":"565_CR2","doi-asserted-by":"crossref","unstructured":"Agarwal, S., Mozafari, B., Panda, A., Milner, H., Madden, S., Stoica, I.: BlinkDB: queries with bounded errors and bounded response times on very large data. In: Proceedings of EuroSys, pp. 29\u201342 (2013)","DOI":"10.1145\/2465351.2465355"},{"key":"565_CR3","unstructured":"Agarwal, S., Zeng, K.: BlinkDB and G-OLA: supporting continuous answers with error bars in SparkSQL. In: Spark Summit (2015)"},{"key":"565_CR4","doi-asserted-by":"crossref","unstructured":"Ahmed, A., Aly, M., Gonzalez, J., Narayanamurthy, S., Smola, A.J.: Scalable inference in latent variable models. In: Proceedings of WSDM (2012)","DOI":"10.1145\/2124295.2124312"},{"key":"565_CR5","doi-asserted-by":"publisher","first-page":"1033","DOI":"10.14778\/2536222.2536229","volume":"6","author":"T Akidau","year":"2013","unstructured":"Akidau, T., Balikov, A., Bekiro, K., Chernyak, S., Haberman, J., Lax, R., Mcveety, S., Mills, D., Nordstrom, P., Whittle, S.: MillWheel: fault-tolerant stream processing at internet scale. Proc. VLDB Endow. 6, 1033\u20131044 (2013)","journal-title":"Proc. VLDB Endow."},{"key":"565_CR6","unstructured":"Apache Flume. http:\/\/flume.apache.org . Accessed 1 June 2019"},{"key":"565_CR7","doi-asserted-by":"crossref","unstructured":"Apache Kafka. http:\/\/kafka.apache.org . Accessed 1 June 2019","DOI":"10.1007\/978-3-319-63962-8_196-1"},{"key":"565_CR8","doi-asserted-by":"crossref","unstructured":"Balazinska, M., Balakrishnan, H., Madden, S.R., Stonebraker, M.: Fault-tolerance in the borealis distributed stream processing system. In: Proceedings of SIGMOD, pp. 13\u201324 (2005)","DOI":"10.1145\/1066157.1066160"},{"key":"565_CR9","doi-asserted-by":"crossref","unstructured":"Baldi, P., Sadowski, P., Whiteson, D.: Searching for exotic particles in high-energy physics with deep learning. Nat. Commun. 5, 4308:1\u20134308:9 (2014)","DOI":"10.1038\/ncomms5308"},{"key":"565_CR10","unstructured":"Bellavista, P., Corradi, A., Kotoulas, S., Reale, A.: Adaptive fault-tolerance for dynamic resource provisioning in distributed stream processing systems. In: Proceedings of IEEE EDBT, pp. 85\u201396 (2014)"},{"key":"565_CR11","doi-asserted-by":"crossref","unstructured":"Bhatotia, P., Wieder, A., Rodrigues, R., Acar, U., Pasquin, R.: Incoop: Mapreduce for incremental computations. In: Proceedings of SoCC, pp. 7:1\u20137:14 (2011)","DOI":"10.1145\/2038916.2038923"},{"key":"565_CR12","volume-title":"Online Learning and Neural Networks","author":"L Bottou","year":"1998","unstructured":"Bottou, L.: Online algorithms and stochastic approximations. In: Saad, D. (ed.) Online Learning and Neural Networks. Cambridge University Press, Cambridge, UK (1998)"},{"key":"565_CR13","doi-asserted-by":"publisher","first-page":"177","DOI":"10.1007\/978-3-7908-2604-3_16","volume-title":"Proceedings of COMPSTAT'2010","author":"L\u00e9on Bottou","year":"2010","unstructured":"Bottou, L.: Large-scale machine learning with stochastic gradient descent. In: Proceedings of COMPSTAT (2010)"},{"key":"565_CR14","unstructured":"Bottou, L., Bousquet, O.: The tradeoffs of large scale learning. In: Proceedings of NIPS (2007)"},{"key":"565_CR15","unstructured":"Bradley, J.K., Kyrola, A., Bickson, D., Guestrin, C.: Parallel coordinate descent for L1-regularized loss minimization. In: Proceedings of ICML (2011)"},{"key":"565_CR16","first-page":"181","volume-title":"Lecture Notes in Computer Science","author":"Steven Busuttil","year":"2007","unstructured":"Busuttil, S., Kalnishkan, Y.: Online regression competitive with changing predictors. In: Proceedings of Alogrithmic Learning Theory, pp. 181\u2013195 (2007)"},{"key":"565_CR17","unstructured":"CAIDA Anonymized Internet Traces 2014. http:\/\/www.caida.org\/data\/passive\/passive_2014_dataset.xml . Accessed 1 June 2019"},{"key":"565_CR18","unstructured":"Canini, K.R.K., Shi, L., Griffiths, T.L.: Online inference of topics with latent Dirichlet allocation. In: Proceedings of AISTATS (2009)"},{"key":"565_CR19","unstructured":"Carbone, P., Katsifodimos, A., Ewen, S., Markl, V., Haridi, S., Tzoumas, K.: Apache Flink: stream and batch processing in a single engine. In: Bulletin of the IEEE Computer Society Technical Committee on Data Engineering (2015)"},{"key":"565_CR20","unstructured":"Cherniack, M., Balakrishnan, H., Balazinska, M., Carney, D., Cetintemel, U., Xing, Y., Zdonik, S.: Scalable distributed stream processing. In: CIDR (2003)"},{"key":"565_CR21","unstructured":"Condie, T., Conway, N., Alvaro, P., Hellerstein, J.M., Elmeleegy, K., Sears, R.: MapReduce online. In: Proceedings of NSDI, pp. 21\u201321 (2010)"},{"key":"565_CR22","volume-title":"Synopses for Massive Data: Samples, Histograms, Wavelets, Sketches","author":"G Cormode","year":"2012","unstructured":"Cormode, G., Garofalakis, M., Haas, P.J., Jermaine, C.: Synopses for Massive Data: Samples, Histograms, Wavelets, Sketches. Now Publishers Inc., Hanover (2012)"},{"key":"565_CR23","unstructured":"Cormode, G., Muthukrishnan, S.: What\u2019s new: finding significant differences in network data streams. In: Proceedings of INFOCOM, pp. 1534\u20131545 (2004)"},{"issue":"1","key":"565_CR24","doi-asserted-by":"publisher","first-page":"58","DOI":"10.1016\/j.jalgor.2003.12.001","volume":"55","author":"G Cormode","year":"2005","unstructured":"Cormode, G., Muthukrishnan, S.: An improved data stream summary: the count-min sketch and its applications. J. Algorithms 55(1), 58\u201375 (2005)","journal-title":"J. Algorithms"},{"key":"565_CR25","doi-asserted-by":"crossref","unstructured":"Dai, W., Kumar, A., Wei, J., Ho, Q., Gibson, G., Xing, E.P.: High-performance distributed ML at scale through parameter server consistency models. In: Proceedings of AAAI (2015)","DOI":"10.1609\/aaai.v29i1.9195"},{"key":"565_CR26","doi-asserted-by":"crossref","unstructured":"Das, T., Zhong, Y., Stoica, I., Shenker, S.: Adaptive stream processing using dynamic batch sizing. In: Proceedings of SoCC, pp. 16:1\u201316:13 (2014)","DOI":"10.1145\/2670979.2670995"},{"issue":"1","key":"565_CR27","doi-asserted-by":"publisher","first-page":"107","DOI":"10.1145\/1327452.1327492","volume":"51","author":"Jeffrey Dean","year":"2008","unstructured":"Dean, J., Ghemawat, S.: MapReduce: simplified data processing on large clusters. In: Proceedings of OSDI, pp. 107\u2013113 (2004)","journal-title":"Communications of the ACM"},{"issue":"4","key":"565_CR28","doi-asserted-by":"publisher","first-page":"323","DOI":"10.1145\/964725.633056","volume":"32","author":"Cristian Estan","year":"2002","unstructured":"Estan, C., Varghese, G.: New directions in traffic measurement and accounting. In: Proceedings of SIGCOMM, pp. 323\u2013336 (2002)","journal-title":"ACM SIGCOMM Computer Communication Review"},{"key":"565_CR29","unstructured":"Fernandez, R.C., Migliavacca, M., Kalyvianaki, E., Pietzuch, P.: Integrating scale out and fault tolerance in stream processing using operator state management. In: Proceedings of SIGMOD, pp. 725\u2013736 (2013)"},{"key":"565_CR30","unstructured":"Fernandez, R.C., Migliavacca, M., Kalyvianaki, E., Pietzuch, P.: Making state explicit for imperative big data processing. In: Proceedings of USENIX ATC, pp. 49\u201360 (2014)"},{"key":"565_CR31","doi-asserted-by":"crossref","unstructured":"Gulisano, V., Jimenez-Peris, R., Patino-Martinez, M., Valduriez, P.: StreamCloud: a large scale data streaming system. In: Proceedings of ICDCS, pp. 126\u2013137 (2010)","DOI":"10.1109\/ICDCS.2010.72"},{"issue":"2","key":"565_CR32","doi-asserted-by":"publisher","first-page":"287","DOI":"10.1145\/304181.304208","volume":"28","author":"Peter J. Haas","year":"1999","unstructured":"Haas, P.J., Hellerstein, J.M.: Ripple joins for online aggregation. In: Proceedings of SIGMOD, pp. 287\u2013298 (1999)","journal-title":"ACM SIGMOD Record"},{"issue":"2\u20133","key":"565_CR33","doi-asserted-by":"publisher","first-page":"169","DOI":"10.1007\/s10994-007-5016-8","volume":"69","author":"E Hazan","year":"2007","unstructured":"Hazan, E., Agarwal, A., Kale, S.: Logarithmic regret algorithms for online convex optimization. J. Mach. Learn. 69(2\u20133), 169\u2013192 (2007)","journal-title":"J. Mach. Learn."},{"key":"565_CR34","doi-asserted-by":"crossref","unstructured":"He, B., Yang, M., Guo, Z., Chen, R., Su, B., Lin, W., Zhou, L.: Comet : Batched stream processing for data intensive distributed computing. In: Proceedings of SoCC, pp. 63\u201374 (2010)","DOI":"10.1145\/1807128.1807139"},{"key":"565_CR35","unstructured":"Ho, Q., Cipar, J., Cui, H., Kim, J.K., Lee, S., Gibbons, P.B., Gibson, G.A., Ganger, G.R., Xing, E.P.: More effective distributed ML via a stale synchronous parallel parameter server. In: Proceedings of NIPS, pp. 1223\u20131231 (2013)"},{"key":"565_CR36","unstructured":"Hoffman, M., Blei, D., Bach, F.: Online learning for latent Dirichlet allocation. In: Proceedings of NIPS, pp. 856\u2013864 (2010)"},{"issue":"1","key":"565_CR37","first-page":"1303","volume":"14","author":"MD Hoffman","year":"2013","unstructured":"Hoffman, M.D., Blei, D.M., Wang, C., Paisley, J.: Stochastic variational inference. J. Mach. Learn. Res. 14(1), 1303\u20131347 (2013)","journal-title":"J. Mach. Learn. Res."},{"key":"565_CR38","unstructured":"Hu, L., Schwan, K., Amur, H., Chen, X.: ELF: efficient lightweight fast stream processing at scale. In: Proceedings of USENIX ATC, pp. 25\u201336 (2014)"},{"issue":"3","key":"565_CR39","doi-asserted-by":"publisher","first-page":"73","DOI":"10.14778\/3021924.3021925","volume":"10","author":"Q Huang","year":"2016","unstructured":"Huang, Q., Lee, P.P.C.: Toward high-performance distributed stream processing via approximate fault tolerance. Proc. VLDB Endow. 10(3), 73\u201384 (2016)","journal-title":"Proc. VLDB Endow."},{"key":"565_CR40","unstructured":"Hunt, P., Konar, M., Junqueira, F.P., Reed, B.: ZooKeeper: wait-free coordination for internet-scale systems. In: Proceedings of USENIX ATC, pp. 11\u201311 (2010)"},{"key":"565_CR41","unstructured":"Hwang, J.-H., Balazinska, M., Rasin, A., \u00c7etintemel, U., Stonebraker, M., Zdonik, S.: High-availability algorithms for distributed stream processing. In: Proceedings of ICDE, pp. 779\u2013790 (2005)"},{"key":"565_CR42","doi-asserted-by":"crossref","unstructured":"Hwang, J.-H., Xing, Y., Cetintemel, U., Zdonik, S.: A cooperative, self-configuring high-availability solution for stream processing. In: Proceedings of ICDE, pp. 176 \u2013 185 (2007)","DOI":"10.1109\/ICDE.2007.367863"},{"key":"565_CR43","unstructured":"Jain, N., Mahajan, P., Kit, D., Yalagandula, P., Dahlin, M., Zhang, Y.: Network imprecision: a new consistency metric for scalable monitoring. In: Proceedings of OSDI, pp. 87\u2013102 (2008)"},{"key":"565_CR44","doi-asserted-by":"crossref","unstructured":"Krishnamurthy, S., Franklin, M.J., Davis, J., Farina, D., Golovko, P., Li, A., Thombre, N.: Continuous analytics over discontinuous streams. In: Proceedings of SIGMOD, pp. 1081\u20131092 (2010)","DOI":"10.1145\/1807167.1807290"},{"key":"565_CR45","doi-asserted-by":"crossref","unstructured":"Kulkarni, S., Bhagat, N., Fu, M., Kedigehalli, V., Kellogg, C., Mittal, S., Patel, J.M., Ramasamy, K., Taneja, S.: Twitter Heron: stream processing at scale. In: Proceedings of SIGMOD, pp. 239\u2013250 (2015)","DOI":"10.1145\/2723372.2742788"},{"key":"565_CR46","unstructured":"Langford, J., Smola, A., Zinkevich, M.: Slow learners are fast. In: Proceedings of NIPS, pp. 2331\u20132339 (2009)"},{"key":"565_CR47","doi-asserted-by":"crossref","unstructured":"Li, M., Andersen, D.G., Park, J.W., Smola, A.J., Ahmed, A., Josifovski, V., Long, J., Shekita, E.J., Su, B.-Y.: Scaling distributed machine learning with the parameter server. In: Proceedings of OSDI, pp. 583\u2013598 (2014)","DOI":"10.1145\/2640087.2644155"},{"key":"565_CR48","unstructured":"Lin, W., Qian, Z., Xu, J., Yang, S., Zhou, J., Zhou, L.: StreamScope: continuous reliable distributed processing of big data streams. In: Proceedings of NSDI, pp. 439\u2013454 (2016)"},{"key":"565_CR49","doi-asserted-by":"crossref","unstructured":"Liu, Q., Lui, J.C., He, C., Pan, L., Fan, W., Shi, Y.: SAND: a fault-tolerant streaming architecture for network traffic analytics. In: Proceedings of DSN, pp. 80\u201387 (2014)","DOI":"10.1109\/DSN.2014.91"},{"key":"565_CR50","doi-asserted-by":"crossref","unstructured":"Logothetis, D., Olston, C., Reed, B., Webb, K.C., Yocum, K.: Stateful bulk processing for incremental analytics. In: Proceedings of SoCC, pp. 51\u201362 (2010)","DOI":"10.1145\/1807128.1807138"},{"key":"565_CR51","unstructured":"Logothetis, D., Trezzo, C., Webb, K.C., Yocum, K.: In-situ MapReduce for log processing. In: Proceedings of USENIX ATC, pp. 9\u20139 (2011)"},{"key":"565_CR52","doi-asserted-by":"crossref","unstructured":"Luo, G., Ellmann, C.J., Haas, P.J., Naughton, J.F.: A scalable hash ripple join algorithm. In: Proceedings of SIGMOD, pp. 252\u2013262 (2002)","DOI":"10.1145\/564691.564721"},{"key":"565_CR53","doi-asserted-by":"crossref","unstructured":"Martin, A., Knauth, T., Creutz, S., Becker, D., Weigert, S., Fetzer, C., Brito, A.: Low-overhead fault tolerance for high-throughput data processing systems. In: Proceedings of ICDCS, pp. 689\u2013699 (2011)","DOI":"10.1109\/ICDCS.2011.29"},{"issue":"34","key":"565_CR54","first-page":"1","volume":"17","author":"X Meng","year":"2016","unstructured":"Meng, X., Bradley, J., Yavuz, B., Sparks, E., Venkataraman, S., Liu, D., Freeman, J., Tsai, D., Amde, M., Owen, S., et al.: Mllib: machine learning in apache spark. J. Mach. Learn. Res. 17(34), 1\u20137 (2016)","journal-title":"J. Mach. Learn. Res."},{"key":"565_CR55","doi-asserted-by":"crossref","unstructured":"Murray, D.G., McSherry, F., Isaacs, R., Isard, M., Barham, P., Abadi, M.: Naiad: a timely dataflow system. In: Proceedings of SOSP, pp. 439\u2013455 (2013)","DOI":"10.1145\/2517349.2522738"},{"key":"565_CR56","unstructured":"NatSys Lab. http:\/\/natsys-lab.com . Accessed 1 June 2019"},{"key":"565_CR57","doi-asserted-by":"crossref","unstructured":"Neumeyer, L., Robbins, B., Nair, A., Kesari, A.: S4: distributed stream computing platform. In: KDCloud, pp. 170 \u2013 177 (2010)","DOI":"10.1109\/ICDMW.2010.172"},{"key":"565_CR58","unstructured":"Niu, Y., Wang, Y., Sun, G., Yue, A., Dalessandro, B., Perlich, C., Hamner, B.: The tencent dataset and KDD-Cup\u201912. In: KDD-Cup Workshop (2012)"},{"key":"565_CR59","unstructured":"Project Gutenberg. http:\/\/www.gutenberg.org . Accessed 1 June 2019"},{"key":"565_CR60","doi-asserted-by":"crossref","unstructured":"Pundir, M., Leslie, L.M., Gupta, I., Campbell, R.H.: Zorro: zero-cost reactive failure recovery in distributed graph processing. In: Proceedings of SoCC, pp. 195\u2013208 (2015)","DOI":"10.1145\/2806777.2806934"},{"key":"565_CR61","doi-asserted-by":"crossref","unstructured":"Qian, Z., He, Y., Su, C., Wu, Z., Zhu, H., Zhang, T., Zhou, L., Yu, Y., Zhang, Z.: TimeStream: reliable stream computation in the cloud. In: Proceedings of EuroSys, pp. 1\u201314 (2013)","DOI":"10.1145\/2465351.2465353"},{"key":"565_CR62","unstructured":"Quanrud, K., Khashabi, D.: Online learning with adversarial delays. In: Proceedings of NIPS (2015)"},{"key":"565_CR63","unstructured":"Rabkin, A., Arye, M., Sen, S., Pai, V.S., Freedman, M.J.: Aggregation and degradation in JetStream: streaming analytics in the wide area. In: Proceedings of NSDI, pp. 275\u2013288 (2014)"},{"key":"565_CR64","doi-asserted-by":"crossref","unstructured":"Shah, M.a., Hellerstein, J.M., Brewer, E.: highly available, fault-tolerant, parallel dataflows. In: Proceedings of SIGMOD, pp. 827\u2013838 (2004)","DOI":"10.1145\/1007568.1007662"},{"key":"565_CR65","doi-asserted-by":"crossref","unstructured":"Shvachko, K., Kuang, H., Radia, S., Chansler, R.: The Hadoop distributed file system. In: Proceedings of IEEE MSST, pp. 1\u201310 (2010)","DOI":"10.1109\/MSST.2010.5496972"},{"key":"565_CR66","doi-asserted-by":"publisher","first-page":"703","DOI":"10.14778\/1920841.1920931","volume":"3","author":"A Smola","year":"2010","unstructured":"Smola, A., Narayanamurthy, S.: An architecture for parallel topic models. Proc. VLDB Endow. 3, 703\u2013710 (2010)","journal-title":"Proc. VLDB Endow."},{"key":"565_CR67","doi-asserted-by":"crossref","unstructured":"Song, H.H., Cho, T.W., Dave, V., Zhang, Y., Qiu, L.: Scalable proximity estimation and link prediction in online social networks. In: Proceedings of IMC, pp. 322\u2013335 (2009)","DOI":"10.1145\/1644893.1644932"},{"key":"565_CR68","unstructured":"Spark Kafka Integration Guide. http:\/\/spark.apache.org\/docs\/latest\/streaming-kafka-integration.html . Accessed 1 June 2019"},{"key":"565_CR69","unstructured":"Storm. http:\/\/storm.apache.org . Accessed 1 June 2019"},{"key":"565_CR70","unstructured":"Storm Kafka Integration Guide. http:\/\/storm.apache.org\/releases\/2.0.0-SNAPSHOT\/storm-kafka.html . Accessed 1 June 2019"},{"key":"565_CR71","first-page":"309","volume":"29","author":"N Tatbul","year":"2003","unstructured":"Tatbul, N., \u00c7etintemel, U., Zdonik, S., Cherniack, M., Stonebraker, M.: Load shedding in a data stream manager. Proc. VLDB 29, 309\u2013320 (2003)","journal-title":"Proc. VLDB"},{"key":"565_CR72","unstructured":"Tatbul, N., Zdonik, S.: Staying FIT: efficient load shedding techniques for distributed stream processing. In: Proceedings of VLDB, pp. 159\u2013170 (2007)"},{"key":"565_CR73","doi-asserted-by":"crossref","unstructured":"Toshniwal, A., Taneja, S., Shukla, A., Ramasamy, K., Patel, J.M., Kulkarni, S., Jackson, J., Gade, K., Fu, M., Donham, J., et al.: Storm@Twitter. In: Proceedings of ACM SIGMOD (2014)","DOI":"10.1145\/2588555.2595641"},{"key":"565_CR74","unstructured":"Trident. http:\/\/storm.apache.org\/documentation\/Trident-tutorial.html . Accessed 1 June 2019"},{"key":"565_CR75","doi-asserted-by":"crossref","unstructured":"Wang, H., Peh, L.S., Koukoumidis, E., Tao, S., Chan, M.C.: Meteor shower: a reliable stream processing system for commodity data centers. In: Proceedings of IPDPS, pp. 1180\u20131191 (2012)","DOI":"10.1109\/IPDPS.2012.108"},{"key":"565_CR76","doi-asserted-by":"crossref","unstructured":"Wei, J., Dai, W., Qiao, A., Ho, Q., Cui, H., Ganger, G.R., Gibbons, P.B., Gibson, G.A., Xing, E.P.: Managed communication and consistency for fast data-parallel iterative analytics. In: SoCC, pp. 381\u2013394 (2015)","DOI":"10.1145\/2806777.2806778"},{"issue":"2","key":"565_CR77","doi-asserted-by":"publisher","first-page":"49","DOI":"10.1109\/TBDATA.2015.2472014","volume":"1","author":"Eric P. Xing","year":"2015","unstructured":"Xing, E.P., Ho, Q., Dai, W., Kim, J.K., Wei, J., Lee, S., Zheng, X.: Petuum: a new platform for distributed machine learning on big data. In: Proceedings of KDD, pp. 49\u201367 (2015)","journal-title":"IEEE Transactions on Big Data"},{"key":"565_CR78","doi-asserted-by":"crossref","unstructured":"Yao, L., Mimno, D., McCallum, A.: Efficient methods for topic model inference on streaming document collections. In: Proceedings of KDD (2009)","DOI":"10.1145\/1557019.1557121"},{"key":"565_CR79","unstructured":"Yu, M., Jose, L., Miao, R.: Software defined traffic measurement with OpenSketch. In: Proceedings of NSDI, pp. 29\u201342 (2013)"},{"key":"565_CR80","doi-asserted-by":"crossref","unstructured":"Zaharia, M., Das, T., Li, H., Hunter, T., Shenker, S., Stoica, I.: Discretized streams: fault-tolerant streaming computation at scale. In: Proceedings of SOSP, pp. 423\u2013438 (2013)","DOI":"10.1145\/2517349.2522737"},{"key":"565_CR81","unstructured":"Zero Data Loss in Spark Streaming. http:\/\/databricks.com\/blog\/2015\/01\/15\/improved-driver-fault-tolerance-and-zero-data-loss-in-spark-streaming.html . Accessed 1 June 2019"},{"key":"565_CR82","unstructured":"ZeroMQ. http:\/\/zeromq.org . Accessed 1 June 2019"},{"key":"565_CR83","unstructured":"Zinkevich, M.: Online convex programming and generalized infinitesimal gradient ascent. In: Proceedings of ICML, pp. 928\u2013936 (2003)"},{"key":"565_CR84","unstructured":"Zinkevich, M., Weimer, M., Smola, A.J., Li, L.: Parallelized stochastic gradient descent. In: Proceedings of NIPS (2010)"}],"container-title":["The VLDB Journal"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s00778-019-00565-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s00778-019-00565-w\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s00778-019-00565-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,9,27]],"date-time":"2022-09-27T07:07:55Z","timestamp":1664262475000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s00778-019-00565-w"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,9,3]]},"references-count":84,"journal-issue":{"issue":"5","published-print":{"date-parts":[[2019,10]]}},"alternative-id":["565"],"URL":"https:\/\/doi.org\/10.1007\/s00778-019-00565-w","relation":{},"ISSN":["1066-8888","0949-877X"],"issn-type":[{"value":"1066-8888","type":"print"},{"value":"0949-877X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2019,9,3]]},"assertion":[{"value":"9 November 2018","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"18 June 2019","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 August 2019","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"3 September 2019","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}