{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,27]],"date-time":"2025-10-27T10:13:05Z","timestamp":1761559985851,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":27,"publisher":"ACM","license":[{"start":{"date-parts":[[2010,6,10]],"date-time":"2010-06-10T00:00:00Z","timestamp":1276128000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2010,6,10]]},"DOI":"10.1145\/1807128.1807138","type":"proceedings-article","created":{"date-parts":[[2010,6,11]],"date-time":"2010-06-11T18:52:58Z","timestamp":1276282378000},"page":"51-62","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":98,"title":["Stateful bulk processing for incremental analytics"],"prefix":"10.1145","author":[{"given":"Dionysios","family":"Logothetis","sequence":"first","affiliation":[{"name":"UCSD, La Jolla, CA, USA"}]},{"given":"Christopher","family":"Olston","sequence":"additional","affiliation":[{"name":"Yahoo! Research, Santa Clara, USA"}]},{"given":"Benjamin","family":"Reed","sequence":"additional","affiliation":[{"name":"Yahoo! Research, Santa Clara, USA"}]},{"given":"Kevin C.","family":"Webb","sequence":"additional","affiliation":[{"name":"UCSD, La Jolla, USA"}]},{"given":"Ken","family":"Yocum","sequence":"additional","affiliation":[{"name":"UCSD, La Jolla, USA"}]}],"member":"320","published-online":{"date-parts":[[2010,6,10]]},"reference":[{"key":"e_1_3_2_1_1_1","unstructured":"The Hive project. http:\/\/hadoop.apache.org\/hive\/.  The Hive project. http:\/\/hadoop.apache.org\/hive\/."},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1145\/543613.543615"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1145\/16856.16861"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1145\/988672.988752"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1016\/S0169-7552(98)00110-X"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.14778\/1454159.1454166"},{"key":"e_1_3_2_1_7_1","first-page":"205","volume-title":"Proceedings of OSDI","author":"Chang F.","year":"2006","unstructured":"F. Chang , J. Dean , S. Ghemawat , W. C. Hsieh , D. A. Wallach , M. Burrows , T. Ch , A. Fikes , and R. E. Gruber . Bigtable: A Distributed Storage System for Structured Data . In Proceedings of OSDI , pages 205 -- 218 , Seattle, WA , November 2006 . F. Chang, J. Dean, S. Ghemawat, W. C. Hsieh, D. A. Wallach, M. Burrows, T. Ch, A. Fikes, and R. E. Gruber. Bigtable: A Distributed Storage System for Structured Data. In Proceedings of OSDI, pages 205--218, Seattle, WA, November 2006."},{"key":"e_1_3_2_1_8_1","volume-title":"November","author":"Chien S.","year":"2004","unstructured":"S. Chien , C. Dwork , R. Kumar , D. R. Simon , and D. Sivakumar . Link evolution: Analysis and algorithms. Internet Mathematics, 1(3) , November 2004 . S. Chien, C. Dwork, R. Kumar, D. R. Simon, and D. Sivakumar. Link evolution: Analysis and algorithms. Internet Mathematics, 1(3), November 2004."},{"key":"e_1_3_2_1_9_1","volume-title":"Proceedings of NSDI","author":"Condie T.","year":"2010","unstructured":"T. Condie , N. Conway , P. Alvaro , and J. M. Hellerstein . MapReduce online . In Proceedings of NSDI , April 2010 . T. Condie, N. Conway, P. Alvaro, and J. M. Hellerstein. MapReduce online. In Proceedings of NSDI, April 2010."},{"key":"e_1_3_2_1_10_1","volume-title":"Proceedings of OSDI","author":"Dean J.","year":"2004","unstructured":"J. Dean and S. Ghemawat . Mapreduce: Simplified data processing on large clusters . In Proceedings of OSDI , San Francisco, CA , December 2004 . J. Dean and S. Ghemawat. Mapreduce: Simplified data processing on large clusters. In Proceedings of OSDI, San Francisco, CA, December 2004."},{"key":"e_1_3_2_1_11_1","volume-title":"1st International Conference on Cloud Computing (CloudComp09)","author":"Ekanayake J.","year":"2009","unstructured":"J. Ekanayake and G. Fox . High performance parallel computing with clouds and cloud technologies . In 1st International Conference on Cloud Computing (CloudComp09) , 2009 . J. Ekanayake and G. Fox. High performance parallel computing with clouds and cloud technologies. In 1st International Conference on Cloud Computing (CloudComp09), 2009."},{"key":"e_1_3_2_1_12_1","volume-title":"Proceedings of VLDB","author":"Ester M.","year":"1998","unstructured":"M. Ester , H. Kriegal , J. Sander , M. Wimmer , and X. Xu . Incremental clustering and mining in a data warehousing environment . In Proceedings of VLDB , 1998 . M. Ester, H. Kriegal, J. Sander, M. Wimmer, and X. Xu. Incremental clustering and mining in a data warehousing environment. In Proceedings of VLDB, 1998."},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1145\/945445.945450"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1145\/1272996.1273005"},{"key":"e_1_3_2_1_16_1","volume-title":"Proceedings of NetDB","author":"Logothetis D.","year":"2009","unstructured":"D. Logothetis and K. Yocum . Data indexing for stateful, large-scale data processing . In Proceedings of NetDB , October 2009 . D. Logothetis and K. Yocum. Data indexing for stateful, large-scale data processing. In Proceedings of NetDB, October 2009."},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1145\/1582716.1582723"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.5555\/1287369.1287400"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1145\/1007568.1007638"},{"key":"e_1_3_2_1_20_1","unstructured":"C. Monash. Facebook Hadoop and Hive May 2009. http:\/\/www.dbms2.com\/2009\/05\/11\/facebook-hadoop-and-hive.  C. Monash. Facebook Hadoop and Hive May 2009. http:\/\/www.dbms2.com\/2009\/05\/11\/facebook-hadoop-and-hive."},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1137\/1.9781611972771.24"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1145\/1376616.1376726"},{"key":"e_1_3_2_1_23_1","unstructured":"B. Pariseau. IDC unstructured data will become the primary task for storage October 2008. http:\/\/itknowledgeexchange.techtarget.com\/storage-soup\/idc-unstructured-data-willbecome-the-primary-task-for-storage\/.  B. Pariseau. IDC unstructured data will become the primary task for storage October 2008. http:\/\/itknowledgeexchange.techtarget.com\/storage-soup\/idc-unstructured-data-willbecome-the-primary-task-for-storage\/."},{"key":"e_1_3_2_1_24_1","volume-title":"HotCloud Workshop","author":"Popa L.","year":"2009","unstructured":"L. Popa , M. Budiu , Y. Yu , and M. Isard . DryadInc:reusing work in large-scale computations . In HotCloud Workshop , June 2009 . L. Popa, M. Budiu, Y. Yu, and M. Isard. DryadInc:reusing work in large-scale computations. In HotCloud Workshop, June 2009."},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1109\/69.91063"},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1145\/1519065.1519089"},{"key":"e_1_3_2_1_27_1","volume-title":"August","author":"Azure Windows","year":"2008","unstructured":"Windows Azure and Facebook teams. Personal communications , August 2008 . Windows Azure and Facebook teams. Personal communications, August 2008."},{"key":"e_1_3_2_1_28_1","volume-title":"Proceedings of OSDI","author":"Yu Y.","year":"2008","unstructured":"Y. Yu , M. Isard , D. Fetterly , M. Budiu , U. Erlingsson , P. K. Gunda ,, and J. Currey . DryadLINQ: A System for General-Purpose Distributed Data-Parallel Computing Using a High-Level Language . In Proceedings of OSDI , San Diego, CA , December 2008 . Y. Yu, M. Isard, D. Fetterly, M. Budiu, U. Erlingsson, P. K. Gunda,, and J. Currey. DryadLINQ: A System for General-Purpose Distributed Data-Parallel Computing Using a High-Level Language. In Proceedings of OSDI, San Diego, CA, December 2008."}],"event":{"name":"SOCC '10: ACM SIGMOD-SIGOPS Workshop on Cloud Computing in conjunction with SIGMOD 2010","sponsor":["SIGMOD ACM Special Interest Group on Management of Data","SIGOPS ACM Special Interest Group on Operating Systems"],"location":"Indianapolis Indiana USA","acronym":"SOCC '10"},"container-title":["Proceedings of the 1st ACM symposium on Cloud computing"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/1807128.1807138","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/1807128.1807138","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T12:17:34Z","timestamp":1750249054000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/1807128.1807138"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2010,6,10]]},"references-count":27,"alternative-id":["10.1145\/1807128.1807138","10.1145\/1807128"],"URL":"https:\/\/doi.org\/10.1145\/1807128.1807138","relation":{},"subject":[],"published":{"date-parts":[[2010,6,10]]},"assertion":[{"value":"2010-06-10","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}