{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,16]],"date-time":"2026-05-16T08:55:41Z","timestamp":1778921741611,"version":"3.51.4"},"publisher-location":"New York, NY, USA","reference-count":24,"publisher":"ACM","license":[{"start":{"date-parts":[[2013,10,1]],"date-time":"2013-10-01T00:00:00Z","timestamp":1380585600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"DOI":"10.13039\/100000143","name":"Division of Computing and Communication Foundations","doi-asserted-by":"publisher","award":["CCF-1048296, CNS-1219220"],"award-info":[{"award-number":["CCF-1048296, CNS-1219220"]}],"id":[{"id":"10.13039\/100000143","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000144","name":"Division of Computer and Network Systems","doi-asserted-by":"publisher","award":["CCF-1048296, CNS-1219220"],"award-info":[{"award-number":["CCF-1048296, CNS-1219220"]}],"id":[{"id":"10.13039\/100000144","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2013,10]]},"DOI":"10.1145\/2523616.2523619","type":"proceedings-article","created":{"date-parts":[[2014,1,6]],"date-time":"2014-01-06T20:44:07Z","timestamp":1389041047000},"page":"1-15","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":32,"title":["Scalable lineage capture for debugging DISC analytics"],"prefix":"10.1145","author":[{"given":"Dionysios","family":"Logothetis","sequence":"first","affiliation":[{"name":"Telefonica Research"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Soumyarupa","family":"De","sequence":"additional","affiliation":[{"name":"Microsoft, Inc."}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Kenneth","family":"Yocum","sequence":"additional","affiliation":[{"name":"U.C. San Diego and Illumina, Inc."}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2013,10]]},"reference":[{"key":"e_1_3_2_1_1_1","unstructured":"Apache Mahout: Scalable Machine Learning and Data Mining. http:\/\/mahout.apache.org.  Apache Mahout: Scalable Machine Learning and Data Mining. http:\/\/mahout.apache.org."},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.14778\/2095686.2095693"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1093\/nar\/gks251"},{"key":"e_1_3_2_1_4_1","volume-title":"De novo genome assembly: what every biologist should know. Nature methods, 9","author":"Baker M.","year":"2012","unstructured":"M. Baker . De novo genome assembly: what every biologist should know. Nature methods, 9 , 2012 . M. Baker. De novo genome assembly: what every biologist should know. Nature methods, 9, 2012."},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE.2011.5767921"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1561\/1900000006"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1007\/s00778-002-0083-8"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1101\/gr.126599.111"},{"issue":"3","key":"e_1_3_2_1_9_1","first-page":"249","article-title":"1 emp meeting on sample selection and acquisition","volume":"3","author":"Gilbert G. A.","year":"1992","unstructured":"G. A. Gilbert , F. Meyer , J. Janson , 1 emp meeting on sample selection and acquisition . At Argonne National Laboratory , 3 ( 3 ): 249 -- 253 , October 1992 . G. A. Gilbert, F. Meyer, J. Janson, et al. 1 emp meeting on sample selection and acquisition. At Argonne National Laboratory, 3(3): 249--53, October 1992.","journal-title":"At Argonne National Laboratory"},{"key":"e_1_3_2_1_10_1","volume-title":"USENIX OSDI","author":"Gonzalez J. E.","year":"2012","unstructured":"J. E. Gonzalez , Y. Low , H. Gu , D. Bickson , and C. Guestrin . PowerGraph: distributed graphparallel computation on natural graphs . In USENIX OSDI , October 2012 . J. E. Gonzalez, Y. Low, H. Gu, D. Bickson, and C. Guestrin. PowerGraph: distributed graphparallel computation on natural graphs. In USENIX OSDI, October 2012."},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1080\/00401706.1969.10490657"},{"key":"e_1_3_2_1_12_1","volume-title":"Proc. of CIDR","author":"Ikeda R.","year":"2011","unstructured":"R. Ikeda , H. Park , and J. Widom . Provenance for generalized map and reduce workflows . In Proc. of CIDR , January 2011 . R. Ikeda, H. Park, and J. Widom. Provenance for generalized map and reduce workflows. In Proc. of CIDR, January 2011."},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1145\/2063576.2063816"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1145\/1272996.1273005"},{"key":"e_1_3_2_1_15_1","volume-title":"Ultrafast and memory-efficient alignment of short dna sequences to the human genome. Genome Biology, (10: R25)","author":"Langmead B.","year":"2009","unstructured":"B. Langmead , C. Trapnell , M. Pop , and S. L. Salzberg . Ultrafast and memory-efficient alignment of short dna sequences to the human genome. Genome Biology, (10: R25) , 2009 . B. Langmead, C. Trapnell, M. Pop, and S. L. Salzberg. Ultrafast and memory-efficient alignment of short dna sequences to the human genome. Genome Biology, (10: R25), 2009."},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1145\/1989323.1989459"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1145\/1376616.1376726"},{"key":"e_1_3_2_1_18_1","volume-title":"Proc. of CIDR","author":"Olston C.","year":"2011","unstructured":"C. Olston and A. D. Sarma . Ibis: A provenance manager for multi-layer systems . In Proc. of CIDR , January 2011 . C. Olston and A. D. Sarma. Ibis: A provenance manager for multi-layer systems. In Proc. of CIDR, January 2011."},{"key":"e_1_3_2_1_19_1","volume-title":"Yahoo","author":"Sarma A. D.","year":"2010","unstructured":"A. D. Sarma , A. Jain , and P. Bohannon . PROBER: Ad-Hoc Debugging of Extraction and Integration Pipelines. Technical report , Yahoo , April 2010 . A. D. Sarma, A. Jain, and P. Bohannon. PROBER: Ad-Hoc Debugging of Extraction and Integration Pipelines. Technical report, Yahoo, April 2010."},{"key":"e_1_3_2_1_20_1","unstructured":"M. Schatz A. Gupta R. Gupta D. Kelley J. Lewi D. Nettem D. Sommer and M. Pop. Contrail: Assembly of Large Genomes using Cloud Computing. http:\/\/sourceforge.net\/apps\/mediawiki\/contrial-bio.  M. Schatz A. Gupta R. Gupta D. Kelley J. Lewi D. Nettem D. Sommer and M. Pop. Contrail: Assembly of Large Genomes using Cloud Computing. http:\/\/sourceforge.net\/apps\/mediawiki\/contrial-bio."},{"key":"e_1_3_2_1_21_1","volume-title":"Genome Research","author":"Simpson J.","year":"2011","unstructured":"J. Simpson and R. Durbin . Efficient de novo assembly of large genomes using compressed data structures . Genome Research , 2011 . J. Simpson and R. Durbin. Efficient de novo assembly of large genomes using compressed data structures. Genome Research, 2011."},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1145\/2043556.2043584"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.14778\/2535568.2448939"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1145\/1807167.1807234"}],"event":{"name":"SOCC '13: ACM Symposium on Cloud Computing","location":"Santa Clara California","acronym":"SOCC '13","sponsor":["SIGMOD ACM Special Interest Group on Management of Data","SIGOPS ACM Special Interest Group on Operating Systems"]},"container-title":["Proceedings of the 4th annual Symposium on Cloud Computing"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/2523616.2523619","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/2523616.2523619","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T07:34:02Z","timestamp":1750232042000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/2523616.2523619"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2013,10]]},"references-count":24,"alternative-id":["10.1145\/2523616.2523619","10.1145\/2523616"],"URL":"https:\/\/doi.org\/10.1145\/2523616.2523619","relation":{},"subject":[],"published":{"date-parts":[[2013,10]]},"assertion":[{"value":"2013-10-01","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}