{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,11]],"date-time":"2025-11-11T15:43:02Z","timestamp":1762875782449,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":12,"publisher":"ACM","license":[{"start":{"date-parts":[[2016,6,19]],"date-time":"2016-06-19T00:00:00Z","timestamp":1466294400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"European Research Council","award":["ERC 339233"],"award-info":[{"award-number":["ERC 339233"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2016,6,19]]},"DOI":"10.1145\/2910896.2910902","type":"proceedings-article","created":{"date-parts":[[2016,6,10]],"date-time":"2016-06-10T13:09:57Z","timestamp":1465564197000},"page":"83-92","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":23,"title":["ArchiveSpark"],"prefix":"10.1145","author":[{"given":"Helge","family":"Holzmann","sequence":"first","affiliation":[{"name":"L3S Research Center, Hannover, Germany"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Vinay","family":"Goel","sequence":"additional","affiliation":[{"name":"Internet Archive, San Francisco, CA, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Avishek","family":"Anand","sequence":"additional","affiliation":[{"name":"L3S Research Center, Hannover, Germany"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2016,6,19]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"(Internet Archive). Web archiving in the united states: A 2013 survey","author":"Jefferson Bailey","year":"2014","unstructured":"Jefferson Bailey et al. (Internet Archive). Web archiving in the united states: A 2013 survey , 2014 . URL http:\/\/www.digitalpreservation.gov\/ndsa\/working_groups\/documents\/NDSA_USWebArchivingSurvey_2013.pdf. A report of the National Digital Stewardship Alliance. {Accessed: 11\/01\/2016}. Jefferson Bailey et al. (Internet Archive). Web archiving in the united states: A 2013 survey, 2014. URL http:\/\/www.digitalpreservation.gov\/ndsa\/working_groups\/documents\/NDSA_USWebArchivingSurvey_2013.pdf. A report of the National Digital Stewardship Alliance. {Accessed: 11\/01\/2016}."},{"volume-title":"Proceedings of TPDL'11","author":"Gomes Daniel","key":"e_1_3_2_1_2_1","unstructured":"Daniel Gomes , Joao Miranda , and Miguel Costa . A survey on web archiving initiatives . In Proceedings of TPDL'11 . Daniel Gomes, Joao Miranda, and Miguel Costa. A survey on web archiving initiatives. In Proceedings of TPDL'11."},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.7227\/ALX.0023"},{"volume-title":"Alexandria Workshop on Foundations for Temporal Retrieval, Exploration and Analytics in Web Archives on 03\/11\/2015 {Accessed: 17\/01\/2016}.","author":"Br\u00fcgger Niels","key":"e_1_3_2_1_4_1","unstructured":"Niels Br\u00fcgger . Web history, web archives, and web research infrastructure - between close and distant reading, 2015. URL http:\/\/alexandria-project.eu\/events\/2nd-int-alexandria-workshop-2015. Keynote at the 2nd Int . Alexandria Workshop on Foundations for Temporal Retrieval, Exploration and Analytics in Web Archives on 03\/11\/2015 {Accessed: 17\/01\/2016}. Niels Br\u00fcgger. Web history, web archives, and web research infrastructure - between close and distant reading, 2015. URL http:\/\/alexandria-project.eu\/events\/2nd-int-alexandria-workshop-2015. Keynote at the 2nd Int. Alexandria Workshop on Foundations for Temporal Retrieval, Exploration and Analytics in Web Archives on 03\/11\/2015 {Accessed: 17\/01\/2016}."},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1145\/2567948.2579045"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1145\/2009916.2009991"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1145\/2756406.2756920"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1145\/1629175.1629198"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1145\/1773912.1773922"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1145\/1365815.1365816"},{"key":"e_1_3_2_1_12_1","first-page":"10","volume-title":"Proceedings of the 2nd USENIX conference on Hot topics in cloud computing","volume":"10","author":"Zaharia Matei","year":"2010","unstructured":"Matei Zaharia , Mosharaf Chowdhury , Michael J Franklin , Scott Shenker , and Ion Stoica . Spark : cluster computing with working sets . In Proceedings of the 2nd USENIX conference on Hot topics in cloud computing , volume 10 , page 10 , 2010 . Matei Zaharia, Mosharaf Chowdhury, Michael J Franklin, Scott Shenker, and Ion Stoica. Spark: cluster computing with working sets. In Proceedings of the 2nd USENIX conference on Hot topics in cloud computing, volume 10, page 10, 2010."},{"key":"e_1_3_2_1_13_1","unstructured":"Jimmy Lin. Warcbase on github. URL https:\/\/github.com\/lintool\/warcbase. {Accessed: 11\/01\/2016}.  Jimmy Lin. Warcbase on github. URL https:\/\/github.com\/lintool\/warcbase. {Accessed: 11\/01\/2016}."}],"event":{"name":"JCDL '16: The 16th ACM\/IEEE-CS Joint Conference on Digital Libraries","sponsor":["SIGWEB ACM Special Interest Group on Hypertext, Hypermedia, and Web","SIGIR ACM Special Interest Group on Information Retrieval","IEEE Technical Committee on Digital Libraries (TC DL)"],"location":"Newark New Jersey USA","acronym":"JCDL '16"},"container-title":["Proceedings of the 16th ACM\/IEEE-CS on Joint Conference on Digital Libraries"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/2910896.2910902","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/2910896.2910902","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T04:54:57Z","timestamp":1750222497000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/2910896.2910902"}},"subtitle":["Efficient Web Archive Access, Extraction and Derivation"],"short-title":[],"issued":{"date-parts":[[2016,6,19]]},"references-count":12,"alternative-id":["10.1145\/2910896.2910902","10.1145\/2910896"],"URL":"https:\/\/doi.org\/10.1145\/2910896.2910902","relation":{},"subject":[],"published":{"date-parts":[[2016,6,19]]},"assertion":[{"value":"2016-06-19","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}