{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2022,12,29]],"date-time":"2022-12-29T05:21:31Z","timestamp":1672291291302},"reference-count":9,"publisher":"Association for Computing Machinery (ACM)","issue":"2","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Proc. VLDB Endow."],"published-print":{"date-parts":[[2008,8]]},"abstract":"<jats:p>\n            Archived web data is a great resource for scientific research, but poses serious challenges in data processing and management. We demonstrate the\n            <jats:italic>Web Lab Collaboration Server<\/jats:italic>\n            , a platform and service for large-scale collaborative web data analysis in a distributed computing environment, and show how it seamlessly supports non-technical users during search, data extraction and analysis.\n          <\/jats:p>","DOI":"10.14778\/1454159.1454205","type":"journal-article","created":{"date-parts":[[2014,6,24]],"date-time":"2014-06-24T12:17:57Z","timestamp":1403612277000},"page":"1476-1479","source":"Crossref","is-referenced-by-count":3,"title":["Large-scale collaborative analysis and extraction of web data"],"prefix":"10.14778","volume":"1","author":[{"given":"Felix","family":"Weigel","sequence":"first","affiliation":[{"name":"Cornell University"}]},{"given":"Biswanath","family":"Panda","sequence":"additional","affiliation":[{"name":"Cornell University"}]},{"given":"Mirek","family":"Riedewald","sequence":"additional","affiliation":[{"name":"Cornell University"}]},{"given":"Johannes","family":"Gehrke","sequence":"additional","affiliation":[{"name":"Cornell University"}]},{"given":"Manuel","family":"Calimlim","sequence":"additional","affiliation":[{"name":"Cornell University"}]}],"member":"320","published-online":{"date-parts":[[2008,8]]},"reference":[{"key":"e_1_2_1_1_1","volume-title":"Proc. OSDI","author":"Dean J.","year":"2004","unstructured":"J. Dean and S. Ghemawat . MapReduce: Simplified Data Proc. on Large Clusters . In Proc. OSDI , 2004 . J. Dean and S. Ghemawat. MapReduce: Simplified Data Proc. on Large Clusters. In Proc. OSDI, 2004."},{"key":"e_1_2_1_2_1","unstructured":"The Hadoop Project. hadoop.apache.org.  The Hadoop Project. hadoop.apache.org."},{"key":"e_1_2_1_3_1","unstructured":"Internet Archive. www.archive.org.  Internet Archive. www.archive.org."},{"key":"e_1_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1145\/1272996.1273005"},{"key":"e_1_2_1_5_1","unstructured":"Lixto Software GmbH. www.lixto.com.  Lixto Software GmbH. www.lixto.com."},{"key":"e_1_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1145\/1376616.1376726"},{"issue":"4","key":"e_1_2_1_7_1","first-page":"227","volume":"13","author":"Pike R.","year":"2005","unstructured":"R. Pike , S. Dorward , R. Griesemer , and S. Quinlan . Interpreting the Data: Parallel Analysis with Sawzall. Scientific Programming , 13 ( 4 ): 227 -- 298 , 2005 . R. Pike, S. Dorward, R. Griesemer, and S. Quinlan. Interpreting the Data: Parallel Analysis with Sawzall. Scientific Programming, 13(4):227--298, 2005.","journal-title":"Interpreting the Data: Parallel Analysis with Sawzall. Scientific Programming"},{"key":"e_1_2_1_8_1","unstructured":"Flash video of the Visual Wrapper Generator. www.cs.cornell.edu\/~weigel\/WrapperDemo.  Flash video of the Visual Wrapper Generator. www.cs.cornell.edu\/~weigel\/WrapperDemo."},{"key":"e_1_2_1_9_1","unstructured":"The Cornell Web Lab Project. weblab.infosci.cornell.edu.  The Cornell Web Lab Project. weblab.infosci.cornell.edu."}],"container-title":["Proceedings of the VLDB Endowment"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.14778\/1454159.1454205","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,12,28]],"date-time":"2022-12-28T09:59:23Z","timestamp":1672221563000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.14778\/1454159.1454205"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2008,8]]},"references-count":9,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2008,8]]}},"alternative-id":["10.14778\/1454159.1454205"],"URL":"https:\/\/doi.org\/10.14778\/1454159.1454205","relation":{},"ISSN":["2150-8097"],"issn-type":[{"value":"2150-8097","type":"print"}],"subject":[],"published":{"date-parts":[[2008,8]]}}}