{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,25]],"date-time":"2025-06-25T05:51:02Z","timestamp":1750830662893,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":30,"publisher":"ACM","license":[{"start":{"date-parts":[[2017,2,2]],"date-time":"2017-02-02T00:00:00Z","timestamp":1485993600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"European Union's - Seventh Framework Programme (FP7)","award":["615688 ERC-COG-PRIME"],"award-info":[{"award-number":["615688 ERC-COG-PRIME"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2017,2,2]]},"DOI":"10.1145\/3018661.3018740","type":"proceedings-article","created":{"date-parts":[[2017,2,2]],"date-time":"2017-02-02T20:09:48Z","timestamp":1486066188000},"page":"385-394","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":13,"title":["Synthesis of Forgiving Data Extractors"],"prefix":"10.1145","author":[{"given":"Adi","family":"Omari","sequence":"first","affiliation":[{"name":"Technion, Haifa, Israel"}]},{"given":"Sharon","family":"Shoham","sequence":"additional","affiliation":[{"name":"Tel Aviv University, Tel Aviv , Israel"}]},{"given":"Eran","family":"Yahav","sequence":"additional","affiliation":[{"name":"Technion, Haifa, Israel"}]}],"member":"320","published-online":{"date-parts":[[2017,2,2]]},"reference":[{"key":"e_1_3_2_1_1_1","first-page":"126","volume-title":"GI Workshops","author":"Anton T.","year":"2005"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1145\/872757.872799"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-31750-2_38"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1145\/371920.372182"},{"key":"e_1_3_2_1_5_1","unstructured":"Cohen J. P. Ding W. and Bagherjeiran A. Semi-supervised web wrapper repair via recursive tree matching. arXiv preprint arXiv:1505.01303 (2015).  Cohen J. P. Ding W. and Bagherjeiran A. Semi-supervised web wrapper repair via recursive tree matching. arXiv preprint arXiv:1505.01303 (2015)."},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1145\/1559845.1559882"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.14778\/1938545.1938547"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-30115-8_13"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"crossref","unstructured":"Hall M. Frank E. Holmes G. Pfahringer B. Reutemann P. and Witten I. H. The weka data mining software: an update. ACM SIGKDD explorations newsletter 11 1 (2009) 10--18.  Hall M. Frank E. Holmes G. Pfahringer B. Reutemann P. and Witten I. H. The weka data mining software: an update. ACM SIGKDD explorations newsletter 11 1 (2009) 10--18.","DOI":"10.1145\/1656274.1656278"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1145\/2009916.2010020"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.5555\/2074158.2074196"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"crossref","unstructured":"Kayed M. and Chang C.-H. Fivatech: Page-level web data extraction from template pages. Knowledge and Data Engineering IEEE Transactions on 22 2 (2010) 249--263.  Kayed M. and Chang C.-H. Fivatech: Page-level web data extraction from template pages. Knowledge and Data Engineering IEEE Transactions on 22 2 (2010) 249--263.","DOI":"10.1109\/TKDE.2009.82"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1016\/S0004-3702(99)00100-9"},{"volume-title":"IJCAI'97","author":"Kushmerick N.","key":"e_1_3_2_1_14_1"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1109\/ISSREW.2014.17"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1145\/956750.956826"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.proeng.2012.01.098"},{"key":"e_1_3_2_1_18_1","unstructured":"Mitchell T. M. Machine Learning 1 ed. McGraw-Hill Inc. New York NY USA 1997.  Mitchell T. M. Machine Learning 1 ed. McGraw-Hill Inc. New York NY USA 1997."},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2015.12.040"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.5220\/0005124504920500"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1145\/2939672.2939858"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1145\/2884781.2884842"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1007\/BF00116251"},{"volume-title":"Elsevier","year":"2014","author":"Quinlan J. R.","key":"e_1_3_2_1_24_1"},{"volume-title":"WWW","year":"2004","author":"Reis D. D. C.","key":"e_1_3_2_1_25_1"},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1145\/2350190.2350199"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"crossref","unstructured":"Thamviset W. and Wongthanavasu S. Information extraction for deep web using repetitive subject pattern. World Wide Web (2013).  Thamviset W. and Wongthanavasu S. Information extraction for deep web using repetitive subject pattern. World Wide Web (2013).","DOI":"10.1109\/ECTICon.2012.6254247"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1145\/775152.775179"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1145\/1060745.1060761"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1145\/1645953.1645962"}],"event":{"name":"WSDM 2017: Tenth ACM International Conference on Web Search and Data Mining","sponsor":["SIGMOD ACM Special Interest Group on Management of Data","SIGWEB ACM Special Interest Group on Hypertext, Hypermedia, and Web","SIGKDD ACM Special Interest Group on Knowledge Discovery in Data","SIGIR ACM Special Interest Group on Information Retrieval"],"location":"Cambridge United Kingdom","acronym":"WSDM 2017"},"container-title":["Proceedings of the Tenth ACM International Conference on Web Search and Data Mining"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3018661.3018740","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3018661.3018740","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T04:24:09Z","timestamp":1750220649000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3018661.3018740"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,2,2]]},"references-count":30,"alternative-id":["10.1145\/3018661.3018740","10.1145\/3018661"],"URL":"https:\/\/doi.org\/10.1145\/3018661.3018740","relation":{},"subject":[],"published":{"date-parts":[[2017,2,2]]},"assertion":[{"value":"2017-02-02","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}