{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T04:35:31Z","timestamp":1750307731931,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":25,"publisher":"ACM","license":[{"start":{"date-parts":[[2009,6,28]],"date-time":"2009-06-28T00:00:00Z","timestamp":1246147200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2009,6,28]]},"DOI":"10.1145\/1557019.1557163","type":"proceedings-article","created":{"date-parts":[[2009,6,30]],"date-time":"2009-06-30T13:10:54Z","timestamp":1246367454000},"page":"1345-1354","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":31,"title":["Can we learn a template-independent wrapper for news article extraction from a single training site?"],"prefix":"10.1145","author":[{"given":"Junfeng","family":"Wang","sequence":"first","affiliation":[{"name":"Zhejiang Key Lab. of Service Robot, College of Computer Science, Zhejiang University, Hangzhou, China"}]},{"given":"Chun","family":"Chen","sequence":"additional","affiliation":[{"name":"Zhejiang Key Lab. of Service Robot, College of Computer Science, Zhejiang University, Hangzhou, China"}]},{"given":"Can","family":"Wang","sequence":"additional","affiliation":[{"name":"Zhejiang Key Lab. of Service Robot, College of Computer Science, Zhejiang University, Hangzhou, China"}]},{"given":"Jian","family":"Pei","sequence":"additional","affiliation":[{"name":"School of Computer Science, Simon Fraser University, Vancouver, Canada"}]},{"given":"Jiajun","family":"Bu","sequence":"additional","affiliation":[{"name":"Zhejiang Key Lab. of Service Robot, College of Computer Science, Zhejiang University, Hangzhou, China"}]},{"given":"Ziyu","family":"Guan","sequence":"additional","affiliation":[{"name":"Zhejiang Key Lab. of Service Robot, College of Computer Science, Zhejiang University, Hangzhou, China"}]},{"given":"Wei Vivian","family":"Zhang","sequence":"additional","affiliation":[{"name":"Microsoft Research, Redmond, WA, USA"}]}],"member":"320","published-online":{"date-parts":[[2009,6,28]]},"reference":[{"key":"e_1_3_2_2_1_1","doi-asserted-by":"publisher","DOI":"10.1145\/872757.872799"},{"key":"e_1_3_2_2_2_1","doi-asserted-by":"publisher","DOI":"10.5555\/1025132.1026338"},{"key":"e_1_3_2_2_3_1","volume-title":"VLDB'01","author":"Crescenzi G. M. P.","year":"2001","unstructured":"G. M. P. Crescenzi , V. Mecca . Roadrunner : Towards automatic data extraction from large web sites . In VLDB'01 , 2001 . G. M. P. Crescenzi, V. Mecca. Roadrunner: Towards automatic data extraction from large web sites. In VLDB'01, 2001."},{"key":"e_1_3_2_2_4_1","doi-asserted-by":"publisher","DOI":"10.5555\/1218702.1218707"},{"key":"e_1_3_2_2_5_1","doi-asserted-by":"publisher","DOI":"10.1145\/775152.775182"},{"key":"e_1_3_2_2_6_1","doi-asserted-by":"publisher","DOI":"10.5555\/306766.306775"},{"key":"e_1_3_2_2_7_1","doi-asserted-by":"publisher","DOI":"10.1145\/1076034.1076079"},{"key":"e_1_3_2_2_8_1","doi-asserted-by":"publisher","DOI":"10.1145\/1135777.1135859"},{"key":"e_1_3_2_2_9_1","doi-asserted-by":"publisher","DOI":"10.1145\/1242572.1242759"},{"key":"e_1_3_2_2_10_1","volume-title":"WWW'95","author":"Kamba K. A. M. C.","year":"1995","unstructured":"K. A. M. C. Kamba , T. Bharat . An interactive, personalized, newspaper on the www . In WWW'95 , 1995 . K. A. M. C. Kamba, T. Bharat. An interactive, personalized, newspaper on the www. In WWW'95, 1995."},{"key":"e_1_3_2_2_11_1","doi-asserted-by":"publisher","DOI":"10.1016\/S0004-3702(99)00100-9"},{"key":"e_1_3_2_2_12_1","doi-asserted-by":"publisher","DOI":"10.1145\/565117.565137"},{"key":"e_1_3_2_2_13_1","volume-title":"WWW'05","author":"Liu B.","year":"2005","unstructured":"B. Liu . Web content mining (tutorial) . In WWW'05 , 2005 . B. Liu. Web content mining (tutorial). In WWW'05, 2005."},{"key":"e_1_3_2_2_14_1","doi-asserted-by":"publisher","DOI":"10.1145\/301136.301191"},{"key":"e_1_3_2_2_15_1","volume-title":"Advances in Large Margin Classifiers","author":"Platt J. C.","year":"1999","unstructured":"J. C. Platt . Probabilistic outputs for support vector machines and comparisons to regularized likelihood methods . Advances in Large Margin Classifiers , 1999 . J. C. Platt. Probabilistic outputs for support vector machines and comparisons to regularized likelihood methods. Advances in Large Margin Classifiers, 1999."},{"key":"e_1_3_2_2_16_1","doi-asserted-by":"publisher","DOI":"10.1145\/988672.988740"},{"key":"e_1_3_2_2_17_1","volume-title":"VLDB'02","author":"Sarawagi S.","year":"2002","unstructured":"S. Sarawagi . Automation in information extraction and data integration (tutorial) . In VLDB'02 , 2002 . S. Sarawagi. Automation in information extraction and data integration (tutorial). In VLDB'02, 2002."},{"key":"e_1_3_2_2_18_1","doi-asserted-by":"publisher","DOI":"10.1016\/0020-0190(77)90064-3"},{"key":"e_1_3_2_2_19_1","doi-asserted-by":"publisher","DOI":"10.1145\/354384.376098"},{"key":"e_1_3_2_2_20_1","doi-asserted-by":"publisher","DOI":"10.1145\/988672.988700"},{"key":"e_1_3_2_2_21_1","first-page":"831","volume-title":"NIPS'91","author":"Vapnik V.","year":"1991","unstructured":"V. Vapnik . Principles of risk minimization for learning theory . In NIPS'91 , pages 831 -- 838 , 1991 . V. Vapnik. Principles of risk minimization for learning theory. In NIPS'91, pages 831--838, 1991."},{"key":"e_1_3_2_2_22_1","doi-asserted-by":"publisher","DOI":"10.1145\/1060745.1060761"},{"key":"e_1_3_2_2_23_1","doi-asserted-by":"publisher","DOI":"10.1145\/1060745.1060760"},{"key":"e_1_3_2_2_24_1","doi-asserted-by":"publisher","DOI":"10.1145\/1281192.1281286"},{"key":"e_1_3_2_2_25_1","first-page":"1507","volume-title":"AAAI'07","volume":"22","author":"Zheng S.","year":"2007","unstructured":"S. Zheng , R. Song , and J. Wen . Template-independent news extraction based on visual consistency . In AAAI'07 , volume 22 , pages 1507 -- 1513 , 2007 . S. Zheng, R. Song, and J. Wen. Template-independent news extraction based on visual consistency. In AAAI'07, volume 22, pages 1507--1513, 2007."}],"event":{"name":"KDD09: The 15th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining","sponsor":["SIGMOD ACM Special Interest Group on Management of Data","SIGKDD ACM Special Interest Group on Knowledge Discovery in Data","ACM Association for Computing Machinery"],"location":"Paris France","acronym":"KDD09"},"container-title":["Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/1557019.1557163","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/1557019.1557163","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T13:38:42Z","timestamp":1750253922000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/1557019.1557163"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2009,6,28]]},"references-count":25,"alternative-id":["10.1145\/1557019.1557163","10.1145\/1557019"],"URL":"https:\/\/doi.org\/10.1145\/1557019.1557163","relation":{},"subject":[],"published":{"date-parts":[[2009,6,28]]},"assertion":[{"value":"2009-06-28","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}