{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,23]],"date-time":"2025-08-23T05:12:11Z","timestamp":1755925931021,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":38,"publisher":"ACM","license":[{"start":{"date-parts":[[2015,8,9]],"date-time":"2015-08-09T00:00:00Z","timestamp":1439078400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2015,8,9]]},"DOI":"10.1145\/2766462.2767739","type":"proceedings-article","created":{"date-parts":[[2015,8,4]],"date-time":"2015-08-04T13:57:50Z","timestamp":1438696670000},"page":"423-432","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":32,"title":["Learning to Extract Local Events from the Web"],"prefix":"10.1145","author":[{"given":"John","family":"Foley","sequence":"first","affiliation":[{"name":"University of Massachusetts, Amherst, MA, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Michael","family":"Bendersky","sequence":"additional","affiliation":[{"name":"Google, Mountain View, CA, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Vanja","family":"Josifovski","sequence":"additional","affiliation":[{"name":"Pinterest, San Francisco, CA, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2015,8,9]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.14778\/2536336.2536343"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-41338-4_2"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1145\/1897816.1897839"},{"key":"e_1_3_2_1_5_1","volume-title":"DTIC Document","author":"Dean-Hall A.","year":"2013","unstructured":"A. Dean-Hall , C. L. Clarke , J. Kamps , P. Thomas , N. Simone , and E. Voorhees . Overview of the trec 2013 contextual suggestion track. Technical report , DTIC Document , 2013 . A. Dean-Hall, C. L. Clarke, J. Kamps, P. Thomas, N. Simone, and E. Voorhees. Overview of the trec 2013 contextual suggestion track. Technical report, DTIC Document, 2013."},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.5555\/1390681.1442794"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1145\/2479832.2479845"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10816-2_35"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.14778\/1687627.1687661"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1145\/775152.775182"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.artint.2012.06.001"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.datak.2009.10.002"},{"key":"e_1_3_2_1_13_1","volume-title":"Proceedings of the Workshop on Pattern Recognition in Practice","author":"Jelinek F.","year":"1980","unstructured":"F. Jelinek and R. L. Mercer . Interpolated estimation of markov source parameters from sparse data . In Proceedings of the Workshop on Pattern Recognition in Practice , 1980 . F. Jelinek and R. L. Mercer. Interpolated estimation of markov source parameters from sparse data. In Proceedings of the Workshop on Pattern Recognition in Practice, 1980."},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1109\/ASONAM.2009.41"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1145\/2661829.2661984"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1145\/2484028.2484123"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.14778\/1920841.1921005"},{"key":"e_1_3_2_1_18_1","first-page":"788","volume-title":"Communication and Conservation of Energy (ICGCE), 2013 International Conference on","author":"Manjula R.","year":"2013","unstructured":"R. Manjula and A. Chilambuchelvan . Extracting templates from web pages. In Green Computing , Communication and Conservation of Energy (ICGCE), 2013 International Conference on , pages 788 -- 791 . IEEE, 2013 . R. Manjula and A. Chilambuchelvan. Extracting templates from web pages. In Green Computing, Communication and Conservation of Energy (ICGCE), 2013 International Conference on, pages 788--791. IEEE, 2013."},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/P14-5010"},{"key":"e_1_3_2_1_20_1","first-page":"646","volume-title":"ACL'12","author":"Metzler D.","year":"2012","unstructured":"D. Metzler , C. Cai , and E. Hovy . Structured event retrieval over microblog archives . In ACL'12 , pages 646 -- 655 . Association for Computational Linguistics , 2012 . D. Metzler, C. Cai, and E. Hovy. Structured event retrieval over microblog archives. In ACL'12, pages 646--655. Association for Computational Linguistics, 2012."},{"key":"e_1_3_2_1_21_1","first-page":"937","article-title":"Web data commons-extracting structured data from two large web corpora","author":"M\u00fchleisen H.","year":"2012","unstructured":"H. M\u00fchleisen and C. Bizer . Web data commons-extracting structured data from two large web corpora . LDOW , 937 , 2012 . H. M\u00fchleisen and C. Bizer. Web data commons-extracting structured data from two large web corpora. LDOW, 937, 2012.","journal-title":"LDOW"},{"key":"e_1_3_2_1_22_1","volume-title":"Learning regular expressions for the extraction of product attributes from e-commerce microdata","author":"Petrovski P.","year":"2014","unstructured":"P. Petrovski , V. Bryl , and C. Bizer . Learning regular expressions for the extraction of product attributes from e-commerce microdata . 2014 . P. Petrovski, V. Bryl, and C. Bizer. Learning regular expressions for the extraction of product attributes from e-commerce microdata. 2014."},{"key":"e_1_3_2_1_23_1","volume-title":"Masarykova univerzita, Fakulta informatiky","author":"Pomik\u00e1lek J.","year":"2011","unstructured":"J. Pomik\u00e1lek . Removing boilerplate and duplicate content from web corpora. Disertacn\u0131 pr\u00e1ce , Masarykova univerzita, Fakulta informatiky , 2011 . J. Pomik\u00e1lek. Removing boilerplate and duplicate content from web corpora. Disertacn\u0131 pr\u00e1ce, Masarykova univerzita, Fakulta informatiky, 2011."},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1145\/290941.291008"},{"key":"e_1_3_2_1_25_1","first-page":"40","volume-title":"Corpus linguistics","author":"Gaizauskas R.","year":"2003","unstructured":"J. Pustejovsky, P. Hanks, R. Sauri, A. See, R. Gaizauskas , A. Setzer , D. Radev , B. Sundheim , D. Day , L. Ferro , The timebank corpus . In Corpus linguistics , volume 2003 , page 40 , 2003 . J. Pustejovsky, P. Hanks, R. Sauri, A. See, R. Gaizauskas, A. Setzer, D. Radev, B. Sundheim, D. Day, L. Ferro, et al. The timebank corpus. In Corpus linguistics, volume 2003, page 40, 2003."},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1145\/1772690.1772777"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-11964-9_16"},{"key":"e_1_3_2_1_28_1","volume-title":"Trinity: on using trinary trees for unsupervised web data extraction","author":"Sleiman H.","year":"2013","unstructured":"H. Sleiman and R. Corchuelo . Trinity: on using trinary trees for unsupervised web data extraction . 2013 . H. Sleiman and R. Corchuelo. Trinity: on using trinary trees for unsupervised web data extraction. 2013."},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1109\/TKDE.2012.135"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2012.10.009"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1145\/564376.564391"},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.1145\/544220.544260"},{"key":"e_1_3_2_1_33_1","first-page":"321","volume-title":"Workshop on Semantic Evaluation, ACL","author":"Str\u00f6tgen J.","year":"2010","unstructured":"J. Str\u00f6tgen and M. Gertz . Heideltime: High quality rule-based extraction and normalization of temporal expressions . In Workshop on Semantic Evaluation, ACL , pages 321 -- 324 , 2010 . J. Str\u00f6tgen and M. Gertz. Heideltime: High quality rule-based extraction and normalization of temporal expressions. In Workshop on Semantic Evaluation, ACL, pages 321--324, 2010."},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1007\/s11280-013-0248-y"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICSEC.2014.6978209"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1145\/2063576.2064014"},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.1080\/00949658208810560"},{"key":"e_1_3_2_1_38_1","volume-title":"Master's thesis","author":"Z. Yu.","year":"2007","unstructured":"Z. Yu. High accuracy postal address extraction from web pages. Master's thesis , Dalhousie University , Halifax, Nova Scotia, 2007 . Z. Yu. High accuracy postal address extraction from web pages. Master's thesis, Dalhousie University, Halifax, Nova Scotia, 2007."},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-11964-9_31"}],"event":{"name":"SIGIR '15: The 38th International ACM SIGIR conference on research and development in Information Retrieval","sponsor":["SIGIR ACM Special Interest Group on Information Retrieval"],"location":"Santiago Chile","acronym":"SIGIR '15"},"container-title":["Proceedings of the 38th International ACM SIGIR Conference on Research and Development in Information Retrieval"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/2766462.2767739","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/2766462.2767739","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T09:20:59Z","timestamp":1750238459000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/2766462.2767739"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015,8,9]]},"references-count":38,"alternative-id":["10.1145\/2766462.2767739","10.1145\/2766462"],"URL":"https:\/\/doi.org\/10.1145\/2766462.2767739","relation":{},"subject":[],"published":{"date-parts":[[2015,8,9]]},"assertion":[{"value":"2015-08-09","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}