{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T04:13:18Z","timestamp":1750306398478,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":49,"publisher":"ACM","license":[{"start":{"date-parts":[[2015,8,10]],"date-time":"2015-08-10T00:00:00Z","timestamp":1439164800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2015,8,10]]},"DOI":"10.1145\/2783258.2788580","type":"proceedings-article","created":{"date-parts":[[2015,8,7]],"date-time":"2015-08-07T15:38:27Z","timestamp":1438961907000},"page":"2257-2266","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":20,"title":["Annotating Needles in the Haystack without Looking"],"prefix":"10.1145","author":[{"given":"Weinan","family":"Zhang","sequence":"first","affiliation":[{"name":"University College London, London, United Kingdom"}]},{"given":"Amr","family":"Ahmed","sequence":"additional","affiliation":[{"name":"Google Inc., Mountain View, CA, USA"}]},{"given":"Jie","family":"Yang","sequence":"additional","affiliation":[{"name":"Google Inc., Mountain View, CA, USA"}]},{"given":"Vanja","family":"Josifovski","sequence":"additional","affiliation":[{"name":"Pinterest, San Francisco, CA, USA"}]},{"given":"Alex J.","family":"Smola","sequence":"additional","affiliation":[{"name":"Carnegie Mellon University, Pittsburgh, PA, USA"}]}],"member":"320","published-online":{"date-parts":[[2015,8,10]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1145\/2433396.2433447"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1109\/18.825794"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1145\/1137983.1138016"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10462-009-9109-6"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1023\/A:1010933404324"},{"key":"e_1_3_2_1_6_1","first-page":"103","volume-title":"ICML","author":"Brutlag J. D.","year":"2000","unstructured":"J. D. Brutlag and C. Meek . Challenges of the email domain for text classification . In ICML , pages 103 -- 110 , 2000 . J. D. Brutlag and C. Meek. Challenges of the email domain for text classification. In ICML, pages 103--110, 2000."},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.5555\/876878.879311"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1145\/371920.372182"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1561\/1500000006"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1023\/A:1022627411411"},{"key":"e_1_3_2_1_11_1","first-page":"77","volume-title":"ISMB","volume":"1999","author":"Craven M.","year":"1999","unstructured":"M. Craven , J. Kumlien , Constructing biological knowledge bases by extracting information from text sources . In ISMB , volume 1999 , pages 77 -- 86 , 1999 . M. Craven, J. Kumlien, et al. Constructing biological knowledge bases by extracting information from text sources. In ISMB, volume 1999, pages 77--86, 1999."},{"key":"e_1_3_2_1_12_1","first-page":"109","volume-title":"VLDB","volume":"1","author":"Crescenzi V.","year":"2001","unstructured":"V. Crescenzi , G. Mecca , P. Merialdo , : Towards automatic data extraction from large web sites . In VLDB , volume 1 , pages 109 -- 118 , 2001 . V. Crescenzi, G. Mecca, P. Merialdo, et al. Roadrunner: Towards automatic data extraction from large web sites. In VLDB, volume 1, pages 109--118, 2001."},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.14778\/1938545.1938547"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10588-005-5377-0"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1145\/304181.304223"},{"key":"e_1_3_2_1_16_1","first-page":"1","volume-title":"Multivariate adaptive regression splines. The annals of statistics","author":"Friedman J. H.","year":"1991","unstructured":"J. H. Friedman . Multivariate adaptive regression splines. The annals of statistics , pages 1 -- 67 , 1991 . J. H. Friedman. Multivariate adaptive regression splines. The annals of statistics, pages 1--67, 1991."},{"key":"e_1_3_2_1_17_1","first-page":"2001","article-title":"Posterior regularization for structured latent variable models","volume":"99","author":"Ganchev K.","year":"2010","unstructured":"K. Ganchev , J. Graica , J. Gillenwater , and B. Taskar . Posterior regularization for structured latent variable models . JMLR , 99 : 2001 -- 2049 , 2010 . K. Ganchev, J. Graica, J. Gillenwater, and B. Taskar. Posterior regularization for structured latent variable models. JMLR, 99:2001--2049, 2010.","journal-title":"JMLR"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1145\/775152.775182"},{"key":"e_1_3_2_1_19_1","first-page":"1489","volume-title":"EMNLP","author":"Hall K.","year":"2011","unstructured":"K. Hall , R. McDonald , J. Katz-Brown , and M. Ringgaard . Training dependency parsers by jointly optimizing multiple objectives . In EMNLP , pages 1489 -- 1499 , 2011 . K. Hall, R. McDonald, J. Katz-Brown, and M. Ringgaard. Training dependency parsers by jointly optimizing multiple objectives. In EMNLP, pages 1489--1499, 2011."},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-0-387-21606-5"},{"key":"e_1_3_2_1_21_1","volume-title":"ACL","author":"Hoffmann R.","year":"2011","unstructured":"R. Hoffmann , C. Zhang , X. Ling , L. Zettlemoyer , and D. S. Weld . Knowledge-based weak supervision for information extraction of overlapping relations . In ACL , 2011 . R. Hoffmann, C. Zhang, X. Ling, L. Zettlemoyer, and D. S. Weld. Knowledge-based weak supervision for information extraction of overlapping relations. In ACL, 2011."},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1023\/A:1021765131316"},{"key":"e_1_3_2_1_23_1","first-page":"897","volume-title":"NIPS","author":"Jin R.","year":"2002","unstructured":"R. Jin and Z. Ghahramani . Learning with multiple labels . In NIPS , pages 897 -- 904 , 2002 . R. Jin and Z. Ghahramani. Learning with multiple labels. In NIPS, pages 897--904, 2002."},{"key":"e_1_3_2_1_24_1","first-page":"301","volume-title":"CASCON","author":"Kiritchenko S.","year":"2011","unstructured":"S. Kiritchenko and S. Matwin . Email classification with co-training . In CASCON , pages 301 -- 312 . IBM Corp. , 2011 . S. Kiritchenko and S. Matwin. Email classification with co-training. In CASCON, pages 301--312. IBM Corp., 2011."},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.3115\/1220175.1220278"},{"key":"e_1_3_2_1_26_1","unstructured":"B. Klimt and Y. Yang. The enron corpus: A new dataset for email classification research.  B. Klimt and Y. Yang. The enron corpus: A new dataset for email classification research."},{"key":"e_1_3_2_1_27_1","first-page":"703","volume-title":"IICAI","author":"Kulkarni A.","year":"2005","unstructured":"A. Kulkarni and T. Pedersen . Name discrimination and email clustering using unsupervised clustering and labeling of similar contexts . In IICAI , pages 703 -- 722 , 2005 . A. Kulkarni and T. Pedersen. Name discrimination and email clustering using unsupervised clustering and labeling of similar contexts. In IICAI, pages 703--722, 2005."},{"key":"e_1_3_2_1_28_1","volume-title":"ICML","author":"Lafferty J.","year":"2001","unstructured":"J. Lafferty , A. McCallum , and F. C. Pereira . Conditional random fields: Probabilistic models for segmenting and labeling sequence data . In ICML , 2001 . J. Lafferty, A. McCallum, and F. C. Pereira. Conditional random fields: Probabilistic models for segmenting and labeling sequence data. In ICML, 2001."},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDM.2006.16"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1145\/956750.956826"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.5555\/1756006.1756038"},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.5555\/1690219.1690287"},{"key":"e_1_3_2_1_33_1","volume-title":"Classification and regression trees","author":"Olshen L. B. J. F. R.","year":"1984","unstructured":"L. B. J. F. R. Olshen and C. J. Stone . Classification and regression trees . Wadsworth International Group , 1984 . L. B. J. F. R. Olshen and C. J. Stone. Classification and regression trees. Wadsworth International Group, 1984."},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1145\/1321440.1321536"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1214\/09-AOS691"},{"key":"e_1_3_2_1_36_1","volume-title":"Generalized boosted regression models. Documentation on the R Package 'gbm', version, 1(5):7","author":"Ridgeway G.","year":"2006","unstructured":"G. Ridgeway . Generalized boosted regression models. Documentation on the R Package 'gbm', version, 1(5):7 , 2006 . G. Ridgeway. Generalized boosted regression models. Documentation on the R Package 'gbm', version, 1(5):7, 2006."},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.5555\/1889788.1889799"},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.1145\/1348549.1348562"},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"crossref","unstructured":"A. M. Rush. A tutorial on dual decomposition and lagrangian relaxation for inference in natural language processing. 2012.  A. M. Rush. A tutorial on dual decomposition and lagrangian relaxation for inference in natural language processing. 2012.","DOI":"10.1613\/jair.3680"},{"key":"e_1_3_2_1_40_1","first-page":"1","volume-title":"EMNLP","author":"Rush A. M.","year":"2010","unstructured":"A. M. Rush , D. Sontag , M. Collins , and T. Jaakkola . On dual decomposition and linear programming relaxations for natural language processing . In EMNLP , pages 1 -- 11 , 2010 . A. M. Rush, D. Sontag, M. Collins, and T. Jaakkola. On dual decomposition and linear programming relaxations for natural language processing. In EMNLP, pages 1--11, 2010."},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"publisher","DOI":"10.5555\/1764441.1764536"},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"publisher","DOI":"10.1145\/1557019.1557124"},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4020-6264-3_67"},{"key":"e_1_3_2_1_44_1","doi-asserted-by":"publisher","DOI":"10.1145\/1060745.1060761"},{"key":"e_1_3_2_1_45_1","doi-asserted-by":"publisher","DOI":"10.1145\/1102351.1102483"},{"key":"e_1_3_2_1_46_1","doi-asserted-by":"publisher","DOI":"10.1145\/1150402.1150457"},{"key":"e_1_3_2_1_47_1","doi-asserted-by":"publisher","DOI":"10.5555\/1390681.1442784"},{"key":"e_1_3_2_1_48_1","first-page":"3","article-title":"Semi-supervised learning literature survey. Computer Science","volume":"2","author":"Zhu X.","year":"2006","unstructured":"X. Zhu . Semi-supervised learning literature survey. Computer Science , University of Wisconsin-Madison , 2 : 3 , 2006 . X. Zhu. Semi-supervised learning literature survey. Computer Science, University of Wisconsin-Madison, 2:3, 2006.","journal-title":"University of Wisconsin-Madison"},{"key":"e_1_3_2_1_49_1","doi-asserted-by":"publisher","DOI":"10.5555\/1717872"}],"event":{"name":"KDD '15: The 21th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining","sponsor":["SIGMOD ACM Special Interest Group on Management of Data","SIGKDD ACM Special Interest Group on Knowledge Discovery in Data"],"location":"Sydney NSW Australia","acronym":"KDD '15"},"container-title":["Proceedings of the 21th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/2783258.2788580","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/2783258.2788580","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T05:07:24Z","timestamp":1750223244000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/2783258.2788580"}},"subtitle":["Product Information Extraction from Emails"],"short-title":[],"issued":{"date-parts":[[2015,8,10]]},"references-count":49,"alternative-id":["10.1145\/2783258.2788580","10.1145\/2783258"],"URL":"https:\/\/doi.org\/10.1145\/2783258.2788580","relation":{},"subject":[],"published":{"date-parts":[[2015,8,10]]},"assertion":[{"value":"2015-08-10","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}