{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T04:53:35Z","timestamp":1750308815144,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":31,"publisher":"ACM","license":[{"start":{"date-parts":[[2010,4,26]],"date-time":"2010-04-26T00:00:00Z","timestamp":1272240000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2010,4,26]]},"DOI":"10.1145\/1772690.1772738","type":"proceedings-article","created":{"date-parts":[[2010,4,27]],"date-time":"2010-04-27T12:45:48Z","timestamp":1272372348000},"page":"461-470","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":11,"title":["A scalable machine-learning approach for semi-structured named entity recognition"],"prefix":"10.1145","author":[{"given":"Utku","family":"Irmak","sequence":"first","affiliation":[{"name":"Yahoo! Inc, Santa Clara, CA, USA"}]},{"given":"Reiner","family":"Kraft","sequence":"additional","affiliation":[{"name":"Yahoo! Inc, Sunnyvale, CA, USA"}]}],"member":"320","published-online":{"date-parts":[[2010,4,26]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1145\/336597.336644"},{"key":"e_1_3_2_1_2_1","volume-title":"Proc. of the 1st Intl. Workshop on the Web and Databases","author":"Brin S.","year":"1998","unstructured":"S. Brin . Extracting patterns and relations from the world wide web . In Proc. of the 1st Intl. Workshop on the Web and Databases , 1998 . S. Brin. Extracting patterns and relations from the world wide web. In Proc. of the 1st Intl. Workshop on the Web and Databases, 1998."},{"key":"e_1_3_2_1_3_1","volume-title":"Proc. of the WebDB","author":"Buyukkokten O.","year":"1999","unstructured":"O. Buyukkokten , J. Cho , H. Garcia-Molina , L. Gravano , and N. Shivakumar . Exploiting geographical location information of web pages . In Proc. of the WebDB , 1999 . O. Buyukkokten, J. Cho, H. Garcia-Molina, L. Gravano, and N. Shivakumar. Exploiting geographical location information of web pages. In Proc. of the WebDB, 1999."},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1145\/1142473.1142505"},{"key":"e_1_3_2_1_5_1","volume-title":"Proc. of the 3rd Conf. on Innovative Data Systems Research (CIDR)","author":"Cheng T.","year":"2007","unstructured":"T. Cheng and K. C.-C. Chang . Entity search engine: Towards agile best-effort information integration over the web . In Proc. of the 3rd Conf. on Innovative Data Systems Research (CIDR) , 2007 . T. Cheng and K. C.-C. Chang. Entity search engine: Towards agile best-effort information integration over the web. In Proc. of the 3rd Conf. on Innovative Data Systems Research (CIDR), 2007."},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.3115\/1119176.1119199"},{"key":"e_1_3_2_1_7_1","volume-title":"Proc. of the Joint SIGDAT Conf. on Empirical Methods in Natural Lang. Processing and Very Large Corpora","author":"Collins M.","year":"1999","unstructured":"M. Collins and Y. Singer . Unsupervised models for named entity classification . In Proc. of the Joint SIGDAT Conf. on Empirical Methods in Natural Lang. Processing and Very Large Corpora , 1999 . M. Collins and Y. Singer. Unsupervised models for named entity classification. In Proc. of the Joint SIGDAT Conf. on Empirical Methods in Natural Lang. Processing and Very Large Corpora, 1999."},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.artint.2005.03.001"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.5555\/1390681.1442794"},{"key":"e_1_3_2_1_10_1","volume-title":"Proc. of AMIA I2B2NLP workshop","author":"Farkas R.","year":"2006","unstructured":"R. Farkas , G. Szarvas , S. Ivan , K. Andras , and R. Busa-Fekete . An iterative method for the de-identification of structured medical text . In Proc. of AMIA I2B2NLP workshop , 2006 . R. Farkas, G. Szarvas, S. Ivan, K. Andras, and R. Busa-Fekete. An iterative method for the de-identification of structured medical text. In Proc. of AMIA I2B2NLP workshop, 2006."},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-30586-6_59"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE.2009.76"},{"key":"e_1_3_2_1_13_1","volume-title":"TREC","author":"Ittycheriah A.","year":"2002","unstructured":"A. Ittycheriah and S. Roukos . Ibm's statistical question answering system-trec 11 . In TREC , 2002 . A. Ittycheriah and S. Roukos. Ibm's statistical question answering system-trec 11. In TREC, 2002."},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.3115\/980691.980696"},{"key":"e_1_3_2_1_15_1","volume-title":"Foundations of Statistical Natural Language Processing","author":"Manning C.","year":"1999","unstructured":"C. Manning and H. Schutze . Foundations of Statistical Natural Language Processing . MIT Press , 1999 . C. Manning and H. Schutze. Foundations of Statistical Natural Language Processing. MIT Press, 1999."},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1145\/371920.372056"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1145\/1242572.1242587"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1145\/1321440.1321510"},{"key":"e_1_3_2_1_19_1","volume-title":"Proc. of Natl. Conf. on AI","author":"Pasca M.","year":"2006","unstructured":"M. Pasca , D. Lin , J. Bigham , A. Lifchits , and A. Jain . Organizing and searching the world wide web of facts - step one: the one-million fact extraction challenge . In Proc. of Natl. Conf. on AI , 2006 . M. Pasca, D. Lin, J. Bigham, A. Lifchits, and A. Jain. Organizing and searching the world wide web of facts - step one: the one-million fact extraction challenge. In Proc. of Natl. Conf. on AI, 2006."},{"key":"e_1_3_2_1_20_1","unstructured":"Perl Compatible Regular Expressions. http:\/\/www.pcre.org.  Perl Compatible Regular Expressions. http:\/\/www.pcre.org."},{"key":"e_1_3_2_1_21_1","volume-title":"Proc. of Conf. on Artificial Intelligence","author":"Riloff E.","year":"1993","unstructured":"E. Riloff . Automatically constructing a dictionary for information extraction tasks . In Proc. of Conf. on Artificial Intelligence , 1993 . E. Riloff. Automatically constructing a dictionary for information extraction tasks. In Proc. of Conf. on Artificial Intelligence, 1993."},{"key":"e_1_3_2_1_22_1","volume-title":"Proc. of Conf. on Artificial Intelligence","author":"Riloff E.","year":"1999","unstructured":"E. Riloff and R. Jones . Learning dictionaries for information extraction by multi-level bootstrapping . In Proc. of Conf. on Artificial Intelligence , 1999 . E. Riloff and R. Jones. Learning dictionaries for information extraction by multi-level bootstrapping. In Proc. of Conf. on Artificial Intelligence, 1999."},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1016\/0306-4573(88)90021-0"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.ins.2008.05.002"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.datak.2005.05.011"},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1162\/089976601750264965"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1145\/964442.964521"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.3115\/1118693.1118721"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.5555\/645328.650004"},{"key":"e_1_3_2_1_30_1","first-page":"14","article-title":"Evaluating the state-of-the-art in automatic de-identification","author":"Uzuner O.","year":"2007","unstructured":"O. Uzuner , Y. Luo , and P. Szolovits . Evaluating the state-of-the-art in automatic de-identification . Journal of the American Medical Informatics Association , 14 , 2007 . O. Uzuner, Y. Luo, and P. Szolovits. Evaluating the state-of-the-art in automatic de-identification. Journal of the American Medical Informatics Association, 14, 2007.","journal-title":"Journal of the American Medical Informatics Association"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1145\/1321440.1321537"}],"event":{"name":"WWW '10: The 19th International World Wide Web Conference","acronym":"WWW '10","location":"Raleigh North Carolina USA"},"container-title":["Proceedings of the 19th international conference on World wide web"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/1772690.1772738","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/1772690.1772738","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T20:26:29Z","timestamp":1750278389000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/1772690.1772738"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2010,4,26]]},"references-count":31,"alternative-id":["10.1145\/1772690.1772738","10.1145\/1772690"],"URL":"https:\/\/doi.org\/10.1145\/1772690.1772738","relation":{},"subject":[],"published":{"date-parts":[[2010,4,26]]},"assertion":[{"value":"2010-04-26","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}