{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,8]],"date-time":"2024-09-08T14:45:12Z","timestamp":1725806712493},"publisher-location":"Cham","reference-count":20,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319119878"},{"type":"electronic","value":"9783319119885"}],"license":[{"start":{"date-parts":[[2014,1,1]],"date-time":"2014-01-01T00:00:00Z","timestamp":1388534400000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2014]]},"DOI":"10.1007\/978-3-319-11988-5_24","type":"book-chapter","created":{"date-parts":[[2014,10,8]],"date-time":"2014-10-08T13:15:40Z","timestamp":1412774140000},"page":"253-264","source":"Crossref","is-referenced-by-count":1,"title":["Entity Recognition for Duplicate Filtering"],"prefix":"10.1007","author":[{"given":"J. A.","family":"Cordero Cruz","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Sara E.","family":"Garza","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"S. E.","family":"Schaeffer","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","reference":[{"key":"24_CR1","doi-asserted-by":"crossref","unstructured":"Agarwal, P., Vaithiyanathan, R., Sharma, S., Shroff, G.: Catching the long-tail: Extracting local news events from Twitter. In: Proc. of the 6th International AAAI Conference on Weblogs and Social Media, Palo Alto, CA, USA, pp. 379\u2013382. AAAI (2012)","DOI":"10.1609\/icwsm.v6i1.14317"},{"key":"24_CR2","volume-title":"Modern information retrieval","author":"R. Baeza-Yates","year":"1999","unstructured":"Baeza-Yates, R., Ribeiro-Neto, B.: Modern information retrieval. ACM Press, New York (1999)"},{"key":"24_CR3","series-title":"Information Science and Statistics","volume-title":"Pattern Recognition and Machine Learning","author":"C. Bishop","year":"2006","unstructured":"Bishop, C.: Pattern Recognition and Machine Learning. Information Science and Statistics. Springer, New York (2006)"},{"key":"24_CR4","doi-asserted-by":"crossref","unstructured":"Church, K.: A stochastic parts program and noun phrase parser for unrestricted text. In: Proc. of the 2nd Conference on Applied Natural Language Processing, Stroudsburg, PA, USA, pp. 136\u2013143. Association for Computational Linguistics (1988)","DOI":"10.3115\/974235.974260"},{"key":"24_CR5","volume-title":"Pattern Classification","author":"R. Duda","year":"2000","unstructured":"Duda, R., Hart, P., Stork, D.: Pattern Classification, 2nd edn. Wiley-Interscience, New York (2000)","edition":"2"},{"key":"24_CR6","first-page":"1851","volume":"10","author":"R. Esposito","year":"2009","unstructured":"Esposito, R., Radicioni, D.: CarpeDiem: Optimizing the Viterbi algorithm and applications to supervised sequential learning. The Journal of Machine Learning Research\u00a010, 1851\u20131880 (2009)","journal-title":"The Journal of Machine Learning Research"},{"key":"24_CR7","series-title":"Lecture Notes in Artificial Intelligence","doi-asserted-by":"publisher","first-page":"877","DOI":"10.1007\/978-3-540-68125-0_87","volume-title":"Advances in Knowledge Discovery and Data Mining","author":"C. Gong","year":"2008","unstructured":"Gong, C., Huang, Y., Cheng, X., Bai, S.: Detecting near-duplicates in large-scale short text databases. In: Washio, T., Suzuki, E., Ting, K.M., Inokuchi, A. (eds.) PAKDD 2008. LNCS (LNAI), vol.\u00a05012, pp. 877\u2013883. Springer, Heidelberg (2008)"},{"issue":"4","key":"24_CR8","doi-asserted-by":"publisher","first-page":"381","DOI":"10.1145\/356827.356830","volume":"12","author":"P. Hall","year":"1980","unstructured":"Hall, P., Dowling, G.: Approximate string matching. ACM Computing Surveys\u00a012(4), 381\u2013402 (1980)","journal-title":"ACM Computing Surveys"},{"key":"24_CR9","series-title":"Springer Series in Statistics","doi-asserted-by":"publisher","DOI":"10.1007\/978-0-387-84858-7","volume-title":"The Elements of Statistical Learning: Data Mining, Inference, and Prediction","author":"T. Hastie","year":"2009","unstructured":"Hastie, T., Tibshirani, R., Friedman, J.: The Elements of Statistical Learning: Data Mining, Inference, and Prediction, 2nd edn. Springer Series in Statistics. Springer, New York (2009)","edition":"2"},{"key":"24_CR10","volume-title":"Speech and Language Processing: An Introduction to Natural Language Processing, Computational Linguistics, and Speech Recognition","author":"D. Jurafsky","year":"2000","unstructured":"Jurafsky, D., Martin, J.: Speech and Language Processing: An Introduction to Natural Language Processing, Computational Linguistics, and Speech Recognition. Prentice Hall PTR, Upper Saddle River (2000)"},{"key":"24_CR11","first-page":"707","volume":"10","author":"V. Levenshtein","year":"1966","unstructured":"Levenshtein, V.: Binary codes capable of correcting deletions, insertions and reversals. Soviet Physics Doklady\u00a010, 707 (1966)","journal-title":"Soviet Physics Doklady"},{"key":"24_CR12","doi-asserted-by":"crossref","unstructured":"Manning, C., Raghavan, P., Sch\u00fctze, H.: Introduction to Information Retrieval. Cambridge University Press (2008)","DOI":"10.1017\/CBO9780511809071"},{"key":"24_CR13","unstructured":"Ponomareva, N., Rosso, P., Pla, F., Molina, A.: Conditional random fields vs. hidden Markov models in a biomedical named entity recognition task. In: Proc. of International Conference Recent Advances in Natural Language Processing, Borovets, Bulgaria, pp. 479\u2013483. RANLP 2007 Organising Committee (2007)"},{"key":"24_CR14","doi-asserted-by":"crossref","unstructured":"Ratinov, L., Roth, D.: Design challenges and misconceptions in named entity recognition. In: Proc. of the 13th Conference on Computational Natural Language Learning, Stroudsburg, PA, USA, pp. 147\u2013155. Association for Computational Linguistics (2009)","DOI":"10.3115\/1596374.1596399"},{"key":"24_CR15","unstructured":"Ritter, A., Clark, S., Mausam, Etzioni, O.: Named entity recognition in tweets: An experimental study. In: Proc. of the Conference on Empirical Methods in Natural Language Processing, Stroudsburg, PA, USA, pp. 1524\u20131534. Association for Computational Linguistics (2011)"},{"key":"24_CR16","volume-title":"A first course in probability","author":"S. Ross","year":"2010","unstructured":"Ross, S.: A first course in probability. Pearson Prentice Hall, Harlow (2010)"},{"key":"24_CR17","first-page":"42","volume-title":"Proc. of the 17th ACM SIGSPATIAL International Conference on Advances in Geographic Information Systems","author":"J. Sankaranarayanan","year":"2009","unstructured":"Sankaranarayanan, J., Samet, H., Teitler, B., Lieberman, M., Sperling, J.: TwitterStand: News in tweets. In: Proc. of the 17th ACM SIGSPATIAL International Conference on Advances in Geographic Information Systems, pp. 42\u201351. ACM, New York (2009)"},{"key":"24_CR18","doi-asserted-by":"crossref","unstructured":"Schleimer, S., Wilkerson, D.S., Aiken, A.: Winnowing: local algorithms for document fingerprinting. In: Proc. of the 2003 ACM SIGMOD International Conference on Management of Data, New York, NY, USA, pp. 76\u201385. ACM (2003)","DOI":"10.1145\/872757.872770"},{"key":"24_CR19","doi-asserted-by":"crossref","unstructured":"Tao, K., Abel, F., Hauff, C., Houben, G.-J., Gadiraju, U.: Groundhog Day: Near-duplicate Detection on Twitter. In: Proc. of the 22nd International Conference on World Wide Web, Republic and Canton of Geneva, Switzerland, pp. 1273\u20131284. International World Wide Web Conferences Steering Committee (2013)","DOI":"10.1145\/2488388.2488499"},{"key":"24_CR20","doi-asserted-by":"crossref","unstructured":"Weis, M., Naumann, F.: DogmatiX tracks down duplicates in xml. In: Proc. of the 2005 ACM SIGMOD International Conference on Management of Data, New York, NY, USA, pp. 431\u2013442. ACM (2005)","DOI":"10.1145\/1066157.1066207"}],"container-title":["Lecture Notes in Computer Science","Similarity Search and Applications"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-11988-5_24","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,7,17]],"date-time":"2023-07-17T03:38:23Z","timestamp":1689565103000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-11988-5_24"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014]]},"ISBN":["9783319119878","9783319119885"],"references-count":20,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-11988-5_24","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2014]]}}}