{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,5]],"date-time":"2024-09-05T17:56:03Z","timestamp":1725558963848},"publisher-location":"Berlin, Heidelberg","reference-count":16,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783642142451"},{"type":"electronic","value":"9783642142468"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2010]]},"DOI":"10.1007\/978-3-642-14246-8_58","type":"book-chapter","created":{"date-parts":[[2010,7,6]],"date-time":"2010-07-06T14:09:26Z","timestamp":1278425366000},"page":"595-607","source":"Crossref","is-referenced-by-count":5,"title":["Efficient Duplicate Record Detection Based on Similarity Estimation"],"prefix":"10.1007","author":[{"given":"Mohan","family":"Li","sequence":"first","affiliation":[]},{"given":"Hongzhi","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Jianzhong","family":"Li","sequence":"additional","affiliation":[]},{"given":"Hong","family":"Gao","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"58_CR1","doi-asserted-by":"crossref","unstructured":"Elmagarmid, A.K., Ipeirotis, P.G., Verykios, V.S.: Duplicate record detection: A survey. IEEE Transactions on Knowledge and Data Engineering (2007)","DOI":"10.1109\/TKDE.2007.250581"},{"key":"58_CR2","doi-asserted-by":"crossref","unstructured":"Ristad, E.S., Yianilos, P.N.: Learning String-Edit Distance. IEEE Transactions on Pattern Analysis and Machine Intelligence (May 1998)","DOI":"10.1109\/34.682181"},{"key":"58_CR3","doi-asserted-by":"crossref","unstructured":"Kuhn, H.W.: The hungarian method for the assignment problem. Naval res. Logist. Quart. (1955)","DOI":"10.1002\/nav.3800020109"},{"key":"58_CR4","doi-asserted-by":"crossref","unstructured":"Munkres, J.: Algorithms for the assignment and transportation problems. J. Soc. Indust. App1. Math. (1957)","DOI":"10.1002\/nav.3800040112"},{"key":"58_CR5","doi-asserted-by":"crossref","unstructured":"Bilenko, M., Mooney, R.J.: Adaptive duplicate detection using learnable string similarity measures. In: SIGKDD, pp. 39\u201348 (August 2003)","DOI":"10.1145\/956750.956759"},{"key":"58_CR6","doi-asserted-by":"crossref","unstructured":"Chandel, Hassanzadeh, O., Koudas, N., et al.: Benchmarking declarative approximate selection predicates. In: SIGMOD, pp. 353\u2013364 (June 2007)","DOI":"10.1145\/1247480.1247521"},{"key":"58_CR7","doi-asserted-by":"crossref","unstructured":"Chaudhuri, S., Ganjam, K., Ganti, V., Motwani, R.: Robust and efficient fuzzy match for online data cleaning. In: SIGMOD, pp. 313\u2013324 (June 2003)","DOI":"10.1145\/872757.872796"},{"issue":"3","key":"58_CR8","doi-asserted-by":"publisher","first-page":"288","DOI":"10.1145\/352595.352598","volume":"18","author":"W.W. Cohen","year":"2000","unstructured":"Cohen, W.W.: Data integration using similarity joins and a word-based information representation language. ACM Trans. on Information Systems\u00a018(3), 288\u2013321 (2000)","journal-title":"ACM Trans. on Information Systems"},{"key":"58_CR9","doi-asserted-by":"crossref","unstructured":"Borkar, V.R., Deshmukh, K., Sarawagi, S.: Automatic segmentation of text into structured records. In: SIGMOD, pp. 175\u2013186 (May 2001)","DOI":"10.1145\/375663.375682"},{"key":"58_CR10","unstructured":"Sarawagi, S., Cohen, W.W.: Semi-markov conditional random fields for information extraction. In: NIPS (December 2004)"},{"key":"58_CR11","doi-asserted-by":"crossref","unstructured":"Viola, P.A., Narasimhan, M.: Learning to extract information from semi-structured text using a discriminative context free grammar. In: SIGIR, pp. 330\u2013337 (August 2005)","DOI":"10.1145\/1076034.1076091"},{"key":"58_CR12","doi-asserted-by":"crossref","unstructured":"Cohen, W.W., Sarawagi, S.: Exploiting dictionaries in named entity extraction: combining semi-markov extraction processes and data integration methods. In: SIGKDD, pp. 89\u201398 (August 2004)","DOI":"10.1145\/1014052.1014065"},{"key":"58_CR13","doi-asserted-by":"crossref","unstructured":"Arasu, Chaudhuri, S., Kaushik, R.: Transformation-based framework for record matching. In: ICDE, pp. 40-49 (April 2008)","DOI":"10.1109\/ICDE.2008.4497412"},{"key":"58_CR14","doi-asserted-by":"crossref","unstructured":"Arasu, Kaushik, R.: A Grammar-based Entity Representation Framework for Data Cleaning. In: SIGMOD, pp. 233\u2013244 (June 2009)","DOI":"10.1145\/1559845.1559871"},{"key":"58_CR15","unstructured":"Mohan, L., Hongzhi, W., Jianzhong, L., Hong, G.: Duplicate Record Detection Method Based on Optimal Bipartite Graph Matching. In: NDBC (October 2009)"},{"key":"58_CR16","volume-title":"Introduction to Machine Learning","author":"E. Alpaydin","year":"2004","unstructured":"Alpaydin, E.: Introduction to Machine Learning. MIT Press, Cambridge (2004)"}],"container-title":["Lecture Notes in Computer Science","Web-Age Information Management"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-14246-8_58.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,11,24]],"date-time":"2020-11-24T02:49:55Z","timestamp":1606186195000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-642-14246-8_58"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2010]]},"ISBN":["9783642142451","9783642142468"],"references-count":16,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-14246-8_58","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2010]]}}}