{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,1,4]],"date-time":"2025-01-04T22:10:30Z","timestamp":1736028630700,"version":"3.32.0"},"publisher-location":"Berlin, Heidelberg","reference-count":25,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783540297383"},{"type":"electronic","value":"9783540321200"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2005]]},"DOI":"10.1007\/11575801_19","type":"book-chapter","created":{"date-parts":[[2005,10,10]],"date-time":"2005-10-10T17:41:20Z","timestamp":1128966080000},"page":"1225-1242","source":"Crossref","is-referenced-by-count":1,"title":["Probabilistic Iterative Duplicate Detection"],"prefix":"10.1007","author":[{"given":"Patrick","family":"Lehti","sequence":"first","affiliation":[]},{"given":"Peter","family":"Fankhauser","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"doi-asserted-by":"crossref","unstructured":"Galhardas, H., Florescu, D., Shasha, D., Simon, E.: An extensible framework for data cleaning. In: Proceddings of the 16th International Conference on Data Engineering (ICDE 2000), p. 312 (2000)","key":"19_CR1","DOI":"10.1109\/ICDE.2000.839429"},{"key":"19_CR2","doi-asserted-by":"publisher","first-page":"9","DOI":"10.1023\/A:1009761603038","volume":"2","author":"M.A. Hernandez","year":"1998","unstructured":"Hernandez, M.A., Stolfo, S.J.: Real-world data is dirty: Data cleansing and the merge\/purge problem. Data Mining and Knowledge Discovery\u00a02, 9\u201337 (1998)","journal-title":"Data Mining and Knowledge Discovery"},{"key":"19_CR3","doi-asserted-by":"crossref","first-page":"414","DOI":"10.1080\/01621459.1989.10478785","volume":"84","author":"M. Jaro","year":"1989","unstructured":"Jaro, M.: Advances in record linkage methodology as applied to matching the 1985 census of tampa. Journal of the American Statistical Society\u00a084, 414\u2013420 (1989)","journal-title":"Journal of the American Statistical Society"},{"unstructured":"Monge, A., Elkan, C.: An efficient domain independent algorithm for detecting approximately duplicate database records. In: Proceedings of the SIGMOD Workshop on Data Mining and Knowledge Discovery (1997)","key":"19_CR4"},{"unstructured":"Cohen, W.W., Ravikumar, P., Fienberg, S.E.: A comparison of string metrics for matching names and records. In: Proceedings of the KDD 2003 Workshop on Data Cleaning, Record Linkage, and Object Consolidation, Washington, DC, pp. 13\u201318 (2003)","key":"19_CR5"},{"unstructured":"Bilenko, M., Mooney, R.J.: Learning to combine trained distance metrics for duplicate detection in databases. Technical Report AI 02-296, Artificial Intelligence Laboratory, University of Texas at Austin, Austin, TX (2002)","key":"19_CR6"},{"key":"19_CR7","doi-asserted-by":"publisher","first-page":"522","DOI":"10.1109\/34.682181","volume":"20","author":"E.S. Ristad","year":"1998","unstructured":"Ristad, E.S., Yianilos, P.N.: Learning string-edit distance. IEEE Transactions on Pattern Analysis and Machine Intelligence\u00a020, 522\u2013532 (1998)","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"doi-asserted-by":"crossref","unstructured":"Cohen, W.W., Richman, J.: Learning to match and cluster large high-dimensional data sets for data integration. In: Proceedings of the Eighth ACM SIGKDD International Conference on Knowledge Discovery and Data Mining (KDD 2002), Edmonton, Alberta (2002)","key":"19_CR8","DOI":"10.1145\/775047.775116"},{"doi-asserted-by":"crossref","unstructured":"Sarawagi, S., Bhamidipaty, A.: Interactive deduplication using active learning. In: Proceedings of the Eighth ACM SIGKDD International Conference on Knowledge Discovery and Data Mining (KDD 2002), Edmonton, Alberta (2002)","key":"19_CR9","DOI":"10.1145\/775047.775087"},{"doi-asserted-by":"crossref","unstructured":"Ananthakrishna, R., Chaudhuri, S., Ganti, V.: Eliminating fuzzy duplicates in data warehouses. In: Proceedings of the 28th International Conference on Very Large Data Bases(VLDB 2002) (2002)","key":"19_CR10","DOI":"10.1016\/B978-155860869-6\/50058-5"},{"unstructured":"Pasula, H., Marthi, B., Milch, B., Russell, S., Shpitser, I.: Identity uncertainty and citation matching. In: Advances in Neural Information Processing Systems, vol.\u00a015. MIT Press, Cambridge (2003)","key":"19_CR11"},{"unstructured":"Bhattacharya, I., Getoor, L.: Deduplication and group detection using links. In: Proceedings of the KDD 2004 Workshop on Link Analysis and Group Detection (2004)","key":"19_CR12"},{"unstructured":"Domingos, P., Domingos, P.: Multi-relational record linkage. In: Proceedings of the KDD 2004 Workshop on Multi-Relational Data Mining, pp. 31\u201348 (2004)","key":"19_CR13"},{"key":"19_CR14","doi-asserted-by":"publisher","first-page":"1183","DOI":"10.2307\/2286061","volume":"64","author":"I.P. Fellegi","year":"1969","unstructured":"Fellegi, I.P., Sunter, A.B.: A theory for record linkage. Journal of the American Statistical Association\u00a064, 1183\u20131210 (1969)","journal-title":"Journal of the American Statistical Association"},{"key":"19_CR15","doi-asserted-by":"publisher","first-page":"954","DOI":"10.1126\/science.130.3381.954","volume":"130","author":"H.B. Newcombe","year":"1959","unstructured":"Newcombe, H.B., Kennedy, J.M., Axford, S.J., James, A.P.: Automatic linkage of vital records. Science\u00a0130, 954\u2013959 (1959)","journal-title":"Science"},{"unstructured":"Winkler, W.E.: Using the em algorithm for weight computation in the fellegi-sunter model of record linkage. In: Proceedings of the Section on Survey Research Methods, American Statistical Association, pp. 667\u2013671 (1988)","key":"19_CR16"},{"unstructured":"Winkler, W.E.: Improved decision rules in the fellegi-sunter model of record linkage. In: Proceedings of the Section on Survey Research Methods, American Statistical Association, pp. 274\u2013279 (1993)","key":"19_CR17"},{"key":"19_CR18","doi-asserted-by":"publisher","first-page":"32","DOI":"10.1198\/016214501750332956","volume":"79","author":"M.D. Larsen","year":"2001","unstructured":"Larsen, M.D., Rubin, D.B.: Alternative automated record linkage using mixture models. Journal of the American Statistical Association\u00a079, 32\u201341 (2001)","journal-title":"Journal of the American Statistical Association"},{"unstructured":"Winkler, W.E.: The state of record linkage and current research problems. Technical report, Statistical Research Division, U.S. Census Bureau, Washington, DC (1999)","key":"19_CR19"},{"unstructured":"Ravikumar, P., Cohen, W.W.: A hierarchical graphical model for record linkage. In: AUAI 2004: Proceedings of the 20th conference on Uncertainty in artificial intelligence, pp. 454\u2013461. AUAI Press (2004)","key":"19_CR20"},{"key":"19_CR21","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"210","DOI":"10.1007\/11546849_21","volume-title":"Data Warehousing and Knowledge Discovery","author":"P. Lehti","year":"2005","unstructured":"Lehti, P., Fankhauser, P.: A precise blocking method for record linkage. In: Tjoa, A.M., Trujillo, J. (eds.) DaWaK 2005. LNCS, vol.\u00a03589, pp. 210\u2013220. Springer, Heidelberg (2005)"},{"key":"19_CR22","doi-asserted-by":"crossref","first-page":"434","DOI":"10.1007\/978-3-662-05744-5","volume-title":"Angewandte Statistik","author":"L. Sachs","year":"2004","unstructured":"Sachs, L.: Angewandte Statistik, pp. 434\u2013435. Springer, Berlin (2004)"},{"key":"19_CR23","first-page":"74","volume-title":"Modern Information Retrieval","author":"R. Baeza-Yates","year":"1999","unstructured":"Baeza-Yates, R., Ribiero-Neto, B.: Modern Information Retrieval, pp. 74\u201379. Addison Wesley, Reading (1999)"},{"key":"19_CR24","first-page":"707","volume":"10","author":"V.I. Levenshtein","year":"1966","unstructured":"Levenshtein, V.I.: Binary codes capable of correcting insertions and reversals. Soviet Physics Doklady\u00a010, 707\u2013710 (1966)","journal-title":"Soviet Physics Doklady"},{"doi-asserted-by":"crossref","unstructured":"Elfeky, M.G., Verykios, V.S., Elmargarid, A.K.: Tailor: A record linkage toolbox. In: Proceedings of the 18th International Conference on Data Engineering, ICDE 2002 (2002)","key":"19_CR25","DOI":"10.1109\/ICDE.2002.994694"}],"container-title":["Lecture Notes in Computer Science","On the Move to Meaningful Internet Systems 2005: CoopIS, DOA, and ODBASE"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/11575801_19.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,4]],"date-time":"2025-01-04T21:46:57Z","timestamp":1736027217000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/11575801_19"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2005]]},"ISBN":["9783540297383","9783540321200"],"references-count":25,"URL":"https:\/\/doi.org\/10.1007\/11575801_19","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2005]]}}}