{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,7,5]],"date-time":"2025-07-05T05:10:05Z","timestamp":1751692205276,"version":"3.41.0"},"publisher-location":"Cham","reference-count":25,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319930398"},{"type":"electronic","value":"9783319930404"}],"license":[{"start":{"date-parts":[[2018,1,1]],"date-time":"2018-01-01T00:00:00Z","timestamp":1514764800000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018]]},"DOI":"10.1007\/978-3-319-93040-4_15","type":"book-chapter","created":{"date-parts":[[2018,6,16]],"date-time":"2018-06-16T13:29:41Z","timestamp":1529155781000},"page":"177-190","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["It Pays to Be Certain: Unsupervised Record Linkage via Ambiguity Minimization"],"prefix":"10.1007","author":[{"given":"Anna","family":"Jurek","sequence":"first","affiliation":[]},{"given":"Deepak","family":"P.","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2018,6,17]]},"reference":[{"key":"15_CR1","doi-asserted-by":"crossref","unstructured":"Arasu, A., Gotz, M., Kaushik, R.: On active learning of record matching packages. In: SIGMOD, pp. 783\u2013794. ACM (2010)","DOI":"10.1145\/1807167.1807252"},{"key":"15_CR2","doi-asserted-by":"crossref","unstructured":"Christen, P.: Automatic record linkage using seeded nearest neighbour and support vector machine classification. In: SIGKDD, pp. 151\u2013159. ACM (2008)","DOI":"10.1145\/1401890.1401913"},{"key":"15_CR3","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-31164-2","volume-title":"Data Matching: Concepts and Techniques for Record Linkage, Entity Resolution, and Duplicate Detection","author":"P Christen","year":"2012","unstructured":"Christen, P.: Data Matching: Concepts and Techniques for Record Linkage, Entity Resolution, and Duplicate Detection. Springer, Heidelberg (2012). https:\/\/doi.org\/10.1007\/978-3-642-31164-2"},{"key":"15_CR4","doi-asserted-by":"crossref","unstructured":"Cohen, W.W., Richman, J.: Learning to match and cluster large high-dimensional data sets for data integration. In: SIGKDD, pp. 475\u2013480. ACM (2002)","DOI":"10.1145\/775047.775116"},{"key":"15_CR5","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-21257-9","volume-title":"Operators for Similarity Search: Semantics Techniques and Usage Scenarios","author":"P Deepak","year":"2015","unstructured":"Deepak, P., Deshpande, P.M.: Operators for Similarity Search: Semantics Techniques and Usage Scenarios. Springer, Heidelberg (2015). https:\/\/doi.org\/10.1007\/978-3-319-21257-9"},{"key":"15_CR6","doi-asserted-by":"crossref","unstructured":"Elfeky, M.G., Verykios, V.S., Elmagarmid, A.K.: TAILOR: a record linkage toolbox. In: 2002 Proceedings of 18th International Conference on Data Engineering, pp. 17\u201328. IEEE (2002)","DOI":"10.1109\/ICDE.2002.994694"},{"issue":"11","key":"15_CR7","doi-asserted-by":"publisher","first-page":"1638","DOI":"10.14778\/2350229.2350276","volume":"5","author":"R Isele","year":"2012","unstructured":"Isele, R., Bizer, C.: Learning expressive linkage rules using genetic programming. Proc. VLDB Endow. 5(11), 1638\u20131649 (2012)","journal-title":"Proc. VLDB Endow."},{"key":"15_CR8","first-page":"241","volume":"37","author":"P Jaccard","year":"1901","unstructured":"Jaccard, P.: Distribution de la flore alpine dans le bassin des dranses et dans quelques r\u00e9gions voisines. Bull. Soc. Vaud. Sci. Nat. 37, 241\u2013272 (1901)","journal-title":"Bull. Soc. Vaud. Sci. Nat."},{"issue":"406","key":"15_CR9","doi-asserted-by":"publisher","first-page":"414","DOI":"10.1080\/01621459.1989.10478785","volume":"84","author":"MA Jaro","year":"1989","unstructured":"Jaro, M.A.: Advances in record-linkage methodology as applied to matching the 1985 census of Tampa, Florida. J. Am. Stat. Assoc. 84(406), 414\u2013420 (1989)","journal-title":"J. Am. Stat. Assoc."},{"key":"15_CR10","doi-asserted-by":"publisher","first-page":"40","DOI":"10.1016\/j.is.2017.06.006","volume":"71","author":"A Jurek","year":"2017","unstructured":"Jurek, A., Hong, J., Chi, Y., Liu, W.: A novel ensemble learning approach to unsupervised record linkage. Inf. Syst. 71, 40\u201354 (2017)","journal-title":"Inf. Syst."},{"key":"15_CR11","doi-asserted-by":"crossref","unstructured":"Kejriwal, M., Miranker, D.P.: An unsupervised algorithm for learning blocking schemes. In: IEEE 13th International Conference on Data Mining (ICDM), pp. 340\u2013349 (2013)","DOI":"10.1109\/ICDM.2013.60"},{"key":"15_CR12","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"388","DOI":"10.1007\/978-3-319-18818-8_24","volume-title":"The Semantic Web. Latest Advances and New Domains","author":"M Kejriwal","year":"2015","unstructured":"Kejriwal, M., Miranker, D.P.: Semi-supervised instance matching using boosted classifiers. In: Gandon, F., Sabou, M., Sack, H., d\u2019Amato, C., Cudr\u00e9-Mauroux, P., Zimmermann, A. (eds.) ESWC 2015. LNCS, vol. 9088, pp. 388\u2013402. Springer, Cham (2015). https:\/\/doi.org\/10.1007\/978-3-319-18818-8_24"},{"key":"15_CR13","doi-asserted-by":"publisher","first-page":"170","DOI":"10.1016\/j.ins.2013.08.045","volume":"261","author":"S Lee","year":"2014","unstructured":"Lee, S., Lee, J., Hwang, S.W.: Efficient entity matching using materialized lists. Inf. Sci. 261, 170\u2013184 (2014)","journal-title":"Inf. Sci."},{"key":"15_CR14","unstructured":"Levenshtein, V.I.: Binary codes capable of correcting deletions, insertions, and reversals. In: Soviet Physics Doklady, vol. 10, pp. 707\u2013710 (1966)"},{"key":"15_CR15","unstructured":"Ngomo, A.C.N., Lyko, K.: Unsupervised learning of link specifications: deterministic vs. non-deterministic. In: Proceedings of the 8th International Conference on Ontology Matching, vol. 1111, pp. 25\u201336. CEUR-WS.org (2013)"},{"key":"15_CR16","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"119","DOI":"10.1007\/978-3-642-30284-8_15","volume-title":"The Semantic Web: Research and Applications","author":"A Nikolov","year":"2012","unstructured":"Nikolov, A., d\u2019Aquin, M., Motta, E.: Unsupervised learning of link discovery configuration. In: Simperl, E., Cimiano, P., Polleres, A., Corcho, O., Presutti, V. (eds.) ESWC 2012. LNCS, vol. 7295, pp. 119\u2013133. Springer, Heidelberg (2012). https:\/\/doi.org\/10.1007\/978-3-642-30284-8_15"},{"key":"15_CR17","doi-asserted-by":"crossref","unstructured":"Deepak, P.: MixKMeans: clustering question-answer archives. In: 2016 Conference on Empirical Methods in Natural Language Processing. In: EMNLP, pp. 1576\u20131585 (2016)","DOI":"10.18653\/v1\/D16-1164"},{"key":"15_CR18","doi-asserted-by":"crossref","unstructured":"Sarawagi, S., Bhamidipaty, A.: Interactive deduplication using active learning. In: SIGKDD, pp. 269\u2013278. ACM (2002)","DOI":"10.1145\/775047.775087"},{"issue":"1","key":"15_CR19","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1145\/584091.584093","volume":"5","author":"CE Shannon","year":"2001","unstructured":"Shannon, C.E.: A mathematical theory of communication. ACM SIGMOBILE Mob. Comput. Commun. Rev. 5(1), 3\u201355 (2001)","journal-title":"ACM SIGMOBILE Mob. Comput. Commun. Rev."},{"issue":"516","key":"15_CR20","doi-asserted-by":"publisher","first-page":"1660","DOI":"10.1080\/01621459.2015.1105807","volume":"111","author":"RC Steorts","year":"2016","unstructured":"Steorts, R.C., Hall, R., Fienberg, S.E.: A Bayesian approach to graphical record linkage and deduplication. J. Am. Stat. Assoc. 111(516), 1660\u20131672 (2016)","journal-title":"J. Am. Stat. Assoc."},{"key":"15_CR21","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"253","DOI":"10.1007\/978-3-319-11257-2_20","volume-title":"Privacy in Statistical Databases","author":"RC Steorts","year":"2014","unstructured":"Steorts, R.C., Ventura, S.L., Sadinle, M., Fienberg, S.E.: A comparison of blocking methods for record linkage. In: Domingo-Ferrer, J. (ed.) PSD 2014. LNCS, vol. 8744, pp. 253\u2013268. Springer, Cham (2014). https:\/\/doi.org\/10.1007\/978-3-319-11257-2_20"},{"issue":"6","key":"15_CR22","doi-asserted-by":"publisher","first-page":"946","DOI":"10.1016\/j.is.2012.11.005","volume":"38","author":"D Vatsalan","year":"2013","unstructured":"Vatsalan, D., Christen, P., Verykios, V.S.: A taxonomy of privacy-preserving record linkage techniques. Inf. Syst. 38(6), 946\u2013969 (2013)","journal-title":"Inf. Syst."},{"issue":"10","key":"15_CR23","doi-asserted-by":"publisher","first-page":"622","DOI":"10.14778\/2021017.2021020","volume":"4","author":"J Wang","year":"2011","unstructured":"Wang, J., Li, G., Yu, J.X., Feng, J.: Entity matching: how similar is similar. Proc. VLDB Endow. 4(10), 622\u2013633 (2011)","journal-title":"Proc. VLDB Endow."},{"key":"15_CR24","series-title":"Lecture Notes in Computer Science (Lecture Notes in Artificial Intelligence)","doi-asserted-by":"publisher","first-page":"562","DOI":"10.1007\/978-3-319-18032-8_44","volume-title":"Advances in Knowledge Discovery and Data Mining","author":"Q Wang","year":"2015","unstructured":"Wang, Q., Vatsalan, D., Christen, P.: Efficient interactive training selection for large-scale entity resolution. In: Cao, T., Lim, E.-P., Zhou, Z.-H., Ho, T.-B., Cheung, D., Motoda, H. (eds.) PAKDD 2015. LNCS (LNAI), vol. 9078, pp. 562\u2013573. Springer, Cham (2015). https:\/\/doi.org\/10.1007\/978-3-319-18032-8_44"},{"key":"15_CR25","unstructured":"Winkler, W.E.: String comparator metrics and enhanced decision rules in the fellegi-sunter model of record linkage, pp. 354\u2013359 (1990)"}],"container-title":["Lecture Notes in Computer Science","Advances in Knowledge Discovery and Data Mining"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-93040-4_15","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,7,5]],"date-time":"2025-07-05T04:38:51Z","timestamp":1751690331000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-319-93040-4_15"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018]]},"ISBN":["9783319930398","9783319930404"],"references-count":25,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-93040-4_15","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2018]]},"assertion":[{"value":"17 June 2018","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"PAKDD","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Pacific-Asia Conference on Knowledge Discovery and Data Mining","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Melbourne, VIC","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Australia","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2018","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"3 June 2018","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"6 June 2018","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"22","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"pakdd2018","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/prada-research.net\/pakdd18\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}