{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,3]],"date-time":"2026-03-03T06:20:32Z","timestamp":1772518832365,"version":"3.50.1"},"reference-count":33,"publisher":"Oxford University Press (OUP)","issue":"1","content-domain":{"domain":["bmj.com"],"crossmark-restriction":true},"short-container-title":["J Am Med Inform Assoc"],"published-print":{"date-parts":[[2014,1]]},"DOI":"10.1136\/amiajnl-2013-001744","type":"journal-article","created":{"date-parts":[[2013,5,24]],"date-time":"2013-05-24T04:55:44Z","timestamp":1369371344000},"page":"97-104","update-policy":"https:\/\/doi.org\/10.1136\/crossmarkpolicy","source":"Crossref","is-referenced-by-count":34,"title":["A benchmark comparison of deterministic and probabilistic methods for defining manual review datasets in duplicate records reconciliation"],"prefix":"10.1093","volume":"21","author":[{"given":"Erel","family":"Joffe","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Michael J","family":"Byrne","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Phillip","family":"Reeder","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jorge R","family":"Herskovic","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Craig W","family":"Johnson","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Allison B","family":"McCoy","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Dean F","family":"Sittig","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Elmer V","family":"Bernstam","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"286","published-online":{"date-parts":[[2014,1,1]]},"reference":[{"key":"2015062501455481000_21.1.97.1","unstructured":"Wiedemann LA . Fundamentals for Building a Master Patient Index\/Enterprise Master Patient Index (Updated). http:\/\/library.ahima.org\/xpedio\/groups\/public\/documents\/ahima\/bok1_048389.hcsp?dDocName=bok1_048389."},{"key":"2015062501455481000_21.1.97.2","unstructured":"Joffe E Bearden CF Byrne MJ . Duplicate patient records\u2014implication for missed laboratory results. Proceedings of the AMIA Annual Symposium, 2012:1269\u201375."},{"key":"2015062501455481000_21.1.97.3","doi-asserted-by":"publisher","DOI":"10.1136\/bmjqs-2012-001419"},{"key":"2015062501455481000_21.1.97.4","doi-asserted-by":"publisher","DOI":"10.1109\/TKDE.2007.250581"},{"key":"2015062501455481000_21.1.97.5","doi-asserted-by":"crossref","unstructured":"Christen P Goiser K . Quality and complexity measures for data linkage and deduplication. In: Guillet FJ Hamilton HJ , eds. Quality measures in data mining. Berlin: Springer, 2007:127\u201351.","DOI":"10.1007\/978-3-540-44918-8_6"},{"key":"2015062501455481000_21.1.97.6","unstructured":"Winkler WE . Overview of record linkage and current research directions. Washington, DC: Statistical Research Division of the U.S. Census Bureau, 2006."},{"key":"2015062501455481000_21.1.97.7","doi-asserted-by":"publisher","DOI":"10.1007\/s00778-002-0072-y"},{"key":"2015062501455481000_21.1.97.8","doi-asserted-by":"publisher","DOI":"10.1056\/NEJMsa054479"},{"key":"2015062501455481000_21.1.97.9","doi-asserted-by":"crossref","unstructured":"K\u00f6pcke H Thor A Rahm E . Evaluation of entity resolution approaches on real-world match problems. Proceedings of the VLDB Endowment, 2010:484\u201393.","DOI":"10.14778\/1920841.1920904"},{"key":"2015062501455481000_21.1.97.10","doi-asserted-by":"crossref","unstructured":"Zhu VJ Overhage MJ Egg J . An empiric modification to the probabilistic record linkage algorithm using frequency-based weight scaling. J Am Med Inform Assoc 2000;16:738\u201345.","DOI":"10.1197\/jamia.M3186"},{"key":"2015062501455481000_21.1.97.11","doi-asserted-by":"publisher","DOI":"10.1136\/amiajnl-2011-000461"},{"key":"2015062501455481000_21.1.97.12","doi-asserted-by":"crossref","unstructured":"Sarawagi S Breiman L Friedman JH . Interactive deduplication using active learning. Proceedings of the Eighth ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, 2002:269\u201378.","DOI":"10.1145\/775047.775087"},{"key":"2015062501455481000_21.1.97.13","unstructured":"Grannis SJ Overhage JM McDonald CJ . Analysis of identifier performance using a deterministic linkage algorithm. Proceedings of the AMIA Annual Symposium, 2002:305\u20139."},{"key":"2015062501455481000_21.1.97.14","unstructured":"Salkowitz SM Clyde S . The unique records portfolio. Decatur, GA: Public Health Informatics Institute, 2006."},{"key":"2015062501455481000_21.1.97.15","doi-asserted-by":"crossref","unstructured":"Christen P . Data matching. Berlin: Springer-Verlag, 2012.","DOI":"10.1007\/978-3-642-31164-2"},{"key":"2015062501455481000_21.1.97.16","doi-asserted-by":"publisher","DOI":"10.1177\/1460458208088855"},{"key":"2015062501455481000_21.1.97.17","doi-asserted-by":"crossref","unstructured":"Shahri H Barforush A . A flexible fuzzy expert system for fuzzy duplicate elimination in data cleaning. In: Galindo F Takizawa M Traunmaller R , eds. Database and expert systems applications. Berlin: Springer-Verlag, 2004:161\u201370.","DOI":"10.1007\/978-3-540-30075-5_16"},{"key":"2015062501455481000_21.1.97.18","doi-asserted-by":"publisher","DOI":"10.2307\/2289924"},{"key":"2015062501455481000_21.1.97.19","unstructured":"Grannis SJ Overhage JM Hui S . Analysis of a probabilistic record linkage technique without human review. Proceedings of the AMIA Annual Symposium, 2003:259\u201363."},{"key":"2015062501455481000_21.1.97.20","doi-asserted-by":"publisher","DOI":"10.1038\/nbt1406"},{"key":"2015062501455481000_21.1.97.21","doi-asserted-by":"crossref","unstructured":"Elfeky MG Verykios VS Elmagarmid AK . TAILOR: a record linkage toolbox. Proceedings 18th International Conference on Data Engineering, IEEE Comput. Soc, 17\u201328.","DOI":"10.1109\/ICDE.2002.994694"},{"key":"2015062501455481000_21.1.97.22","doi-asserted-by":"publisher","DOI":"10.1109\/TKDE.2010.234"},{"key":"2015062501455481000_21.1.97.23","doi-asserted-by":"crossref","unstructured":"Eberhart R Kennedy J . A new optimizer using particle swarm theory. Proceedings of the Sixth International Symposium on Micro Machine and Human Science, 1995:39\u201343.","DOI":"10.1109\/MHS.1995.494215"},{"key":"2015062501455481000_21.1.97.24","doi-asserted-by":"publisher","DOI":"10.1136\/amiajnl-2011-000335"},{"key":"2015062501455481000_21.1.97.25","doi-asserted-by":"publisher","DOI":"10.1006\/jbin.2001.1001"},{"key":"2015062501455481000_21.1.97.26","unstructured":"Duvall SL Fraser AM Kerber RA . The impact of a growing minority population on identification of duplicate records in an enterprise data warehouse. Stud Health Technol Inform 2010;160:1122\u20136."},{"key":"2015062501455481000_21.1.97.27","doi-asserted-by":"publisher","DOI":"10.1016\/j.jbi.2009.08.004"},{"key":"2015062501455481000_21.1.97.28","doi-asserted-by":"publisher","DOI":"10.1016\/j.jbi.2012.02.002"},{"key":"2015062501455481000_21.1.97.29","doi-asserted-by":"publisher","DOI":"10.1002\/sim.1147"},{"key":"2015062501455481000_21.1.97.30","doi-asserted-by":"publisher","DOI":"10.1186\/1472-6963-6-1"},{"key":"2015062501455481000_21.1.97.31","doi-asserted-by":"crossref","unstructured":"Gu L Baxter R . Decision models for record linkage. In: Williams GJ Simoff SJ , eds. Data mining. Berlin: Springer, 2006:146\u201360.","DOI":"10.1007\/11677437_12"},{"key":"2015062501455481000_21.1.97.32","doi-asserted-by":"crossref","unstructured":"Ho VH Compton P Benatallah B . An incremental knowledge acquisition method for improving duplicate invoices detection. IEEE 25th International Conference on Data Engineering. IEEE, 2009:1415\u201318.","DOI":"10.1109\/ICDE.2009.38"},{"key":"2015062501455481000_21.1.97.33","unstructured":"User Manual for the De-duplication Evaluation Toolkit. Center for Disease Control and Prevention, 2002."}],"container-title":["Journal of the American Medical Informatics Association"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/academic.oup.com\/jamia\/article-pdf\/21\/1\/97\/17376250\/21-1-97.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,4,30]],"date-time":"2025-04-30T11:19:30Z","timestamp":1746011970000},"score":1,"resource":{"primary":{"URL":"https:\/\/academic.oup.com\/jamia\/article-lookup\/doi\/10.1136\/amiajnl-2013-001744"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014,1]]},"references-count":33,"journal-issue":{"issue":"1","published-online":{"date-parts":[[2014,1,1]]},"published-print":{"date-parts":[[2014,1]]}},"alternative-id":["10.1136\/amiajnl-2013-001744"],"URL":"https:\/\/doi.org\/10.1136\/amiajnl-2013-001744","relation":{},"ISSN":["1067-5027","1527-974X"],"issn-type":[{"value":"1067-5027","type":"print"},{"value":"1527-974X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2014,1]]}}}