{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,27]],"date-time":"2025-06-27T15:47:48Z","timestamp":1751039268381,"version":"3.40.4"},"reference-count":20,"publisher":"Oxford University Press (OUP)","license":[{"start":{"date-parts":[[2016,12,5]],"date-time":"2016-12-05T00:00:00Z","timestamp":1480896000000},"content-version":"vor","delay-in-days":1069,"URL":"http:\/\/creativecommons.org\/licenses\/by\/3.0\/"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2014,1,1]]},"DOI":"10.1093\/database\/bat086","type":"journal-article","created":{"date-parts":[[2014,1,17]],"date-time":"2014-01-17T03:40:35Z","timestamp":1389930035000},"source":"Crossref","is-referenced-by-count":24,"title":["Rule-based deduplication of article records from bibliographic databases"],"prefix":"10.1093","volume":"2014","author":[{"given":"Yu","family":"Jiang","sequence":"first","affiliation":[{"name":"Department of Computer Science, Binghamton University, Binghamton, NY 13902, USA, 2Department of Computer Science, University of Illinois at Chicago, Chicago, IL 60612, USA, 3Department of Medical Informatics and Clinical Epidemiology, Oregon Health & Science University, Portland, OR 97239, USA and 4Department of Psychiatry and Psychiatric Institute, University of Illinois at Chicago, Chicago, IL 60612, USA"}]},{"given":"Can","family":"Lin","sequence":"additional","affiliation":[{"name":"Department of Computer Science, Binghamton University, Binghamton, NY 13902, USA, 2Department of Computer Science, University of Illinois at Chicago, Chicago, IL 60612, USA, 3Department of Medical Informatics and Clinical Epidemiology, Oregon Health & Science University, Portland, OR 97239, USA and 4Department of Psychiatry and Psychiatric Institute, University of Illinois at Chicago, Chicago, IL 60612, USA"}]},{"given":"Weiyi","family":"Meng","sequence":"additional","affiliation":[{"name":"Department of Computer Science, Binghamton University, Binghamton, NY 13902, USA, 2Department of Computer Science, University of Illinois at Chicago, Chicago, IL 60612, USA, 3Department of Medical Informatics and Clinical Epidemiology, Oregon Health & Science University, Portland, OR 97239, USA and 4Department of Psychiatry and Psychiatric Institute, University of Illinois at Chicago, Chicago, IL 60612, USA"}]},{"given":"Clement","family":"Yu","sequence":"additional","affiliation":[{"name":"Department of Computer Science, Binghamton University, Binghamton, NY 13902, USA, 2Department of Computer Science, University of Illinois at Chicago, Chicago, IL 60612, USA, 3Department of Medical Informatics and Clinical Epidemiology, Oregon Health & Science University, Portland, OR 97239, USA and 4Department of Psychiatry and Psychiatric Institute, University of Illinois at Chicago, Chicago, IL 60612, USA"}]},{"given":"Aaron M.","family":"Cohen","sequence":"additional","affiliation":[{"name":"Department of Computer Science, Binghamton University, Binghamton, NY 13902, USA, 2Department of Computer Science, University of Illinois at Chicago, Chicago, IL 60612, USA, 3Department of Medical Informatics and Clinical Epidemiology, Oregon Health & Science University, Portland, OR 97239, USA and 4Department of Psychiatry and Psychiatric Institute, University of Illinois at Chicago, Chicago, IL 60612, USA"}]},{"given":"Neil R.","family":"Smalheiser","sequence":"additional","affiliation":[{"name":"Department of Computer Science, Binghamton University, Binghamton, NY 13902, USA, 2Department of Computer Science, University of Illinois at Chicago, Chicago, IL 60612, USA, 3Department of Medical Informatics and Clinical Epidemiology, Oregon Health & Science University, Portland, OR 97239, USA and 4Department of Psychiatry and Psychiatric Institute, University of Illinois at Chicago, Chicago, IL 60612, USA"}]}],"member":"286","published-online":{"date-parts":[[2014,1,16]]},"reference":[{"key":"key\n\t\t\t\t20180618202348_bat086-B1","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1109\/TKDE.2007.250581","article-title":"Duplicate record detection: a survey","volume":"19","author":"Elmagarmid","year":"2007","journal-title":"IEEE Trans. Know. Data Eng."},{"key":"key\n\t\t\t\t20180618202348_bat086-B2","doi-asserted-by":"crossref","first-page":"1246","DOI":"10.1093\/ije\/31.6.1246","article-title":"Probabilistic record linkage and a method to calculate the positive predictive value","volume":"31","author":"Blakely","year":"2002","journal-title":"Int. J. Epidemiol."},{"key":"key\n\t\t\t\t20180618202348_bat086-B3","first-page":"1425","article-title":"Identity uncertainty and citation matching","volume-title":"Proceedings of 16th Annual Advances in Neural Information Processing Systems (NIPS 2002)","author":"Pasula","year":"2003"},{"key":"key\n\t\t\t\t20180618202348_bat086-B4","first-page":"407","article-title":"Reasoning about record matching rules","volume-title":"The 35th International Conference on Very Large Data Bases (VLDB), Lyon, France","author":"Fan","year":"2009"},{"key":"key\n\t\t\t\t20180618202348_bat086-B5","doi-asserted-by":"crossref","first-page":"954","DOI":"10.1126\/science.130.3381.954","article-title":"Automatic linkage of vital records","volume":"130","author":"Newcombe","year":"1959","journal-title":"Science"},{"key":"key\n\t\t\t\t20180618202348_bat086-B6","doi-asserted-by":"crossref","first-page":"1183","DOI":"10.1080\/01621459.1969.10501049","article-title":"A theory for record linkage","volume":"64","author":"Fellegi","year":"1969","journal-title":"J. Am. Stat. Soc."},{"key":"key\n\t\t\t\t20180618202348_bat086-B7","article-title":"Deduplication and group detection using links","volume-title":"ACM SIGKDD Workshop on Link Analysis and Group Detection (LinkKDD-04), Seattle, WA","author":"Bhattacharya","year":"2004"},{"key":"key\n\t\t\t\t20180618202348_bat086-B8","doi-asserted-by":"crossref","first-page":"11","DOI":"10.1145\/1008694.1008697","article-title":"Iterative record linkage for cleaning and integration","volume-title":"ACM SIGMOD Workshop on Research Issues in DataMining and Knowledge Discovery (DMKD), Paris, France","author":"Bhattacharya","year":"2004"},{"key":"key\n\t\t\t\t20180618202348_bat086-B9","first-page":"39","article-title":"Adaptive duplicate detection using learnable string similarity measures","volume-title":"ACM SIGKDD Conference on Knowledge Discovery and Data Mining, Washington, DC","author":"Bilenko","year":"2003"},{"key":"key\n\t\t\t\t20180618202348_bat086-B10","first-page":"269","article-title":"Interactive deduplication using active learning","volume-title":"ACM SIGKDD Conference on Knowledge Discovery and Data Mining, Edmonton, Alberta","author":"Sarawagi","year":"2002"},{"key":"key\n\t\t\t\t20180618202348_bat086-B11","doi-asserted-by":"crossref","first-page":"706","DOI":"10.1016\/j.ipm.2011.01.009","article-title":"An unsupervised heuristic-based approach for bibliographic metadata deduplication","volume":"47","author":"Borges","year":"2011","journal-title":"Inf. Process. Manag."},{"key":"key\n\t\t\t\t20180618202348_bat086-B12","doi-asserted-by":"crossref","first-page":"1065","DOI":"10.1145\/1401890.1402020","article-title":"Febrl: an open source data cleaning, deduplication and record linkage system with a graphical user interface","volume-title":"Proceedings of the 14th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, Las Vegas, NV","author":"Christen","year":"2008"},{"key":"key\n\t\t\t\t20180618202348_bat086-B13","first-page":"440","article-title":"FRIL: a tool for comparative record linkage","volume":"2008","author":"Jurczyk","year":"2008","journal-title":"Proc. AMIA Symp."},{"key":"key\n\t\t\t\t20180618202348_bat086-B14","article-title":"Design and implementation of Metta, a metasearch engine for biomedical literature intended for systematic reviewers","author":"Smalheiser","year":"2013","journal-title":"Health Information Science and Systems"},{"key":"key\n\t\t\t\t20180618202348_bat086-B15","doi-asserted-by":"crossref","first-page":"e71838","DOI":"10.1371\/journal.pone.0071838","article-title":"Find duplicates among the PubMed, EMBASE, and Cochrane library databases in systematic reviews","volume":"8","author":"Qi","year":"2013","journal-title":"PLoS One"},{"key":"key\n\t\t\t\t20180618202348_bat086-B16","doi-asserted-by":"crossref","first-page":"9","DOI":"10.1023\/A:1009761603038","article-title":"Real-world data is dirty: data cleansing and the merge\/purge problem","volume":"2","author":"Hernandez","year":"1998","journal-title":"Data Min. Knowl. Discov."},{"key":"key\n\t\t\t\t20180618202348_bat086-B17","doi-asserted-by":"crossref","first-page":"169","DOI":"10.1145\/347090.347123","article-title":"Efficient clustering of high dimensional data sets with application to reference matching","volume-title":"Proceedings of the 6th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, Boston, MA","author":"McCallum","year":"2000"},{"key":"key\n\t\t\t\t20180618202348_bat086-B18","first-page":"1067","article-title":"Efficient spectral neighborhood blocking for entity resolution","volume-title":"IEEE International Conference on Data Engineering (ICDE), Hannover, Germany","author":"Shu","year":"2011"},{"key":"key\n\t\t\t\t20180618202348_bat086-B19","volume-title":"Introduction to Algorithms","author":"Corman","year":"2009","edition":"3rd"},{"key":"key\n\t\t\t\t20180618202348_bat086-B20","first-page":"451","article-title":"A simple algorithm for identifying abbreviation definitions in biomedical text","volume":"4","author":"Schwartz","year":"2003","journal-title":"Pac. Symp. Biocomput."}],"container-title":["Database"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/academic.oup.com\/database\/article-pdf\/doi\/10.1093\/database\/bat086\/17471098\/bat086.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,5,1]],"date-time":"2025-05-01T15:45:38Z","timestamp":1746114338000},"score":1,"resource":{"primary":{"URL":"https:\/\/academic.oup.com\/database\/article\/doi\/10.1093\/database\/bat086\/2633762"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014,1,1]]},"references-count":20,"URL":"https:\/\/doi.org\/10.1093\/database\/bat086","relation":{},"ISSN":["1758-0463"],"issn-type":[{"type":"electronic","value":"1758-0463"}],"subject":[],"published-other":{"date-parts":[[2014]]},"published":{"date-parts":[[2014,1,1]]}}}