{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,8]],"date-time":"2026-02-08T20:48:50Z","timestamp":1770583730182,"version":"3.49.0"},"reference-count":33,"publisher":"Oxford University Press (OUP)","issue":"1","content-domain":{"domain":["bmj.com"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2013,1]]},"DOI":"10.1136\/amiajnl-2012-001020","type":"journal-article","created":{"date-parts":[[2012,9,5]],"date-time":"2012-09-05T04:56:48Z","timestamp":1346821008000},"page":"77-83","update-policy":"https:\/\/doi.org\/10.1136\/crossmarkpolicy","source":"Crossref","is-referenced-by-count":56,"title":["BoB, a best-of-breed automated text de-identification system for VHA clinical documents"],"prefix":"10.1093","volume":"20","author":[{"given":"Oscar","family":"Ferr\u00e1ndez","sequence":"first","affiliation":[]},{"given":"Brett R","family":"South","sequence":"additional","affiliation":[]},{"given":"Shuying","family":"Shen","sequence":"additional","affiliation":[]},{"given":"F Jeffrey","family":"Friedlin","sequence":"additional","affiliation":[]},{"given":"Matthew H","family":"Samore","sequence":"additional","affiliation":[]},{"given":"St\u00e9phane M","family":"Meystre","sequence":"additional","affiliation":[]}],"member":"286","published-online":{"date-parts":[[2012,9,4]]},"reference":[{"key":"key\n\t\t\t\t20170522084138_b1","doi-asserted-by":"crossref","first-page":"70","DOI":"10.1186\/1471-2288-10-70","article-title":"Automatic de-identification of textual documents in the electronic health record: a review of recent research","volume":"10","author":"Meystre","year":"2010","journal-title":"BMC Med Res Methodol"},{"key":"key\n\t\t\t\t20170522084138_b2","unstructured":"Dixon P . Medical identity theft: the information crime that can kill you. 2006. http:\/\/www.worldprivacyforum.org\/pdf\/wpf_medicalidtheft2006.pdf (accessed April 2012)."},{"key":"key\n\t\t\t\t20170522084138_b3","article-title":"Health information privacy (HIPAA) notices have improved public's confidence that their medical information is being handled properly","author":"Harris Interactive","year":"2005"},{"key":"key\n\t\t\t\t20170522084138_b4","article-title":"45 C.F.R. \u00a7 46 Protection of Human Subjects","author":"GPO US","year":"2008"},{"key":"key\n\t\t\t\t20170522084138_b5","article-title":"45 C.F.R. \u00a7 164 Security and Privacy","author":"GPO US","year":"2008"},{"key":"key\n\t\t\t\t20170522084138_b6","doi-asserted-by":"crossref","first-page":"550","DOI":"10.1197\/jamia.M2444","article-title":"Evaluating the state-of-the-art in automatic de-identification","volume":"14","author":"Uzuner","year":"2007","journal-title":"J Am Med Inform Assoc"},{"key":"key\n\t\t\t\t20170522084138_b7","doi-asserted-by":"crossref","first-page":"601","DOI":"10.1197\/jamia.M2702","article-title":"A software tool for removing patient identifying information from clinical documents","volume":"15","author":"Friedlin","year":"2008","journal-title":"J Am Med Inform Assoc"},{"key":"key\n\t\t\t\t20170522084138_b8","doi-asserted-by":"crossref","first-page":"32","DOI":"10.1186\/1472-6947-8-32","article-title":"Automated de-identification of free-text medical records","volume":"8","author":"Neamatullah","year":"2008","journal-title":"BMC Med Inform Decis Mak"},{"key":"key\n\t\t\t\t20170522084138_b9","doi-asserted-by":"crossref","first-page":"12","DOI":"10.1186\/1472-6947-6-12","article-title":"Development and evaluation of an open source software tool for deidentification of pathology reports","volume":"6","author":"Beckwith","year":"2006","journal-title":"BMC Med Inform Decis Mak"},{"key":"key\n\t\t\t\t20170522084138_b10","doi-asserted-by":"crossref","first-page":"176","DOI":"10.1309\/E6K33GBPE5C27FYU","article-title":"Evaluation of a deidentification (De-Id) software engine to share pathology reports and clinical documents for research","volume":"121","author":"Gupta","year":"2004","journal-title":"Am J Clin Pathol"},{"key":"key\n\t\t\t\t20170522084138_b11","doi-asserted-by":"crossref","first-page":"849","DOI":"10.1016\/j.ijmedinf.2010.09.007","article-title":"The MITRE identification scrubber toolkit: design, training, and assessment","volume":"79","author":"Aberdeen","year":"2010","journal-title":"Inter J Med Inform"},{"key":"key\n\t\t\t\t20170522084138_b12","doi-asserted-by":"crossref","first-page":"1441","DOI":"10.1016\/j.datak.2009.07.006","article-title":"An integrated framework for de-identifying unstructured medical data","volume":"68","author":"Gardner","year":"2009","journal-title":"Data Knowl Eng"},{"key":"key\n\t\t\t\t20170522084138_b13","doi-asserted-by":"crossref","first-page":"13","DOI":"10.1016\/j.artmed.2007.10.001","article-title":"A de-identifier for medical discharge summaries","volume":"42","author":"Uzuner","year":"2008","journal-title":"Artif Intell Med"},{"key":"key\n\t\t\t\t20170522084138_b14","doi-asserted-by":"crossref","first-page":"574","DOI":"10.1197\/jamia.M2441","article-title":"State-of-the-art anonymization of medical records using an iterative machine learning framework","volume":"14","author":"Szarvas","year":"2007","journal-title":"J Am Med Inform Assoc"},{"key":"key\n\t\t\t\t20170522084138_b15","article-title":"Identifying Personal Health Information using support vector machines training sub-system testing sub-system The Preprocessing sub-system","author":"Guo","year":"2006"},{"key":"key\n\t\t\t\t20170522084138_b16","first-page":"466","article-title":"Message understanding conference-6: a brief history","author":"Grishman","year":"1996"},{"key":"key\n\t\t\t\t20170522084138_b17","doi-asserted-by":"crossref","DOI":"10.1186\/1471-2105-12-S3-S2","article-title":"A system for de-identifying medical message board text","volume":"12","author":"Benton","year":"2011","journal-title":"BMC Bioinformatics"},{"key":"key\n\t\t\t\t20170522084138_b18","doi-asserted-by":"crossref","first-page":"564","DOI":"10.1197\/jamia.M2435","article-title":"Rapidly retargetable approaches to de-identification in medical records","volume":"14","author":"Wellner","year":"2007","journal-title":"J Am Med Inform Assoc"},{"key":"key\n\t\t\t\t20170522084138_b19","doi-asserted-by":"crossref","first-page":"109","DOI":"10.1186\/1471-2288-12-109","article-title":"Evaluating current automatic de-identification methods with Veteran's health administration clinical documents","volume":"12","author":"Ferr\u00e1ndez","year":"2012","journal-title":"BMC Med Res Methodol"},{"key":"key\n\t\t\t\t20170522084138_b20","doi-asserted-by":"crossref","first-page":"e19","DOI":"10.1016\/j.ijmedinf.2009.04.005","article-title":"Developing a standard for de-identifying electronic patient records written in Swedish: precision, recall and F-measure in a manual and computerized annotation trial","volume":"78","author":"Velupillai","year":"2009","journal-title":"Int J Med Inform"},{"key":"key\n\t\t\t\t20170522084138_b21","author":"Apache UIMA","year":"2008"},{"key":"key\n\t\t\t\t20170522084138_b22","author":"LVG (Lexical Variant Generation)","year":"2011"},{"key":"key\n\t\t\t\t20170522084138_b23","doi-asserted-by":"crossref","first-page":"507","DOI":"10.1136\/jamia.2009.001560","article-title":"Mayo clinical Text Analysis and Knowledge Extraction System (cTAKES): architecture, component evaluation and applications","volume":"17","author":"Savova","year":"2010","journal-title":"J Am Med Inform Assoc"},{"key":"key\n\t\t\t\t20170522084138_b24","unstructured":"Baldridge J Morton M Bierner G . OpenNLP Maxent Package in Java. 2005. http:\/\/opennlp.apache.org\/ (accessed Apr 2012)."},{"key":"key\n\t\t\t\t20170522084138_b25","unstructured":"The Apache Lucene project. http:\/\/lucene.apache.org\/ (accessed Apr 2012)."},{"key":"key\n\t\t\t\t20170522084138_b26","first-page":"142","article-title":"Introduction to the CoNLL-2003 shared task: language-independent named entity recognition","volume-title":"Proceedings of the Seventh Conference on Natural language Learning","author":"Tjong Kim Sang","year":"2003"},{"key":"key\n\t\t\t\t20170522084138_b27","first-page":"837","article-title":"The Automatic Content Extraction (ACE) program\u2014tasks, data, and evaluation. Evaluation","volume-title":"Proceedings of The International Conference on Language Resources and Evaluation","author":"Doddington","year":"2004"},{"key":"key\n\t\t\t\t20170522084138_b28","first-page":"363","article-title":"Incorporating non-local information into information extraction systems by Gibbs sampling","volume-title":"Proceedings of the 43rd Annual Meeting on Association for Computational Linguistics","author":"Finkel","year":"2005"},{"key":"key\n\t\t\t\t20170522084138_b29","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/1961189.1961199","article-title":"LIBSVM: a library for support vector machines","volume":"2","author":"Chang","year":"2011","journal-title":"ACM Trans Intell Syst Technol"},{"key":"key\n\t\t\t\t20170522084138_b30","first-page":"1871","article-title":"LIBLINEAR: a library for large linear classification","volume":"9","author":"Fan","year":"2008","journal-title":"J Mach Lear Res"},{"key":"key\n\t\t\t\t20170522084138_b31","volume-title":"Information retrieval","author":"van Rijsbergen","year":"1979"},{"key":"key\n\t\t\t\t20170522084138_b32","first-page":"72","article-title":"Measuring risk and information preservation: toward new metrics for de-identification of clinical texts","volume-title":"Proceedings of the Second Louhi Workshop on Text and Data Mining of Health Documents","author":"Hirschman","year":"2010"},{"key":"key\n\t\t\t\t20170522084138_b33","doi-asserted-by":"crossref","first-page":"159","DOI":"10.1136\/jamia.2009.002212","article-title":"Effects of personal identifier resynthesis on clinical text de-identification","volume":"17","author":"Yeniterzi","year":"2010","journal-title":"J Am Med Inform Assoc"}],"container-title":["Journal of the American Medical Informatics Association"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/academic.oup.com\/jamia\/article-pdf\/20\/1\/77\/17375119\/20-1-77.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,8,23]],"date-time":"2017-08-23T06:29:21Z","timestamp":1503469761000},"score":1,"resource":{"primary":{"URL":"https:\/\/academic.oup.com\/jamia\/article-lookup\/doi\/10.1136\/amiajnl-2012-001020"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2012,9,4]]},"references-count":33,"journal-issue":{"issue":"1","published-online":{"date-parts":[[2012,9,4]]},"published-print":{"date-parts":[[2013,1]]}},"URL":"https:\/\/doi.org\/10.1136\/amiajnl-2012-001020","relation":{},"ISSN":["1527-974X","1067-5027"],"issn-type":[{"value":"1527-974X","type":"electronic"},{"value":"1067-5027","type":"print"}],"subject":[],"published":{"date-parts":[[2012,9,4]]}}}