{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,17]],"date-time":"2026-03-17T00:38:07Z","timestamp":1773707887681,"version":"3.50.1"},"update-to":[{"DOI":"10.1371\/journal.pcbi.1006106","type":"new_version","label":"New version","source":"publisher","updated":{"date-parts":[[2018,5,8]],"date-time":"2018-05-08T00:00:00Z","timestamp":1525737600000}}],"reference-count":28,"publisher":"Public Library of Science (PLoS)","issue":"4","license":[{"start":{"date-parts":[[2018,4,26]],"date-time":"2018-04-26T00:00:00Z","timestamp":1524700800000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"DOI":"10.13039\/100000025","name":"National Institute of Mental Health","doi-asserted-by":"publisher","award":["1P50MH094267"],"award-info":[{"award-number":["1P50MH094267"]}],"id":[{"id":"10.13039\/100000025","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000050","name":"National Heart, Lung, and Blood Institute","doi-asserted-by":"publisher","award":["R01HL122712"],"award-info":[{"award-number":["R01HL122712"]}],"id":[{"id":"10.13039\/100000050","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000185","name":"Defense Advanced Research Projects Agency","doi-asserted-by":"publisher","award":["W911NF1410333"],"award-info":[{"award-number":["W911NF1410333"]}],"id":[{"id":"10.13039\/100000185","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["www.ploscompbiol.org"],"crossmark-restriction":false},"short-container-title":["PLoS Comput Biol"],"DOI":"10.1371\/journal.pcbi.1006106","type":"journal-article","created":{"date-parts":[[2018,4,26]],"date-time":"2018-04-26T17:49:30Z","timestamp":1524764970000},"page":"e1006106","update-policy":"https:\/\/doi.org\/10.1371\/journal.pcbi.corrections_policy","source":"Crossref","is-referenced-by-count":26,"title":["RIDDLE: Race and ethnicity Imputation from Disease history with Deep LEarning"],"prefix":"10.1371","volume":"14","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-8966-529X","authenticated-orcid":true,"given":"Ji-Sung","family":"Kim","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7108-3574","authenticated-orcid":true,"given":"Xin","family":"Gao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6959-7405","authenticated-orcid":true,"given":"Andrey","family":"Rzhetsky","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"340","published-online":{"date-parts":[[2018,4,26]]},"reference":[{"issue":"6","key":"ref1","doi-asserted-by":"crossref","first-page":"395","DOI":"10.1038\/nrg3208","article-title":"Mining electronic health records: towards better research applications and clinical care","volume":"13","author":"PB Jensen","year":"2012","journal-title":"Nature Reviews Genetics"},{"issue":"8","key":"ref2","doi-asserted-by":"crossref","first-page":"618","DOI":"10.1056\/NEJM199902253400806","article-title":"The effect of race and sex on physicians\u2019 recommendations for cardiac catheterization","volume":"340","author":"KA Schulman","year":"1999","journal-title":"New England Journal of Medicine"},{"issue":"12","key":"ref3","doi-asserted-by":"crossref","first-page":"1170","DOI":"10.1056\/NEJMsb025007","article-title":"The importance of race and ethnic background in biomedical research and clinical practice","volume":"348","author":"EG Burchard","year":"2003","journal-title":"The New England Journal of Medicine"},{"key":"ref4","doi-asserted-by":"crossref","first-page":"b2393","DOI":"10.1136\/bmj.b2393","article-title":"Multiple imputation for missing data in epidemiological and clinical research: potential and pitfalls","volume":"338","author":"JA Sterne","year":"2009","journal-title":"BMJ"},{"key":"ref5","unstructured":"WHO; 2010. Available from: <ext-link xmlns:xlink=\"http:\/\/www.w3.org\/1999\/xlink\" ext-link-type=\"uri\" xlink:href=\"http:\/\/www.who.int\/classifications\/icd\/en\/\" xlink:type=\"simple\">http:\/\/www.who.int\/classifications\/icd\/en\/<\/ext-link>."},{"issue":"5p1","key":"ref6","doi-asserted-by":"crossref","first-page":"1722","DOI":"10.1111\/j.1475-6773.2008.00854.x","article-title":"A New Method for Estimating Race\/Ethnicity and Associated Disparities Where Administrative Records Lack Self-Reported Race\/Ethnicity","volume":"43","author":"MN Elliott","year":"2008","journal-title":"Health Services Research"},{"issue":"4","key":"ref7","doi-asserted-by":"crossref","first-page":"946","DOI":"10.1111\/1475-6773.12295","article-title":"Imputing missing race\/ethnicity in pediatric electronic health records: reducing bias with use of US census location and surname data","volume":"50","author":"RW Grundmeier","year":"2015","journal-title":"Health Services Research"},{"issue":"3","key":"ref8","doi-asserted-by":"crossref","first-page":"404","DOI":"10.1016\/j.jss.2005.02.026","article-title":"Categorical missing data imputation for software cost estimation by multinomial logistic regression","volume":"79","author":"P Sentas","year":"2006","journal-title":"Journal of Systems and Software"},{"issue":"7553","key":"ref9","doi-asserted-by":"crossref","first-page":"436","DOI":"10.1038\/nature14539","article-title":"Deep learning","volume":"521","author":"Y LeCun","year":"2015","journal-title":"Nature"},{"key":"ref10","unstructured":"Shrikumar A, Greenside P, Kundaje A. Learning important features through propagating activation differences. arXiv preprint arXiv:170402685. 2017;."},{"issue":"12","key":"ref11","doi-asserted-by":"crossref","first-page":"2219","DOI":"10.2105\/AJPH.2016.303471","article-title":"Neighborhood Disadvantage, Poor Social Conditions, and Cardiovascular Disease Incidence Among African American Adults in the Jackson Heart Study","volume":"106","author":"S Barber","year":"2016","journal-title":"Am J Public Health"},{"issue":"3","key":"ref12","doi-asserted-by":"crossref","first-page":"295","DOI":"10.18865\/ed.25.3.295","article-title":"Racial Composition Over the Life Course: Examining Separate and Unequal Environments and the Risk for Heart Disease for African American Men","volume":"25","author":"KL Gilbert","year":"2015","journal-title":"Ethn Dis"},{"issue":"3","key":"ref13","doi-asserted-by":"crossref","first-page":"165","DOI":"10.2165\/11631520-000000000-00000","article-title":"Epidemiology and management of hypertension in the hispanic population","volume":"12","author":"NJ Guzman","year":"2012","journal-title":"American Journal of Cardiovascular Drugs"},{"issue":"6","key":"ref14","doi-asserted-by":"crossref","first-page":"319","DOI":"10.1097\/01.olq.0000240342.12960.73","article-title":"The efficacy of behavioral interventions in reducing HIV risk sex behaviors and incident sexually transmitted disease in black and Hispanic sexually transmitted disease clinic patients in the United States: a meta-analytic review","volume":"34","author":"N Crepaz","year":"2007","journal-title":"Sexually Transmitted Diseases"},{"issue":"5","key":"ref15","doi-asserted-by":"crossref","first-page":"511","DOI":"10.1016\/S0895-4356(99)00208-5","article-title":"Diabetes mellitus, coronary heart disease incidence, and death from all causes in African American and European American women: The NHANES I epidemiologic follow-up study","volume":"53","author":"RF Gillum","year":"2000","journal-title":"J Clin Epidemiol"},{"issue":"4","key":"ref16","doi-asserted-by":"crossref","first-page":"996","DOI":"10.1353\/hpu.0.0204","article-title":"The impact of acculturation on utilization of HIV prevention services and access to care among an at-risk Hispanic population","volume":"20","author":"JJ Kinsler","year":"2009","journal-title":"Journal of Health Care for the Poor and Underserved"},{"issue":"49","key":"ref17","first-page":"1155","article-title":"Incidence of sickle cell trait\u2013United States, 2010","volume":"63","author":"J Ojodu","year":"2014","journal-title":"MMWR Morb Mortal Wkly Rep"},{"issue":"8","key":"ref18","doi-asserted-by":"crossref","first-page":"756","DOI":"10.1093\/aje\/152.8.756","article-title":"Racial differences in reported Lyme disease incidence","volume":"152","author":"AD Fix","year":"2000","journal-title":"American Journal of Epidemiology"},{"issue":"8","key":"ref19","doi-asserted-by":"crossref","first-page":"1803","DOI":"10.1377\/hlthaff.2011.0746","article-title":"Differences in life expectancy due to race and educational differences are widening, and many may not catch up","volume":"31","author":"SJ Olshansky","year":"2012","journal-title":"Health Affairs"},{"issue":"11","key":"ref20","doi-asserted-by":"crossref","first-page":"1629","DOI":"10.1016\/S0277-9536(00)00273-2","article-title":"Trends in healthy life expectancy in the United States, 1970\u20131990: gender, racial, and educational differences","volume":"52","author":"EM Crimmins","year":"2001","journal-title":"Social science & medicine"},{"key":"ref21","unstructured":"Calandrino JA, Kilzer A, Narayanan A, Felten EW, Shmatikov V. \u201cYou Might Also Like:\u201d Privacy Risks of Collaborative Filtering. In: Security and Privacy (SP), 2011 IEEE Symposium on. IEEE; 2011. p. 231\u2013246."},{"key":"ref22","unstructured":"Chollet F. Keras; 2015. Available from: <ext-link xmlns:xlink=\"http:\/\/www.w3.org\/1999\/xlink\" ext-link-type=\"uri\" xlink:href=\"https:\/\/keras.io\/\" xlink:type=\"simple\">https:\/\/keras.io\/<\/ext-link>."},{"key":"ref23","unstructured":"Abadi M, Agarwal A, Barham P, Brevdo E, Chen Z, Citro C, et al. Tensorflow: Large-scale machine learning on heterogeneous distributed systems. arXiv preprint arXiv:160304467. 2016;."},{"key":"ref24","first-page":"437","article-title":"Neural Networks: Tricks of the Trade","author":"Y Bengio","year":"2012"},{"issue":"1","key":"ref25","first-page":"1929","article-title":"Dropout: a simple way to prevent neural networks from overfitting","volume":"15","author":"N Srivastava","year":"2014","journal-title":"Journal of Machine Learning Research"},{"key":"ref26","doi-asserted-by":"crossref","unstructured":"He K, Zhang X, Ren S, Sun J. Delving deep into rectifiers: Surpassing human-level performance on imagenet classification. In: Proceedings of the IEEE international conference on computer vision; 2015. p. 1026\u20131034.","DOI":"10.1109\/ICCV.2015.123"},{"key":"ref27","unstructured":"Kingma D, Ba J. Adam: A method for stochastic optimization. arXiv preprint arXiv:14126980. 2014;."},{"key":"ref28","unstructured":"Chen T, Guestrin C. XGBoost: A Scalable Tree Boosting System. In: Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining. KDD\u201916. New York, NY, USA: ACM; 2016. p. 785\u2013794. Available from: <ext-link xmlns:xlink=\"http:\/\/www.w3.org\/1999\/xlink\" ext-link-type=\"uri\" xlink:href=\"http:\/\/doi.acm.org\/10.1145\/2939672.2939785\" xlink:type=\"simple\">http:\/\/doi.acm.org\/10.1145\/2939672.2939785<\/ext-link>."}],"updated-by":[{"DOI":"10.1371\/journal.pcbi.1006106","type":"new_version","label":"New version","source":"publisher","updated":{"date-parts":[[2018,5,8]],"date-time":"2018-05-08T00:00:00Z","timestamp":1525737600000}}],"container-title":["PLOS Computational Biology"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/dx.plos.org\/10.1371\/journal.pcbi.1006106","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,11,1]],"date-time":"2020-11-01T09:17:01Z","timestamp":1604222221000},"score":1,"resource":{"primary":{"URL":"https:\/\/dx.plos.org\/10.1371\/journal.pcbi.1006106"}},"subtitle":[],"editor":[{"given":"Jean-Philippe","family":"Vert","sequence":"first","affiliation":[],"role":[{"role":"editor","vocabulary":"crossref"}]}],"short-title":[],"issued":{"date-parts":[[2018,4,26]]},"references-count":28,"journal-issue":{"issue":"4","published-online":{"date-parts":[[2018,4,26]]}},"URL":"https:\/\/doi.org\/10.1371\/journal.pcbi.1006106","relation":{"new_version":[{"id-type":"doi","id":"10.1371\/journal.pcbi.1006106","asserted-by":"object"}]},"ISSN":["1553-7358"],"issn-type":[{"value":"1553-7358","type":"electronic"}],"subject":[],"published":{"date-parts":[[2018,4,26]]}}}