{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,25]],"date-time":"2026-03-25T01:54:27Z","timestamp":1774403667917,"version":"3.50.1"},"reference-count":31,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2020,8,3]],"date-time":"2020-08-03T00:00:00Z","timestamp":1596412800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2020,8,3]],"date-time":"2020-08-03T00:00:00Z","timestamp":1596412800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/100006537","name":"Vanderbilt University","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100006537","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Healthc Inform Res"],"published-print":{"date-parts":[[2020,12]]},"DOI":"10.1007\/s41666-020-00077-1","type":"journal-article","created":{"date-parts":[[2020,8,3]],"date-time":"2020-08-03T16:06:08Z","timestamp":1596470768000},"page":"383-394","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":152,"title":["Predicting Missing Values in Medical Data Via XGBoost Regression"],"prefix":"10.1007","volume":"4","author":[{"given":"Xinmeng","family":"Zhang","sequence":"first","affiliation":[]},{"given":"Chao","family":"Yan","sequence":"additional","affiliation":[]},{"given":"Cheng","family":"Gao","sequence":"additional","affiliation":[]},{"given":"Bradley A.","family":"Malin","sequence":"additional","affiliation":[]},{"given":"You","family":"Chen","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2020,8,3]]},"reference":[{"key":"77_CR1","doi-asserted-by":"crossref","unstructured":"Evans RS (2016) Electronic health records: then, now, and in the future. International Medical Informatics Association (IMIA) 1:S48\u2013S61","DOI":"10.15265\/IYS-2016-s006"},{"key":"77_CR2","doi-asserted-by":"crossref","unstructured":"Richesson RL, Horvath MM, Rusincovitch SA (2014) Clinical research informatics and electronic health record data. International Medical Informatics Association (IMIA) 23(1):215\u2013223","DOI":"10.15265\/IY-2014-0009"},{"key":"77_CR3","doi-asserted-by":"crossref","unstructured":"K\u00f6pcke F, Trinczek B, Majeed RW, Schreiweis B, Wenk J, Leusch T, Ganslandt T, Ohmann C, Bergh B, R\u00f6hrig R, Dugas M, Prokosch HU (2013) Evaluation of data completeness in the electronic health record for the purpose of patient recruitment into clinical trials: a retrospective analysis of element presence. BioMed Central (BMC) 13(1):37","DOI":"10.1186\/1472-6947-13-37"},{"key":"77_CR4","doi-asserted-by":"publisher","first-page":"112","DOI":"10.1016\/j.jbi.2017.03.009","volume":"68","author":"Z Hu","year":"2017","unstructured":"Hu Z, Melton GB, Arsoniadis EG, Wang Y, Kwaan MR, Simon GJ (2017) Strategies for handling missing clinical data for automated surgical site infection detection from the electronic health record. J Biomed Inform 68:112\u2013120","journal-title":"J Biomed Inform"},{"key":"77_CR5","doi-asserted-by":"crossref","unstructured":"Beaulieu-Jones BK, Moore JH (2017) Missing data imputation in the electronic health record using deeply learned autoencoders. In Proceedings of the Pacific Symposium on Biocomputing. 207\u2013218","DOI":"10.1142\/9789813207813_0021"},{"key":"77_CR6","doi-asserted-by":"publisher","first-page":"1134","DOI":"10.1093\/jamia\/ocx071","volume":"24","author":"GM Weber","year":"2017","unstructured":"Weber GM, Adams WG, Bernstam EV, Bickel JP, Fox KP, Marsolo K, Raghavan VA, Turchin A, Zhou X, Murphy SN, Mandl KD (2017) Biases introduced by filtering electronic health records for patients with \u201ccomplete data.\u201d. J Am Med Inform Assoc 24:1134\u20131141","journal-title":"J Am Med Inform Assoc"},{"key":"77_CR7","doi-asserted-by":"publisher","DOI":"10.2196\/medinform.8960","volume":"6","author":"BK Beaulieu-Jones","year":"2018","unstructured":"Beaulieu-Jones BK, Lavage DR, Snyder JW, Moore JH, Pendergrass SA, Bauer CR (2018) Characterizing and managing missing structured data in electronic health records: data analysis. JMIR Med Inform 6:e11","journal-title":"JMIR Med Inform"},{"key":"77_CR8","doi-asserted-by":"publisher","first-page":"24","DOI":"10.1016\/j.jbi.2014.03.016","volume":"51","author":"R Pivovarov","year":"2014","unstructured":"Pivovarov R, Albers DJ, Sepulveda JL, Elhadad N (2014) Identifying and mitigating biases in EHR laboratory tests. J Biomed Inform 51:24\u201334","journal-title":"J Biomed Inform"},{"issue":"8","key":"77_CR9","doi-asserted-by":"publisher","first-page":"e002847","DOI":"10.1136\/bmjopen-2013-002847","volume":"3","author":"AK Waljee","year":"2013","unstructured":"Waljee AK, Mukherjee A, Singal AG, Zhang Y, Warren J, Balis U, Marrero J, Zhu J, Higgins PDR (2013) Comparison of imputation methods for missing laboratory data in medicine. BMJ Open 3(8):e002847","journal-title":"BMJ Open"},{"issue":"3","key":"77_CR10","doi-asserted-by":"publisher","first-page":"1","DOI":"10.18637\/jss.v045.i03","volume":"45","author":"SV Buuren","year":"2011","unstructured":"Buuren SV, Groothuis-Oudshoorn K (2011) MICE: multivariate imputation by chained equations in R. J Stat Softw 45(3):1\u201368","journal-title":"J Stat Softw"},{"key":"77_CR11","doi-asserted-by":"publisher","first-page":"645","DOI":"10.1093\/jamia\/ocx133","volume":"25","author":"Y Luo","year":"2017","unstructured":"Luo Y, Szolovits P, Dighe AS et al (2017) 3D-MICE: integration of cross-sectional and longitudinal imputation for multi-analyte longitudinal clinical data. J Am Med Inform Assoc 25:645\u2013653","journal-title":"J Am Med Inform Assoc"},{"key":"77_CR12","doi-asserted-by":"publisher","first-page":"160035","DOI":"10.1038\/sdata.2016.35","volume":"3","author":"AEW Johnson","year":"2016","unstructured":"Johnson AEW, Pollard TJ, Shen L, Lehman L, Feng M, Ghassemi M, Moody B, Szolovits P, Celi LA, Mark RG (2016) MIMIC-III, a freely accessible critical care database. Scientific Data 3:160035","journal-title":"Scientific Data"},{"issue":"3","key":"77_CR13","doi-asserted-by":"publisher","first-page":"1035","DOI":"10.13063\/2327-9214.1035","volume":"1","author":"BJ Wells","year":"2013","unstructured":"Wells BJ, Chagin KM, Nowacki AS, Kattan MW (2013) Strategies for handling missing data in electronic health record derived data. EGEMS. 1(3):1035","journal-title":"EGEMS."},{"issue":"1","key":"77_CR14","doi-asserted-by":"publisher","first-page":"63","DOI":"10.1016\/j.artmed.2013.01.003","volume":"58","author":"F Cismondi","year":"2013","unstructured":"Cismondi F, Fialho AS, Vieira SM, Reti SR, Sousa JMC, Finkelstein SN (2013) Missing data in medical databases: impute, delete or classify. Artif Intell Med 58(1):63\u201372","journal-title":"Artif Intell Med"},{"issue":"18","key":"77_CR15","doi-asserted-by":"publisher","first-page":"1966","DOI":"10.1001\/jama.2015.15281","volume":"314","author":"P Li","year":"2015","unstructured":"Li P, Stuart EA, Allison DB (2015) Multiple imputation: a flexible tool for handling missing data. JAMA. 314(18):1966\u20131967","journal-title":"JAMA."},{"issue":"10","key":"77_CR16","doi-asserted-by":"publisher","first-page":"1087","DOI":"10.1016\/j.jclinepi.2006.01.014","volume":"59","author":"AR Donders","year":"2006","unstructured":"Donders AR, Van Der Heijden GJ, Stijnen T et al (2006) A gentle introduction to imputation of missing values. J Clin Epidemiol 59(10):1087\u20131091","journal-title":"J Clin Epidemiol"},{"issue":"1","key":"77_CR17","first-page":"1000224","volume":"6","author":"P Schmitt","year":"2015","unstructured":"Schmitt P, Mandel J, Guedj M (2015) A comparison of six methods for missing data imputation. Journal of Biometrics & Biostatistics 6(1):1000224","journal-title":"Journal of Biometrics & Biostatistics"},{"issue":"1","key":"77_CR18","doi-asserted-by":"publisher","first-page":"57","DOI":"10.1186\/1471-2288-6-57","volume":"6","author":"FM Shrive","year":"2006","unstructured":"Shrive FM, Stuart H, Quan H, Ghali WA (2006) Dealing with missing data in a multi-question de- pression scale: a comparison of imputation methods. BMC Med Res Methodol 6(1):57","journal-title":"BMC Med Res Methodol"},{"key":"77_CR19","doi-asserted-by":"publisher","first-page":"520","DOI":"10.1093\/bioinformatics\/17.6.520","volume":"17","author":"O Troyanskaya","year":"2001","unstructured":"Troyanskaya O, Cantor M, Sherlock G, Hastie T, Tibshirani R, Botstein D, Altman R (2001) Missing value estimation methods for DNA microarrays. Bioinformatics. 17:520\u2013525","journal-title":"Bioinformatics."},{"issue":"1","key":"77_CR20","doi-asserted-by":"publisher","first-page":"21689","DOI":"10.1038\/srep21689","volume":"6","author":"Y Deng","year":"2016","unstructured":"Deng Y, Chang C, Ido MS, Long Q (2016) Multiple imputation for general missing data patterns in the presence of high-dimensional data. Sci Rep 6(1):21689","journal-title":"Sci Rep"},{"issue":"3","key":"77_CR21","doi-asserted-by":"publisher","first-page":"911","DOI":"10.1111\/j.1541-0420.2008.01155.x","volume":"65","author":"G Zhang","year":"2009","unstructured":"Zhang G, Little R (2009) Extensions of the penalized spline of propensity prediction method of imputation. Biometrics. 65(3):911\u2013918","journal-title":"Biometrics."},{"issue":"6","key":"77_CR22","doi-asserted-by":"publisher","first-page":"7787","DOI":"10.1093\/ajcp\/aqw064","volume":"145","author":"Y Luo","year":"2016","unstructured":"Luo Y, Szolovits P, Dighe AS, Baron JM (2016) Using machine learning to predict laboratory test results. American Journal of Clinical Pathology 145(6):7787\u20137788","journal-title":"American Journal of Clinical Pathology"},{"issue":"3","key":"77_CR23","first-page":"949","volume":"149","author":"R Little","year":"2004","unstructured":"Little R, An H (2004) Robust likelihood-based analysis of multivariate data with missing values. Stat Sin 149(3):949\u2013968","journal-title":"Stat Sin"},{"issue":"6","key":"77_CR24","doi-asserted-by":"publisher","first-page":"681","DOI":"10.1002\/(SICI)1097-0258(19990330)18:6<681::AID-SIM71>3.0.CO;2-R","volume":"18","author":"SV Buuren","year":"1999","unstructured":"Buuren SV, Boshuizen HC, Knook DL (1999) Multiple imputation of missing blood pressure covariates in survival analysis. Stat Med 18(6):681\u2013694","journal-title":"Stat Med"},{"key":"77_CR25","doi-asserted-by":"publisher","first-page":"112","DOI":"10.1093\/bioinformatics\/btr597","volume":"28","author":"DJ Stekhoven","year":"2012","unstructured":"Stekhoven DJ, B\u00fchlmann P (2012) MissForest - non-parametric missing value imputation for mixed-type data. Bioinformatics 28:112\u2013118","journal-title":"Bioinformatics"},{"issue":"6","key":"77_CR26","doi-asserted-by":"publisher","first-page":"363","DOI":"10.1002\/sam.11348","volume":"10","author":"F Tang","year":"2017","unstructured":"Tang F, Ishwaran H (2017) Random forest missing data algorithms. Stat Anal Data Min 10(6):363\u2013377","journal-title":"Stat Anal Data Min"},{"key":"77_CR27","first-page":"3367","volume":"16","author":"T Hastie","year":"2015","unstructured":"Hastie T, Mazumder R, Lee JD, Zadeh R (2015) Matrix completion and low-rank SVD via fast alternating least squares. J Mach Learn Res 16:3367\u20133402","journal-title":"J Mach Learn Res"},{"issue":"80","key":"77_CR28","first-page":"2287","volume":"11","author":"R Mazumder","year":"2010","unstructured":"Mazumder R, Hastie T, Tibshirani R (2010) Spectral regularization algorithms for learning large incomplete matrices. J Mach Learn Res 11(80):2287\u20132322","journal-title":"J Mach Learn Res"},{"key":"77_CR29","doi-asserted-by":"crossref","unstructured":"Liao Z, Lu X, Yang T, Wang H (2009) Missing data imputation: a fuzzy K-means clustering algorithm over sliding window. In Proceedings of the 6th International Conference on Fuzzy Systems and Knowledge Discovery. 133\u2013137","DOI":"10.1109\/FSKD.2009.407"},{"key":"77_CR30","doi-asserted-by":"crossref","unstructured":"Chen T, Guestrin C (2016) XGBoost: a scalable tree boosting system. In: Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining 785\u2013794","DOI":"10.1145\/2939672.2939785"},{"key":"77_CR31","unstructured":"PythonAPIReference. https:\/\/xgboost.readthedocs.io\/en\/latest\/python\/pythonapi.html. Accessed Aug 9 2019"}],"container-title":["Journal of Healthcare Informatics Research"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s41666-020-00077-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s41666-020-00077-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s41666-020-00077-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,8,2]],"date-time":"2021-08-02T23:13:28Z","timestamp":1627946008000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s41666-020-00077-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,8,3]]},"references-count":31,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2020,12]]}},"alternative-id":["77"],"URL":"https:\/\/doi.org\/10.1007\/s41666-020-00077-1","relation":{},"ISSN":["2509-4971","2509-498X"],"issn-type":[{"value":"2509-4971","type":"print"},{"value":"2509-498X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020,8,3]]},"assertion":[{"value":"3 September 2019","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"29 May 2020","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 July 2020","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"3 August 2020","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Compliance with Ethical Standards"}},{"value":"The authors declare that they have no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of Interest"}},{"value":"Source code at .","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Code Availability"}}]}}