{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,21]],"date-time":"2026-02-21T18:47:25Z","timestamp":1771699645793,"version":"3.50.1"},"reference-count":45,"publisher":"Springer Science and Business Media LLC","issue":"6","license":[{"start":{"date-parts":[[2020,7,25]],"date-time":"2020-07-25T00:00:00Z","timestamp":1595635200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2020,7,25]],"date-time":"2020-07-25T00:00:00Z","timestamp":1595635200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/501100002858","name":"China Postdoctoral Science Foundation","doi-asserted-by":"publisher","award":["2019M661077"],"award-info":[{"award-number":["2019M661077"]}],"id":[{"id":"10.13039\/501100002858","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","award":["IIS-1717084"],"award-info":[{"award-number":["IIS-1717084"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61433008"],"award-info":[{"award-number":["61433008"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Data Min Knowl Disc"],"published-print":{"date-parts":[[2020,11]]},"DOI":"10.1007\/s10618-020-00706-8","type":"journal-article","created":{"date-parts":[[2020,7,25]],"date-time":"2020-07-25T10:02:26Z","timestamp":1595671346000},"page":"1859-1897","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":27,"title":["MIDIA: exploring denoising autoencoders for missing data imputation"],"prefix":"10.1007","volume":"34","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-6473-9523","authenticated-orcid":false,"given":"Qian","family":"Ma","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Wang-Chien","family":"Lee","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Tao-Yang","family":"Fu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yu","family":"Gu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ge","family":"Yu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2020,7,25]]},"reference":[{"issue":"2","key":"706_CR1","doi-asserted-by":"crossref","first-page":"253","DOI":"10.1093\/bib\/bbp059","volume":"11","author":"T Aittokallio","year":"2010","unstructured":"Aittokallio T (2010) Dealing with missing values in large-scale studies: microarray data imputation and beyond. Brief Bioinform 11(2):253\u2013264","journal-title":"Brief Bioinform"},{"key":"706_CR2","doi-asserted-by":"crossref","unstructured":"Anagnostopoulos C, Triantafillou P (2014) Scaling out big data missing value imputations: pythia vs. godzilla. In: Proceedings of ACM international conference on knowledge discovery and data mining, pp 651\u2013660","DOI":"10.1145\/2623330.2623615"},{"issue":"1","key":"706_CR3","doi-asserted-by":"crossref","first-page":"40","DOI":"10.1111\/j.1751-5823.2010.00103.x","volume":"78","author":"RR Andridge","year":"2010","unstructured":"Andridge RR, Little RJA (2010) A review of hot deck imputation for survey non-response. Int Stat Rev 78(1):40\u201364","journal-title":"Int Stat Rev"},{"issue":"11","key":"706_CR4","doi-asserted-by":"crossref","first-page":"2140","DOI":"10.1080\/00949655.2015.1104683","volume":"86","author":"V Audigier","year":"2016","unstructured":"Audigier V, Husson F, Josse J (2016) Multiple imputation for continuous variables using a bayesian principal component analysis. J Stat Comput Simul 86(11):2140\u20132156","journal-title":"J Stat Comput Simul"},{"key":"706_CR5","unstructured":"Baldi P (2012) Autoencoders, unsupervised learning, and deep architectures. In: Proceedings of ICML workshop on unsupervised and transfer learning, pp 37\u201350"},{"key":"706_CR6","unstructured":"Bergstra J, Desjardins G, Lamblin P, Bengio Y (2009) Quadratic polynomials learn better image features. Technical report, p 1337"},{"issue":"1","key":"706_CR7","first-page":"7133","volume":"18","author":"D Bertsimas","year":"2017","unstructured":"Bertsimas D, Pawlowski C, Zhuo YD (2017) From predictive methods to missing data imputation: an optimization approach. J Mach Learn Res 18(1):7133\u20137171","journal-title":"J Mach Learn Res"},{"key":"706_CR8","doi-asserted-by":"crossref","unstructured":"Borovicka T, Jirina-Jr M, Kordik P, Jirina M (2012) Selecting representative data sets. In: Advances in data mining knowledge discovery and applications, pp 43\u201370","DOI":"10.5772\/50787"},{"key":"706_CR9","doi-asserted-by":"crossref","unstructured":"Bottou L (2010) Large-scale machine learning with stochastic gradient descent. In: Proceedings of COMPSTAT\u20192010, pp 177\u2013186","DOI":"10.1007\/978-3-7908-2604-3_16"},{"issue":"1","key":"706_CR10","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1111\/j.2517-6161.1977.tb01600.x","volume":"39","author":"AP Dempster","year":"1977","unstructured":"Dempster AP, Laird NM, Rubin DB (1977) Maximum likelihood from incomplete data via the em algorithm. J R Stat Soc Ser B (Methodol) 39(1):1\u201338","journal-title":"J R Stat Soc Ser B (Methodol)"},{"key":"706_CR11","doi-asserted-by":"crossref","unstructured":"Dong X, Gabrilovich E, Heitz G et al (2014) Knowledge vault: a web-scale approach to probabilistic knowledge fusion. In: Proceedings of ACM international conference on knowledge discovery and data mining, pp 601\u2013610","DOI":"10.1145\/2623330.2623623"},{"issue":"1","key":"706_CR12","doi-asserted-by":"crossref","first-page":"12","DOI":"10.1007\/s41019-019-00115-y","volume":"5","author":"Z Gharibshah","year":"2020","unstructured":"Gharibshah Z, Zhu XQ, Hainline A, Conway M (2020) Deep learning for user interest and response prediction in online display advertising. Data Sci Eng 5(1):12\u201326","journal-title":"Data Sci Eng"},{"key":"706_CR13","unstructured":"Glorot X, Bengio Y (2010) Understanding the difficulty of training deep feedforward neural networks. In: Proceedings of international conference on artificial intelligence and statistics, pp 249\u2013256"},{"key":"706_CR14","unstructured":"Glorot X, Bordes A, Bengio Y (2011) Deep sparse rectifier neural networks. In: Proceedings of international conference on artificial intelligence and statistics, pp 315\u2013323"},{"key":"706_CR15","doi-asserted-by":"crossref","unstructured":"Han J, Moraga C (1995) The influence of the sigmoid function parameters on the speed of backpropagation learning. In: Proceedings of international workshop on artificial neural networks, pp 195\u2013201","DOI":"10.1007\/3-540-59497-3_175"},{"issue":"8","key":"706_CR16","first-page":"45","volume":"2","author":"YK Jain","year":"2011","unstructured":"Jain YK, Bhandare SK (2011) Min max normalization based data perturbation method for privacy protection. Int J Comput Commun Technol 2(8):45\u201350","journal-title":"Int J Comput Commun Technol"},{"key":"706_CR17","doi-asserted-by":"crossref","unstructured":"Jing XY, Qi FM, Wu F, Xu BW (2016) Missing data imputation based on low-rank recovery and semi-supervised regression for software effort estimation. In: Proceedings of IEEE\/ACM international conference on software engineering, pp 607\u2013618","DOI":"10.1145\/2884781.2884827"},{"key":"706_CR18","doi-asserted-by":"crossref","unstructured":"Joenssen DW, Bankhofer U (2012) Hot deck methods for imputing missing data\u2014the effects of limiting donor usage. In: International workshop on machine learning and data mining in pattern recognition, pp 63\u201375","DOI":"10.1007\/978-3-642-31537-4_6"},{"issue":"7713","key":"706_CR19","first-page":"157","volume":"339","author":"ACS Jonathan","year":"2009","unstructured":"Jonathan ACS, White IR, Carlin JB, Spratt M, Royston P, Kenward MG, Wood AM, Carpenter JR (2009) Multiple imputation for missing data in epidemiological and clinical research: potential and pitfalls. BMJ Br Med J 339(7713):157\u2013160","journal-title":"BMJ Br Med J"},{"key":"706_CR20","doi-asserted-by":"crossref","first-page":"160","DOI":"10.1186\/1471-2105-5-160","volume":"5","author":"KY Kim","year":"2004","unstructured":"Kim KY, Kim BJ, Yi GS (2004) Reuse of imputed data in microarray analysis increases imputation efficiency. BMC Bioinform 5:160","journal-title":"BMC Bioinform"},{"issue":"2","key":"706_CR21","doi-asserted-by":"crossref","first-page":"187","DOI":"10.1093\/bioinformatics\/bth499","volume":"21","author":"H Kim","year":"2005","unstructured":"Kim H, Golub GH, Park H (2005) Missing value estimation for DNA microarray gene expression data: local least squares imputation. Bioinformatics 21(2):187\u2013198","journal-title":"Bioinformatics"},{"issue":"4","key":"706_CR22","doi-asserted-by":"crossref","first-page":"491","DOI":"10.1109\/TKDE.2005.66","volume":"17","author":"H Liu","year":"2005","unstructured":"Liu H, Yu L (2005) Toward integrating feature selection algorithms for classification and clustering. IEEE Trans Knowl Discov Eng 17(4):491\u2013502","journal-title":"IEEE Trans Knowl Discov Eng"},{"key":"706_CR23","unstructured":"Lovedeep G, Wang K (2017) Multiple imputation using deep denoising autoencoders. CoRR arXiv:1705.02737"},{"key":"706_CR24","unstructured":"Magnani M (2004) Techniques for dealing with missing data in knowledge discovery tasks. Obtido 15(01):2007. http:\/\/magnanim.web.cs.unibo.it\/index.html"},{"issue":"1","key":"706_CR25","doi-asserted-by":"crossref","first-page":"24","DOI":"10.1080\/02664763.2016.1158246","volume":"44","author":"D McNeish","year":"2017","unstructured":"McNeish D (2017) Missing data methods for arbitrary missingness with small samples. J Appl Stat 44(1):24\u201339","journal-title":"J Appl Stat"},{"key":"706_CR26","unstructured":"Nair V, Hinton GE (2010) Rectified linear units improve restricted Boltzmann machines. In: Proceedings of international conference on international conference on machine learning, pp 807\u2013814"},{"issue":"2","key":"706_CR27","doi-asserted-by":"crossref","first-page":"2794","DOI":"10.1016\/j.eswa.2008.01.059","volume":"36","author":"Y Qin","year":"2009","unstructured":"Qin Y, Zhang S, Zhu X et al (2009) POP algorithm: Kernel-based imputation to treat missing values in knowledge discovery from databases. Expert Syst Appl 36(2):2794\u20132804","journal-title":"Expert Syst Appl"},{"issue":"1","key":"706_CR28","first-page":"85","volume":"27","author":"TE Raghunathan","year":"2001","unstructured":"Raghunathan TE, Lepkowski JM, Hoewyk JV, Solenberger P (2001) A multivariate technique for multiply imputing missing values using a sequence of regression models. Survey Methodol 27(1):85\u201396","journal-title":"Survey Methodol"},{"key":"706_CR29","unstructured":"Rahman G, Islam Z (2011) A decision tree-based missing value imputation technique for data pre-processing. In: Proceedings of Australasian data mining conference, pp 41\u201350"},{"key":"706_CR30","volume-title":"Collins concise dictionary","author":"JM Sinclair","year":"2001","unstructured":"Sinclair JM, Wilkes GA, Krebs WA (2001) Collins concise dictionary. HarperCollins, New York"},{"issue":"4","key":"706_CR31","doi-asserted-by":"crossref","first-page":"427","DOI":"10.1016\/j.ipm.2009.03.002","volume":"45","author":"M Sokolova","year":"2009","unstructured":"Sokolova M, Lapalme G (2009) A systematic analysis of performance measures for classification tasks. Inf Process Manag 45(4):427\u2013437","journal-title":"Inf Process Manag"},{"issue":"6","key":"706_CR32","doi-asserted-by":"crossref","first-page":"520","DOI":"10.1093\/bioinformatics\/17.6.520","volume":"17","author":"OG Troyanskaya","year":"2001","unstructured":"Troyanskaya OG, Cantor MN, Sherlock G et al (2001) Missing value estimation methods for DNA microarrays. Bioinformatics 17(6):520\u2013525","journal-title":"Bioinformatics"},{"issue":"5\u20136","key":"706_CR33","doi-asserted-by":"crossref","first-page":"320","DOI":"10.1016\/j.compbiolchem.2007.07.001","volume":"31","author":"S Verboven","year":"2007","unstructured":"Verboven S, Branden KV, Goos P (2007) Sequential imputation for missing values. Comput Biol Chem 31(5\u20136):320\u2013327","journal-title":"Comput Biol Chem"},{"key":"706_CR34","doi-asserted-by":"crossref","unstructured":"Vincent P, Larochelle H, Bengio Y, Manzagol PA (2008) Extracting and composing robust features with denoising autoencoders. In: Proceedings of international conference on machine learning, pp 1096\u20131103","DOI":"10.1145\/1390156.1390294"},{"issue":"12","key":"706_CR35","first-page":"3371","volume":"11","author":"P Vincent","year":"2010","unstructured":"Vincent P, Larochelle H, Lajoie I, Bengio Y, Manzagol PA (2010) Stacked denoising autoencoders: learning useful representations in a deep network with a local denoising criterion. J Mach Learn Res 11(12):3371\u20133408","journal-title":"J Mach Learn Res"},{"issue":"2","key":"706_CR36","doi-asserted-by":"crossref","first-page":"750","DOI":"10.1016\/j.snb.2007.09.060","volume":"129","author":"SD Vito","year":"2008","unstructured":"Vito SD, Massera E, Piga M et al (2008) On field calibration of an electronic nose for benzene estimation in an urban pollution monitoring scenario. Sens Actuators B Chem 129(2):750\u2013757","journal-title":"Sens Actuators B Chem"},{"issue":"3","key":"706_CR37","doi-asserted-by":"crossref","first-page":"563","DOI":"10.1111\/1467-9469.00306","volume":"29","author":"QH Wang","year":"2002","unstructured":"Wang QH, Rao JNK (2002a) Empirical likelihood-based inference in linear models with missing data. Scand J Stat 29(3):563\u2013576","journal-title":"Scand J Stat"},{"issue":"3","key":"706_CR38","doi-asserted-by":"publisher","first-page":"896","DOI":"10.1214\/aos\/1028674845","volume":"30","author":"QH Wang","year":"2002","unstructured":"Wang QH, Rao JNK (2002b) Empirical likelihood-based inference under imputation for missing response data. Ann Stat 30(3):896\u2013924","journal-title":"Ann Stat"},{"key":"706_CR39","first-page":"1","volume-title":"Multiple imputation for missing data: concepts and new development","author":"YC Yuan","year":"2010","unstructured":"Yuan YC (2010) Multiple imputation for missing data: concepts and new development, vol 49. SAS Institute Inc, Rockville, pp 1\u201311"},{"issue":"1","key":"706_CR40","first-page":"32","volume":"9","author":"S Zhang","year":"2008","unstructured":"Zhang S (2008) Parimputation: from imputation and null-imputation to partially imputation. IEEE Intell Inform Bull 9(1):32\u201338","journal-title":"IEEE Intell Inform Bull"},{"issue":"5","key":"706_CR41","doi-asserted-by":"crossref","first-page":"414","DOI":"10.1109\/LSP.2009.2016451","volume":"16","author":"Y Zhang","year":"2009","unstructured":"Zhang Y, Liu YC (2009) Data imputation using least squares support vector machines in urban arterial streets. IEEE Signal Process Lett 16(5):414\u2013417","journal-title":"IEEE Signal Process Lett"},{"key":"706_CR42","doi-asserted-by":"crossref","unstructured":"Zhang CQ, Zhu XF, Zhang JL, Qin YS, Zhang SC (2007) GBKII: an imputation method for missing values. In: Proceedings of Pacific-Asia conference on knowledge discovery and data mining, pp 1080\u20131087","DOI":"10.1007\/978-3-540-71701-0_122"},{"issue":"10","key":"706_CR43","doi-asserted-by":"crossref","first-page":"1112","DOI":"10.1016\/j.compbiomed.2008.08.006","volume":"38","author":"X Zhang","year":"2008","unstructured":"Zhang X, Song X, Wang H et al (2008) Sequential local least squares imputation estimating missing value of microarray data. Comput Biol Med 38(10):1112\u20131120","journal-title":"Comput Biol Med"},{"issue":"4","key":"706_CR44","doi-asserted-by":"crossref","first-page":"745","DOI":"10.1016\/S0165-1684(02)00469-3","volume":"83","author":"XB Zhou","year":"2003","unstructured":"Zhou XB, Wang XD, Dougherty ER (2003) Construction of genomic networks using mutual-information clustering and reversible-jump markov-chain-monte-carlo predictor design. Signal Process 83(4):745\u2013761","journal-title":"Signal Process"},{"issue":"1","key":"706_CR45","doi-asserted-by":"crossref","first-page":"110","DOI":"10.1109\/TKDE.2010.99","volume":"23","author":"X Zhu","year":"2011","unstructured":"Zhu X, Zhang S, Jin Z et al (2011) Missing value estimation for mixed-attribute data sets. IEEE Trans Knowl Data Eng 23(1):110\u2013121","journal-title":"IEEE Trans Knowl Data Eng"}],"container-title":["Data Mining and Knowledge Discovery"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10618-020-00706-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10618-020-00706-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10618-020-00706-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,8,10]],"date-time":"2024-08-10T19:57:31Z","timestamp":1723319851000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10618-020-00706-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,7,25]]},"references-count":45,"journal-issue":{"issue":"6","published-print":{"date-parts":[[2020,11]]}},"alternative-id":["706"],"URL":"https:\/\/doi.org\/10.1007\/s10618-020-00706-8","relation":{},"ISSN":["1384-5810","1573-756X"],"issn-type":[{"value":"1384-5810","type":"print"},{"value":"1573-756X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020,7,25]]},"assertion":[{"value":"16 August 2019","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"17 July 2020","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"25 July 2020","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}