{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,3]],"date-time":"2026-04-03T09:43:30Z","timestamp":1775209410182,"version":"3.50.1"},"reference-count":30,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2025,1,7]],"date-time":"2025-01-07T00:00:00Z","timestamp":1736208000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,1,7]],"date-time":"2025-01-07T00:00:00Z","timestamp":1736208000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Netw Model Anal Health Inform Bioinforma"],"DOI":"10.1007\/s13721-024-00496-9","type":"journal-article","created":{"date-parts":[[2025,1,7]],"date-time":"2025-01-07T20:38:54Z","timestamp":1736282334000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":9,"title":["A ClusteredRF Approach to Data Imputation in Healthcare for Enhanced Data Integrity"],"prefix":"10.1007","volume":"14","author":[{"given":"Subhashish","family":"Nayak","sequence":"first","affiliation":[]},{"given":"Pabitra Mohan","family":"Khilar","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,1,7]]},"reference":[{"key":"496_CR1","doi-asserted-by":"publisher","DOI":"10.1177\/09622802211047346","author":"L Beesley","year":"2021","unstructured":"Beesley L, Bondarenko I, Elliott M, Kurian A, Katz S, Taylor J (2021) Multiple imputation with missing data indicators. Stat Methods Med Res. https:\/\/doi.org\/10.1177\/09622802211047346","journal-title":"Stat Methods Med Res"},{"issue":"3","key":"496_CR2","doi-asserted-by":"publisher","first-page":"375","DOI":"10.1016\/j.patcog.2018.05.030","volume":"83","author":"Y Chen","year":"2018","unstructured":"Chen Y, Tang S, Bouguila N, Wang C, Du J, Li H (2018) A fast clustering algorithm based on pruning unnecessary distance computations in dbscan for high-dimensional data. Pattern Recog 83(3):375\u2013387","journal-title":"Pattern Recog"},{"key":"496_CR3","doi-asserted-by":"publisher","first-page":"11781","DOI":"10.1007\/s00500-021-05947-3","volume":"25","author":"C-H Cheng","year":"2021","unstructured":"Cheng C-H, Huang S-F (2021) A novel clustering-based purity and distance imputation for handling medical data with missing values. Soft Comput 25:11781\u201311801","journal-title":"Soft Comput"},{"key":"496_CR4","doi-asserted-by":"publisher","DOI":"10.1016\/j.compbiomed.2020.103824","author":"C-H Cheng","year":"2020","unstructured":"Cheng C-H, Chang J-R, Huang H-H (2020) A novel weighted distance threshold method for handling medical missing values. Comput Biol Med. https:\/\/doi.org\/10.1016\/j.compbiomed.2020.103824","journal-title":"Comput Biol Med"},{"key":"496_CR5","doi-asserted-by":"crossref","unstructured":"de campos, D. A., Bernardes, J., Garrido, A., de s\u00e1, J. M., and Pereira-leite, L. (2000) Sisporto 2.0: A program for automated analysis of cardiotocograms. J Mater-Fetal Med. 9(5):311\u2013318","DOI":"10.1002\/1520-6661(200009\/10)9:5<311::AID-MFM12>3.3.CO;2-0"},{"key":"496_CR6","doi-asserted-by":"publisher","first-page":"418","DOI":"10.1016\/j.ins.2021.04.076","volume":"571","author":"T Dinh","year":"2021","unstructured":"Dinh T, Huynh V-N, Sriboonchitta S (2021) Clustering mixed numerical and categorical data with missing values. Inf Sci 571:418\u2013442","journal-title":"Inf Sci"},{"key":"496_CR7","unstructured":"[Fedesoriano] Fedesoriano 2021. Heart failure prediction dataset. https:\/\/archive.ics.uci.edu\/ml\/machine-learning-databases\/ heart-disease\/. [Accessed 10 Jan 2023]."},{"issue":"6","key":"496_CR8","doi-asserted-by":"publisher","first-page":"488","DOI":"10.1002\/nur.20100","volume":"28","author":"SM Fox-Wasylyshyn","year":"2005","unstructured":"Fox-Wasylyshyn SM, El-Masri MM (2005) Handling missing data in self-report measures. Res Nurs Health 28(6):488\u2013495","journal-title":"Res Nurs Health"},{"key":"496_CR9","doi-asserted-by":"publisher","DOI":"10.24432\/C5FK5P","volume-title":"Dermatology","author":"NG Ilter","year":"1998","unstructured":"Ilter NG, H (1998) Dermatology. Open Data Commons, License. https:\/\/doi.org\/10.24432\/C5FK5P"},{"issue":"4","key":"496_CR10","first-page":"1889","volume":"34","author":"N Karmitsa","year":"2022","unstructured":"Karmitsa N, Taheri S, Bagirov A, M\u00e4kinen P (2022) Missing value imputation via clusterwise linear regression. IEEE Trans Knowl Data Eng 34(4):1889\u20131901","journal-title":"IEEE Trans Knowl Data Eng"},{"issue":"1","key":"496_CR11","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s40537-020-00313-w","volume":"7","author":"SI Khan","year":"2020","unstructured":"Khan SI, Hoque ASML (2020) Sice: an improved missing data imputation technique. J Big Data 7(1):1\u201321","journal-title":"J Big Data"},{"issue":"5","key":"496_CR12","doi-asserted-by":"publisher","first-page":"1396","DOI":"10.1109\/TFUZZ.2021.3058643","volume":"30","author":"D Li","year":"2021","unstructured":"Li D, Zhang H, Li T, Bouras A, Yu X, Wang T (2021) Hybrid missing value imputation algorithms using fuzzy c-means and vaguely quantified rough set. IEEE Trans Fuzzy Syst 30(5):1396\u20131408","journal-title":"IEEE Trans Fuzzy Syst"},{"key":"496_CR13","doi-asserted-by":"publisher","DOI":"10.24432\/C59C74","author":"M Little","year":"2008","unstructured":"Little M (2008) Parkinsons. UCI Mach Learn Reposit. https:\/\/doi.org\/10.24432\/C59C74","journal-title":"UCI Mach Learn Reposit"},{"key":"496_CR14","first-page":"49","volume-title":"Advances in healthcare information systems and administration","author":"S Nayak","year":"2024","unstructured":"Nayak S, Khilar PM (2024) Data imputation in healthcare applications. Advances in healthcare information systems and administration. IGI Global, USA, pp 49\u201367"},{"key":"496_CR15","doi-asserted-by":"crossref","unstructured":"Nayak S, Dash S, Khilar P (2024) A Multi-Step Fuzzy C-Means Approach for Accurate Data Imputation. In: Healthcare IEEE International Conference on Computer Vision and Machine Intelligence (CVMI). pp 1\u20136","DOI":"10.1109\/CVMI61877.2024.10782293"},{"issue":"6","key":"496_CR16","doi-asserted-by":"publisher","first-page":"2419","DOI":"10.1007\/s10115-019-01427-1","volume":"62","author":"S Nikfalazar","year":"2020","unstructured":"Nikfalazar S, Yeh C-H, Bedingfield S, Khorshidi HA (2020) Missing data imputation using decision trees and fuzzy clustering with iterative learning. Knowl Inf Syst 62(6):2419\u20132437","journal-title":"Knowl Inf Syst"},{"key":"496_CR17","unstructured":"Nowak, R. (2011). Lecture 16: Minimum variance unbiased (mvub) estimators. https:\/\/nowak.ece.wisc.edu\/ece830\/ece830_ lecture16.pdf."},{"key":"496_CR18","doi-asserted-by":"publisher","first-page":"157","DOI":"10.2147\/CLEP.S129785","volume":"9","author":"A Pedersen","year":"2017","unstructured":"Pedersen A, Mikkelsen E, Cronin-Fenton D, Kristensen N, Pham T, Pedersen L, Petersen I (2017) Missing data and multiple imputation in clinical epidemiological research. Clin Epidemiol 9:157\u2013166","journal-title":"Clin Epidemiol"},{"key":"496_CR19","doi-asserted-by":"publisher","first-page":"10033","DOI":"10.1007\/s00521-019-04535-9","volume":"32","author":"P Raja","year":"2020","unstructured":"Raja P, Sasirekha K, Thangavel K (2020) A novel fuzzy rough clustering parameter-based missing value imputation. Neural Comput Appl 32:10033\u201310050","journal-title":"Neural Comput Appl"},{"issue":"1","key":"496_CR20","doi-asserted-by":"publisher","first-page":"20","DOI":"10.1007\/s41066-023-00446-2","volume":"9","author":"K Savita","year":"2024","unstructured":"Savita K, N., and Siwch, A (2024) Fuzzy clustering based on distance metric under intuitionistic fuzzy environment. Granular Comput 9(1):20","journal-title":"Granular Comput"},{"key":"496_CR21","doi-asserted-by":"publisher","first-page":"855","DOI":"10.1007\/s11047-018-9700-3","volume":"17","author":"A Skowron","year":"2018","unstructured":"Skowron A, Dutta S (2018) Rough sets: past, present, and future. Nat Comput 17:855\u2013876","journal-title":"Nat Comput"},{"key":"496_CR22","volume-title":"Using the adap learning algorithm to forcast the onset of diabetes mellitus Proceed - Annual symposium on computer applications in medical care","author":"J Smith","year":"1988","unstructured":"Smith J, Everhart J, Dickson W, Knowler W, Johannes R (1988) Using the adap learning algorithm to forcast the onset of diabetes mellitus Proceed - Annual symposium on computer applications in medical care. American Medical Informatics Association, USA"},{"key":"496_CR23","first-page":"159","volume-title":"Proceed of 4th International Conf on Recent Trends in Machine Learning, IoT, Smart Cities and Applications","author":"KM Varma","year":"2024","unstructured":"Varma KM, Nayak S, Khilar PM (2024) Imice: An improved missing data imputation using machine learning. In: Gunjan VK, Zurada JM (eds) Proceed of 4th International Conf on Recent Trends in Machine Learning, IoT, Smart Cities and Applications. Springer Nature Singapore, Singapore, pp 159\u2013167"},{"key":"496_CR24","doi-asserted-by":"publisher","first-page":"102243","DOI":"10.1016\/j.datak.2023.102243","volume":"150","author":"H Vijayan","year":"2024","unstructured":"Vijayan H, Subramaniam M, Sathiyasekar K (2024) A-mkmc: An effective adaptive-based multilevel k-means clustering with optimal centroid selection using hybrid heuristic approach for handling the incomplete data. Data Knowl Eng 150:102243","journal-title":"Data Knowl Eng"},{"key":"496_CR25","unstructured":"Wikipedia (n.d.). Mean squared error - proof of variance and bias relationship. https:\/\/en.wikipedia.org\/wiki\/Mean_squared_ error#Proof_of_variance_and_bias_relationship."},{"key":"496_CR26","doi-asserted-by":"publisher","first-page":"566","DOI":"10.1016\/j.neucom.2020.10.114","volume":"452","author":"J Xie","year":"2021","unstructured":"Xie J, Wu R, Wang H, Chen H, Xu X, Kong Y, Zhang W (2021) Prediction of cardiovascular diseases using weight learning based on density information. Neurocomputing 452:566\u2013575","journal-title":"Neurocomputing"},{"issue":"3","key":"496_CR27","doi-asserted-by":"publisher","first-page":"183","DOI":"10.26599\/BDMA.2021.9020001","volume":"4","author":"Z Xue","year":"2021","unstructured":"Xue Z, Wang H (2021) Effective density-based clustering algorithms for incomplete data. Big Data Mining Anal 4(3):183\u2013194","journal-title":"Big Data Mining Anal"},{"issue":"3","key":"496_CR28","doi-asserted-by":"publisher","first-page":"487","DOI":"10.1016\/j.compeleceng.2017.11.030","volume":"66","author":"U Yelipe","year":"2018","unstructured":"Yelipe U, Porika S, Golla M (2018) An efficient approach for imputation and classification of medical data values using class-based clustering of medical records. Comput Electr Eng 66(3):487\u2013504","journal-title":"Comput Electr Eng"},{"key":"496_CR29","first-page":"128","volume":"1","author":"S Zhang","year":"2008","unstructured":"Zhang S, Zhang J, Zhu X, Qin Y, Zhang C (2008) Missing value imputation based on data clustering. Trans Comput Sci 1:128\u2013138","journal-title":"Trans Comput Sci"},{"key":"496_CR30","doi-asserted-by":"publisher","DOI":"10.1016\/j.ins.2023.120065","volume":"659","author":"Z Zhang","year":"2024","unstructured":"Zhang Z, Yan X, Zhang L, Lai X, Lu W (2024) Fuzzy neuron modeling of incomplete data for missing value imputation. Inf Sci 659:120065","journal-title":"Inf Sci"}],"container-title":["Network Modeling Analysis in Health Informatics and Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s13721-024-00496-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s13721-024-00496-9\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s13721-024-00496-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,7]],"date-time":"2025-01-07T21:20:12Z","timestamp":1736284812000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s13721-024-00496-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,1,7]]},"references-count":30,"journal-issue":{"issue":"1","published-online":{"date-parts":[[2025,12]]}},"alternative-id":["496"],"URL":"https:\/\/doi.org\/10.1007\/s13721-024-00496-9","relation":{},"ISSN":["2192-6670"],"issn-type":[{"value":"2192-6670","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,1,7]]},"assertion":[{"value":"9 September 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"5 November 2024","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"5 December 2024","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"7 January 2025","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"5"}}