{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,25]],"date-time":"2025-06-25T06:05:11Z","timestamp":1750831511051,"version":"3.28.0"},"reference-count":46,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2024,11,19]],"date-time":"2024-11-19T00:00:00Z","timestamp":1731974400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2024,11,19]],"date-time":"2024-11-19T00:00:00Z","timestamp":1731974400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Big Data"],"DOI":"10.1186\/s40537-024-01009-1","type":"journal-article","created":{"date-parts":[[2024,11,19]],"date-time":"2024-11-19T09:12:22Z","timestamp":1732007542000},"update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["The application of adaptive group LASSO imputation method with missing values in personal income compositional data"],"prefix":"10.1186","volume":"11","author":[{"given":"Ying","family":"Tian","sequence":"first","affiliation":[]},{"given":"Majid Khan Majahar","family":"Ali","sequence":"additional","affiliation":[]},{"given":"Lili","family":"Wu","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,11,19]]},"reference":[{"key":"1009_CR1","doi-asserted-by":"publisher","first-page":"271","DOI":"10.1146\/annurev-statistics-042720-124436","volume":"8","author":"M Greenacre","year":"2021","unstructured":"Greenacre M. Compositional data analysis. Annu Rev Stat Appl. 2021;8:271\u201399.","journal-title":"Annu Rev Stat Appl"},{"issue":"3","key":"1009_CR2","doi-asserted-by":"publisher","first-page":"271","DOI":"10.1023\/A:1007529726302","volume":"32","author":"J Aitchison","year":"2000","unstructured":"Aitchison J, Barcelo-Vidal C, Mart\u0131n-Fernandez JA, Pawlowsky-Glahn V. Logratio analysis and compositional distance. Math Geol. 2000;32(3):271\u20135.","journal-title":"Math Geol"},{"key":"1009_CR3","doi-asserted-by":"publisher","first-page":"279","DOI":"10.1023\/A:1023818214614","volume":"35","author":"JJ Egozcue","year":"2003","unstructured":"Egozcue JJ, Pawlowsky-Glahn V, Mateu-Figueras G, Barcel\u00f3-Vidal C. Isometric log-ratio transformations for compositional data analysis. Math Geol. 2003;35:279\u2013300.","journal-title":"Math Geol"},{"issue":"1","key":"1009_CR4","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1186\/s40537-021-00553-4","volume":"9","author":"KM Batko","year":"2022","unstructured":"Batko KM, \u015al\u0119zak A. The use of big data analytics in healthcare. J Big Data. 2022;9(1):3.","journal-title":"J Big Data"},{"key":"1009_CR5","volume-title":"Advances in compositional data analysis","author":"K Hron","year":"2014","unstructured":"Hron K. Advances in compositional data analysis. Statistics Reference Online: Wiley StatsRef; 2014."},{"issue":"2","key":"1009_CR6","doi-asserted-by":"publisher","first-page":"365","DOI":"10.33096\/ilkom.v15i2.1561.365-372","volume":"15","author":"I As\u2019ad","year":"2023","unstructured":"As\u2019ad I, Asis MA, Hariani Mat\u2019ang Pakka MH, Mursalim R. K-nearest neighbors analysis for public sentiment towards implementation of booster vaccines in Indonesia. ILKOM Jurnal Ilmiah. 2023;15(2):365\u201372.","journal-title":"ILKOM Jurnal Ilmiah"},{"key":"1009_CR7","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s12982-017-0062-6","volume":"14","author":"CD Nguyen","year":"2017","unstructured":"Nguyen CD, Carlin JB, Lee KJ. Model checking in multiple imputation: an overview and case study. Emerg Themes Epidemiol. 2017;14:1\u201312.","journal-title":"Emerg Themes Epidemiol"},{"key":"1009_CR8","first-page":"2","volume":"4","author":"Z Zhang","year":"2016","unstructured":"Zhang Z. Multiple imputation with multivariate imputation by chained equation (MICE) package. Ann Trans Med. 2016;4:2.","journal-title":"Ann Trans Med"},{"issue":"4","key":"1009_CR9","doi-asserted-by":"publisher","first-page":"1090","DOI":"10.1007\/s42952-022-00177-1","volume":"51","author":"H Han","year":"2022","unstructured":"Han H, Yu K. Partial linear regression of compositional data. J Korean Statist Soc. 2022;51(4):1090\u2013116.","journal-title":"J Korean Statist Soc"},{"key":"1009_CR10","doi-asserted-by":"publisher","first-page":"2419","DOI":"10.1007\/s10115-019-01427-1","volume":"62","author":"S Nikfalazar","year":"2020","unstructured":"Nikfalazar S, Yeh CH, Bedingfield S, Khorshidi HA. Missing data imputation using decision trees and fuzzy clustering with iterative learning. Knowl Inf Syst. 2020;62:2419\u201337.","journal-title":"Knowl Inf Syst"},{"key":"1009_CR11","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s12859-019-3110-0","volume":"20","author":"M Kokla","year":"2019","unstructured":"Kokla M, Virtanen J, Kolehmainen M, Paananen J, Hanhineva K. Random forest-based imputation outperforms other methods for imputing LC-MS metabolomics data: a comparative study. BMC Bioinformatics. 2019;20:1\u201311.","journal-title":"BMC Bioinformatics"},{"issue":"5","key":"1009_CR12","doi-asserted-by":"publisher","first-page":"414","DOI":"10.1109\/LSP.2009.2016451","volume":"16","author":"Y Zhang","year":"2009","unstructured":"Zhang Y, Liu Y. Data imputation using least squares support vector machines in urban arterial streets. IEEE Signal Process Lett. 2009;16(5):414\u20137.","journal-title":"IEEE Signal Process Lett"},{"issue":"3","key":"1009_CR13","doi-asserted-by":"publisher","first-page":"860","DOI":"10.1007\/s10489-019-01560-y","volume":"50","author":"J Lin","year":"2000","unstructured":"Lin J, Li N, Alam MA, Ma Y. Data-driven missing data imputation in cluster monitoring system based on deep neural network. Appl Intell. 2000;50(3):860\u201377.","journal-title":"Appl Intell"},{"issue":"10","key":"1009_CR14","doi-asserted-by":"publisher","first-page":"2467","DOI":"10.1002\/sim.8915","volume":"40","author":"F Noghrehchi","year":"2021","unstructured":"Noghrehchi F, Stoklosa J, Penev S, Warton DI. Selecting the model for multiple imputation of missing data: just use an IC! Stat Med. 2021;40(10):2467\u201397.","journal-title":"Stat Med"},{"issue":"3","key":"1009_CR15","doi-asserted-by":"publisher","first-page":"795","DOI":"10.56899\/153.03.05","volume":"153","author":"T Ritthewa","year":"2024","unstructured":"Ritthewa T, Samart K. Performance of different imputation methods in logistic regression with multicollinearity. Philippine J Sci. 2024;153(3):795\u2013804.","journal-title":"Philippine J Sci"},{"key":"1009_CR16","doi-asserted-by":"publisher","DOI":"10.1016\/j.artmed.2021.102214","volume":"123","author":"G Nagarajan","year":"2022","unstructured":"Nagarajan G, Babu LD. Missing data imputation on biomedical data using deeply learned clustering and L2 regularized regression based on symmetric uncertainty. Artif Intell Med. 2022;123: 102214.","journal-title":"Artif Intell Med"},{"key":"1009_CR17","doi-asserted-by":"publisher","first-page":"19","DOI":"10.1007\/978-981-10-8055-5_3","volume-title":"Computational Intelligence in Data Mining: Proceedings of the International Conference on CIDM 2017","author":"K Lavanya","year":"2019","unstructured":"Lavanya K, Reddy LSS, Eswara RB. A study of high-dimensional data imputation using additive LASSO regression model. In: Himansu Sekhar B, Janmenjoy N, Bighnaraj N, Ajith A, editors. Computational Intelligence in Data Mining: Proceedings of the International Conference on CIDM 2017. Singapore: Springer Singapore; 2019. p. 19\u201330."},{"issue":"4","key":"1009_CR18","doi-asserted-by":"publisher","first-page":"570","DOI":"10.29207\/resti.v6i4.4173","volume":"6","author":"A Fadlil","year":"2022","unstructured":"Fadlil A, Herman PMD. K nearest neighbor imputation performance on missing value data graduate user satisfaction. Jurnal RESTI (Rekayasa Sistem dan Teknologi Informasi). 2022;6(4):570\u20136.","journal-title":"Jurnal RESTI (Rekayasa Sistem dan Teknologi Informasi)."},{"issue":"3","key":"1009_CR19","doi-asserted-by":"publisher","first-page":"599","DOI":"10.1007\/s11749-019-00670-6","volume":"28","author":"JJ Egozcue","year":"2019","unstructured":"Egozcue JJ, Pawlowsky-Glahn V. Compositional data: the sample space and its structure. TEST. 2019;28(3):599\u2013638.","journal-title":"TEST"},{"issue":"1","key":"1009_CR20","doi-asserted-by":"publisher","first-page":"663","DOI":"10.1038\/s41598-017-19120-0","volume":"8","author":"R Wei","year":"2018","unstructured":"Wei R, Wang J, Su M, Jia E, Chen S, Chen T, Ni Y. Missing value imputation approach for mass spectrometry-based metabolomics data. Sci Rep. 2018;8(1):663.","journal-title":"Sci Rep"},{"issue":"5\u20136","key":"1009_CR21","doi-asserted-by":"publisher","first-page":"684","DOI":"10.1016\/j.neunet.2005.06.025","volume":"18","author":"K Pelckmans","year":"2005","unstructured":"Pelckmans K, De Brabanter J, Suykens JA, De Moor B. Handling missing values in support vector machine classifiers. Neural Netw. 2005;18(5\u20136):684\u201392.","journal-title":"Neural Netw"},{"key":"1009_CR22","doi-asserted-by":"publisher","first-page":"199","DOI":"10.1186\/s12874-020-01080-1","volume":"20","author":"S Hong","year":"2020","unstructured":"Hong S, Lynn HS. Accuracy of random-forest-based imputation of missing data in the presence of non-normality, non-linearity, and interaction. BMC Med Res Methodol. 2020;20:199.","journal-title":"BMC Med Res Methodol"},{"issue":"2","key":"1009_CR23","doi-asserted-by":"publisher","first-page":"514","DOI":"10.17969\/jimfp.v7i2.19896","volume":"7","author":"R Mardisa","year":"2022","unstructured":"Mardisa R, Siregar K, Nasution IS. Klasifikasi Kualitas Fisik Kopi Beras Arabika menggunakan Pengolahan citra dengan Metode K-Nearest Neighbor (K-NN). Jurnal Ilmiah Mahasiswa Pertanian. 2022;7(2):514\u201322.","journal-title":"Jurnal Ilmiah Mahasiswa Pertanian"},{"issue":"760","key":"1009_CR24","first-page":"1","volume":"24","author":"K Jeong","year":"2024","unstructured":"Jeong K, Kim S, Kang MG. Multispectral demosaicing based on iterative-linear-regression model for estimating pseudo-panchromatic image. Sensors. 2024;24(760):1\u201319.","journal-title":"Sensors"},{"key":"1009_CR25","doi-asserted-by":"publisher","first-page":"461","DOI":"10.1007\/s13762-022-04013-1","volume":"20","author":"E Yap\u0131c\u0131","year":"2022","unstructured":"Yap\u0131c\u0131 E, Akg\u00fcn H, \u00d6zkan K, G\u00fcnkaya Z, \u00d6zkan A, Banar M. Prediction of gas product yield from packaging waste pyrolysis: support vector and Gaussian process regression models. Int J Environ Sci Technol. 2022;20:461\u201376.","journal-title":"Int J Environ Sci Technol"},{"key":"1009_CR26","doi-asserted-by":"publisher","DOI":"10.1007\/s41133-020-00032-0","author":"K Shah","year":"2020","unstructured":"Shah K, Patel H, Sanghvi D, Shah M. A comparative analysis of logistic regression random forest and KNN Models for the text classification. Augmented Human Res. 2020. https:\/\/doi.org\/10.1007\/s41133-020-00032-0.","journal-title":"Augmented Human Res"},{"issue":"9","key":"1009_CR27","doi-asserted-by":"publisher","first-page":"2647","DOI":"10.1177\/0962280220908613","volume":"29","author":"L Yu","year":"2020","unstructured":"Yu L, Liu L, Peace KE. Regression multiple imputation for missing data analysis. Stat Methods Med Res. 2020;29(9):2647\u201364.","journal-title":"Stat Methods Med Res"},{"issue":"6","key":"1009_CR28","doi-asserted-by":"publisher","first-page":"1042","DOI":"10.1002\/sim.9315","volume":"41","author":"Y Yamaguchi","year":"2022","unstructured":"Yamaguchi Y, Yoshida S, Misumi T, Maruo K. Multiple imputation for longitudinal data using Bayesian lasso imputation model. Stat Med. 2022;41(6):1042\u201358.","journal-title":"Stat Med"},{"issue":"1","key":"1009_CR29","doi-asserted-by":"publisher","first-page":"49","DOI":"10.1111\/j.1467-9868.2005.00532.x","volume":"68","author":"M Yuan","year":"2006","unstructured":"Yuan M, Lin Y. Model selection and estimation in regression with grouped variables. J Roy Stat Soc. 2006;68(1):49\u201367.","journal-title":"J Roy Stat Soc"},{"issue":"12","key":"1009_CR30","doi-asserted-by":"publisher","first-page":"5277","DOI":"10.1016\/j.csda.2008.05.006","volume":"52","author":"HS Wang","year":"2008","unstructured":"Wang HS, Leng CL. A note on adaptive group lasso. Comput Statist Data Anal. 2008;52(12):5277\u201386.","journal-title":"Comput Statist Data Anal"},{"key":"1009_CR31","first-page":"107","volume":"57","author":"LJ Xi","year":"2023","unstructured":"Xi LJ, Guo ZY, Yang XK, Ping ZG. Application of LASSO and its extended method in variable selection of regression analysis. Chinese J Prev Med. 2023;57:107\u201311.","journal-title":"Chinese J Prev Med"},{"key":"1009_CR32","doi-asserted-by":"publisher","first-page":"48","DOI":"10.5808\/gi.22075","volume":"20","author":"M Song","year":"2022","unstructured":"Song M, Lee M, Park T, Park M. MP-LASSO chart: a multi-level polar chart for visualizing group LASSO analysis of genomic data. Gen Inform. 2022;20:48.","journal-title":"Gen Inform"},{"key":"1009_CR33","unstructured":"Ferrers NM. An elementary treatise on trilinear co-ordinates: the method of reciprocal Polars, and the theory of projections. Macmillan and Company. 1876."},{"issue":"04","key":"1009_CR34","first-page":"396","volume":"33","author":"KP Cui","year":"2018","unstructured":"Cui KP, Zhao Q. Adaptive Group Lasso Algorithm for Logistic Models. J Shandong Normal Univ (Natural Science Edition). 2018;33(04):396\u2013400.","journal-title":"J Shandong Normal Univ (Natural Science Edition)"},{"issue":"12","key":"1009_CR35","doi-asserted-by":"publisher","first-page":"3095","DOI":"10.1016\/j.csda.2009.11.023","volume":"54","author":"K Hron","year":"2010","unstructured":"Hron K, Templ M, Filzmoser P. Imputation of missing values for compositional data using classical and robust methods. Comput Stat Data Anal. 2010;54(12):3095\u2013107.","journal-title":"Comput Stat Data Anal"},{"issue":"6","key":"1009_CR36","first-page":"10","volume":"3","author":"A Bin Khamis","year":"2018","unstructured":"Bin Khamis A, Yee PH. A hybrid model of artificial neural network and genetic algorithm in forecasting gold price. Euro J Eng Technol Res. 2018;3(6):10\u20134.","journal-title":"Euro J Eng Technol Res"},{"issue":"4","key":"1009_CR37","doi-asserted-by":"publisher","first-page":"317","DOI":"10.1037\/1082-989X.6.4.317","volume":"6","author":"S Sinharay","year":"2001","unstructured":"Sinharay S, Stern HS, Russell D. The use of multiple imputation for the analysis of missing data. Psychol methods. 2001;6(4):317.","journal-title":"Psychol methods"},{"key":"1009_CR38","volume-title":"Statistical analysis with missing data","author":"RJ Little","year":"2019","unstructured":"Little RJ, Rubin DB. Statistical analysis with missing data. New Jersey: John Wiley & Sons; 2019."},{"key":"1009_CR39","first-page":"1","volume":"2024","author":"P Brimos","year":"2024","unstructured":"Brimos P, Seregkos P, Karamanou A, Kalampokis E, Tarabanis KA. Deep learning missing value imputation on traffic data using self-attention and GAN-based methods. Panhellenic Conf Electr Telecommun (PACET). 2024;2024:1\u20134.","journal-title":"Panhellenic Conf Electr Telecommun (PACET)"},{"key":"1009_CR40","doi-asserted-by":"publisher","first-page":"521","DOI":"10.3390\/e25030521","volume":"25","author":"P Buczak","year":"2023","unstructured":"Buczak P, Chen JJ, Pauly M. Analyzing the effect of imputation on classification performance under MCAR and MAR missing mechanisms. Entropy. 2023;25:521.","journal-title":"Entropy"},{"key":"1009_CR41","first-page":"1","volume":"2022","author":"K Psychogyios","year":"2022","unstructured":"Psychogyios K, Ilias L, Askounis DT. Comparison of missing data imputation methods using the Framingham heart study dataset. IEEE-EMBS Int Conf Biomed Health Inform (BHI). 2022;2022:1\u20135.","journal-title":"IEEE-EMBS Int Conf Biomed Health Inform (BHI)"},{"key":"1009_CR42","doi-asserted-by":"publisher","DOI":"10.1155\/2018\/2935248","author":"Q Shang","year":"2018","unstructured":"Shang Q, Yang Z, Gao S, Tan D. An imputation method for missing traffic data based on FCM optimized by PSO-SVR. J Adv Trans. 2018. https:\/\/doi.org\/10.1155\/2018\/2935248.","journal-title":"J Adv Trans"},{"key":"1009_CR43","doi-asserted-by":"publisher","DOI":"10.7717\/peerj-cs.619","author":"KM Fouad","year":"2021","unstructured":"Fouad KM, Ismail MM, Azar AT, Arafa MM. Advanced methods for missing values imputation based on similarity learning. PeerJ Comput Sci. 2021. https:\/\/doi.org\/10.7717\/peerj-cs.619.","journal-title":"PeerJ Comput Sci"},{"key":"1009_CR44","doi-asserted-by":"publisher","first-page":"1082","DOI":"10.11113\/mjfas.v20n1.3034","volume":"19","author":"Y Tian","year":"2023","unstructured":"Tian Y, Majahar Ali MK, Pei Shan F, Wu L, Mohd Jamaludin SZ. Application of imputation method for compositional data with missing values based on adaptive LASSO model: the composition of employment industry in Taiyuan. China Malays J Fundam Appl. 2023;19:1082\u201398.","journal-title":"China Malays J Fundam Appl"},{"issue":"3","key":"1009_CR45","doi-asserted-by":"publisher","first-page":"627","DOI":"10.1080\/10618600.2014.938812","volume":"24","author":"M Lim","year":"2015","unstructured":"Lim M, Hastie T. Learning interactions via hierarchical group-lasso regularization. J Comput Graph Stat. 2015;24(3):627\u201354.","journal-title":"J Comput Graph Stat"},{"key":"1009_CR46","doi-asserted-by":"publisher","first-page":"233","DOI":"10.1007\/s11004-007-9141-5","volume":"40","author":"P Filzmoser","year":"2008","unstructured":"Filzmoser P, Hron K. Outlier detection for compositional data using robust methods. Math Geosci. 2008;40:233\u201348.","journal-title":"Math Geosci"}],"container-title":["Journal of Big Data"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s40537-024-01009-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1186\/s40537-024-01009-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s40537-024-01009-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,19]],"date-time":"2024-11-19T11:25:50Z","timestamp":1732015550000},"score":1,"resource":{"primary":{"URL":"https:\/\/journalofbigdata.springeropen.com\/articles\/10.1186\/s40537-024-01009-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,11,19]]},"references-count":46,"journal-issue":{"issue":"1","published-online":{"date-parts":[[2024,12]]}},"alternative-id":["1009"],"URL":"https:\/\/doi.org\/10.1186\/s40537-024-01009-1","relation":{},"ISSN":["2196-1115"],"issn-type":[{"value":"2196-1115","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,11,19]]},"assertion":[{"value":"11 September 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 October 2024","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"19 November 2024","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"Not applicable.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval and consent to participate"}},{"value":"Not applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for publication"}},{"value":"The authors declare no competing interests.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}],"article-number":"166"}}