{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,23]],"date-time":"2026-03-23T14:57:23Z","timestamp":1774277843558,"version":"3.50.1"},"reference-count":77,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2026,3,23]],"date-time":"2026-03-23T00:00:00Z","timestamp":1774224000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,3,23]],"date-time":"2026-03-23T00:00:00Z","timestamp":1774224000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100007831","name":"University of Tabriz","doi-asserted-by":"publisher","award":["S\/2354"],"award-info":[{"award-number":["S\/2354"]}],"id":[{"id":"10.13039\/501100007831","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Data Sci Anal"],"published-print":{"date-parts":[[2026,12]]},"DOI":"10.1007\/s41060-026-01061-5","type":"journal-article","created":{"date-parts":[[2026,3,23]],"date-time":"2026-03-23T13:01:48Z","timestamp":1774270908000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Toward a taxonomy and empirical benchmark of bagging methods for imbalanced classification"],"prefix":"10.1007","volume":"22","author":[{"given":"Yousef","family":"Abdi","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mohammad","family":"Asadpour","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yousef","family":"Seyfari","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2026,3,23]]},"reference":[{"issue":"6","key":"1061_CR1","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s10462-024-10759-6","volume":"57","author":"W Chen","year":"2024","unstructured":"Chen, W., Yang, K., Yu, Z., Shi, Y., Chen, C.L.: A survey on imbalanced learning: latest research, applications and future directions. Artif. Intell. Rev. 57(6), 1\u201351 (2024)","journal-title":"Artif. Intell. Rev."},{"key":"1061_CR2","doi-asserted-by":"crossref","unstructured":"Gao, X., Xie, D., Zhang, Y., Wang, Z., Chen, C., He, C., & Zhang, W.:. A comprehensive survey on imbalanced data learning. arXiv preprint arXiv:2502.08960 (2025)","DOI":"10.1007\/s11704-025-50274-7"},{"key":"1061_CR3","doi-asserted-by":"publisher","first-page":"137","DOI":"10.1007\/s10462-024-10759-6","volume":"58","author":"W Chen","year":"2024","unstructured":"Chen, W., Yang, K., Yu, Z., et al.: A survey on imbalanced learning: latest research, applications and future directions. Artif. Intell. Rev. 58, 137 (2024)","journal-title":"Artif. Intell. Rev."},{"key":"1061_CR4","unstructured":"Liu, Z., Wei, P., Wei, Z., Yu, B., Jiang, J., Cao, W., Bian, J., & Chang, Y.: Towards inter-class and intra-class imbalance in class-imbalanced learning. arXiv. https:\/\/arxiv.org\/abs\/2111.12791(2021)"},{"key":"1061_CR5","doi-asserted-by":"publisher","first-page":"71","DOI":"10.1186\/s40537-025-01119-4","volume":"12","author":"M Carvalho","year":"2025","unstructured":"Carvalho, M., Pinho, A.J., Br\u00e1s, S.: Resampling approaches to handle class imbalance: a review from a data perspective. J. Big Data 12, 71 (2025)","journal-title":"J. Big Data"},{"key":"1061_CR6","unstructured":"Twomey, D.: Novel algorithm-level approaches for class-imbalanced machine learning (Doctoral dissertation, University College London). UCL Discovery (2023) https:\/\/discovery.ucl.ac.uk\/id\/eprint\/10167331."},{"key":"1061_CR7","doi-asserted-by":"publisher","first-page":"595","DOI":"10.1007\/s42452-024-06274-6","volume":"6","author":"H Kaur","year":"2024","unstructured":"Kaur, H., Kaur, T., Bhardwaj, V., Kumar, M.: An ensemble deep learning model for classification of students as weak and strong learners via multiparametric analysis. Discov. Appl. Sci. 6, 595 (2024)","journal-title":"Discov. Appl. Sci."},{"key":"1061_CR8","doi-asserted-by":"publisher","first-page":"99129","DOI":"10.1109\/ACCESS.2022.3207287","volume":"10","author":"ID Mienye","year":"2022","unstructured":"Mienye, I.D., Sun, Y.: A survey of ensemble learning: concepts, algorithms, applications, and prospects. IEEE Access 10, 99129\u201399149 (2022)","journal-title":"IEEE Access"},{"key":"1061_CR9","doi-asserted-by":"publisher","DOI":"10.34028\/iajit\/17\/4\/10","author":"G T\u00fcys\u00fczo\u011flu","year":"2020","unstructured":"T\u00fcys\u00fczo\u011flu, G., Birant, D.: Enhanced bagging (eBagging): a novel approach for ensemble learning. Int. Arab J. Inf. Technol. (2020). https:\/\/doi.org\/10.34028\/iajit\/17\/4\/10","journal-title":"Int. Arab J. Inf. Technol."},{"issue":"2","key":"1061_CR10","first-page":"905","volume":"15","author":"R Qui","year":"2024","unstructured":"Qui, R., et al.: Func-Bagging: an ensemble learning strategy for improving the performance of heterogeneous anomaly detection models. Appl. Sci. 15(2), 905 (2024)","journal-title":"Appl. Sci."},{"issue":"2","key":"1061_CR11","first-page":"67","volume":"15","author":"G Rekha","year":"2019","unstructured":"Rekha, G., Tyagi, A.K., Krishna Reddy, V.: Solving class imbalance problem using bagging, boosting techniques, with and without using noise filtering method. Int. J. Hybrid Intell. Syst. 15(2), 67\u201376 (2019)","journal-title":"Int. J. Hybrid Intell. Syst."},{"key":"1061_CR12","doi-asserted-by":"crossref","unstructured":"Lin, T.-Y., Goyal, P., Girshick, R., He, K., & Doll\u00e1r, P.: Focal loss for dense object detection. In: Proceedings of the IEEE International Conference on Computer Vision (ICCV), 2980\u20132988 (2017)","DOI":"10.1109\/ICCV.2017.324"},{"issue":"12","key":"1061_CR13","doi-asserted-by":"publisher","first-page":"3358","DOI":"10.1016\/j.patcog.2007.04.009","volume":"40","author":"Y Sun","year":"2007","unstructured":"Sun, Y., Kamel, M.S., Wong, A.K.C., Wang, Y.: Cost-sensitive boosting for classification of imbalanced data. Pattern Recognit. 40(12), 3358\u20133378 (2007)","journal-title":"Pattern Recognit."},{"key":"1061_CR14","doi-asserted-by":"crossref","unstructured":"Chen, T., & Guestrin, C.: XGBoost: A scalable tree boosting system. In: Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining (KDD), 785\u2013794 (2016)","DOI":"10.1145\/2939672.2939785"},{"key":"1061_CR15","unstructured":"Ke, G., Meng, Q., Finley, T., Wang, T., Chen, W., Ma, W., & Liu, T.-Y.: LightGBM: a highly efficient gradient boosting decision tree. Advances in Neural Information Processing Systems (NeurIPS), 30 (2017)"},{"key":"1061_CR16","unstructured":"Prokhorenkova, L., Gusev, G., Vorobev, A., Dorogush, A.V., & Gulin, A.: CatBoost: Unbiased boosting with categorical features. Advances in Neural Information Processing Systems (NeurIPS), 31 (2018)"},{"key":"1061_CR17","doi-asserted-by":"crossref","unstructured":"Rawat, U., & Rawat, B.: A comprehensive study of boosting algorithms for class imbalance dataset. In: International Conference on Smart Systems and Wireless Communication, pp. 269\u2013282. Springer Nature Singapore, Singapore (2024)","DOI":"10.1007\/978-981-96-1348-9_21"},{"issue":"6","key":"1061_CR18","doi-asserted-by":"publisher","first-page":"137","DOI":"10.1007\/s10462-024-10759-6","volume":"57","author":"W Chen","year":"2024","unstructured":"Chen, W., Yang, K., Yu, Z., Shi, Y., Chen, C.P.: A survey on imbalanced learning: latest research, applications and future directions. Artif. Intell. Rev. 57(6), 137 (2024)","journal-title":"Artif. Intell. Rev."},{"issue":"4","key":"1061_CR19","doi-asserted-by":"publisher","first-page":"463","DOI":"10.1109\/TSMCC.2011.2161285","volume":"42","author":"M Galar","year":"2011","unstructured":"Galar, M., Fernandez, A., Barrenechea, E., Bustince, H., Herrera, F.: A review on ensembles for the class imbalance problem: bagging-, boosting-, and hybrid-based approaches. IEEE Trans. Syst. Man Cybern. Part C Appl. Rev. 42(4), 463\u2013484 (2011)","journal-title":"IEEE Trans. Syst. Man Cybern. Part C Appl. Rev."},{"issue":"12","key":"1061_CR20","doi-asserted-by":"publisher","first-page":"368","DOI":"10.1007\/s10462-025-11357-w","volume":"58","author":"M Fachrie","year":"2025","unstructured":"Fachrie, M., Musdholifah, A., Pulungan, R.: Effectiveness of data resampling and ensemble learning in multiclass imbalance learning. Artif. Intell. Rev. 58(12), 368 (2025)","journal-title":"Artif. Intell. Rev."},{"key":"1061_CR21","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s40537-020-00349-y","volume":"7","author":"J Tanha","year":"2020","unstructured":"Tanha, J., Abdi, Y., Samadi, N., Razzaghi, N., Asadpour, M.: Boosting methods for multi-class imbalanced data classification: an experimental review. J. Big Data 7, 1\u201347 (2020)","journal-title":"J. Big Data"},{"key":"1061_CR22","doi-asserted-by":"crossref","unstructured":"Gosain, A., Gupta, A., & Singh, D.: Hybrid data-level techniques for class imbalance problem. In: International Conference on Innovative Computing and Communications: Proceedings of ICICC 2020, Vol. 1, pp. 1131\u20131141. Springer Singapore, Singapore (2020).","DOI":"10.1007\/978-981-15-5113-0_95"},{"issue":"1","key":"1061_CR23","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s10618-021-00790-4","volume":"36","author":"G Petrides","year":"2022","unstructured":"Petrides, G., Verbeke, W.: Cost-sensitive ensemble learning: a unifying framework. Data Min. Knowl. Discov. 36(1), 1\u201328 (2022)","journal-title":"Data Min. Knowl. Discov."},{"key":"1061_CR24","unstructured":"Horna, D., Lango, M., & Stefanowski, J.: Deep similarity learning loss functions in data transformation for class imbalance. In: Fifth International Workshop on Learning with Imbalanced Domains: Theory and Applications, pp. 1\u201315. PMLR (2024)"},{"issue":"1","key":"1061_CR25","doi-asserted-by":"publisher","first-page":"82","DOI":"10.1186\/s12911-022-01821-w","volume":"22","author":"L Liu","year":"2022","unstructured":"Liu, L., Wu, X., Li, S., Li, Y., Tan, S., Bai, Y.: Solving the class imbalance problem using ensemble algorithm: application of screening for aortic dissection. BMC Med. Inform. Decis. Mak. 22(1), 82 (2022)","journal-title":"BMC Med. Inform. Decis. Mak."},{"issue":"6","key":"1061_CR26","doi-asserted-by":"publisher","first-page":"2883","DOI":"10.1007\/s00521-023-09180-x","volume":"36","author":"H Ding","year":"2024","unstructured":"Ding, H., Sun, Y., Huang, N., Cui, X.: VGAN-BL: imbalanced data classification based on generative adversarial network and biased loss. Neural Comput. Appl. 36(6), 2883\u20132899 (2024)","journal-title":"Neural Comput. Appl."},{"key":"1061_CR27","doi-asserted-by":"publisher","first-page":"113005","DOI":"10.1016\/j.eswa.2019.113005","volume":"142","author":"HG Zefrehi","year":"2020","unstructured":"Zefrehi, H.G., Alt\u0131n\u00e7ay, H.: Imbalance learning using heterogeneous ensembles. Expert Syst. Appl. 142, 113005 (2020)","journal-title":"Expert Syst. Appl."},{"key":"1061_CR28","unstructured":"Esteves, V. M. S.: Techniques to deal with imbalanced data in multi-class problems: a review of existing methods. PQDT-Global (2020)"},{"key":"1061_CR29","doi-asserted-by":"publisher","DOI":"10.1109\/tkde.2025.3528719","author":"T Zhu","year":"2025","unstructured":"Zhu, T., Hu, X., Liu, X., Zhu, E., Zhu, X., Xu, H.: Dynamic ensemble framework for imbalanced data classification. IEEE Trans. Knowl. Data Eng. (2025). https:\/\/doi.org\/10.1109\/tkde.2025.3528719","journal-title":"IEEE Trans. Knowl. Data Eng."},{"key":"1061_CR30","doi-asserted-by":"publisher","first-page":"250","DOI":"10.1016\/j.comcom.2022.07.034","volume":"194","author":"J Jiang","year":"2022","unstructured":"Jiang, J., Liu, F., Liu, Y., Tang, Q., Wang, B., Zhong, G., Wang, W.: A dynamic ensemble algorithm for anomaly detection in IoT imbalanced data streams. Comput. Commun. 194, 250\u2013257 (2022)","journal-title":"Comput. Commun."},{"key":"1061_CR31","doi-asserted-by":"publisher","first-page":"157","DOI":"10.1016\/j.ins.2020.12.023","volume":"554","author":"Z Chen","year":"2021","unstructured":"Chen, Z., Duan, J., Kang, L., Qiu, G.: A hybrid data-level ensemble to enable learning from highly imbalanced dataset. Inf. Sci. 554, 157\u2013176 (2021)","journal-title":"Inf. Sci."},{"key":"1061_CR32","doi-asserted-by":"publisher","first-page":"137","DOI":"10.1007\/s10462-024-10759-6","volume":"57","author":"W Chen","year":"2024","unstructured":"Chen, W., Yang, K., Yu, Z., Shi, Y., Chen, C.L.P.: A survey on imbalanced learning: latest research, applications and future directions. Artif. Intell. Rev. 57, 137 (2024)","journal-title":"Artif. Intell. Rev."},{"key":"1061_CR33","doi-asserted-by":"publisher","first-page":"123832","DOI":"10.1016\/j.eswa.2024.123832","volume":"249","author":"Z Jiang","year":"2024","unstructured":"Jiang, Z., Lu, Y., Zhao, L., Zhan, Y., Mao, Q.: A post-processing framework for class-imbalanced learning in a transductive setting. Expert Syst. Appl. 249, 123832 (2024)","journal-title":"Expert Syst. Appl."},{"key":"1061_CR34","doi-asserted-by":"publisher","first-page":"119733","DOI":"10.1016\/j.eswa.2023.119733","volume":"221","author":"Z Jiang","year":"2023","unstructured":"Jiang, Z., Zhao, L., Lu, Y., Zhan, Y., Mao, Q.: A semi-supervised resampling method for class-imbalanced learning. Expert Syst. Appl. 221, 119733 (2023)","journal-title":"Expert Syst. Appl."},{"issue":"9","key":"1061_CR35","doi-asserted-by":"publisher","first-page":"e13377","DOI":"10.1111\/exsy.13377","volume":"40","author":"Z Jiang","year":"2023","unstructured":"Jiang, Z., Zhao, L., Zhan, Y.: A boosted co-training method for class-imbalanced learning. Expert. Syst. 40(9), e13377 (2023)","journal-title":"Expert. Syst."},{"key":"1061_CR36","unstructured":"Ai, Q., Wang, P., He, L., Wen, L., Pan, L., & Xu, Z.: Generative oversampling for imbalanced data via majority-guided VAE. In: International Conference on Artificial Intelligence and Statistics, pp. 3315\u20133330. PMLR (2023)"},{"key":"1061_CR37","doi-asserted-by":"crossref","unstructured":"Roth, K., Pemula, L., Zepeda, J., Sch\u00f6lkopf, B., Brox, T., & Gehler, P.: Towards total recall in industrial anomaly detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 14318\u201314328 (2022)","DOI":"10.1109\/CVPR52688.2022.01392"},{"key":"1061_CR38","doi-asserted-by":"crossref","unstructured":"Harine Rajashree, R., & Hariharan, M.: A study on ensemble methods for classification. In: Machine Learning, Deep Learning and Computational Intelligence for Wireless Communication: Proceedings of MDCWC 2020, pp. 127\u2013136. Springer Singapore (2021)","DOI":"10.1007\/978-981-16-0289-4_10"},{"key":"1061_CR39","doi-asserted-by":"crossref","unstructured":"Newaz, A., Mohosheu, M.S., Al Noman, M.A., & Jabid, T.: iBRF: improved balanced random forest classifier. In: 2024 35th Conference of Open Innovations Association (FRUCT), pp. 501\u2013508. IEEE (2024)","DOI":"10.23919\/FRUCT61870.2024.10516372"},{"issue":"2","key":"1061_CR40","first-page":"539","volume":"39","author":"XY Liu","year":"2008","unstructured":"Liu, X.Y., Wu, J., Zhou, Z.H.: Exploratory undersampling for class-imbalance learning. IEEE Trans. Syst. Man Cybern. Part B (Cybern.) 39(2), 539\u2013550 (2008)","journal-title":"IEEE Trans. Syst. Man Cybern. Part B (Cybern.)"},{"issue":"1","key":"1061_CR41","doi-asserted-by":"publisher","first-page":"20","DOI":"10.1145\/1007730.1007735","volume":"6","author":"GE Batista","year":"2004","unstructured":"Batista, G.E., Prati, R.C., Monard, M.C.: A study of the behavior of several methods for balancing machine learning training data. ACM SIGKDD Explor. Newsl. 6(1), 20\u201329 (2004)","journal-title":"ACM SIGKDD Explor. Newsl."},{"key":"1061_CR42","doi-asserted-by":"crossref","unstructured":"Pinto, F., Soares, C., & Mendes-Moreira, J.: An empirical methodology to analyze the behavior of bagging. In: Advanced Data Mining and Applications: 10th International onference, ADMA 2014, Guilin, China. Proceedings 10, pp. 199\u2013212. Springer International Publishing (2014)","DOI":"10.1007\/978-3-319-14717-8_16"},{"issue":"5\u20136","key":"1061_CR43","doi-asserted-by":"publisher","first-page":"412","DOI":"10.1002\/sam.10061","volume":"2","author":"S Hido","year":"2009","unstructured":"Hido, S., Kashima, H., Takahashi, Y.: Roughly balanced bagging for imbalanced data. Stat. Anal. Data Min. 2(5\u20136), 412\u2013426 (2009)","journal-title":"Stat. Anal. Data Min."},{"key":"1061_CR44","doi-asserted-by":"publisher","first-page":"97","DOI":"10.1007\/s10844-017-0446-7","volume":"50","author":"M Lango","year":"2018","unstructured":"Lango, M., Stefanowski, J.: Multi-class and feature selection extensions of roughly balanced bagging for imbalanced data. J. Intell. Inf. Syst. 50, 97\u2013127 (2018)","journal-title":"J. Intell. Inf. Syst."},{"key":"1061_CR45","doi-asserted-by":"crossref","unstructured":"Li, C.: Classifying imbalanced data using a bagging ensemble variation (BEV). In: Proceedings of the 45th Annual Southeast Regional Conference, pp. 203\u2013208 (2007).","DOI":"10.1145\/1233341.1233378"},{"key":"1061_CR46","doi-asserted-by":"crossref","unstructured":"Zhu, X.: Lazy bagging for classifying imbalanced data. In: Seventh IEEE International Conference on Data Mining (ICDM 2007), pp. 763\u2013768. IEEE (2007)","DOI":"10.1109\/ICDM.2007.95"},{"key":"1061_CR47","doi-asserted-by":"publisher","first-page":"105434","DOI":"10.1016\/j.knosys.2019.105434","volume":"193","author":"JJ Rodriguez","year":"2020","unstructured":"Rodriguez, J.J., Diez-Pastor, J.F., Arnaiz-Gonzalez, A., Kuncheva, L.I.: Random balance ensembles for multiclass imbalance learning. Knowl. Based Syst. 193, 105434 (2020)","journal-title":"Knowl. Based Syst."},{"key":"1061_CR48","doi-asserted-by":"publisher","first-page":"529","DOI":"10.1016\/j.neucom.2014.07.064","volume":"150","author":"J B\u0142aszczy\u0144ski","year":"2015","unstructured":"B\u0142aszczy\u0144ski, J., Stefanowski, J.: Neighbourhood sampling in bagging for imbalanced data. Neurocomputing 150, 529\u2013542 (2015)","journal-title":"Neurocomputing"},{"key":"1061_CR49","doi-asserted-by":"publisher","first-page":"330","DOI":"10.1016\/j.neucom.2017.08.035","volume":"275","author":"G Collell","year":"2018","unstructured":"Collell, G., Prelec, D., Patil, K.R.: A simple plug-in bagging ensemble based on threshold-moving for classifying binary and multiclass imbalanced data. Neurocomputing 275, 330\u2013340 (2018)","journal-title":"Neurocomputing"},{"key":"1061_CR50","doi-asserted-by":"publisher","first-page":"863","DOI":"10.1613\/jair.1.11192","volume":"61","author":"A Fern\u00e1ndez","year":"2018","unstructured":"Fern\u00e1ndez, A., Garcia, S., Herrera, F., Chawla, N.V.: SMOTE for learning from imbalanced data: progress and challenges, marking the 15-year anniversary. J. Artif. Intell. Res. 61, 863\u2013905 (2018)","journal-title":"J. Artif. Intell. Res."},{"key":"1061_CR51","doi-asserted-by":"crossref","unstructured":"He, H., Bai, Y., Garcia, E.A., & Li, S.: ADASYN: Adaptive synthetic sampling approach for imbalanced learning. In: 2008 IEEE International Joint Conference on Neural Networks (IEEE World Congress on Computational Intelligence), pp. 1322\u20131328. IEEE (2008)","DOI":"10.1109\/IJCNN.2008.4633969"},{"key":"1061_CR52","doi-asserted-by":"crossref","unstructured":"Ahmed, S., Mahbub, A., Rayhan, F., Jani, R., Shatabda, S., & Farid, D.M.: Hybrid methods for class imbalance learning employing bagging with sampling techniques. In: 2017 2nd International Conference on Computational Systems and Information Technology for Sustainable Solution (CSITSS), pp. 1\u20135. IEEE (2017)","DOI":"10.1109\/CSITSS.2017.8447799"},{"key":"1061_CR53","doi-asserted-by":"publisher","first-page":"57","DOI":"10.1016\/j.neucom.2014.06.021","volume":"143","author":"Y Qian","year":"2014","unstructured":"Qian, Y., Liang, Y., Li, M., Feng, G., Shi, X.: A resampling ensemble algorithm for classification of imbalance problems. Neurocomputing 143, 57\u201367 (2014)","journal-title":"Neurocomputing"},{"key":"1061_CR54","doi-asserted-by":"crossref","unstructured":"Wang, S., & Yao, X.: Diversity analysis on imbalanced data sets by using ensemble models. In: 2009 IEEE Symposium on Computational Intelligence and Data Mining, pp. 324\u2013331. IEEE (2009)","DOI":"10.1109\/CIDM.2009.4938667"},{"issue":"118","key":"1061_CR55","first-page":"1","volume":"23","author":"H Hang","year":"2022","unstructured":"Hang, H., Cai, Y., Yang, H., Lin, Z.: Under-bagging nearest neighbors for imbalanced classification. J. Mach. Learn. Res. 23(118), 1\u201363 (2022)","journal-title":"J. Mach. Learn. Res."},{"key":"1061_CR56","doi-asserted-by":"crossref","unstructured":"Boukir, S., & Feng, W.: Boundary bagging to address training data issues in ensemble classification. In: 2020 25th International Conference on Pattern Recognition (ICPR), pp. 9975\u20139981. IEEE (2021)","DOI":"10.1109\/ICPR48806.2021.9413055"},{"key":"1061_CR57","doi-asserted-by":"crossref","unstructured":"Kapp, M. N., Sabourin, R., & Maupin, P.: An empirical study on diversity measures and margin theory for ensembles of classifiers. In: 2007 10th International Conference on Information Fusion, pp. 1\u20138. IEEE (2007)","DOI":"10.1109\/ICIF.2007.4408144"},{"key":"1061_CR58","doi-asserted-by":"publisher","DOI":"10.1155\/2017\/1827016","author":"Q Wang","year":"2017","unstructured":"Wang, Q., Luo, Z., Huang, J., Feng, Y., Liu, Z.: A novel ensemble method for imbalanced data learning: bagging of extrapolation-SMOTE SVM. Comput. Intell. Neurosci. (2017). https:\/\/doi.org\/10.1155\/2017\/1827016","journal-title":"Comput. Intell. Neurosci."},{"key":"1061_CR59","doi-asserted-by":"publisher","first-page":"331","DOI":"10.1007\/s11704-016-5306-z","volume":"12","author":"B Sun","year":"2018","unstructured":"Sun, B., Chen, H., Wang, J., Xie, H.: Evolutionary under-sampling based bagging ensemble method for imbalanced data classification. Front. Comput. Sci. 12, 331\u2013350 (2018)","journal-title":"Front. Comput. Sci."},{"key":"1061_CR60","doi-asserted-by":"publisher","first-page":"280","DOI":"10.1016\/j.patrec.2020.03.016","volume":"133","author":"C Huang","year":"2020","unstructured":"Huang, C., Huang, X., Fang, Y., Xu, J., Qu, Y., Zhai, P., Li, J.: Sample imbalance disease classification model based on association rule feature selection. Pattern Recognit. Lett. 133, 280\u2013286 (2020)","journal-title":"Pattern Recognit. Lett."},{"key":"1061_CR61","doi-asserted-by":"publisher","first-page":"915","DOI":"10.1007\/s11590-015-0934-z","volume":"11","author":"T Razzaghi","year":"2017","unstructured":"Razzaghi, T., Xanthopoulos, P., \u015eeref, O.: Constraint relaxation, cost-sensitive learning and bagging for imbalanced classification problems with outliers. Optim. Lett. 11, 915\u2013928 (2017)","journal-title":"Optim. Lett."},{"key":"1061_CR62","doi-asserted-by":"publisher","first-page":"123","DOI":"10.1023\/A:1018054314350","volume":"24","author":"L Breiman","year":"1996","unstructured":"Breiman, L.: Bagging predictors. Mach. Learn. 24, 123\u2013140 (1996)","journal-title":"Mach. Learn."},{"issue":"1","key":"1061_CR63","doi-asserted-by":"publisher","first-page":"78","DOI":"10.1007\/s00357-021-09397-2","volume":"39","author":"A Plaia","year":"2022","unstructured":"Plaia, A., Buscemi, S., F\u00fcrnkranz, J., Menc\u00eda, E.L.: Comparing boosting and bagging for decision trees of rankings. J. Classif. 39(1), 78\u201399 (2022)","journal-title":"J. Classif."},{"issue":"2","key":"1061_CR64","first-page":"121","volume":"3","author":"K Machov\u00e1","year":"2006","unstructured":"Machov\u00e1, K., Barcak, F., Bedn\u00e1r, P.: A bagging method using decision trees in the role of base classifiers. Acta Polytech. Hung. 3(2), 121\u2013132 (2006)","journal-title":"Acta Polytech. Hung."},{"issue":"3","key":"1061_CR65","doi-asserted-by":"publisher","first-page":"2259","DOI":"10.1007\/s10115-024-02281-6","volume":"67","author":"X Li","year":"2025","unstructured":"Li, X., Liu, Q.: A hybrid sampling algorithm for imbalanced and class-overlap data based on natural neighbors and density estimation. Knowl. Inf. Syst. 67(3), 2259\u20132290 (2025)","journal-title":"Knowl. Inf. Syst."},{"key":"1061_CR66","doi-asserted-by":"publisher","first-page":"1373","DOI":"10.1613\/jair.1.12125","volume":"70","author":"C Northcutt","year":"2021","unstructured":"Northcutt, C., Jiang, L., Chuang, I.: Confident learning: estimating uncertainty in dataset labels. J. Artif. Intell. Res. 70, 1373\u20131411 (2021)","journal-title":"J. Artif. Intell. Res."},{"key":"1061_CR67","unstructured":"Grandini, M., Bagli, E., & Visani, G.: Metrics for multi-class classification: an overview. arXiv preprint arXiv:2008.05756 (2020)"},{"key":"1061_CR68","doi-asserted-by":"crossref","unstructured":"Song, Y., Zhang, J., Yan, H., & Li, Q.: Multi-class imbalanced learning with one-versus-one decomposition: an empirical study. In: Cloud Computing and Security: 4th International Conference, ICCCS 2018, Haikou, China, Part III 4, pp. 617\u2013628. Springer International Publishing (2018)","DOI":"10.1007\/978-3-030-00012-7_56"},{"key":"1061_CR69","doi-asserted-by":"crossref","unstructured":"Sun Y, Kamel MS, Wang Y.: Boosting for learning multiple classes with imbalanced class distribution. In: Sixth International Conference on Data Mining (ICDM'06), pp. 592\u2013602 (2006)","DOI":"10.1109\/ICDM.2006.29"},{"key":"1061_CR70","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0118432","author":"T Saito","year":"2015","unstructured":"Saito, T., Rehmsmeier, M.: The precision-recall plot is more informative than the ROC plot when evaluating binary classifiers on imbalanced datasets. PLoS One (2015). https:\/\/doi.org\/10.1371\/journal.pone.0118432","journal-title":"PLoS One"},{"issue":"11","key":"1061_CR71","doi-asserted-by":"publisher","first-page":"7747","DOI":"10.1109\/TPAMI.2021.3101125","volume":"44","author":"Z Yang","year":"2021","unstructured":"Yang, Z., Xu, Q., Bao, S., Cao, X., Huang, Q.: Learning with multiclass AUC: theory and algorithms. IEEE Trans. Pattern Anal. Mach. Intell. 44(11), 7747\u20137763 (2021)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"1061_CR72","doi-asserted-by":"crossref","unstructured":"Halimu, C., Kasem, A., Newaz, S.S.: Empirical comparison of area under ROC curve (AUC) and mathew correlation coefficient (MCC) for evaluating machine learning algorithms on imbalanced datasets for binary classification. In: Proceedings of the 3rd International Conference on Machine Learning and Soft Computing, pp. 1\u20136 (2019)","DOI":"10.1145\/3310986.3311023"},{"issue":"16","key":"1061_CR73","doi-asserted-by":"publisher","first-page":"10213","DOI":"10.3390\/ijerph191610213","volume":"19","author":"B Wi\u0119ckowska","year":"2022","unstructured":"Wi\u0119ckowska, B., Kubiak, K.B., J\u00f3\u017awiak, P., Moryson, W., Stawi\u0144ska-Witoszy\u0144ska, B.: Cohen\u2019s kappa coefficient as a measure to assess classification improvement following the addition of a new marker to a regression model. Int. J. Environ. Res. Public Health 19(16), 10213 (2022)","journal-title":"Int. J. Environ. Res. Public Health"},{"issue":"10","key":"1061_CR74","doi-asserted-by":"publisher","first-page":"2636","DOI":"10.1080\/03610918.2014.931971","volume":"44","author":"DG Pereira","year":"2015","unstructured":"Pereira, D.G., Afonso, A., Medeiros, F.M.: Overview of Friedman\u2019s test and post-hoc analysis. Commun. Stat. - Simul. Comput. 44(10), 2636\u20132653 (2015)","journal-title":"Commun. Stat. - Simul. Comput."},{"key":"1061_CR75","first-page":"1","volume":"7","author":"J Dem\u0161ar","year":"2006","unstructured":"Dem\u0161ar, J.: Statistical comparisons of classifiers over multiple data sets. J. Mach. Learn. Res. 7, 1\u201330 (2006)","journal-title":"J. Mach. Learn. Res."},{"key":"1061_CR76","doi-asserted-by":"crossref","unstructured":"Ling, C. X., Yang, Q., Wang, J., & Zhang, S.: Decision trees with minimal costs. In: Proceedings of the Twenty-First International Conference on Machine Learning, p. 69. (2004)","DOI":"10.1145\/1015330.1015369"},{"issue":"1-12","key":"1061_CR77","first-page":"24","volume":"110","author":"C Chen","year":"2004","unstructured":"Chen, C., Liaw, A., Breiman, L.: Using random forest to learn imbalanced data. Univ. Calif. Berkeley 110(1\u201312), 24 (2004)","journal-title":"Univ. Calif. Berkeley"}],"container-title":["International Journal of Data Science and Analytics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s41060-026-01061-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s41060-026-01061-5","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s41060-026-01061-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,23]],"date-time":"2026-03-23T14:03:50Z","timestamp":1774274630000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s41060-026-01061-5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,3,23]]},"references-count":77,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2026,12]]}},"alternative-id":["1061"],"URL":"https:\/\/doi.org\/10.1007\/s41060-026-01061-5","relation":{},"ISSN":["2364-415X","2364-4168"],"issn-type":[{"value":"2364-415X","type":"print"},{"value":"2364-4168","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,3,23]]},"assertion":[{"value":"21 June 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"5 February 2026","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"23 March 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no competing interests.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interest"}}],"article-number":"114"}}