{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,25]],"date-time":"2026-06-25T05:45:12Z","timestamp":1782366312223,"version":"3.54.5"},"reference-count":136,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2025,3,23]],"date-time":"2025-03-23T00:00:00Z","timestamp":1742688000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2025,3,23]],"date-time":"2025-03-23T00:00:00Z","timestamp":1742688000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"funder":[{"DOI":"10.13039\/501100001871","name":"Funda\u00e7\u00e3o para a Ci\u00eancia e a Tecnologia","doi-asserted-by":"publisher","award":["B\/UI62\/10541\/2022"],"award-info":[{"award-number":["B\/UI62\/10541\/2022"]}],"id":[{"id":"10.13039\/501100001871","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Big Data"],"DOI":"10.1186\/s40537-025-01119-4","type":"journal-article","created":{"date-parts":[[2025,3,23]],"date-time":"2025-03-23T14:20:47Z","timestamp":1742739647000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":95,"title":["Resampling approaches to handle class imbalance: a review from a data perspective"],"prefix":"10.1186","volume":"12","author":[{"given":"Miguel","family":"Carvalho","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Armando J.","family":"Pinho","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Susana","family":"Br\u00e1s","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2025,3,23]]},"reference":[{"issue":"2","key":"1119_CR1","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/2907070","volume":"49","author":"P Branco","year":"2016","unstructured":"Branco P, Torgo L, Ribeiro RP. A survey of predictive modeling on imbalanced domains. ACM Comput Surv. 2016;49(2):1\u201356. https:\/\/doi.org\/10.1145\/2907070.","journal-title":"ACM Comput Surv"},{"key":"1119_CR2","doi-asserted-by":"publisher","first-page":"170668","DOI":"10.1109\/ACCESS.2019.2955086","volume":"7","author":"K Cheng","year":"2019","unstructured":"Cheng K, Zhang C, Yu H, Yang X, Zou H, Gao S. Grouped SMOTE with noise filtering mechanism for classifying imbalanced data. IEEE Access. 2019;7:170668\u201381. https:\/\/doi.org\/10.1109\/ACCESS.2019.2955086.","journal-title":"IEEE Access"},{"key":"1119_CR3","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.ins.2018.06.056","volume":"465","author":"F Last","year":"2017","unstructured":"Last F, Douzas G, Bacao F. Oversampling for imbalanced learning based on K-means and SMOTE. Inf Sci. 2017;465:1\u201320. https:\/\/doi.org\/10.1016\/j.ins.2018.06.056.","journal-title":"Inf Sci"},{"key":"1119_CR4","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-98074-4_5","volume-title":"Data level preprocessing methods","author":"A Fern\u00e1ndez","year":"2018","unstructured":"Fern\u00e1ndez A, Garc\u00eda S, Galar M, Prati RC, Krawczyk B, Herrera F. Data level preprocessing methods. Cham: Springer; 2018."},{"key":"1119_CR5","doi-asserted-by":"publisher","first-page":"6207","DOI":"10.1007\/s10462-022-10150-3","volume":"55","author":"MS Santos","year":"2022","unstructured":"Santos MS, et al. On the joint-effect of class imbalance and overlap: a critical review. Artif Intell Rev. 2022;55:6207.","journal-title":"Artif Intell Rev"},{"key":"1119_CR6","doi-asserted-by":"publisher","DOI":"10.1016\/j.asoc.2023.110415","volume":"143","author":"S Rezvani","year":"2023","unstructured":"Rezvani S, Wang X. A broad review on class imbalance learning techniques. Appl Soft Comput. 2023;143: 110415. https:\/\/doi.org\/10.1016\/j.asoc.2023.110415.","journal-title":"Appl Soft Comput"},{"key":"1119_CR7","doi-asserted-by":"publisher","DOI":"10.1002\/eng2.12298","author":"S Susan","year":"2021","unstructured":"Susan S. \u201cThe balancing trick: optimized sampling of imbalanced datasets\u2014a brief survey of the recent state of the art. Eng Rep. 2021. https:\/\/doi.org\/10.1002\/eng2.12298.","journal-title":"Eng Rep."},{"issue":"1","key":"1119_CR8","doi-asserted-by":"publisher","first-page":"31","DOI":"10.1007\/s10115-022-01772-8","volume":"65","author":"V Werner","year":"2023","unstructured":"Werner V, et al. Imbalanced data preprocessing techniques for machine learning\u202f: a systematic mapping study. Knowl Inf Syst. 2023;65(1):31\u201357. https:\/\/doi.org\/10.1007\/s10115-022-01772-8.","journal-title":"Knowl Inf Syst"},{"key":"1119_CR9","doi-asserted-by":"publisher","unstructured":"Pradipta GA. SMOTE for handling imbalanced data problem\u202f: a review. In: 2021 Sixth Int. Conf. Informatics Comput. 1\u20138. https:\/\/doi.org\/10.1109\/ICIC54025.2021.9632912.","DOI":"10.1109\/ICIC54025.2021.9632912"},{"key":"1119_CR10","doi-asserted-by":"publisher","first-page":"123","DOI":"10.1007\/s10462-024-10759-6","volume":"57","author":"W Chen","year":"2024","unstructured":"Chen W, Yang K, Yu Z, Shi Y, Chen CLP. A survey on imbalanced learning\u202f: latest research, applications and future directions. Artif Intell Rev. 2024;57:123.","journal-title":"Artif Intell Rev"},{"key":"1119_CR11","doi-asserted-by":"publisher","unstructured":"Basha SJ, Madala SR, Vivek K, Kumar ES, Ammannamma T. A review on imbalanced data classification techniques. In: 2022 Int. Conf. Adv. Comput. Technol. Appl. ICACTA 2022, 2022, https:\/\/doi.org\/10.1109\/ICACTA54488.2022.9753392.","DOI":"10.1109\/ICACTA54488.2022.9753392"},{"key":"1119_CR12","doi-asserted-by":"publisher","unstructured":"Sauber-Cole R, Khoshgoftaar TM. The use of generative adversarial networks to alleviate class imbalance in tabular data: a survey. J Big Data. 2022;9(1). https:\/\/doi.org\/10.1186\/s40537-022-00648-6.","DOI":"10.1186\/s40537-022-00648-6"},{"key":"1119_CR13","first-page":"2020","volume-title":"Foundations of data imbalance and solutions for a data democracy","author":"A Kulkarni","year":"2020","unstructured":"Kulkarni A, Chong D, Batarseh FA. Foundations of data imbalance and solutions for a data democracy. Amsterdam: Elsevier Inc.; 2020. p. 2020."},{"key":"1119_CR14","doi-asserted-by":"publisher","first-page":"83","DOI":"10.1016\/j.ins.2020.12.006","volume":"553","author":"VH Barella","year":"2021","unstructured":"Barella VH, Garcia LPF, de Souto MCP, Lorena AC, de Carvalho ACPLF. Assessing the data complexity of imbalanced datasets. Inf Sci (Ny). 2021;553:83\u2013109. https:\/\/doi.org\/10.1016\/j.ins.2020.12.006.","journal-title":"Inf Sci (Ny)"},{"issue":"3","key":"1119_CR15","doi-asserted-by":"publisher","first-page":"563","DOI":"10.1007\/s10844-015-0368-1","volume":"46","author":"K Napierala","year":"2016","unstructured":"Napierala K, Stefanowski J. Types of minority class examples and their influence on learning classifiers from imbalanced data. J Intell Inf Syst. 2016;46(3):563\u201397. https:\/\/doi.org\/10.1007\/s10844-015-0368-1.","journal-title":"J Intell Inf Syst"},{"key":"1119_CR16","doi-asserted-by":"publisher","first-page":"228","DOI":"10.1016\/j.inffus.2022.08.017","volume":"89","author":"MS Santos","year":"2023","unstructured":"Santos MS, Abreu PH, Japkowicz N, Fern\u00e1ndez A, Santos J. A unifying view of class overlap and imbalance: key concepts, multi-view panorama, and open avenues for research. Inf Fusion. 2023;89:228\u201353. https:\/\/doi.org\/10.1016\/j.inffus.2022.08.017.","journal-title":"Inf Fusion"},{"issue":"4","key":"1119_CR17","doi-asserted-by":"publisher","first-page":"394","DOI":"10.1002\/sam.11463","volume":"13","author":"D Singh","year":"2020","unstructured":"Singh D, Gosain A, Saha A. Weighted k-nearest neighbor based data complexity metrics for imbalanced datasets. Stat Anal Data Min. 2020;13(4):394\u2013404. https:\/\/doi.org\/10.1002\/sam.11463.","journal-title":"Stat Anal Data Min"},{"issue":"9","key":"1119_CR18","doi-asserted-by":"publisher","first-page":"3525","DOI":"10.1109\/TNNLS.2019.2944962","volume":"31","author":"Y Lu","year":"2020","unstructured":"Lu Y, Cheung YM, Tang YY. Bayes imbalance impact index: a measure of class imbalanced data set for classification problem. IEEE Trans Neural Netw Learn Syst. 2020;31(9):3525\u201339. https:\/\/doi.org\/10.1109\/TNNLS.2019.2944962.","journal-title":"IEEE Trans Neural Netw Learn Syst"},{"issue":"7","key":"1119_CR19","doi-asserted-by":"publisher","first-page":"1961","DOI":"10.1007\/s10115-021-01577-1","volume":"63","author":"JD Pascual-Triana","year":"2021","unstructured":"Pascual-Triana JD, Charte D, Andr\u00e9sArroyo M, Fern\u00e1ndez A, Herrera F. Revisiting data complexity metrics based on morphology for overlap and imbalance: snapshot, new overlap number of balls metrics and singular problems prospect. Knowl Inf Syst. 2021;63(7):1961\u201389. https:\/\/doi.org\/10.1007\/s10115-021-01577-1.","journal-title":"Knowl Inf Syst"},{"issue":"2","key":"1119_CR20","doi-asserted-by":"publisher","first-page":"353","DOI":"10.1109\/TEVC.2023.3257230","volume":"28","author":"W Pei","year":"2024","unstructured":"Pei W, Xue B, Member S, Zhang M, Shang L. A survey on unbalanced classification\u202f: how can evolutionary computation help\u202f? IEEE Trans Evol Comput. 2024;28(2):353\u201373. https:\/\/doi.org\/10.1109\/TEVC.2023.3257230.","journal-title":"IEEE Trans Evol Comput"},{"key":"1119_CR21","doi-asserted-by":"publisher","first-page":"63243","DOI":"10.1007\/s11042-023-17864-8","volume":"83","author":"A Kumar","year":"2024","unstructured":"Kumar A, Singh D, Shankar R. Class overlap handling methods in imbalanced domain\u202f: A comprehensive survey. MultiMed Tools Appl. 2024;83:63243\u201390. https:\/\/doi.org\/10.1007\/s11042-023-17864-8.","journal-title":"MultiMed Tools Appl"},{"key":"1119_CR22","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1155\/2019\/5901087","volume":"2019","author":"A Onan","year":"2019","unstructured":"Onan A. Consensus clustering-based undersampling approach to imbalanced learning. Sci Progr. 2019;2019:1\u201314. https:\/\/doi.org\/10.1155\/2019\/5901087.","journal-title":"Sci Progr"},{"key":"1119_CR23","doi-asserted-by":"publisher","first-page":"59069","DOI":"10.1109\/ACCESS.2020.2983003","volume":"8","author":"AS Tarawneh","year":"2020","unstructured":"Tarawneh AS, Hassanat ABA, Almohammadi K, Chetverikov D, Bellinger C. SMOTEFUNA: synthetic minority over-sampling technique based on furthest neighbour algorithm. IEEE Access. 2020;8:59069\u201382. https:\/\/doi.org\/10.1109\/ACCESS.2020.2983003.","journal-title":"IEEE Access"},{"issue":"June","key":"1119_CR24","doi-asserted-by":"publisher","first-page":"321","DOI":"10.1613\/jair.953","volume":"16","author":"NV Chawla","year":"2002","unstructured":"Chawla NV, Bowyer KW, Hall LO, Kegelmeyer WP. SMOTE: synthetic minority over-sampling technique. J Artif Intell Res. 2002;16(June):321\u201357. https:\/\/doi.org\/10.1613\/jair.953.","journal-title":"J Artif Intell Res"},{"key":"1119_CR25","doi-asserted-by":"publisher","first-page":"863","DOI":"10.1613\/jair.1.11192","volume":"61","author":"A Fern\u00e1ndez","year":"2018","unstructured":"Fern\u00e1ndez A, Garc\u00eda S, Herrera F, Chawla NV. SMOTE for learning from imbalanced data: progress and challenges, marking the 15-year anniversary. J Artif Intell Res. 2018;61:863\u2013905. https:\/\/doi.org\/10.1613\/jair.1.11192.","journal-title":"J Artif Intell Res"},{"key":"1119_CR26","doi-asserted-by":"publisher","first-page":"124863","DOI":"10.1016\/j.eswa.2024.124863","volume":"256","author":"J Wainer","year":"2024","unstructured":"Wainer J. An empirical evaluation of imbalanced data strategies from a practitioner \u2019 s point of view. Expert Syst Appl. 2024;256:124863. https:\/\/doi.org\/10.1016\/j.eswa.2024.124863.","journal-title":"Expert Syst Appl"},{"key":"1119_CR27","first-page":"2825","volume":"12","author":"F Pedregosa","year":"2011","unstructured":"Pedregosa F, et al. Scikit-learn: machine learning in Python. J Mach Learn Res. 2011;12:2825\u201330.","journal-title":"J Mach Learn Res"},{"key":"1119_CR28","doi-asserted-by":"publisher","first-page":"878","DOI":"10.1007\/11538059_91","volume":"3644","author":"H Han","year":"2005","unstructured":"Han H, Wang WY, Mao BH. Borderline-SMOTE: a new over-sampling method in imbalanced data sets learning. Lect Notes Comput Sci. 2005;3644:878\u201387. https:\/\/doi.org\/10.1007\/11538059_91.","journal-title":"Lect Notes Comput Sci"},{"issue":"1","key":"1119_CR29","doi-asserted-by":"publisher","first-page":"4","DOI":"10.1504\/ijkesdp.2011.039875","volume":"3","author":"HM Nguyen","year":"2011","unstructured":"Nguyen HM, Cooper EW, Kamei K. Borderline over-sampling for imbalanced data classification. Int J Knowl Eng Soft Data Paradig. 2011;3(1):4. https:\/\/doi.org\/10.1504\/ijkesdp.2011.039875.","journal-title":"Int J Knowl Eng Soft Data Paradig"},{"key":"1119_CR30","doi-asserted-by":"publisher","unstructured":"He H, Bai Y, Garcia EA, Li S. ADASYN: adaptive synthetic sampling approach for imbalanced learning. Proc Int Jt Conf Neural Netw. 2008; 1322\u20131328. https:\/\/doi.org\/10.1109\/IJCNN.2008.4633969.","DOI":"10.1109\/IJCNN.2008.4633969"},{"key":"1119_CR31","doi-asserted-by":"publisher","first-page":"475","DOI":"10.1007\/978-3-642-01307-2_43","volume":"5476","author":"C Bunkhumpornpat","year":"2009","unstructured":"Bunkhumpornpat C, Sinapiromsaran K, Lursinsap C. Safe-level-SMOTE: safe-level-synthetic minority over-sampling technique for handling the class imbalanced problem. Lect Notes Comput Sci. 2009;5476:475\u201382. https:\/\/doi.org\/10.1007\/978-3-642-01307-2_43.","journal-title":"Lect Notes Comput Sci"},{"issue":"2","key":"1119_CR32","doi-asserted-by":"publisher","first-page":"405","DOI":"10.1109\/TKDE.2012.232","volume":"26","author":"S Barua","year":"2014","unstructured":"Barua S, Islam MM, Yao X, Murase K. MWMOTE\u2014majority weighted minority oversampling technique for imbalanced data set learning. IEEE Trans Knowl Data Eng. 2014;26(2):405\u201325. https:\/\/doi.org\/10.1109\/TKDE.2012.232.","journal-title":"IEEE Trans Knowl Data Eng"},{"issue":"3","key":"1119_CR33","doi-asserted-by":"publisher","first-page":"664","DOI":"10.1007\/s10489-011-0287-y","volume":"36","author":"C Bunkhumpornpat","year":"2012","unstructured":"Bunkhumpornpat C, Sinapiromsaran K, Lursinsap C. DBSMOTE: density-based synthetic minority over-sampling technique. Appl Intell. 2012;36(3):664\u201384. https:\/\/doi.org\/10.1007\/s10489-011-0287-y.","journal-title":"Appl Intell"},{"key":"1119_CR34","doi-asserted-by":"publisher","DOI":"10.1016\/j.ibmed.2020.100023","volume":"3","author":"VPK Turlapati","year":"2020","unstructured":"Turlapati VPK, Prusty MR. Outlier-SMOTE: a refined oversampling technique for improved detection of COVID-19. Intell Med. 2020;3: 100023. https:\/\/doi.org\/10.1016\/j.ibmed.2020.100023.","journal-title":"Intell Med"},{"issue":"1","key":"1119_CR35","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s13755-020-00112-w","volume":"8","author":"M Naseriparsa","year":"2020","unstructured":"Naseriparsa M, Al-Shammari A, Sheng M, Zhang Y, Zhou R. RSMOTE: improving classification performance over imbalanced medical datasets. Heal Inf Sci Syst. 2020;8(1):1\u201313. https:\/\/doi.org\/10.1007\/s13755-020-00112-w.","journal-title":"Heal Inf Sci Syst"},{"key":"1119_CR36","doi-asserted-by":"publisher","unstructured":"MacIejewski T, Stefanowski J. Local neighbourhood extension of SMOTE for mining imbalanced data. In: IEEE SSCI 2011 Symp. Ser. Comput. Intell. - CIDM 2011 2011 IEEE Symp. Comput. Intell. Data Min., pp. 104\u2013111, 2011. https:\/\/doi.org\/10.1109\/CIDM.2011.5949434.","DOI":"10.1109\/CIDM.2011.5949434"},{"key":"1119_CR37","doi-asserted-by":"publisher","first-page":"184","DOI":"10.1016\/j.ins.2014.08.051","volume":"291","author":"JA S\u00e1ez","year":"2015","unstructured":"S\u00e1ez JA, Luengo J, Stefanowski J, Herrera F. SMOTE-IPF: addressing the noisy and borderline examples problem in imbalanced classification by a re-sampling method with filtering. Inf Sci (Ny). 2015;291:184\u2013203. https:\/\/doi.org\/10.1016\/j.ins.2014.08.051.","journal-title":"Inf Sci (Ny)"},{"key":"1119_CR38","doi-asserted-by":"publisher","first-page":"107","DOI":"10.1016\/j.neucom.2020.02.081","volume":"399","author":"X Ye","year":"2020","unstructured":"Ye X, Li H, Imakura A, Sakurai T. An oversampling framework for imbalanced classification based on Laplacian eigenmaps. Neurocomputing. 2020;399:107\u201316. https:\/\/doi.org\/10.1016\/j.neucom.2020.02.081.","journal-title":"Neurocomputing"},{"key":"1119_CR39","doi-asserted-by":"publisher","unstructured":"Cieslak DA, Chawla NV, Striegel A. Combating imbalance in network intrusion datasets. In: 2006 IEEE Int. Conf. Granul. Comput., pp. 732\u2013737, 2006, https:\/\/doi.org\/10.1109\/grc.2006.1635905.","DOI":"10.1109\/grc.2006.1635905"},{"issue":"3","key":"1119_CR40","doi-asserted-by":"publisher","first-page":"841","DOI":"10.1007\/s10115-019-01380-z","volume":"62","author":"C Bellinger","year":"2020","unstructured":"Bellinger C, Sharma S, Japkowicz N, Za\u00efane OR. Framework for extreme imbalance classification: SWIM\u2014sampling with the majority class. Knowl Inf Syst. 2020;62(3):841\u201366. https:\/\/doi.org\/10.1007\/s10115-019-01380-z.","journal-title":"Knowl Inf Syst"},{"issue":"2","key":"1119_CR41","doi-asserted-by":"publisher","first-page":"1","DOI":"10.3390\/sym13020194","volume":"13","author":"Z Jiang","year":"2021","unstructured":"Jiang Z, Pan T, Zhang C, Yang J. A new oversampling method based on the classification contribution degree. Symmetry (Basel). 2021;13(2):1\u201313. https:\/\/doi.org\/10.3390\/sym13020194.","journal-title":"Symmetry (Basel)"},{"key":"1119_CR42","doi-asserted-by":"publisher","first-page":"146","DOI":"10.1016\/j.ins.2017.04.046","volume":"408","author":"WA Rivera","year":"2017","unstructured":"Rivera WA. Noise reduction a priori synthetic over-sampling for class imbalanced data sets. Inf Sci (Ny). 2017;408:146\u201361. https:\/\/doi.org\/10.1016\/j.ins.2017.04.046.","journal-title":"Inf Sci (Ny)"},{"issue":"2","key":"1119_CR43","doi-asserted-by":"publisher","first-page":"667","DOI":"10.1109\/TKDE.2020.2985965","volume":"34","author":"Y Xie","year":"2022","unstructured":"Xie Y, Qiu M, Zhang H, Peng L, Chen Z. Gaussian distribution based oversampling for imbalanced data classification. IEEE Trans Knowl Data Eng. 2022;34(2):667\u201379. https:\/\/doi.org\/10.1109\/TKDE.2020.2985965.","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"1119_CR44","doi-asserted-by":"publisher","first-page":"74763","DOI":"10.1109\/ACCESS.2021.3080316","volume":"9","author":"GA Pradipta","year":"2021","unstructured":"Pradipta GA, Wardoyo R, Musdholifah A, Sanjaya INH. Radius-SMOTE: a new oversampling technique of minority samples based on radius distance for learning from imbalanced data. IEEE Access. 2021;9:74763\u201377. https:\/\/doi.org\/10.1109\/ACCESS.2021.3080316.","journal-title":"IEEE Access"},{"issue":"1","key":"1119_CR45","doi-asserted-by":"publisher","first-page":"20","DOI":"10.1145\/1007730.1007735","volume":"6","author":"GEAPA Batista","year":"2004","unstructured":"Batista GEAPA, Prati RC, Monard MC. A study of the behavior of several methods for balancing machine learning training data. ACM SIGKDD Explor Newsl. 2004;6(1):20\u20139. https:\/\/doi.org\/10.1145\/1007730.1007735.","journal-title":"ACM SIGKDD Explor Newsl"},{"key":"1119_CR46","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2021.108511","volume":"124","author":"S Maldonado","year":"2022","unstructured":"Maldonado S, Vairetti C, Fernandez A, Herrera F. FW-SMOTE: a feature-weighted oversampling approach for imbalanced classification. Pattern Recognit. 2022;124: 108511. https:\/\/doi.org\/10.1016\/j.patcog.2021.108511.","journal-title":"Pattern Recognit"},{"issue":"4","key":"1119_CR47","doi-asserted-by":"publisher","first-page":"995","DOI":"10.1016\/j.eswa.2012.08.014","volume":"40","author":"P Luukka","year":"2013","unstructured":"Luukka P, Kurama O. Similarity classifier with ordered weighted averaging operators. Expert Syst Appl. 2013;40(4):995\u20131002. https:\/\/doi.org\/10.1016\/j.eswa.2012.08.014.","journal-title":"Expert Syst Appl"},{"issue":"5","key":"1119_CR48","doi-asserted-by":"publisher","first-page":"565","DOI":"10.14456\/sjst-psu.2017.70","volume":"39","author":"W Siriseriwan","year":"2017","unstructured":"Siriseriwan W, Sinapiromsaran K. Adaptive neighbor synthetic minority oversampling technique under 1NN outcast handling. Songklanakarin J Sci Technol. 2017;39(5):565\u201376. https:\/\/doi.org\/10.14456\/sjst-psu.2017.70.","journal-title":"Songklanakarin J Sci Technol"},{"issue":"1","key":"1119_CR49","first-page":"234","volume":"43","author":"W Siriseriwan","year":"2016","unstructured":"Siriseriwan W, Sinapiromsaran K. The effective redistribution for imbalance dataset: relocating safe-eevel SMOTE with minority outcast handling. Chiang Mai J Sci. 2016;43(1):234\u201346.","journal-title":"Chiang Mai J Sci"},{"key":"1119_CR50","doi-asserted-by":"publisher","first-page":"19","DOI":"10.1016\/j.neucom.2018.04.089","volume":"343","author":"M Koziarski","year":"2019","unstructured":"Koziarski M, Krawczyk B, Wo\u017aniak M. Radial-Based oversampling for noisy imbalanced data classification. Neurocomputing. 2019;343:19\u201333. https:\/\/doi.org\/10.1016\/j.neucom.2018.04.089.","journal-title":"Neurocomputing"},{"issue":"4","key":"1119_CR51","doi-asserted-by":"publisher","first-page":"347","DOI":"10.1007\/s13748-012-0027-5","volume":"1","author":"V Garc\u00eda","year":"2012","unstructured":"Garc\u00eda V, S\u00e1nchez JS, Mart\u00edn-F\u00e9lez R, Mollineda RA. Surrounding neighborhood-based SMOTE for learning from imbalanced data sets. Prog Artif Intell. 2012;1(4):347\u201362. https:\/\/doi.org\/10.1007\/s13748-012-0027-5.","journal-title":"Prog Artif Intell"},{"issue":"2","key":"1119_CR52","doi-asserted-by":"publisher","first-page":"423","DOI":"10.24507\/ijicic.15.02.423","volume":"15","author":"T Fahrudin","year":"2019","unstructured":"Fahrudin T, Buliali JL, Fatichah C. Enhancing the performance of smote algorithm by using attribute weighting scheme and new selective sampling method for imbalanced data set. Int J Innov Comput Inf Control. 2019;15(2):423\u201344. https:\/\/doi.org\/10.24507\/ijicic.15.02.423.","journal-title":"Int J Innov Comput Inf Control"},{"key":"1119_CR53","doi-asserted-by":"publisher","first-page":"277","DOI":"10.1007\/11574798_11","volume-title":"Analogy-based reasoning in classifier construction","author":"A Wojna","year":"2005","unstructured":"Wojna A. Analogy-based reasoning in classifier construction. Berlin: Springer; 2005. p. 277\u2013374. https:\/\/doi.org\/10.1007\/11574798_11."},{"key":"1119_CR54","doi-asserted-by":"publisher","first-page":"118","DOI":"10.1016\/j.ins.2019.06.007","volume":"501","author":"G Douzas","year":"2019","unstructured":"Douzas G, Bacao F. Geometric SMOTE a geometrically enhanced drop-in replacement for SMOTE. Inf Sci (Ny). 2019;501:118\u201335. https:\/\/doi.org\/10.1016\/j.ins.2019.06.007.","journal-title":"Inf Sci (Ny)"},{"issue":"6","key":"1119_CR55","doi-asserted-by":"publisher","first-page":"3413","DOI":"10.1016\/j.jksuci.2021.01.014","volume":"34","author":"NU Asniar","year":"2022","unstructured":"Asniar NU, Maulidevi, and K. Surendro,. SMOTE-LOF for noise identification in imbalanced data classification. J King Saud Univ Comput Inf Sci. 2022;34(6):3413\u201323. https:\/\/doi.org\/10.1016\/j.jksuci.2021.01.014.","journal-title":"J King Saud Univ Comput Inf Sci"},{"issue":"2","key":"1119_CR56","doi-asserted-by":"publisher","first-page":"93","DOI":"10.1145\/335191.335388","volume":"29","author":"MM Breuniq","year":"2000","unstructured":"Breuniq MM, Kriegel HP, Ng RT, Sander J. LOF: Identifying density-based local outliers. SIGMOD Rec (ACM Spec Interes Gr Manag Data). 2000;29(2):93\u2013104. https:\/\/doi.org\/10.1145\/335191.335388.","journal-title":"SIGMOD Rec (ACM Spec. Interes. Gr. Manag. Data)."},{"issue":"3","key":"1119_CR57","doi-asserted-by":"publisher","first-page":"1394","DOI":"10.1007\/s10489-020-01852-8","volume":"51","author":"H Guan","year":"2021","unstructured":"Guan H, Zhang Y, Xian M, Cheng HD, Tang X. SMOTE-WENN: solving class imbalance and small sample problems by oversampling and distance scaling. Appl Intell. 2021;51(3):1394\u2013409. https:\/\/doi.org\/10.1007\/s10489-020-01852-8.","journal-title":"Appl Intell"},{"key":"1119_CR58","unstructured":"Batista GE, Bazzan ALC, Monard M-C, Batista GEAPA, Monard MC. Balancing training data for automated annotation of keywords: a case study. Missing data imputation View project Automatic Genetic Generation of Fuzzy Classification Systems. View project Balancing Training Data for Automated Annotation of Keywords: a Cas. 2003. Available: https:\/\/www.researchgate.net\/publication\/221322870."},{"key":"1119_CR59","doi-asserted-by":"publisher","first-page":"47","DOI":"10.1016\/j.ins.2019.08.062","volume":"509","author":"P Vuttipittayamongkol","year":"2020","unstructured":"Vuttipittayamongkol P, Elyan E. Neighbourhood-based undersampling approach for handling imbalanced and overlapped data. Inf Sci (Ny). 2020;509:47\u201370. https:\/\/doi.org\/10.1016\/j.ins.2019.08.062.","journal-title":"Inf Sci (Ny)"},{"key":"1119_CR60","doi-asserted-by":"publisher","first-page":"438","DOI":"10.1016\/j.ins.2021.03.041","volume":"565","author":"J Li","year":"2021","unstructured":"Li J, Zhu Q, Wu Q, Fan Z. A novel oversampling technique for class-imbalanced learning based on SMOTE and natural neighbors. Inf Sci (Ny). 2021;565:438\u201355. https:\/\/doi.org\/10.1016\/j.ins.2021.03.041.","journal-title":"Inf Sci (Ny)"},{"key":"1119_CR61","doi-asserted-by":"publisher","DOI":"10.1155\/2019\/3526539","author":"W Xie","year":"2019","unstructured":"Xie W, Liang G, Dong Z, Tan B, Zhang B. An improved oversampling algorithm based on the samples\u2019 selection strategy for classifying imbalanced data\u201d. Math Probl Eng. 2019. https:\/\/doi.org\/10.1155\/2019\/3526539.","journal-title":"Math Probl Eng"},{"issue":"2","key":"1119_CR62","doi-asserted-by":"publisher","DOI":"10.1088\/1742-6596\/1237\/2\/022052","volume":"1237","author":"L Zhang","year":"2019","unstructured":"Zhang L, Tan B, Liu T, Sun X. Classification study for the imbalanced data based on biased-SVM and the modified over-sampling algorithm. J Phys Conf Ser. 2019;1237(2): 022052. https:\/\/doi.org\/10.1088\/1742-6596\/1237\/2\/022052.","journal-title":"J Phys Conf Ser"},{"issue":"2","key":"1119_CR63","doi-asserted-by":"publisher","first-page":"139","DOI":"10.1142\/S0218194019500074","volume":"29","author":"S Guo","year":"2019","unstructured":"Guo S, Chen R, Li H, Zhang T, Liu Y. Identify severity bug report with distribution imbalance by CR-SMOTE and ELM. Int J Softw Eng Knowl Eng. 2019;29(2):139\u201375. https:\/\/doi.org\/10.1142\/S0218194019500074.","journal-title":"Int J Softw Eng Knowl Eng"},{"key":"1119_CR64","doi-asserted-by":"publisher","first-page":"420","DOI":"10.1016\/j.procs.2020.08.043","volume":"176","author":"T Sasada","year":"2020","unstructured":"Sasada T, Liu Z, Baba T, Hatano K, Kimura Y. A resampling method for imbalanced datasets considering noise and overlap. Procedia Comput Sci. 2020;176:420\u20139. https:\/\/doi.org\/10.1016\/j.procs.2020.08.043.","journal-title":"Procedia Comput Sci"},{"issue":"3","key":"1119_CR65","doi-asserted-by":"publisher","first-page":"515","DOI":"10.1109\/TIT.1968.1054155","volume":"14","author":"PE Hart","year":"1968","unstructured":"Hart PE. The condensed nearest neighbor rule. IEEE Trans Inf Theory. 1968;14(3):515\u20136. https:\/\/doi.org\/10.1109\/TIT.1968.1054155.","journal-title":"IEEE Trans Inf Theory"},{"issue":"2","key":"1119_CR66","doi-asserted-by":"publisher","first-page":"279","DOI":"10.1007\/s10994-020-05913-4","volume":"110","author":"S Bej","year":"2021","unstructured":"Bej S, Davtyan N, Wolfien M, Nassar M, Wolkenhauer O. LoRAS: an oversampling approach for imbalanced datasets. Mach Learn. 2021;110(2):279\u2013301. https:\/\/doi.org\/10.1007\/s10994-020-05913-4.","journal-title":"Mach Learn"},{"issue":"4","key":"1119_CR67","doi-asserted-by":"publisher","first-page":"391","DOI":"10.17791\/jcs.2017.18.4.391","volume":"18","author":"Y Suh","year":"2017","unstructured":"Suh Y, Yu J, Mo J, Song L, Kim C. A comparison of oversampling methods on imbalanced topic classification of Korean news articles. J Cogn Sci (Seoul). 2017;18(4):391\u2013437. https:\/\/doi.org\/10.17791\/jcs.2017.18.4.391.","journal-title":"J Cogn Sci (Seoul)"},{"key":"1119_CR68","doi-asserted-by":"publisher","DOI":"10.1016\/j.asoc.2019.105662","volume":"83","author":"G Kov\u00e1cs","year":"2019","unstructured":"Kov\u00e1cs G. An empirical comparison and evaluation of minority oversampling techniques on a large number of imbalanced datasets. Appl Soft Comput J. 2019;83: 105662. https:\/\/doi.org\/10.1016\/j.asoc.2019.105662.","journal-title":"Appl Soft Comput J."},{"key":"1119_CR69","doi-asserted-by":"publisher","unstructured":"Gazzah S, Ben Amara NE. New oversampling approaches based on polynomial fitting for imbalanced data sets. In: DAS 2008 - Proc. 8th IAPR Int. Work. Doc. Anal. Syst., pp. 677\u2013684, 2008, https:\/\/doi.org\/10.1109\/DAS.2008.74.","DOI":"10.1109\/DAS.2008.74"},{"key":"1119_CR70","doi-asserted-by":"publisher","first-page":"317","DOI":"10.1007\/978-3-642-37456-2_27","volume":"7819","author":"S Barua","year":"2013","unstructured":"Barua S, Islam MM, Murase K. ProWSyn: proximity weighted synthetic oversampling technique for imbalanced data set learning. Lect Notes Comput Sci. 2013;7819:317\u201328. https:\/\/doi.org\/10.1007\/978-3-642-37456-2_27.","journal-title":"Lect Notes Comput Sci"},{"issue":"8","key":"1119_CR71","doi-asserted-by":"publisher","first-page":"2050043","DOI":"10.1142\/S0129065720500434","volume":"30","author":"P Vuttipittayamongkol","year":"2020","unstructured":"Vuttipittayamongkol P, Elyan E. Improved overlap-based undersampling for imbalanced dataset classification with application to epilepsy and Parkinson\u2019s disease. Int J Neural Syst. 2020;30(8):2050043. https:\/\/doi.org\/10.1142\/S0129065720500434.","journal-title":"Int J Neural Syst"},{"key":"1119_CR72","doi-asserted-by":"publisher","unstructured":"Yan S, Te Kao H, Ferrara E. Fair class balancing: enhancing model fairness without observing sensitive attributes. Int Conf Inf Knowl Manag Proc. pp. 1715\u20131724, 2020, https:\/\/doi.org\/10.1145\/3340531.3411980.","DOI":"10.1145\/3340531.3411980"},{"key":"1119_CR73","doi-asserted-by":"publisher","DOI":"10.1007\/s44248-024-00007-1","author":"D Dablain","year":"2024","unstructured":"Dablain D, Krawczyk B, Chawla N. Towards a holistic view of bias in machine learning: bridging algorithmic fairness and imbalanced learning. Discov Data. 2024. https:\/\/doi.org\/10.1007\/s44248-024-00007-1.","journal-title":"Discov Data"},{"issue":"7","key":"1119_CR74","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3616865","volume":"56","author":"S Caton","year":"2024","unstructured":"Caton S, Haas C. Fairness in machine learning: a survey. ACM Comput Surv. 2024;56(7):1\u201338. https:\/\/doi.org\/10.1145\/3616865.","journal-title":"ACM Comput Surv"},{"key":"1119_CR75","unstructured":"Kubat M. Addressing the curse of imbalanced training sets: one-sided selection. In: Fourteenth Int. Conf. Mach. Learn. 2000."},{"key":"1119_CR76","first-page":"769","volume":"6","author":"I Tomek","year":"1976","unstructured":"Tomek I. Tomek link: two modifications of CNN. IEEE Trans Syst Man Cybern. 1976;6:769\u201372.","journal-title":"IEEE Trans Syst Man Cybern"},{"key":"1119_CR77","doi-asserted-by":"publisher","first-page":"63","DOI":"10.1007\/3-540-48229-6_9","volume":"2101","author":"J Laurikkala","year":"2001","unstructured":"Laurikkala J. Improving identification of difficult small classes by balancing class distribution. Lect Notes Comput Sci. 2001;2101:63\u20136. https:\/\/doi.org\/10.1007\/3-540-48229-6_9.","journal-title":"Lect Notes Comput Sci"},{"key":"1119_CR78","unstructured":"Zhang J, Mani I. kNN approach to unbalanced data distributions: a case study involving information extraction."},{"issue":"2","key":"1119_CR79","doi-asserted-by":"publisher","first-page":"225","DOI":"10.1007\/s10994-013-5422-z","volume":"95","author":"MR Smith","year":"2014","unstructured":"Smith MR, Martinez T, Giraud-Carrier C. An instance level analysis of data complexity. Mach Learn. 2014;95(2):225\u201356. https:\/\/doi.org\/10.1007\/s10994-013-5422-z.","journal-title":"Mach Learn"},{"key":"1119_CR80","unstructured":"Peterson A, Martinez T. Estimating the potential for combining learning models. 2005."},{"key":"1119_CR81","doi-asserted-by":"publisher","first-page":"17","DOI":"10.1016\/j.ins.2017.05.008","volume":"409\u2013410","author":"WC Lin","year":"2017","unstructured":"Lin WC, Tsai CF, Hu YH, Jhang JS. Clustering-based undersampling in class-imbalanced data. Inf Sci (Ny). 2017;409\u2013410:17\u201326. https:\/\/doi.org\/10.1016\/j.ins.2017.05.008.","journal-title":"Inf Sci (Ny)"},{"key":"1119_CR82","unstructured":"A. Accepted. Overlap-based undersampling for improving imbalanced data classification . Year: overlap-based undersampling for improving imbalanced data classification. 2019; 0\u20138."},{"key":"1119_CR83","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2020.107262","volume":"102","author":"M Koziarski","year":"2020","unstructured":"Koziarski M. Radial-based undersampling for imbalanced data classification. Pattern Recognit. 2020;102: 107262. https:\/\/doi.org\/10.1016\/j.patcog.2020.107262.","journal-title":"Pattern Recognit"},{"issue":"4","key":"1119_CR84","doi-asserted-by":"publisher","first-page":"463","DOI":"10.1109\/TSMCC.2011.2161285","volume":"42","author":"M Galar","year":"2012","unstructured":"Galar M, Fernandez A, Barrenechea E, Bustince H, Herrera F. \u201cA review on ensembles for the class imbalance problem: bagging-, boosting-, and hybrid-based approaches. IEEE Trans Syst Man Cybern Part C Appl Rev. 2012;42(4):463\u201384. https:\/\/doi.org\/10.1109\/TSMCC.2011.2161285.","journal-title":"IEEE Trans Syst Man Cybern Part C Appl Rev"},{"key":"1119_CR85","doi-asserted-by":"publisher","first-page":"2019","DOI":"10.1109\/IJCNN.2019.8852415","volume":"1\u20138","author":"F Zhang","year":"2019","unstructured":"Zhang F, Liu G, Li Z, Yan C, Jiang C. GMM-based undersampling and its application for credit card fraud detection. Proc Int J Conf Neural Netw. 2019;1\u20138:2019. https:\/\/doi.org\/10.1109\/IJCNN.2019.8852415.","journal-title":"Proc Int J Conf Neural Netw"},{"key":"1119_CR86","doi-asserted-by":"publisher","first-page":"2019","DOI":"10.1109\/ICMLC48188.2019.8949290","volume":"1\u20138","author":"J Zhang","year":"2019","unstructured":"Zhang J, Wang T, Ng WWY, Zhang S, Nugent CD. Undersampling near decision boundary for imbalance problems. Proc Int Conf Mach Learn Cybern. 2019;1\u20138:2019. https:\/\/doi.org\/10.1109\/ICMLC48188.2019.8949290.","journal-title":"Proc Int Conf Mach Learn Cybern"},{"issue":"1","key":"1119_CR87","doi-asserted-by":"publisher","first-page":"21","DOI":"10.1109\/TIT.1967.1053964","volume":"13","author":"TM Cover","year":"1967","unstructured":"Cover TM, Hart PE. Nearest neighbor pattern classification. IEEE Trans Inf Theory. 1967;13(1):21\u20137. https:\/\/doi.org\/10.1109\/TIT.1967.1053964.","journal-title":"IEEE Trans Inf Theory"},{"key":"1119_CR88","doi-asserted-by":"publisher","unstructured":"Wang S, Yao X. Diversity analysis on imbalanced data sets by using ensemble models. In: 2009 IEEE Symp. Comput. Intell. Data Mining, CIDM 2009 - Proc, pp. 324\u2013331, 2009, https:\/\/doi.org\/10.1109\/CIDM.2009.4938667.","DOI":"10.1109\/CIDM.2009.4938667"},{"issue":"1","key":"1119_CR89","doi-asserted-by":"publisher","first-page":"185","DOI":"10.1109\/TSMCA.2009.2029559","volume":"40","author":"C Seiffert","year":"2010","unstructured":"Seiffert C, Khoshgoftaar TM, Van Hulse J, Napolitano A. RUSBoost: a hybrid approach to alleviating class imbalance. IEEE Trans Syst Man Cybern Part A Syst Human. 2010;40(1):185\u201397. https:\/\/doi.org\/10.1109\/TSMCA.2009.2029559.","journal-title":"IEEE Trans Syst Man Cybern Part A Syst Human."},{"issue":"2","key":"1119_CR90","doi-asserted-by":"publisher","first-page":"105","DOI":"10.1080\/09540091.2018.1560394","volume":"31","author":"D Devi","year":"2019","unstructured":"Devi D, Biswas SK, Purkayastha B. Learning in presence of class imbalance and class overlapping by using one-class SVM and undersampling technique. Conn Sci. 2019;31(2):105\u201342. https:\/\/doi.org\/10.1080\/09540091.2018.1560394.","journal-title":"Conn Sci"},{"key":"1119_CR91","doi-asserted-by":"publisher","first-page":"375","DOI":"10.12785\/amis\/071L50","volume":"7","author":"Z Yang","year":"2013","unstructured":"Yang Z, Gao D. Classification for imbalanced and overlapping classes using outlier detection and sampling techniques. Appl Math Inf Sci. 2013;7:375\u201381. https:\/\/doi.org\/10.12785\/amis\/071L50.","journal-title":"Appl Math Inf Sci."},{"key":"1119_CR92","doi-asserted-by":"publisher","first-page":"63","DOI":"10.1109\/TKDE.2006.17","volume":"18","author":"Z-H Zhou","year":"2006","unstructured":"Zhou Z-H, Liu X-Y. Training cost-sensitive neural networks with methods addressing the class imbalance problem. Knowl Data Eng IEEE Trans. 2006;18:63\u201377. https:\/\/doi.org\/10.1109\/TKDE.2006.17.","journal-title":"Knowl Data Eng IEEE Trans"},{"key":"1119_CR93","doi-asserted-by":"publisher","first-page":"220","DOI":"10.1007\/978-3-540-24674-9_24","volume":"3025","author":"SB Kotsiantis","year":"2004","unstructured":"Kotsiantis SB, Pintelas PE. A cost sensitive technique for ordinal classification problems. Lect Notes Artif Intell (Subser Lect Notes Comput Sci. 2004;3025:220\u20139. https:\/\/doi.org\/10.1007\/978-3-540-24674-9_24.","journal-title":"Lect Notes Artif Intell (Subser Lect Notes Comput Sci."},{"key":"1119_CR94","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2020.106689","volume":"213","author":"X Xie","year":"2021","unstructured":"Xie X, Liu H, Zeng S, Lin L, Li W. A novel progressively undersampling method based on the density peaks sequence for imbalanced data. Knowl Based Syst. 2021;213: 106689. https:\/\/doi.org\/10.1016\/j.knosys.2020.106689.","journal-title":"Knowl Based Syst"},{"key":"1119_CR95","doi-asserted-by":"publisher","unstructured":"Peng M et al. Trainable undersampling for class-imbalance learning. In: 33rd AAAI Conf. Artif. Intell. AAAI 2019, 31st Innov. Appl. Artif. Intell. Conf. IAAI 2019 9th AAAI Symp. Educ. Adv. Artif. Intell. EAAI 2019, pp. 4707\u20134714, 2019, https:\/\/doi.org\/10.1609\/aaai.v33i01.33014707.","DOI":"10.1609\/aaai.v33i01.33014707"},{"key":"1119_CR96","doi-asserted-by":"publisher","DOI":"10.1016\/j.jbi.2020.103465","volume":"107","author":"Z Xu","year":"2020","unstructured":"Xu Z, Shen D, Nie T, Kou Y. A hybrid sampling algorithm combining M-SMOTE and ENN based on random forest for medical imbalanced data. J Biomed Inform. 2020;107: 103465. https:\/\/doi.org\/10.1016\/j.jbi.2020.103465.","journal-title":"J Biomed Inform"},{"issue":"4","key":"1119_CR97","doi-asserted-by":"publisher","first-page":"727","DOI":"10.1515\/amcs-2017-0050","volume":"27","author":"M Koziarski","year":"2017","unstructured":"Koziarski M, Wozniak M. CCR: a combined cleaning and resampling algorithm for imbalanced data classification. Int J Appl Math Comput Sci. 2017;27(4):727\u201336. https:\/\/doi.org\/10.1515\/amcs-2017-0050.","journal-title":"Int J Appl Math Comput Sci"},{"issue":"4","key":"1119_CR98","doi-asserted-by":"publisher","first-page":"229","DOI":"10.5391\/IJFIS.2017.17.4.229","volume":"17","author":"H Lee","year":"2017","unstructured":"Lee H, Kim J, Kim S. Gaussian-based SMOTE algorithm for solving skewed class distributions. Int J Fuzzy Log Intell Syst. 2017;17(4):229\u201334. https:\/\/doi.org\/10.5391\/IJFIS.2017.17.4.229.","journal-title":"Int J Fuzzy Log Intell Syst"},{"issue":"September","key":"1119_CR99","doi-asserted-by":"publisher","first-page":"2021","DOI":"10.1016\/j.eswa.2020.114035","volume":"164","author":"B Mirzaei","year":"2020","unstructured":"Mirzaei B, Nikpour B, Nezamabadi-pour H. CDBH: a clustering and density-based hybrid approach for imbalanced data classification. Expert Syst Appl. 2020;164(September):2021. https:\/\/doi.org\/10.1016\/j.eswa.2020.114035.","journal-title":"Expert Syst Appl"},{"issue":"1","key":"1119_CR100","doi-asserted-by":"publisher","first-page":"200","DOI":"10.1016\/j.eswa.2012.07.021","volume":"40","author":"ME Celebi","year":"2013","unstructured":"Celebi ME, Kingravi HA, Vela PA. A comparative study of efficient initialization methods for the k-means clustering algorithm. Expert Syst Appl. 2013;40(1):200\u201310. https:\/\/doi.org\/10.1016\/j.eswa.2012.07.021.","journal-title":"Expert Syst Appl"},{"issue":"2","key":"1119_CR101","doi-asserted-by":"publisher","first-page":"245","DOI":"10.1007\/s10115-011-0465-6","volume":"33","author":"E Ramentol","year":"2012","unstructured":"Ramentol E, Caballero Y, Bello R, Herrera F. SMOTE-RSB*: a hybrid preprocessing approach based on oversampling and undersampling for high imbalanced data-sets using SMOTE and rough sets theory. Knowl Inf Syst. 2012;33(2):245\u201365. https:\/\/doi.org\/10.1007\/s10115-011-0465-6.","journal-title":"Knowl Inf Syst"},{"issue":"3","key":"1119_CR102","doi-asserted-by":"publisher","first-page":"275","DOI":"10.1162\/evco.2009.17.3.275","volume":"17","author":"S Garc\u00eda","year":"2009","unstructured":"Garc\u00eda S, Herrera F. Evolutionary undersampling for classification with imbalanced datasets: proposals and taxonomy. Evol Comput. 2009;17(3):275\u2013306. https:\/\/doi.org\/10.1162\/evco.2009.17.3.275.","journal-title":"Evol Comput"},{"issue":"1","key":"1119_CR103","doi-asserted-by":"publisher","first-page":"7","DOI":"10.1016\/j.artmed.2005.03.002","volume":"37","author":"G Cohen","year":"2006","unstructured":"Cohen G, Hilario M, Sax H, Hugonnet S, Geissbuhler A. Learning from imbalanced data in surveillance of nosocomial infection. Artif Intell Med. 2006;37(1):7\u201318. https:\/\/doi.org\/10.1016\/j.artmed.2005.03.002.","journal-title":"Artif Intell Med"},{"key":"1119_CR104","doi-asserted-by":"publisher","first-page":"161","DOI":"10.1016\/j.ins.2018.04.068","volume":"454\u2013455","author":"GY Wong","year":"2018","unstructured":"Wong GY, Leung FHF, Ling SH. A hybrid evolutionary preprocessing method for imbalanced datasets. Inf Sci (Ny). 2018;454\u2013455:161\u201377. https:\/\/doi.org\/10.1016\/j.ins.2018.04.068.","journal-title":"Inf Sci (Ny)"},{"key":"1119_CR105","doi-asserted-by":"publisher","first-page":"70","DOI":"10.1016\/j.ins.2022.02.038","volume":"595","author":"A Zhang","year":"2022","unstructured":"Zhang A, Yu H, Huan Z, Yang X, Zheng S, Gao S. SMOTE-RkNN: a hybrid re-sampling method based on SMOTE and reverse k-nearest neighbors. Inf Sci (Ny). 2022;595:70\u201388. https:\/\/doi.org\/10.1016\/j.ins.2022.02.038.","journal-title":"Inf Sci (Ny)"},{"key":"1119_CR106","doi-asserted-by":"publisher","first-page":"141","DOI":"10.1016\/j.asoc.2019.02.028","volume":"78","author":"S Susan","year":"2019","unstructured":"Susan S, Kumar A. SSO Maj-SMOTE-SSO Min: three-step intelligent pruning of majority and minority samples for learning from imbalanced datasets. Appl Soft Comput J. 2019;78:141\u20139. https:\/\/doi.org\/10.1016\/j.asoc.2019.02.028.","journal-title":"Appl Soft Comput J"},{"key":"1119_CR107","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2020.105818","volume":"196","author":"M Li","year":"2020","unstructured":"Li M, Xiong A, Wang L, Deng S, Ye J. ACO resampling: enhancing the performance of oversampling methods for class imbalance classification. Knowl Based Syst. 2020;196: 105818. https:\/\/doi.org\/10.1016\/j.knosys.2020.105818.","journal-title":"Knowl Based Syst"},{"issue":"4","key":"1119_CR108","doi-asserted-by":"publisher","first-page":"3205","DOI":"10.1007\/s13369-019-04336-1","volume":"45","author":"H Al","year":"2020","unstructured":"Al H, Islam M, \u00d6yk\u00fc E, Mehtap A, Uluk\u00f6k K. HCAB-SMOTE: a hybrid clustered affinitive borderline SMOTE approach for imbalanced data binary classification. Arab J Sci Eng. 2020;45(4):3205\u201322. https:\/\/doi.org\/10.1007\/s13369-019-04336-1.","journal-title":"Arab J Sci Eng"},{"key":"1119_CR109","doi-asserted-by":"publisher","unstructured":"Koziarski M. CSMOUTE: combined synthetic oversampling and undersampling technique for imbalanced data classification. Proc Int J Conf Neural Netw. 2021; https:\/\/doi.org\/10.1109\/IJCNN52387.2021.9533415.","DOI":"10.1109\/IJCNN52387.2021.9533415"},{"key":"1119_CR110","doi-asserted-by":"publisher","first-page":"333","DOI":"10.1016\/j.neucom.2020.08.060","volume":"417","author":"Y Zhu","year":"2020","unstructured":"Zhu Y, Yan Y, Zhang Y, Zhang Y. EHSO: evolutionary hybrid sampling in overlapping scenarios for imbalanced learning. Neurocomputing. 2020;417:333\u201346. https:\/\/doi.org\/10.1016\/j.neucom.2020.08.060.","journal-title":"Neurocomputing"},{"issue":"6","key":"1119_CR111","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s42979-021-00815-1","volume":"2","author":"IH Sarker","year":"2021","unstructured":"Sarker IH. Deep learning: a comprehensive overview on techniques, taxonomy, applications and research directions. SN Comput Sci. 2021;2(6):1\u201320. https:\/\/doi.org\/10.1007\/s42979-021-00815-1.","journal-title":"SN Comput Sci"},{"key":"1119_CR112","unstructured":"Shiri FM, Mohamed R, Perumal T, Mustapha N. A comprehensive overview and comparative analysis on deep learning models. pp. 1\u201361."},{"key":"1119_CR113","doi-asserted-by":"publisher","first-page":"2600","DOI":"10.3906\/elk-2101-133","volume":"29","author":"OO Abayomi-alli","year":"2021","unstructured":"Abayomi-alli OO, Maskeliunas R. Malignant skin melanoma detection using image augmentation by oversamplingin nonlinear lower-dimensional embedding manifold. Turk J Electr Eng Comput Sci. 2021;29:2600. https:\/\/doi.org\/10.3906\/elk-2101-133.","journal-title":"Turk J Electr Eng Comput Sci"},{"key":"1119_CR114","doi-asserted-by":"publisher","DOI":"10.1016\/j.comnet.2020.107315","volume":"177","author":"H Zhang","year":"2020","unstructured":"Zhang H, Huang L, Wu CQ, Li Z. An effective convolutional neural network based on SMOTE and Gaussian mixture model for intrusion detection in imbalanced dataset. Comput Netw. 2020;177: 107315. https:\/\/doi.org\/10.1016\/j.comnet.2020.107315.","journal-title":"Comput Netw"},{"key":"1119_CR115","doi-asserted-by":"publisher","first-page":"10611","DOI":"10.1007\/s11227-023-05073-x","volume":"79","author":"A Abdelkhalek","year":"2023","unstructured":"Abdelkhalek A, Mashaly M. Addressing the class imbalance problem in network intrusion detection systems using data resampling and deep learning. J Supercomput. 2023;79:10611.","journal-title":"J Supercomput"},{"key":"1119_CR116","volume-title":"Dynamic network anomaly detection system by using deep learning techniques","author":"P Lin","year":"2019","unstructured":"Lin P, Ye K, Xu C. Dynamic network anomaly detection system by using deep learning techniques, vol. 1. Cham: Springer International Publishing; 2019."},{"issue":"February","key":"1119_CR117","doi-asserted-by":"publisher","first-page":"30628","DOI":"10.1109\/ACCESS.2023.3262020","volume":"11","author":"ID Mienye","year":"2023","unstructured":"Mienye ID, Sun Y, Member S. A deep learning ensemble with data resampling for credit card fraud detection. IEEE Access. 2023;11(February):30628\u201338. https:\/\/doi.org\/10.1109\/ACCESS.2023.3262020.","journal-title":"IEEE Access"},{"key":"1119_CR118","doi-asserted-by":"publisher","first-page":"47491","DOI":"10.1109\/ACCESS.2021.3068316","volume":"9","author":"YU Chen","year":"2021","unstructured":"Chen YU, Chang RUI, Guo J. Effects of data augmentation method borderline-SMOTE on emotion recognition of EEG signals based on convolutional neural network. IEEE Access. 2021;9:47491\u2013502. https:\/\/doi.org\/10.1109\/ACCESS.2021.3068316.","journal-title":"IEEE Access."},{"key":"1119_CR119","doi-asserted-by":"publisher","DOI":"10.1016\/j.compbiomed.2022.106142","volume":"150","author":"H Mohan","year":"2022","unstructured":"Mohan H, Chatterjee K, Dashkevych S. The prediction of cardiac abnormality and enhancement in minority class accuracy from imbalanced ECG signals using modified deep neural network models. Comput Biol Med. 2022;150: 106142. https:\/\/doi.org\/10.1016\/j.compbiomed.2022.106142.","journal-title":"Comput Biol Med"},{"key":"1119_CR120","doi-asserted-by":"publisher","DOI":"10.1186\/s12911-022-01775-z","author":"S Sadeghi","year":"2022","unstructured":"Sadeghi S, Khalili D, Ramezankhani A, Mansournia MA. Diabetes mellitus risk prediction in the presence of class imbalance using flexible machine learning methods. BMC Med Inform Decis Mak. 2022. https:\/\/doi.org\/10.1186\/s12911-022-01775-z.","journal-title":"BMC Med Inform Decis Mak"},{"key":"1119_CR121","doi-asserted-by":"crossref","unstructured":"Alani AA, Cosma G. classifying imbalanced multi-modal sensor data for human activity recognition in a smart home using deep learning. 2020.","DOI":"10.1109\/IJCNN48605.2020.9207697"},{"issue":"9","key":"1119_CR122","doi-asserted-by":"publisher","first-page":"6390","DOI":"10.1109\/TNNLS.2021.3136503","volume":"34","author":"D Dablain","year":"2023","unstructured":"Dablain D, Krawczyk B, Chawla NV. DeepSMOTE: fusing deep learning and SMOTE for imbalanced data. IEEE Trans Neural Netw Learn Syst. 2023;34(9):6390\u2013404. https:\/\/doi.org\/10.1109\/TNNLS.2021.3136503.","journal-title":"IEEE Trans Neural Netw Learn Syst"},{"key":"1119_CR123","unstructured":"Varona I, Madera J, Mart\u00ednez L\u00f3pez Y, Hern\u00e1ndez-Nieto JC, SMOTE-Cov: a new over-sampling method based on the Covariance Matrix. 2019."},{"key":"1119_CR124","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2019.113026","volume":"158","author":"V Garc\u00eda","year":"2020","unstructured":"Garc\u00eda V, S\u00e1nchez JS, Marqu\u00e9s AI, Florencia R, Rivera G. Understanding the apparent superiority of over-sampling through an analysis of local information for class-imbalanced data. Expert Syst Appl. 2020;158: 113026. https:\/\/doi.org\/10.1016\/j.eswa.2019.113026.","journal-title":"Expert Syst Appl"},{"key":"1119_CR125","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2021.115589","volume":"185","author":"ARS Parmezan","year":"2021","unstructured":"Parmezan ARS, Lee HD, Spola\u00f4r N, Wu FC. Automatic recommendation of feature selection algorithms based on dataset characteristics. Expert Syst Appl. 2021;185: 115589. https:\/\/doi.org\/10.1016\/j.eswa.2021.115589.","journal-title":"Expert Syst Appl"},{"issue":"18","key":"1119_CR126","doi-asserted-by":"publisher","first-page":"8546","DOI":"10.3390\/app11188546","volume":"11","author":"MS Kraiem","year":"2021","unstructured":"Kraiem MS, S\u00e1nchez-Hern\u00e1ndez F, Moreno-Garc\u00eda MN. \u201cSelecting the suitable resampling strategy for imbalanced data classification regarding dataset properties. An approach based on association models. Appl Sci. 2021;11(18):8546. https:\/\/doi.org\/10.3390\/app11188546.","journal-title":"Appl Sci"},{"issue":"1","key":"1119_CR127","doi-asserted-by":"publisher","first-page":"147","DOI":"10.1007\/s10115-013-0700-4","volume":"42","author":"J Luengo","year":"2015","unstructured":"Luengo J, Herrera F. An automatic extraction method of the domains of competence for learning classifiers using data complexity measures. Knowl Inf Syst. 2015;42(1):147\u201380. https:\/\/doi.org\/10.1007\/s10115-013-0700-4.","journal-title":"Knowl Inf Syst"},{"key":"1119_CR128","unstructured":"Costa AJ, Santos MS, Soares C, Abreu PH. Analysis of imbalance strategies recommendation using a meta-learning approach. 2020."},{"key":"1119_CR129","first-page":"1","volume":"21","author":"E Alcoba\u00e7a","year":"2020","unstructured":"Alcoba\u00e7a E, Siqueira F, Rivolli A, Garcia LPF, Oliva JT, de Carvalho ACPLF. MFE: towards reproducible meta-feature extraction. J Mach Learn Res. 2020;21:1\u20135.","journal-title":"J Mach Learn Res"},{"key":"1119_CR130","doi-asserted-by":"publisher","unstructured":"Tang S, Chen SP. The generation mechanism of synthetic minority class examples. In: 5th Int. Conf. Inf. Technol. Appl. Biomed. ITAB 2008 conjunction with 2nd Int. Symp. Summer Sch. Biomed. Heal. Eng. IS3BHE 2008, no. September, pp. 444\u2013447, 2008, https:\/\/doi.org\/10.1109\/ITAB.2008.4570642.","DOI":"10.1109\/ITAB.2008.4570642"},{"key":"1119_CR131","doi-asserted-by":"publisher","unstructured":"De Morais RFAB, Miranda PBC, Silva RMA. A meta-learning method to select under-sampling algorithms for imbalanced data sets. In: Proc. 2016 5th Brazilian Conf. Intell. Syst. BRACIS 2016, pp. 385\u2013390, 2017. https:\/\/doi.org\/10.1109\/BRACIS.2016.076.","DOI":"10.1109\/BRACIS.2016.076"},{"key":"1119_CR132","doi-asserted-by":"publisher","first-page":"204","DOI":"10.1016\/j.amc.2018.12.020","volume":"351","author":"X Zhang","year":"2019","unstructured":"Zhang X, Li R, Zhang B, Yang Y, Guo J, Ji X. An instance-based learning recommendation algorithm of imbalance handling methods. Appl Math Comput. 2019;351:204\u201318. https:\/\/doi.org\/10.1016\/j.amc.2018.12.020.","journal-title":"Appl Math Comput"},{"key":"1119_CR133","unstructured":"Freund Y, Schapire RE. Experiments with a new boosting algorithm. In: Proc. 13th Int. Conf. Mach. Learn., pp. 148\u2013156, 1996, 10.1.1.133.1040."},{"key":"1119_CR134","doi-asserted-by":"publisher","unstructured":"Domingos P. MetaCost. 1999; 155\u2013164. https:\/\/doi.org\/10.1145\/312129.312220.","DOI":"10.1145\/312129.312220"},{"key":"1119_CR135","doi-asserted-by":"publisher","first-page":"107","DOI":"10.1007\/978-3-540-39804-2_12","volume":"2838","author":"NV Chawla","year":"2003","unstructured":"Chawla NV, Lazarevic A, Hall LO, Bowyer KW. SMOTEBoost: improving prediction of the minority class in boosting. Lect Notes Artif Intell. 2003;2838:107\u201319. https:\/\/doi.org\/10.1007\/978-3-540-39804-2_12.","journal-title":"Lect Notes Artif Intell."},{"issue":"3","key":"1119_CR136","doi-asserted-by":"publisher","first-page":"289","DOI":"10.1109\/34.990132","volume":"24","author":"TK Ho","year":"2002","unstructured":"Ho TK, Basu M. Complexity measures of supervised classification problems. IEEE Trans Pattern Anal Mach Intell. 2002;24(3):289\u2013300. https:\/\/doi.org\/10.1109\/34.990132.","journal-title":"IEEE Trans Pattern Anal Mach Intell"}],"container-title":["Journal of Big Data"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s40537-025-01119-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1186\/s40537-025-01119-4\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s40537-025-01119-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,3,23]],"date-time":"2025-03-23T14:20:58Z","timestamp":1742739658000},"score":1,"resource":{"primary":{"URL":"https:\/\/journalofbigdata.springeropen.com\/articles\/10.1186\/s40537-025-01119-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,3,23]]},"references-count":136,"journal-issue":{"issue":"1","published-online":{"date-parts":[[2025,12]]}},"alternative-id":["1119"],"URL":"https:\/\/doi.org\/10.1186\/s40537-025-01119-4","relation":{},"ISSN":["2196-1115"],"issn-type":[{"value":"2196-1115","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,3,23]]},"assertion":[{"value":"25 October 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"25 February 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"23 March 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"Not applicable.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval and consent to participate"}},{"value":"Not applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for publication"}},{"value":"The authors declare that they have no competing interests.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}],"article-number":"71"}}