{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,16]],"date-time":"2026-05-16T02:02:28Z","timestamp":1778896948322,"version":"3.51.4"},"reference-count":153,"publisher":"Springer Science and Business Media LLC","issue":"8","license":[{"start":{"date-parts":[[2022,3,24]],"date-time":"2022-03-24T00:00:00Z","timestamp":1648080000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2022,3,24]],"date-time":"2022-03-24T00:00:00Z","timestamp":1648080000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Artif Intell Rev"],"published-print":{"date-parts":[[2022,12]]},"DOI":"10.1007\/s10462-022-10150-3","type":"journal-article","created":{"date-parts":[[2022,3,25]],"date-time":"2022-03-25T10:34:41Z","timestamp":1648204481000},"page":"6207-6275","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":88,"title":["On the joint-effect of class imbalance and overlap: a critical review"],"prefix":"10.1007","volume":"55","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-5912-963X","authenticated-orcid":false,"given":"Miriam Seoane","family":"Santos","sequence":"first","affiliation":[]},{"given":"Pedro Henriques","family":"Abreu","sequence":"additional","affiliation":[]},{"given":"Nathalie","family":"Japkowicz","sequence":"additional","affiliation":[]},{"given":"Alberto","family":"Fern\u00e1ndez","sequence":"additional","affiliation":[]},{"given":"Carlos","family":"Soares","sequence":"additional","affiliation":[]},{"given":"Szymon","family":"Wilk","sequence":"additional","affiliation":[]},{"given":"Jo\u00e3o","family":"Santos","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2022,3,24]]},"reference":[{"issue":"1","key":"10150_CR1","doi-asserted-by":"publisher","first-page":"238","DOI":"10.1109\/TKDE.2015.2458858","volume":"28","author":"L Abdi","year":"2015","unstructured":"Abdi L, Hashemi S (2015) To combat multi-class imbalanced problems by means of over-sampling techniques. IEEE Trans Knowl Data Eng 28(1):238\u2013251","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"10150_CR2","doi-asserted-by":"crossref","unstructured":"Akbani R, Kwek S, Japkowicz N (2004) Applying support vector machines to imbalanced datasets. In: European conference on machine learning. Springer, pp 39\u201350","DOI":"10.1007\/978-3-540-30115-8_7"},{"issue":"4","key":"10150_CR3","doi-asserted-by":"publisher","first-page":"380","DOI":"10.1016\/j.patrec.2012.09.003","volume":"34","author":"R Alejo","year":"2013","unstructured":"Alejo R, Valdovinos RM, Garc\u00eda V, Pacheco-Sanchez JH (2013) A hybrid method to face class overlap and class imbalance on neural networks and multi-class scenarios. Pattern Recogn Lett 34(4):380\u2013388","journal-title":"Pattern Recogn Lett"},{"issue":"3","key":"10150_CR4","doi-asserted-by":"publisher","first-page":"194","DOI":"10.1002\/sam.11228","volume":"7","author":"N Anwar","year":"2014","unstructured":"Anwar N, Jones G, Ganesh S (2014) Measurement of data complexity for classification problems with unbalanced data. Stat Anal Data Min ASA Data Sci J 7(3):194\u2013211","journal-title":"Stat Anal Data Min ASA Data Sci J"},{"issue":"1","key":"10150_CR5","doi-asserted-by":"publisher","first-page":"129","DOI":"10.1007\/s10044-014-0446-y","volume":"19","author":"G Armano","year":"2016","unstructured":"Armano G, Tamponi E (2016) Experimenting multiresolution analysis for identifying regions of different classification complexity. Pattern Anal Appl 19(1):129\u2013137","journal-title":"Pattern Anal Appl"},{"issue":"3","key":"10150_CR6","doi-asserted-by":"publisher","first-page":"245","DOI":"10.1007\/s10044-003-0192-z","volume":"6","author":"R Barandela","year":"2003","unstructured":"Barandela R, Valdovinos RM, S\u00e1nchez JS (2003) New applications of ensembles of classifiers. Pattern Anal Appl 6(3):245\u2013256","journal-title":"Pattern Anal Appl"},{"key":"10150_CR7","unstructured":"Barella VH, Costa EP, Carvalho A, Pl F (2014) Clusteross: a new undersampling method for imbalanced learning. In: Proceedings of the 3th Brazilian conference on intelligent systems. Academic Press"},{"key":"10150_CR8","doi-asserted-by":"crossref","unstructured":"Barella VH, Garcia LP, de\u00a0Souto MP, Lorena AC, de\u00a0Carvalho A (2018) Data complexity measures for imbalanced classification tasks. In: 2018 international joint conference on neural networks (IJCNN). IEEE, pp 1\u20138","DOI":"10.1109\/IJCNN.2018.8489661"},{"key":"10150_CR9","doi-asserted-by":"publisher","first-page":"83","DOI":"10.1016\/j.ins.2020.12.006","volume":"553","author":"VH Barella","year":"2021","unstructured":"Barella VH, Garcia LP, de Souto MC, Lorena AC, de Carvalho AC (2021) Assessing the data complexity of imbalanced datasets. Inf Sci 553:83\u2013109","journal-title":"Inf Sci"},{"issue":"2","key":"10150_CR10","doi-asserted-by":"publisher","first-page":"405","DOI":"10.1109\/TKDE.2012.232","volume":"26","author":"S Barua","year":"2014","unstructured":"Barua S, Islam M, Yao X, Murase K (2014) Mwmote-majority weighted minority oversampling technique for imbalanced data set learning. IEEE Trans Knowl Data Eng 26(2):405\u2013425","journal-title":"IEEE Trans Knowl Data Eng"},{"issue":"1","key":"10150_CR11","doi-asserted-by":"publisher","first-page":"20","DOI":"10.1145\/1007730.1007735","volume":"6","author":"GE Batista","year":"2004","unstructured":"Batista GE, Prati RC, Monard MC (2004) A study of the behavior of several methods for balancing machine learning training data. ACM SIGKDD Explor Newsl 6(1):20\u201329","journal-title":"ACM SIGKDD Explor Newsl"},{"issue":"3","key":"10150_CR12","doi-asserted-by":"publisher","first-page":"558","DOI":"10.1109\/TFUZZ.2010.2042721","volume":"18","author":"R Batuwita","year":"2010","unstructured":"Batuwita R, Palade V (2010) Fsvm-cil: fuzzy support vector machines for class imbalance learning. IEEE Trans Fuzzy Syst 18(3):558\u2013571","journal-title":"IEEE Trans Fuzzy Syst"},{"key":"10150_CR13","doi-asserted-by":"publisher","first-page":"81","DOI":"10.1016\/j.knosys.2018.05.037","volume":"158","author":"J Bi","year":"2018","unstructured":"Bi J, Zhang C (2018) An empirical comparison on state-of-the-art multi-class imbalance learning algorithms and a new diversified ensemble learning scheme. Knowl Based Syst 158:81\u201393","journal-title":"Knowl Based Syst"},{"issue":"2","key":"10150_CR14","doi-asserted-by":"publisher","first-page":"381","DOI":"10.1007\/s10044-016-0583-6","volume":"21","author":"Z Borsos","year":"2018","unstructured":"Borsos Z, Lemnaru C, Potolea R (2018) Dealing with overlap and imbalance: a new metric and approach. Pattern Anal Appl 21(2):381\u2013395","journal-title":"Pattern Anal Appl"},{"issue":"2","key":"10150_CR15","doi-asserted-by":"publisher","first-page":"123","DOI":"10.1007\/BF00058655","volume":"24","author":"L Breiman","year":"1996","unstructured":"Breiman L (1996) Bagging predictors. Mach Learn 24(2):123\u2013140","journal-title":"Mach Learn"},{"issue":"3","key":"10150_CR16","doi-asserted-by":"publisher","first-page":"827","DOI":"10.1007\/s10115-016-0957-5","volume":"50","author":"C Bunkhumpornpat","year":"2017","unstructured":"Bunkhumpornpat C, Sinapiromsaran K (2017) Dbmute: density-based majority under-sampling technique. Knowl Inf Syst 50(3):827\u2013850","journal-title":"Knowl Inf Syst"},{"key":"10150_CR17","doi-asserted-by":"crossref","unstructured":"Bunkhumpornpat C, Sinapiromsaran K, Lursinsap C (2009) Safe-level-smote: safe-level-synthetic minority over-sampling technique for handling the class imbalanced problem. In: Pacific-Asia conference on knowledge discovery and data mining. Springer, pp 475\u2013482","DOI":"10.1007\/978-3-642-01307-2_43"},{"key":"10150_CR18","doi-asserted-by":"crossref","unstructured":"Bunkhumpornpat C, Sinapiromsaran K, Lursinsap C (2011) Mute: majority under-sampling technique. In: 2011 8th international conference on information, communications and signal processing. IEEE, pp 1\u20134","DOI":"10.1109\/ICICS.2011.6173603"},{"issue":"3","key":"10150_CR19","doi-asserted-by":"publisher","first-page":"664","DOI":"10.1007\/s10489-011-0287-y","volume":"36","author":"C Bunkhumpornpat","year":"2012","unstructured":"Bunkhumpornpat C, Sinapiromsaran K, Lursinsap C (2012) Dbsmote: density-based synthetic minority over-sampling technique. Appl Intell 36(3):664\u2013684","journal-title":"Appl Intell"},{"issue":"12","key":"10150_CR20","doi-asserted-by":"publisher","first-page":"2809","DOI":"10.1109\/TKDE.2013.37","volume":"25","author":"H Cao","year":"2013","unstructured":"Cao H, Li XL, Woon DYK, Ng SK (2013) Integrated oversampling for imbalanced time series classification. IEEE Trans Knowl Data Eng 25(12):2809\u20132822","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"10150_CR21","doi-asserted-by":"publisher","first-page":"321","DOI":"10.1613\/jair.953","volume":"16","author":"NV Chawla","year":"2002","unstructured":"Chawla NV, Bowyer KW, Hall LO, Kegelmeyer WP (2002) Smote: synthetic minority over-sampling technique. J Artif Intell Res 16:321\u2013357","journal-title":"J Artif Intell Res"},{"key":"10150_CR22","doi-asserted-by":"crossref","unstructured":"Chawla NV, Lazarevic A, Hall LO, Bowyer KW (2003) Smoteboost: improving prediction of the minority class in boosting. In: European conference on principles of data mining and knowledge discovery. Springer, pp 107\u2013119","DOI":"10.1007\/978-3-540-39804-2_12"},{"key":"10150_CR24","unstructured":"Chen S (2017) An improved synthetic minority over-sampling technique for imbalanced data set learning. Degree thesis of Department of Information Engineering, National Tsing Hua University, pp 1\u201359"},{"issue":"10","key":"10150_CR25","doi-asserted-by":"publisher","first-page":"1624","DOI":"10.1109\/TNN.2010.2066988","volume":"21","author":"S Chen","year":"2010","unstructured":"Chen S, He H, Garcia EA (2010) Ramoboost: ranked minority oversampling in boosting. IEEE Trans Neural Netw 21(10):1624\u20131642","journal-title":"IEEE Trans Neural Netw"},{"issue":"1","key":"10150_CR23","doi-asserted-by":"publisher","first-page":"97","DOI":"10.1007\/s11219-016-9342-6","volume":"26","author":"L Chen","year":"2018","unstructured":"Chen L, Fang B, Shang Z, Tang Y (2018) Tackling class overlap and imbalance problems in software defect prediction. Softw Qual J 26(1):97\u2013125","journal-title":"Softw Qual J"},{"key":"10150_CR26","doi-asserted-by":"crossref","unstructured":"Chen X, Zhang L, Wei X, Lu X (2021) An effective method using clustering-based adaptive decomposition and editing-based diversified oversamping for multi-class imbalanced datasets. Appl Intell 51(4):1918\u20131933","DOI":"10.1007\/s10489-020-01883-1"},{"key":"10150_CR27","doi-asserted-by":"crossref","unstructured":"Cieslak DA, Chawla NV, Striegel A (2006) Combating imbalance in network intrusion datasets. In: GrC, Citeseer, pp 732\u2013737","DOI":"10.1109\/GRC.2006.1635905"},{"issue":"1","key":"10150_CR28","doi-asserted-by":"publisher","first-page":"7","DOI":"10.1016\/j.artmed.2005.03.002","volume":"37","author":"G Cohen","year":"2006","unstructured":"Cohen G, Hilario M, Sax H, Hugonnet S, Geissbuhler A (2006) Learning from imbalanced data in surveillance of nosocomial infection. Artif Intell Med 37(1):7\u201318","journal-title":"Artif Intell Med"},{"key":"10150_CR29","doi-asserted-by":"crossref","unstructured":"Correia A, Soares C, Jorge A (2019) Dataset morphing to analyze the performance of collaborative filtering. In: International conference on discovery science. Springer, pp 29\u201339","DOI":"10.1007\/978-3-030-33778-0_3"},{"key":"10150_CR30","unstructured":"Costa AJ, Santos MS, Soares C, Abreu PH (2020) Analysis of imbalance strategies recommendation using a meta-learning approach. In: 7th ICML workshop on automated machine learning (AutoML-ICML2020), pp 1\u201310"},{"key":"10150_CR31","unstructured":"Cummins L (2013) Combining and choosing case base maintenance algorithms. PhD thesis, University College Cork"},{"key":"10150_CR32","doi-asserted-by":"crossref","unstructured":"Das B, Krishnan NC, Cook DJ (2014a) Handling imbalanced and overlapping classes in smart environments prompting dataset. In: Data mining for service. Springer, pp 199\u2013219","DOI":"10.1007\/978-3-642-45252-9_12"},{"issue":"1","key":"10150_CR33","doi-asserted-by":"publisher","first-page":"222","DOI":"10.1109\/TKDE.2014.2324567","volume":"27","author":"B Das","year":"2014","unstructured":"Das B, Krishnan NC, Cook DJ (2014b) Racog and wracog: two probabilistic oversampling techniques. IEEE Trans Knowl Data Eng 27(1):222\u2013234","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"10150_CR34","doi-asserted-by":"publisher","first-page":"674","DOI":"10.1016\/j.patcog.2018.03.008","volume":"81","author":"S Das","year":"2018","unstructured":"Das S, Datta S, Chaudhuri B (2018) Handling data irregularities in classification: foundations, trends, and future challenges. Pattern Recogn 81:674\u2013693","journal-title":"Pattern Recogn"},{"key":"10150_CR96","doi-asserted-by":"crossref","unstructured":"de\u00a0Melo VV, Lorena AC (2018) Using complexity measures to evolve synthetic classification datasets. In: 2018 International joint conference on neural networks (IJCNN). IEEE, pp 1\u20138","DOI":"10.1109\/IJCNN.2018.8489645"},{"issue":"2","key":"10150_CR35","doi-asserted-by":"publisher","first-page":"182","DOI":"10.1109\/4235.996017","volume":"6","author":"K Deb","year":"2002","unstructured":"Deb K, Pratap A, Agarwal S, Meyarivan T (2002) A fast and elitist multiobjective genetic algorithm: Nsga-ii. IEEE Trans Evol Comput 6(2):182\u2013197","journal-title":"IEEE Trans Evol Comput"},{"key":"10150_CR36","doi-asserted-by":"crossref","unstructured":"Denil M, Trappenberg T (2010) Overlap versus imbalance. In: Canadian conference on artificial intelligence. Springer, pp 220\u2013231","DOI":"10.1007\/978-3-642-13059-5_22"},{"key":"10150_CR37","doi-asserted-by":"publisher","first-page":"118","DOI":"10.1016\/j.ins.2019.06.007","volume":"501","author":"G Douzas","year":"2019","unstructured":"Douzas G, Bacao F (2019) Geometric smote a geometrically enhanced drop-in replacement for smote. Inf Sci 501:118\u2013135","journal-title":"Inf Sci"},{"key":"10150_CR38","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.ins.2018.06.056","volume":"465","author":"G Douzas","year":"2018","unstructured":"Douzas G, Bacao F, Last F (2018) Improving imbalanced learning through a heuristic oversampling method based on k-means and smote. Inf Sci 465:1\u201320","journal-title":"Inf Sci"},{"key":"10150_CR39","doi-asserted-by":"crossref","unstructured":"Eshelman LJ (1991) The chc adaptive search algorithm: How to have safe search when engaging in nontraditional genetic recombination. In: Foundations of genetic algorithms, vol\u00a01. Elsevier, pp 265\u2013283","DOI":"10.1016\/B978-0-08-050684-5.50020-3"},{"key":"10150_CR40","first-page":"226","volume":"96","author":"M Ester","year":"1996","unstructured":"Ester M, Kriegel HP, Sander J, Xu X et al (1996) A density-based algorithm for discovering clusters in large spatial databases with noise. Kdd 96:226\u2013231","journal-title":"Kdd"},{"key":"10150_CR41","doi-asserted-by":"publisher","first-page":"87","DOI":"10.1016\/j.knosys.2016.09.032","volume":"115","author":"Q Fan","year":"2017","unstructured":"Fan Q, Wang Z, Li D, Gao D, Zha H (2017) Entropy-based fuzzy support vector machine for imbalanced datasets. Knowl Based Syst 115:87\u201399","journal-title":"Knowl Based Syst"},{"key":"10150_CR42","doi-asserted-by":"publisher","first-page":"141","DOI":"10.1016\/j.ins.2019.04.052","volume":"494","author":"ER Fernandes","year":"2019","unstructured":"Fernandes ER, de Carvalho AC (2019) Evolutionary inversion of class distribution in overlapping areas for multi-class imbalanced learning. Inf Sci 494:141\u2013154","journal-title":"Inf Sci"},{"key":"10150_CR43","first-page":"253","volume-title":"Data Intrinsic Characteristics","author":"A Fern\u00e1ndez","year":"2018","unstructured":"Fern\u00e1ndez A, Garc\u00eda S, Galar M, Prati R, Krawczyk B, Herrera F (2018a) Data Intrinsic Characteristics. Springer, Cham, pp 253\u2013277"},{"key":"10150_CR44","first-page":"147","volume-title":"Ensemble Learning","author":"A Fern\u00e1ndez","year":"2018","unstructured":"Fern\u00e1ndez A, Garc\u00eda S, Galar M, Prati R, Krawczyk B, Herrera F (2018b) Ensemble Learning. Springer, Cham, pp 147\u2013196"},{"key":"10150_CR45","doi-asserted-by":"crossref","unstructured":"Fern\u00e1ndez A, Garc\u00eda S, Galar M, Prati RC, Krawczyk B, Herrera F (2018c) Dimensionality reduction for imbalanced learning. In: Learning from imbalanced data sets. Springer, pp 227\u2013251","DOI":"10.1007\/978-3-319-98074-4_9"},{"key":"10150_CR46","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-98074-4","volume-title":"Learning From Imbalanced Data Sets","author":"A Fern\u00e1ndez","year":"2018","unstructured":"Fern\u00e1ndez A, Garc\u00eda S, Galar M, Prati RC, Krawczyk B, Herrera F (2018d) Learning From Imbalanced Data Sets, vol 11. Springer, Berlin"},{"key":"10150_CR47","doi-asserted-by":"publisher","first-page":"863","DOI":"10.1613\/jair.1.11192","volume":"61","author":"A Fern\u00e1ndez","year":"2018","unstructured":"Fern\u00e1ndez A, Garcia S, Herrera F, Chawla NV (2018e) Smote for learning from imbalanced data: progress and challenges, marking the 15-year anniversary. J Artif Intell Res 61:863\u2013905","journal-title":"J Artif Intell Res"},{"key":"10150_CR48","doi-asserted-by":"crossref","unstructured":"Fran\u00e7a TR, Miranda PB, Prud\u00eancio RB, Lorenaz AC, Nascimento AC (2020) A many-objective optimization approach for complexity-based data set generation. In: 2020 IEEE congress on evolutionary computation (CEC). IEEE, pp 1\u20138","DOI":"10.1109\/CEC48606.2020.9185543"},{"issue":"1","key":"10150_CR49","doi-asserted-by":"publisher","first-page":"119","DOI":"10.1006\/jcss.1997.1504","volume":"55","author":"Y Freund","year":"1997","unstructured":"Freund Y, Schapire RE (1997) A decision-theoretic generalization of on-line learning and an application to boosting. J Comput Syst Sci 55(1):119\u2013139","journal-title":"J Comput Syst Sci"},{"issue":"2","key":"10150_CR50","doi-asserted-by":"publisher","first-page":"337","DOI":"10.1214\/aos\/1016218223","volume":"28","author":"J Friedman","year":"2000","unstructured":"Friedman J, Hastie T, Tibshirani R et al (2000) Additive logistic regression: a statistical view of boosting (with discussion and a rejoinder by the authors). Ann Stat 28(2):337\u2013407","journal-title":"Ann Stat"},{"key":"10150_CR51","doi-asserted-by":"publisher","first-page":"103906","DOI":"10.1016\/j.chemolab.2019.103906","volume":"196","author":"GH Fu","year":"2020","unstructured":"Fu GH, Wu YJ, Zong MJ, Yi LZ (2020) Feature selection and classification by minimizing overlap degree for class-imbalanced data in metabolomics. Chemom Intell Lab Syst 196:103906","journal-title":"Chemom Intell Lab Syst"},{"issue":"12","key":"10150_CR52","doi-asserted-by":"publisher","first-page":"3412","DOI":"10.1016\/j.patcog.2013.04.018","volume":"46","author":"M Galar","year":"2013","unstructured":"Galar M, Fern\u00e1ndez A, Barrenechea E, Bustince H, Herrera F (2013) Dynamic classifier selection for one-vs-one strategy: avoiding non-competent classifiers. Pattern Recogn 46(12):3412\u20133424","journal-title":"Pattern Recogn"},{"issue":"1","key":"10150_CR53","doi-asserted-by":"publisher","first-page":"28","DOI":"10.1016\/j.patcog.2014.07.023","volume":"48","author":"M Galar","year":"2015","unstructured":"Galar M, Fern\u00e1ndez A, Barrenechea E, Herrera F (2015) Drcw-ovo: distance-based relative competence weighting combination for one-vs-one strategy in multi-class problems. Pattern Recogn 48(1):28\u201342","journal-title":"Pattern Recogn"},{"issue":"3","key":"10150_CR54","doi-asserted-by":"publisher","first-page":"275","DOI":"10.1162\/evco.2009.17.3.275","volume":"17","author":"S Garc\u00eda","year":"2009","unstructured":"Garc\u00eda S, Herrera F (2009) Evolutionary undersampling for classification with imbalanced datasets: proposals and taxonomy. Evol Comput 17(3):275\u2013306","journal-title":"Evol Comput"},{"key":"10150_CR55","doi-asserted-by":"crossref","unstructured":"Garc\u00eda V, Alejo R, S\u00e1nchez J, Sotoca J, Mollineda R (2006) Combined effects of class imbalance and class overlap on instance-based classification. In: International conference on intelligent data engineering and automated learning. Springer, pp 371\u2013378","DOI":"10.1007\/11875581_45"},{"key":"10150_CR56","doi-asserted-by":"crossref","unstructured":"Garc\u00eda V, Mollineda R, S\u00e1nchez J, Alejo R, Sotoca J (2007a) When overlapping unexpectedly alters the class imbalance effects. In: Iberian conference on pattern recognition and image analysis. Springer, pp 499\u2013506","DOI":"10.1007\/978-3-540-72849-8_63"},{"key":"10150_CR57","doi-asserted-by":"crossref","unstructured":"Garc\u00eda V, S\u00e1nchez J, Mollineda R (2007b) An empirical study of the behavior of classifiers on imbalanced and overlapped data sets. In: Iberoamerican congress on pattern recognition. Springer, pp 397\u2013406","DOI":"10.1007\/978-3-540-76725-1_42"},{"issue":"3\u20134","key":"10150_CR58","doi-asserted-by":"publisher","first-page":"269","DOI":"10.1007\/s10044-007-0087-5","volume":"11","author":"V Garc\u00eda","year":"2008","unstructured":"Garc\u00eda V, Mollineda R, S\u00e1nchez J (2008) On the k-nn performance in a challenging scenario of imbalance and overlapping. Pattern Anal Appl 11(3\u20134):269\u2013280","journal-title":"Pattern Anal Appl"},{"key":"10150_CR59","doi-asserted-by":"publisher","first-page":"113026","DOI":"10.1016\/j.eswa.2019.113026","volume":"158","author":"V Garc\u00eda","year":"2020","unstructured":"Garc\u00eda V, S\u00e1nchez J, Marqu\u00e9s A, Florencia R, Rivera G (2020) Understanding the apparent superiority of over-sampling through an analysis of local information for class-imbalanced data. Expert Syst Appl 158:113026","journal-title":"Expert Syst Appl"},{"key":"10150_CR60","unstructured":"Greene J (2001) Feature subset selection using thornton\u2019s separability index and its applicability to a number of sparse proximity-based classifiers. In: Proceedings of annual symposium of the pattern recognition association of South Africa"},{"issue":"15","key":"10150_CR61","doi-asserted-by":"publisher","first-page":"5164","DOI":"10.3390\/app10155164","volume":"10","author":"A Guzm\u00e1n-Ponce","year":"2020","unstructured":"Guzm\u00e1n-Ponce A, Valdovinos RM, S\u00e1nchez JS, Marcial-Romero JR (2020) A new under-sampling method to face class overlap and imbalance. Appl Sci 10(15):5164","journal-title":"Appl Sci"},{"key":"10150_CR62","doi-asserted-by":"publisher","first-page":"220","DOI":"10.1016\/j.eswa.2016.12.035","volume":"73","author":"G Haixiang","year":"2017","unstructured":"Haixiang G, Yijing L, Shang J, Mingyun G, Yuanyue H, Bing G (2017) Learning from class-imbalanced data: review of methods and applications. Expert Syst Appl 73:220\u2013239","journal-title":"Expert Syst Appl"},{"key":"10150_CR63","doi-asserted-by":"crossref","unstructured":"Han H, Wang WY, Mao BH (2005) Borderline-smote: a new over-sampling method in imbalanced data sets learning. In: International conference on intelligent computing. Springer, pp 878\u2013887","DOI":"10.1007\/11538059_91"},{"issue":"3","key":"10150_CR64","doi-asserted-by":"publisher","first-page":"515","DOI":"10.1109\/TIT.1968.1054155","volume":"14","author":"P Hart","year":"1968","unstructured":"Hart P (1968) The condensed nearest neighbor rule (corresp.). IEEE Trans Inf Theory 14(3):515\u2013516","journal-title":"IEEE Trans Inf Theory"},{"key":"10150_CR65","unstructured":"He H, Bai Y, Garcia E, Li S (2008) Adasyn: adaptive synthetic sampling approach for imbalanced learning. In: IEEE international joint conference on neural networks, 2008. IJCNN 2008. (IEEE World Congress on Computational Intelligence). IEEE, pp 1322\u20131328"},{"issue":"3","key":"10150_CR66","doi-asserted-by":"publisher","first-page":"289","DOI":"10.1109\/34.990132","volume":"24","author":"T Ho","year":"2002","unstructured":"Ho T, Basu M (2002) Complexity measures of supervised classification problems. IEEE Trans Pattern Anal Mach Intell 24(3):289\u2013300","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"issue":"9","key":"10150_CR67","doi-asserted-by":"publisher","first-page":"850","DOI":"10.1109\/34.232073","volume":"15","author":"DP Huttenlocher","year":"1993","unstructured":"Huttenlocher DP, Klanderman GA, Rucklidge WJ (1993) Comparing images using the hausdorff distance. IEEE Trans Pattern Anal Mach Intell 15(9):850\u2013863","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"issue":"1","key":"10150_CR68","doi-asserted-by":"publisher","first-page":"4","DOI":"10.1109\/34.824819","volume":"22","author":"A Jain","year":"2000","unstructured":"Jain A, Duin R, Mao J (2000) Statistical pattern recognition: a review. IEEE Trans Pattern Anal Mach Intell 22(1):4\u201337","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"10150_CR69","doi-asserted-by":"crossref","unstructured":"Japkowicz N (2001) Concept-learning in the presence of between-class and within-class imbalances. In: Conference of the Canadian society for computational studies of intelligence. Springer, pp 67\u201377","DOI":"10.1007\/3-540-45153-6_7"},{"issue":"1","key":"10150_CR70","doi-asserted-by":"publisher","first-page":"40","DOI":"10.1145\/1007730.1007737","volume":"6","author":"T Jo","year":"2004","unstructured":"Jo T, Japkowicz N (2004) Class imbalances versus small disjuncts. ACM SIGKDD Explor Newsl 6(1):40\u201349","journal-title":"ACM SIGKDD Explor Newsl"},{"key":"10150_CR71","doi-asserted-by":"publisher","first-page":"677","DOI":"10.1016\/j.neucom.2014.08.006","volume":"149","author":"S Kang","year":"2015","unstructured":"Kang S, Cho S, Kang P (2015) Constructing a multi-class classifier using one-against-one approach with different binary classifiers. Neurocomputing 149:677\u2013682","journal-title":"Neurocomputing"},{"issue":"4","key":"10150_CR72","first-page":"1","volume":"52","author":"H Kaur","year":"2019","unstructured":"Kaur H, Pannu HS, Malhi AK (2019) A systematic review on imbalanced data challenges in machine learning: applications and solutions. ACM Comput Surv (CSUR) 52(4):1\u201336","journal-title":"ACM Comput Surv (CSUR)"},{"key":"10150_CR73","doi-asserted-by":"publisher","first-page":"105662","DOI":"10.1016\/j.asoc.2019.105662","volume":"83","author":"G Kov\u00e1cs","year":"2019","unstructured":"Kov\u00e1cs G (2019) An empirical comparison and evaluation of minority oversampling techniques on a large number of imbalanced datasets. Appl Soft Comput 83:105662","journal-title":"Appl Soft Comput"},{"issue":"4","key":"10150_CR74","doi-asserted-by":"publisher","first-page":"727","DOI":"10.1515\/amcs-2017-0050","volume":"27","author":"M Koziarski","year":"2017","unstructured":"Koziarski M, Wozniak M (2017) Ccr: a combined cleaning and resampling algorithm for imbalanced data classification. Int J Appl Math Comput Sci 27(4):727\u2013736","journal-title":"Int J Appl Math Comput Sci"},{"key":"10150_CR75","doi-asserted-by":"publisher","first-page":"19","DOI":"10.1016\/j.neucom.2018.04.089","volume":"343","author":"M Koziarski","year":"2019","unstructured":"Koziarski M, Krawczyk B, Wozniak M (2019) Radial-based oversampling for noisy imbalanced data classification. Neurocomputing 343:19\u201333","journal-title":"Neurocomputing"},{"issue":"4","key":"10150_CR76","doi-asserted-by":"publisher","first-page":"221","DOI":"10.1007\/s13748-016-0094-0","volume":"5","author":"B Krawczyk","year":"2016","unstructured":"Krawczyk B (2016) Learning from imbalanced data: open challenges and future directions. Progr. Artif. Intell. 5(4):221\u2013232","journal-title":"Progr. Artif. Intell."},{"key":"10150_CR77","first-page":"179","volume":"97","author":"M Kubat","year":"1997","unstructured":"Kubat M, Matwin S et al (1997) Addressing the curse of imbalanced training sets: one-sided selection. Icml Citeseer 97:179\u2013186","journal-title":"Icml Citeseer"},{"key":"10150_CR78","doi-asserted-by":"crossref","unstructured":"Lango M, Brzezinski D, Firlik S, Stefanowski J (2017) Discovering minority sub-clusters and local difficulty factors from imbalanced data. In: International conference on discovery science. Springer, pp 324\u2013339","DOI":"10.1007\/978-3-319-67786-6_23"},{"key":"10150_CR79","unstructured":"Lango M, Brzezinski D, Stefanowski J (2018) Imweights: classifying imbalanced data using local and neighborhood information. In: Second international workshop on learning with imbalanced domains: theory and applications, PMLR, pp 95\u2013109"},{"key":"10150_CR80","doi-asserted-by":"crossref","unstructured":"Laurikkala J (2001) Improving identification of difficult small classes by balancing class distribution. In: Conference on artificial intelligence in medicine in Europe. Springer, pp 63\u201366","DOI":"10.1007\/3-540-48229-6_9"},{"key":"10150_CR81","doi-asserted-by":"publisher","first-page":"72","DOI":"10.1016\/j.eswa.2018.01.008","volume":"98","author":"HK Lee","year":"2018","unstructured":"Lee HK, Kim SB (2018) An overlap-sensitive margin classifier for imbalanced and overlapping data. Expert Syst Appl 98:72\u201383","journal-title":"Expert Syst Appl"},{"issue":"2","key":"10150_CR82","doi-asserted-by":"publisher","first-page":"354","DOI":"10.1109\/TKDE.2014.2327034","volume":"27","author":"E Leyva","year":"2014","unstructured":"Leyva E, Gonz\u00e1lez A, Perez R (2014) A set of complexity measures designed for applying meta-learning to instance selection. IEEE Trans Knowl Data Eng 27(2):354\u2013367","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"10150_CR83","doi-asserted-by":"publisher","first-page":"100564","DOI":"10.1016\/j.swevo.2019.100564","volume":"50","author":"KS Li","year":"2019","unstructured":"Li KS, Wang HR, Liu KH (2019) A novel error-correcting output codes algorithm based on genetic programming. Swarm Evol Comput 50:100564","journal-title":"Swarm Evol Comput"},{"issue":"2","key":"10150_CR84","doi-asserted-by":"publisher","first-page":"53","DOI":"10.1007\/s10032-008-0069-1","volume":"11","author":"C Liu","year":"2008","unstructured":"Liu C (2008) Partial discriminative training for classification of overlapping classes in document analysis. IJDAR 11(2):53","journal-title":"IJDAR"},{"issue":"2","key":"10150_CR85","first-page":"539","volume":"39","author":"XY Liu","year":"2008","unstructured":"Liu XY, Wu J, Zhou ZH (2008) Exploratory undersampling for class-imbalance learning. IEEE Trans Syst Man Cybern Part B (Cybern) 39(2):539\u2013550","journal-title":"IEEE Trans Syst Man Cybern Part B (Cybern)"},{"key":"10150_CR86","doi-asserted-by":"publisher","first-page":"113","DOI":"10.1016\/j.ins.2013.07.007","volume":"250","author":"V L\u00f3pez","year":"2013","unstructured":"L\u00f3pez V, Fern\u00e1ndez A, Garc\u00eda S, Palade V, Herrera F (2013) An insight into classification with imbalanced data: empirical results and current trends on using data intrinsic characteristics. Inf Sci 250:113\u2013141","journal-title":"Inf Sci"},{"issue":"1","key":"10150_CR87","doi-asserted-by":"publisher","first-page":"33","DOI":"10.1016\/j.neucom.2011.03.054","volume":"75","author":"AC Lorena","year":"2012","unstructured":"Lorena AC, Costa IG, Spola\u00f4r N, De Souto MC (2012) Analysis of complexity indices for classification problems: cancer gene expression data. Neurocomputing 75(1):33\u201342","journal-title":"Neurocomputing"},{"issue":"5","key":"10150_CR88","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3347711","volume":"52","author":"AC Lorena","year":"2019","unstructured":"Lorena AC, Garcia LP, Lehmann J, Souto MC, Ho TK (2019) How complex is your classification problem? A survey on measuring classification complexity. ACM Comput Surv (CSUR) 52(5):1\u201334","journal-title":"ACM Comput Surv (CSUR)"},{"issue":"10","key":"10150_CR89","doi-asserted-by":"publisher","first-page":"1909","DOI":"10.1007\/s00500-010-0625-8","volume":"15","author":"J Luengo","year":"2011","unstructured":"Luengo J, Fern\u00e1ndez A, Garc\u00eda S, Herrera F (2011) Addressing data complexity for imbalanced data sets: analysis of smote-based oversampling and evolutionary undersampling. Soft Comput 15(10):1909\u20131936","journal-title":"Soft Comput"},{"key":"10150_CR90","doi-asserted-by":"publisher","DOI":"10.1201\/b10331","volume-title":"Clustering in Bioinformatics and Drug Discovery","author":"J MacCuish","year":"2010","unstructured":"MacCuish J, MacCuish N (2010) Clustering in Bioinformatics and Drug Discovery. CRC Press, London"},{"key":"10150_CR91","doi-asserted-by":"publisher","first-page":"237","DOI":"10.1016\/j.ins.2013.08.059","volume":"261","author":"N Maci\u00e0","year":"2014","unstructured":"Maci\u00e0 N, Bernad\u00f3-Mansilla E (2014) Towards uci+: a mindful repository design. Inf Sci 261:237\u2013262","journal-title":"Inf Sci"},{"issue":"4","key":"10150_CR92","doi-asserted-by":"publisher","first-page":"629","DOI":"10.1109\/3477.938265","volume":"31","author":"W Malina","year":"2001","unstructured":"Malina W (2001) Two-parameter fisher criterion. IEEE Trans Syst Man Cybern Part B (Cybern) 31(4):629\u2013636","journal-title":"IEEE Trans Syst Man Cybern Part B (Cybern)"},{"key":"10150_CR93","unstructured":"Mani I, Zhang I (2003) knn approach to unbalanced data distributions: a case study involving information extraction. In: Proceedings of workshop on learning from imbalanced datasets, ICML United States, vol 126"},{"issue":"1","key":"10150_CR94","first-page":"6504","volume":"17","author":"A Manukyan","year":"2016","unstructured":"Manukyan A, Ceyhan E (2016) Classification of imbalanced data with a geometric digraph family. J Mach Learn Res 17(1):6504\u20136543","journal-title":"J Mach Learn Res"},{"key":"10150_CR95","first-page":"216","volume":"5","author":"S Massie","year":"2005","unstructured":"Massie S, Craw S, Wiratunga N (2005) Complexity-guided case discovery for case based reasoning. AAAI 5:216\u2013221","journal-title":"AAAI"},{"issue":"6","key":"10150_CR97","doi-asserted-by":"publisher","first-page":"822","DOI":"10.1109\/TSE.2012.83","volume":"39","author":"T Menzies","year":"2012","unstructured":"Menzies T, Butcher A, Cok D, Marcus A, Layman L, Shull F, Turhan B, Zimmermann T (2012) Local versus global lessons for defect prediction and effort estimation. IEEE Trans Softw Eng 39(6):822\u2013834","journal-title":"IEEE Trans Softw Eng"},{"key":"10150_CR98","doi-asserted-by":"crossref","unstructured":"Mercier M, Santos M, Abreu P, Soares C, Soares J, Santos J (2018) Analysing the footprint of classifiers in overlapped and imbalanced contexts. In: International symposium on intelligent data analysis. Springer, pp 200\u2013212","DOI":"10.1007\/978-3-030-01768-2_17"},{"issue":"1","key":"10150_CR99","doi-asserted-by":"publisher","first-page":"109","DOI":"10.1007\/s10994-017-5629-5","volume":"107","author":"MA Mu\u00f1oz","year":"2018","unstructured":"Mu\u00f1oz MA, Villanova L, Baatar D, Smith-Miles K (2018) Instance spaces for machine learning classification. Mach Learn 107(1):109\u2013147","journal-title":"Mach Learn"},{"issue":"3","key":"10150_CR100","doi-asserted-by":"publisher","first-page":"563","DOI":"10.1007\/s10844-015-0368-1","volume":"46","author":"K Napierala","year":"2016","unstructured":"Napierala K, Stefanowski J (2016) Types of minority class examples and their influence on learning classifiers from imbalanced data. J Intell Inf Syst 46(3):563\u2013597","journal-title":"J Intell Inf Syst"},{"key":"10150_CR101","doi-asserted-by":"crossref","unstructured":"Napiera\u0142a K, Stefanowski J, Wilk S (2010) Learning from imbalanced data in presence of noisy and borderline examples. In: International conference on rough sets and current trends in computing. Springer, pp 158\u2013167","DOI":"10.1007\/978-3-642-13529-3_18"},{"key":"10150_CR102","doi-asserted-by":"publisher","first-page":"405","DOI":"10.1016\/j.eswa.2015.10.031","volume":"46","author":"I Nekooeimehr","year":"2016","unstructured":"Nekooeimehr I, Lai-Yuen SK (2016) Adaptive semi-unsupervised weighted oversampling (a-suwo) for imbalanced datasets. Expert Syst Appl 46:405\u2013416","journal-title":"Expert Syst Appl"},{"issue":"2","key":"10150_CR103","doi-asserted-by":"publisher","first-page":"115","DOI":"10.1016\/j.compbiomed.2010.12.006","volume":"41","author":"S Oh","year":"2011","unstructured":"Oh S (2011) A new dataset evaluation method based on category overlap. Comput Biol Med 41(2):115\u2013122","journal-title":"Comput Biol Med"},{"key":"10150_CR104","first-page":"1","volume":"196","author":"A Orriols-Puig","year":"2010","unstructured":"Orriols-Puig A, Macia N, Ho TK (2010) Documentation for the data complexity library in c++. Universitat Ramon Llull, La Salle 196:1\u201340","journal-title":"Universitat Ramon Llull, La Salle"},{"issue":"7","key":"10150_CR105","doi-asserted-by":"publisher","first-page":"1961","DOI":"10.1007\/s10115-021-01577-1","volume":"63","author":"JD Pascual-Triana","year":"2021","unstructured":"Pascual-Triana JD, Charte D, Andr\u00e9s Arroyo M, Fern\u00e1ndez A, Herrera F (2021) Revisiting data complexity metrics based on morphology for overlap and imbalance: snapshot, new overlap number of balls metrics and singular problems prospect. Knowl Inf Syst 63(7):1961\u20131989","journal-title":"Knowl Inf Syst"},{"key":"10150_CR106","doi-asserted-by":"crossref","unstructured":"Prati RGB, Monard M (2004) Class imbalances versus class overlapping: an analysis of a learning system behavior. In: Mexican international conference on artificial intelligence. Springer, pp 312\u2013321","DOI":"10.1007\/978-3-540-24694-7_32"},{"key":"10150_CR107","unstructured":"Rivolli A, Garcia LP, Soares C, Vanschoren J, de\u00a0Carvalho AC (2018) Characterizing classification datasets: a study of meta-features for meta-learning. arXiv:180810406"},{"key":"10150_CR108","doi-asserted-by":"publisher","first-page":"184","DOI":"10.1016\/j.ins.2014.08.051","volume":"291","author":"J S\u00e1ez","year":"2015","unstructured":"S\u00e1ez J, Luengo J, Stefanowski J, Herrera F (2015) Smote-ipf: addressing the noisy and borderline examples problem in imbalanced classification by a re-sampling method with filtering. Inf Sci 291:184\u2013203","journal-title":"Inf Sci"},{"key":"10150_CR109","doi-asserted-by":"publisher","first-page":"83396","DOI":"10.1109\/ACCESS.2019.2925300","volume":"7","author":"JA S\u00e1ez","year":"2019","unstructured":"S\u00e1ez JA, Galar M, Krawczyk B (2019) Addressing the overlapping data problem in classification using the one-vs-one decomposition strategy. IEEE Access 7:83396\u201383411","journal-title":"IEEE Access"},{"key":"10150_CR110","doi-asserted-by":"publisher","first-page":"49","DOI":"10.1016\/j.jbi.2015.09.012","volume":"58","author":"M Santos","year":"2015","unstructured":"Santos M, Abreu P, Garc\u00eda-Laencina P, Sim\u00e3o A, Carvalho A (2015) A new cluster-based oversampling method for improving survival prediction of hepatocellular carcinoma patients. J Biomed Inform 58:49\u201359","journal-title":"J Biomed Inform"},{"issue":"3","key":"10150_CR111","doi-asserted-by":"publisher","first-page":"59","DOI":"10.1109\/MCI.2018.2866730","volume":"13","author":"M Santos","year":"2018","unstructured":"Santos M, Soares J, Abreu P, Ara\u00fajo H, Santos J (2018) Cross-validation for imbalanced datasets: avoiding overoptimistic and overfitting approaches. IEEE Comput Intell Mag 13(3):59\u201376","journal-title":"IEEE Comput Intell Mag"},{"issue":"10","key":"10150_CR112","first-page":"449","volume":"12","author":"B Santoso","year":"2018","unstructured":"Santoso B, Wijayanto H, Notodiputro KA, Sartono B (2018) K-neighbor over-sampling with cleaning data: a new approach to improve classification performance in data sets with class imbalance. Appl Math Sci 12(10):449\u2013460","journal-title":"Appl Math Sci"},{"issue":"1","key":"10150_CR113","doi-asserted-by":"publisher","first-page":"185","DOI":"10.1109\/TSMCA.2009.2029559","volume":"40","author":"C Seiffert","year":"2009","unstructured":"Seiffert C, Khoshgoftaar TM, Van Hulse J, Napolitano A (2009) Rusboost: a hybrid approach to alleviating class imbalance. IEEE Trans Syst Man, Cybern Part A Syst Hum 40(1):185\u2013197","journal-title":"IEEE Trans Syst Man, Cybern Part A Syst Hum"},{"key":"10150_CR114","doi-asserted-by":"publisher","first-page":"120","DOI":"10.1016\/j.jbi.2018.09.004","volume":"86","author":"G Selvaraj","year":"2018","unstructured":"Selvaraj G, Kaliamurthi S, Kaushik A, Khan A, Wei Y, Cho W, Gu K, Wei D (2018) Identification of target gene and prognostic evaluation for lung adenocarcinoma using gene expression meta-analysis, network analysis and neural network algorithms. J Biomed Inform 86:120\u2013134","journal-title":"J Biomed Inform"},{"key":"10150_CR115","doi-asserted-by":"publisher","first-page":"205","DOI":"10.1016\/j.ins.2016.08.077","volume":"384","author":"S Shilaskar","year":"2017","unstructured":"Shilaskar S, Ghatol A, Chatur P (2017) Medical decision support system for extremely imbalanced datasets. Inf Sci 384:205\u2013219","journal-title":"Inf Sci"},{"issue":"12","key":"10150_CR117","doi-asserted-by":"publisher","first-page":"1534","DOI":"10.1109\/TPAMI.2003.1251146","volume":"25","author":"S Singh","year":"2003","unstructured":"Singh S (2003a) Multiresolution estimates of classification complexity. IEEE Trans Pattern Anal Mach Intell 25(12):1534\u20131539","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"issue":"2","key":"10150_CR118","doi-asserted-by":"publisher","first-page":"134","DOI":"10.1007\/s10044-002-0186-2","volume":"6","author":"S Singh","year":"2003","unstructured":"Singh S (2003b) Prism-a novel framework for pattern recognition. Pattern Anal Appl 6(2):134\u2013149","journal-title":"Pattern Anal Appl"},{"issue":"4","key":"10150_CR116","doi-asserted-by":"publisher","first-page":"394","DOI":"10.1002\/sam.11463","volume":"13","author":"D Singh","year":"2020","unstructured":"Singh D, Gosain A, Saha A (2020) Weighted k-nearest neighbor based data complexity metrics for imbalanced datasets. Stat Anal Data Min ASA Data Sci J 13(4):394\u2013404","journal-title":"Stat Anal Data Min ASA Data Sci J"},{"key":"10150_CR119","doi-asserted-by":"crossref","unstructured":"Slowik A, Kwasnicka H (2020) Evolutionary algorithms and their applications to engineering problems. Neural Comput Appl 32(16):12363\u201312379","DOI":"10.1007\/s00521-020-04832-8"},{"issue":"2","key":"10150_CR120","doi-asserted-by":"publisher","first-page":"225","DOI":"10.1007\/s10994-013-5422-z","volume":"95","author":"MR Smith","year":"2014","unstructured":"Smith MR, Martinez T, Giraud-Carrier C (2014) An instance level analysis of data complexity. Mach Learn 95(2):225\u2013256","journal-title":"Mach Learn"},{"key":"10150_CR121","unstructured":"Sotoca JM, Sanchez J, Mollineda RA (2005) A review of data complexity measures and their applicability to pattern classification problems. Actas del III Taller Nacional de Mineria de Datos y Aprendizaje TAMIDA, pp 77\u201383"},{"issue":"29","key":"10150_CR122","first-page":"31","volume":"10","author":"JM Sotoca","year":"2006","unstructured":"Sotoca JM, Mollineda RA, S\u00e1nchez JS (2006) A meta-learning framework for pattern classication by means of data complexity measures. Inteligencia Artificial Revista Iberoamericana de Inteligencia Artificial 10(29):31\u201338","journal-title":"Inteligencia Artificial Revista Iberoamericana de Inteligencia Artificial"},{"issue":"3","key":"10150_CR123","doi-asserted-by":"publisher","first-page":"205","DOI":"10.18178\/ijmlc.2016.6.3.599","volume":"6","author":"RA Sowah","year":"2016","unstructured":"Sowah RA, Agebure MA, Mills GA, Koumadi KM, Fiawoo SY (2016) New cluster undersampling technique for class imbalance learning. Int J Mach Learn Comput 6(3):205","journal-title":"Int J Mach Learn Comput"},{"key":"10150_CR124","doi-asserted-by":"crossref","unstructured":"Stefanowski J (2013) Overlapping, rare examples and class decomposition in learning classifiers from imbalanced data. In: Emerging paradigms in machine learning. Springer, pp 277\u2013306","DOI":"10.1007\/978-3-642-28699-5_11"},{"key":"10150_CR125","doi-asserted-by":"crossref","unstructured":"Stefanowski J (2016) Dealing with data difficulty factors while learning from imbalanced data. In: Challenges in computational statistics and data mining. Springer, pp 333\u2013363","DOI":"10.1007\/978-3-319-18781-5_17"},{"key":"10150_CR126","doi-asserted-by":"crossref","unstructured":"Stefanowski J, Wilk S (2008) Selective pre-processing of imbalanced data for improving classification performance. In: International conference on data warehousing and knowledge discovery. Springer, pp 283\u2013292","DOI":"10.1007\/978-3-540-85836-2_27"},{"issue":"11","key":"10150_CR128","doi-asserted-by":"publisher","first-page":"1787","DOI":"10.1093\/ietisy\/e90-d.11.1787","volume":"90","author":"Y Tang","year":"2007","unstructured":"Tang Y, Gao J (2007) Improved classification for problem involving overlapping patterns. IEICE Trans Inf Syst 90(11):1787\u20131795","journal-title":"IEICE Trans Inf Syst"},{"key":"10150_CR127","unstructured":"Tang W, Mao K, Mak LO, Ng GW (2010) Classification for overlapping classes using optimized overlapping region detection and soft decision. In: 2010 13th international conference on information fusion. IEEE, pp 1\u20138"},{"key":"10150_CR129","doi-asserted-by":"crossref","unstructured":"Thornton C (1998) Separability is a learner\u2019s best friend. In: 4th Neural computation and psychology workshop, London, 9\u201311 April 1997. Springer, pp 40\u201346","DOI":"10.1007\/978-1-4471-1546-5_4"},{"key":"10150_CR130","first-page":"769","volume":"6","author":"I Tomek","year":"1976","unstructured":"Tomek I (1976) Two modifications of cnn. IEEE Trans Syst Man Commun 6:769\u2013772","journal-title":"IEEE Trans Syst Man Commun"},{"key":"10150_CR131","doi-asserted-by":"publisher","first-page":"429","DOI":"10.1016\/j.neucom.2014.10.007","volume":"152","author":"P Vorraboot","year":"2015","unstructured":"Vorraboot P, Rasmequan S, Chinnasarn K, Lursinsap C (2015) Improving classification rate constrained to imbalanced data between overlapped and non-overlapped regions by hybrid algorithms. Neurocomputing 152:429\u2013443","journal-title":"Neurocomputing"},{"key":"10150_CR132","doi-asserted-by":"crossref","unstructured":"Vuttipittayamongkol P, Elyan E (2020a) Improved overlap-based undersampling for imbalanced dataset classification with application to epilepsy and Parkinson\u2019s disease. Int J Neural Syst 30(08):2050043","DOI":"10.1142\/S0129065720500434"},{"key":"10150_CR133","doi-asserted-by":"publisher","first-page":"47","DOI":"10.1016\/j.ins.2019.08.062","volume":"509","author":"P Vuttipittayamongkol","year":"2020","unstructured":"Vuttipittayamongkol P, Elyan E (2020b) Neighbourhood-based undersampling approach for handling imbalanced and overlapped data. Inf Sci 509:47\u201370.","journal-title":"Inf Sci"},{"key":"10150_CR134","doi-asserted-by":"crossref","unstructured":"Vuttipittayamongkol P, Elyan E, Petrovski A, Jayne C (2018) Overlap-based undersampling for improving imbalanced data classification. In: International conference on intelligent data engineering and automated learning. Springer, pp 689\u2013697","DOI":"10.1007\/978-3-030-03493-1_72"},{"key":"10150_CR135","doi-asserted-by":"crossref","unstructured":"Vuttipittayamongkol P, Elyan E, Petrovski A (2020) On the class overlap problem in imbalanced data classification. Knowl Based Syst 106631","DOI":"10.1016\/j.knosys.2020.106631"},{"key":"10150_CR136","unstructured":"Van\u00a0der Walt CM, Barnard E (2007) Measures for the characterisation of pattern-recognition data sets. In: 18th Annual symposium of the pattern recognition association of South Africa"},{"key":"10150_CR137","unstructured":"Van\u00a0der Walt CM, et\u00a0al. (2008) Data measures that characterise classification problems. PhD thesis, University of Pretoria"},{"issue":"1","key":"10150_CR138","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s10115-009-0198-y","volume":"25","author":"BX Wang","year":"2010","unstructured":"Wang BX, Japkowicz N (2010) Boosting support vector machines for imbalanced data sets. Knowl Inf Syst 25(1):1\u201320","journal-title":"Knowl Inf Syst"},{"key":"10150_CR139","doi-asserted-by":"crossref","unstructured":"Wang S, Yao X (2009) Diversity analysis on imbalanced data sets by using ensemble models. In: 2009 IEEE symposium on computational intelligence and data mining. IEEE, pp 324\u2013331","DOI":"10.1109\/CIDM.2009.4938667"},{"issue":"2","key":"10150_CR140","doi-asserted-by":"publisher","first-page":"434","DOI":"10.1109\/TR.2013.2259203","volume":"62","author":"S Wang","year":"2013","unstructured":"Wang S, Yao X (2013) Using class imbalance learning for software defect prediction. IEEE Trans Reliab 62(2):434\u2013443","journal-title":"IEEE Trans Reliab"},{"key":"10150_CR141","doi-asserted-by":"publisher","first-page":"106116","DOI":"10.1016\/j.knosys.2020.106116","volume":"203","author":"J Wei","year":"2020","unstructured":"Wei J, Huang H, Yao L, Hu Y, Fan Q, Huang D (2020a) Ia-suwo: an improving adaptive semi-unsupervised weighted oversampling for imbalanced classification problems. Knowl Based Syst 203:106116","journal-title":"Knowl Based Syst"},{"key":"10150_CR142","doi-asserted-by":"publisher","first-page":"113504","DOI":"10.1016\/j.eswa.2020.113504","volume":"158","author":"J Wei","year":"2020","unstructured":"Wei J, Huang H, Yao L, Hu Y, Fan Q, Huang D (2020b) Ni-mwmote: an improving noise-immunity majority weighted minority oversampling technique for imbalanced classification problems. Expert Syst Appl 158:113504","journal-title":"Expert Syst Appl"},{"key":"10150_CR143","doi-asserted-by":"crossref","unstructured":"Weng CG, Poon J (2006) A data complexity analysis on imbalanced datasets and an alternative imbalance recovering strategy. In: 2006 IEEE\/WIC\/ACM international conference on web intelligence (WI 2006 main conference proceedings) (WI\u201906). IEEE, pp 270\u2013276","DOI":"10.1109\/WI.2006.9"},{"key":"10150_CR144","doi-asserted-by":"publisher","first-page":"408","DOI":"10.1109\/TSMC.1972.4309137","volume":"3","author":"DL Wilson","year":"1972","unstructured":"Wilson DL (1972) Asymptotic properties of nearest neighbor rules using edited data. IEEE Trans Syst Man Cybern 3:408\u2013421","journal-title":"IEEE Trans Syst Man Cybern"},{"issue":"2","key":"10150_CR145","doi-asserted-by":"publisher","first-page":"149","DOI":"10.1515\/fcds-2017-0007","volume":"42","author":"S Wojciechowski","year":"2017","unstructured":"Wojciechowski S, Wilk S (2017) Difficulty factors and preprocessing in imbalanced data sets: an experimental study on artificial data. Found Comput Decis Sci 42(2):149\u2013176","journal-title":"Found Comput Decis Sci"},{"key":"10150_CR146","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1016\/j.inffus.2013.04.006","volume":"16","author":"M Wozniak","year":"2014","unstructured":"Wozniak M, Grana M, Corchado E (2014) A survey of multiple classifier systems as hybrid systems. Inf Fusion 16:3\u201317","journal-title":"Inf Fusion"},{"key":"10150_CR147","doi-asserted-by":"crossref","unstructured":"Xiong H, Wu J, Liu L (2010) classification with classoverlapping: a systematic study. In: Proceedings of the 1st international conference on E-Business intelligence (ICEBI2010). Atlantis Press","DOI":"10.2991\/icebi.2010.43"},{"key":"10150_CR148","doi-asserted-by":"publisher","first-page":"23537","DOI":"10.1109\/ACCESS.2019.2899467","volume":"7","author":"Y Yan","year":"2019","unstructured":"Yan Y, Liu R, Ding Z, Du X, Chen J, Zhang Y (2019) A parameter-free cleaning method for smote in imbalanced classification. IEEE Access 7:23537\u201323548","journal-title":"IEEE Access"},{"issue":"3","key":"10150_CR149","doi-asserted-by":"publisher","first-page":"5718","DOI":"10.1016\/j.eswa.2008.06.108","volume":"36","author":"SJ Yen","year":"2009","unstructured":"Yen SJ, Lee YS (2009) Cluster-based under-sampling approaches for imbalanced data distributions. Expert Syst Appl 36(3):5718\u20135727","journal-title":"Expert Syst Appl"},{"key":"10150_CR150","doi-asserted-by":"publisher","first-page":"72","DOI":"10.1016\/j.patrec.2017.01.014","volume":"88","author":"C Zhu","year":"2017","unstructured":"Zhu C, Wang Z (2017) Entropy-based matrix learning machine for imbalanced data sets. Pattern Recogn Lett 88:72\u201380","journal-title":"Pattern Recogn Lett"},{"key":"10150_CR151","doi-asserted-by":"publisher","first-page":"327","DOI":"10.1016\/j.patcog.2017.07.024","volume":"72","author":"T Zhu","year":"2017","unstructured":"Zhu T, Lin Y, Liu Y (2017) Synthetic minority oversampling technique for multiclass imbalance problems. Pattern Recogn 72:327\u2013340","journal-title":"Pattern Recogn"},{"key":"10150_CR152","doi-asserted-by":"publisher","first-page":"104826","DOI":"10.1016\/j.knosys.2019.06.034","volume":"187","author":"T Zhu","year":"2020","unstructured":"Zhu T, Lin Y, Liu Y (2020a) Improving interpolation-based oversampling for imbalanced data learning. Knowl-Based Syst 187:104826","journal-title":"Knowl-Based Syst"},{"key":"10150_CR153","doi-asserted-by":"publisher","first-page":"333","DOI":"10.1016\/j.neucom.2020.08.060","volume":"417","author":"Y Zhu","year":"2020","unstructured":"Zhu Y, Yan Y, Zhang Y, Zhang Y (2020b) Ehso: evolutionary hybrid sampling in overlapping scenarios for imbalanced learning. Neurocomputing 417:333\u2013346","journal-title":"Neurocomputing"}],"container-title":["Artificial Intelligence Review"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10462-022-10150-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10462-022-10150-3\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10462-022-10150-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,11,12]],"date-time":"2022-11-12T04:34:56Z","timestamp":1668227696000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10462-022-10150-3"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,3,24]]},"references-count":153,"journal-issue":{"issue":"8","published-print":{"date-parts":[[2022,12]]}},"alternative-id":["10150"],"URL":"https:\/\/doi.org\/10.1007\/s10462-022-10150-3","relation":{},"ISSN":["0269-2821","1573-7462"],"issn-type":[{"value":"0269-2821","type":"print"},{"value":"1573-7462","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022,3,24]]},"assertion":[{"value":"24 March 2022","order":1,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":".","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Code availability"}}]}}