{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,21]],"date-time":"2025-11-21T06:16:02Z","timestamp":1763705762080,"version":"3.45.0"},"reference-count":78,"publisher":"Springer Science and Business Media LLC","issue":"12","license":[{"start":{"date-parts":[[2025,9,29]],"date-time":"2025-09-29T00:00:00Z","timestamp":1759104000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,9,29]],"date-time":"2025-09-29T00:00:00Z","timestamp":1759104000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Knowl Inf Syst"],"published-print":{"date-parts":[[2025,12]]},"DOI":"10.1007\/s10115-025-02593-1","type":"journal-article","created":{"date-parts":[[2025,9,29]],"date-time":"2025-09-29T08:48:10Z","timestamp":1759135690000},"page":"12299-12333","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Proportional clustering-based undersampling for imbalanced data classification"],"prefix":"10.1007","volume":"67","author":[{"given":"Chengshuo","family":"Zhang","sequence":"first","affiliation":[]},{"given":"Zhanrong","family":"Shi","sequence":"additional","affiliation":[]},{"given":"Wangwei","family":"Lu","sequence":"additional","affiliation":[]},{"given":"Zhao","family":"Jin","sequence":"additional","affiliation":[]},{"given":"Shuo","family":"Feng","sequence":"additional","affiliation":[]},{"given":"Mingliang","family":"Xu","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,9,29]]},"reference":[{"key":"2593_CR1","doi-asserted-by":"publisher","DOI":"10.1016\/j.asoc.2024.111376","volume":"154","author":"L Jia","year":"2024","unstructured":"Jia L, Wang Z, Sun P, Xu Z (2024) R-wdls: an efficient security region oversampling technique based on data distribution. Appl Soft Comput 154:111376","journal-title":"Appl Soft Comput"},{"key":"2593_CR2","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2023.121084","volume":"235","author":"S Feng","year":"2024","unstructured":"Feng S, Keung J, Xiao Y, Zhang P, Yu X, Cao X (2024) Improving the undersampling technique by optimizing the termination condition for software defect prediction. Expert Syst Appl 235:121084","journal-title":"Expert Syst Appl"},{"key":"2593_CR3","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2024.123328","volume":"249","author":"Z Sun","year":"2024","unstructured":"Sun Z, Ying W, Zhang W, Gong S (2024) Undersampling method based on minority class density for imbalanced data. Expert Syst Appl 249:123328","journal-title":"Expert Syst Appl"},{"key":"2593_CR4","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2023.109953","volume":"145","author":"Z Teng","year":"2024","unstructured":"Teng Z, Cao P, Huang M, Gao Z, Wang X (2024) Multi-label borderline oversampling technique. Pattern Recogn 145:109953","journal-title":"Pattern Recogn"},{"key":"2593_CR5","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2024.123149","volume":"246","author":"C Vairetti","year":"2024","unstructured":"Vairetti C, Assadi JL, Maldonado S (2024) Efficient hybrid oversampling and intelligent undersampling for imbalanced big data classification. Expert Syst Appl 246:123149","journal-title":"Expert Syst Appl"},{"key":"2593_CR6","doi-asserted-by":"publisher","DOI":"10.1016\/j.asoc.2024.111774","volume":"161","author":"F Wang","year":"2024","unstructured":"Wang F, Zheng M, Hu X, Li H, Wang T, Chen F (2024) Fiao: feature information aggregation oversampling for imbalanced data classification. Appl Soft Comput 161:111774","journal-title":"Appl Soft Comput"},{"key":"2593_CR7","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2024.123987","volume":"251","author":"J Wang","year":"2024","unstructured":"Wang J, Wei J, Huang H, Wen L, Yuan Y, Chen H, Wu R, Wu J (2024) Imwmote: a novel oversampling technique for fault diagnosis in heterogeneous imbalanced data. Expert Syst Appl 251:123987","journal-title":"Expert Syst Appl"},{"key":"2593_CR8","doi-asserted-by":"publisher","DOI":"10.1016\/j.ins.2024.120351","volume":"665","author":"L Bai","year":"2024","unstructured":"Bai L, Ju T, Wang H, Lei M, Pan X (2024) Two-step ensemble under-sampling algorithm for massive imbalanced data classification. Inf Sci 665:120351","journal-title":"Inf Sci"},{"key":"2593_CR9","doi-asserted-by":"publisher","DOI":"10.1016\/j.ins.2024.120263","volume":"662","author":"Y Xie","year":"2024","unstructured":"Xie Y, Huang X, Qin F, Li F, Ding X (2024) A majority affiliation based under-sampling method for class imbalance problem. Inf Sci 662:120263","journal-title":"Inf Sci"},{"key":"2593_CR10","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2023.109721","volume":"143","author":"P Soltanzadeh","year":"2023","unstructured":"Soltanzadeh P, Feizi-Derakhshi MR, Hashemzadeh M (2023) Addressing the class-imbalance and class-overlap problems by a metaheuristic-based under-sampling approach. Pattern Recogn 143:109721","journal-title":"Pattern Recogn"},{"key":"2593_CR11","doi-asserted-by":"publisher","DOI":"10.1016\/j.infsof.2020.106432","volume":"129","author":"S Feng","year":"2021","unstructured":"Feng S, Keung J, Yu X, Xiao Y, Bennin KE, Kabir MA, Zhang M (2021) Coste: complexity-based oversampling technique to alleviate the class imbalance problem in software defect prediction. Inf Softw Technol 129:106432","journal-title":"Inf Softw Technol"},{"key":"2593_CR12","doi-asserted-by":"publisher","first-page":"371","DOI":"10.1016\/j.ins.2022.11.108","volume":"621","author":"T Li","year":"2023","unstructured":"Li T, Wang Y, Liu L, Chen L, Chen CP (2023) Subspace-based minority oversampling for imbalance classification. Inf Sci 621:371\u2013388","journal-title":"Inf Sci"},{"key":"2593_CR13","doi-asserted-by":"publisher","DOI":"10.1016\/j.ins.2024.120724","volume":"674","author":"L Akritidis","year":"2024","unstructured":"Akritidis L, Bozanis P (2024) A clustering-based resampling technique with cluster structure analysis for software defect detection in imbalanced datasets. Inf Sci 674:120724","journal-title":"Inf Sci"},{"key":"2593_CR14","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2024.111612","volume":"292","author":"Y Liu","year":"2024","unstructured":"Liu Y, Du G, Yin C, Zhang H, Wang J (2024) Clustering-based incremental learning for imbalanced data classification. Knowl-Based Syst 292:111612","journal-title":"Knowl-Based Syst"},{"key":"2593_CR15","doi-asserted-by":"publisher","DOI":"10.1016\/j.asoc.2024.111659","volume":"159","author":"X Yuan","year":"2024","unstructured":"Yuan X, Sun C, Chen S (2024) A clustering-based adaptive undersampling ensemble method for highly unbalanced data classification. Appl Soft Comput 159:111659","journal-title":"Appl Soft Comput"},{"key":"2593_CR16","doi-asserted-by":"publisher","first-page":"47","DOI":"10.1016\/j.ins.2018.10.029","volume":"477","author":"C-F Tsai","year":"2019","unstructured":"Tsai C-F, Lin W-C, Hu Y-H, Yao G-T (2019) Under-sampling class imbalanced datasets by combining clustering analysis and instance selection. Inf Sci 477:47\u201354","journal-title":"Inf Sci"},{"key":"2593_CR17","doi-asserted-by":"publisher","first-page":"17","DOI":"10.1016\/j.ins.2017.05.008","volume":"409","author":"W-C Lin","year":"2017","unstructured":"Lin W-C, Tsai C-F, Hu Y-H, Jhang J-S (2017) Clustering-based undersampling in class-imbalanced data. Inf Sci 409:17\u201326","journal-title":"Inf Sci"},{"issue":"3","key":"2593_CR18","doi-asserted-by":"publisher","first-page":"10785","DOI":"10.48084\/etasr.5844","volume":"13","author":"RM Mathew","year":"2023","unstructured":"Mathew RM, Gunasundari R (2023) A cluster-based undersampling technique for multiclass skewed datasets. Eng Technol Appl Sci Res 13(3):10785\u201310790","journal-title":"Eng Technol Appl Sci Res"},{"key":"2593_CR19","doi-asserted-by":"publisher","first-page":"885","DOI":"10.1007\/s10044-015-0458-2","volume":"19","author":"V Vigneron","year":"2016","unstructured":"Vigneron V, Chen H (2016) A multi-scale seriation algorithm for clustering sparse imbalanced data: application to spike sorting. Pattern Anal Appl 19:885\u2013903","journal-title":"Pattern Anal Appl"},{"key":"2593_CR20","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2024.112196","volume":"300","author":"MK Paul","year":"2024","unstructured":"Paul MK, Pal B, Sattar AS, Siddique AMR, Hasan MAM (2024) Carbo: clustering and rotation based oversampling for class imbalance learning. Knowl-Based Syst 300:112196","journal-title":"Knowl-Based Syst"},{"key":"2593_CR21","volume":"8","author":"Q Zhou","year":"2023","unstructured":"Zhou Q, Sun B (2023) Adaptive k-means clustering based under-sampling methods to solve the class imbalance problem. Data Inf Manag 8:100064","journal-title":"Data Inf Manag"},{"key":"2593_CR22","doi-asserted-by":"publisher","first-page":"49","DOI":"10.1016\/j.simpat.2015.03.007","volume":"54","author":"R Duwairi","year":"2015","unstructured":"Duwairi R, Abu-Rahmeh M (2015) A novel approach for initializing the spherical k-means clustering algorithm. Simul Model Pract Theory 54:49\u201363","journal-title":"Simul Model Pract Theory"},{"key":"2593_CR23","doi-asserted-by":"publisher","DOI":"10.1016\/j.asoc.2019.105763","volume":"84","author":"H Xie","year":"2019","unstructured":"Xie H, Zhang L, Lim CP, Yu Y, Liu C, Liu H, Walters J (2019) Improving k-means clustering with enhanced firefly algorithms. Appl Soft Comput 84:105763","journal-title":"Appl Soft Comput"},{"key":"2593_CR24","doi-asserted-by":"crossref","unstructured":"Kaur P, Gosain A (2018) Comparing the behavior of oversampling and undersampling approach of class imbalance learning by combining class imbalance problem with noise. In: ICT Based Innovations: Proceedings of CSI 2015, pp. 23\u201330 . Springer","DOI":"10.1007\/978-981-10-6602-3_3"},{"issue":"5","key":"2593_CR25","doi-asserted-by":"publisher","first-page":"603","DOI":"10.1109\/34.1000236","volume":"24","author":"D Comaniciu","year":"2002","unstructured":"Comaniciu D, Meer P (2002) Mean shift: a robust approach toward feature space analysis. IEEE Trans Pattern Anal Mach Intell 24(5):603\u2013619","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"2593_CR26","unstructured":"Ester M, Kriegel H-P, Sander J, Xu X, et al.(1996) A density-based algorithm for discovering clusters in large spatial databases with noise. In: Kdd, vol. 96, pp. 226\u2013231"},{"issue":"3","key":"2593_CR27","doi-asserted-by":"publisher","first-page":"241","DOI":"10.1007\/BF02289588","volume":"32","author":"SC Johnson","year":"1967","unstructured":"Johnson SC (1967) Hierarchical clustering schemes. Psychometrika 32(3):241\u2013254","journal-title":"Psychometrika"},{"key":"2593_CR28","doi-asserted-by":"publisher","first-page":"341","DOI":"10.1023\/A:1008202821328","volume":"11","author":"R Storn","year":"1997","unstructured":"Storn R, Price K (1997) Differential evolution-a simple and efficient heuristic for global optimization over continuous spaces. J Global Optim 11:341\u2013359","journal-title":"J Global Optim"},{"key":"2593_CR29","doi-asserted-by":"publisher","first-page":"321","DOI":"10.1613\/jair.953","volume":"16","author":"NV Chawla","year":"2002","unstructured":"Chawla NV, Bowyer KW, Hall LO, Kegelmeyer WP (2002) Smote: synthetic minority over-sampling technique. J Artif Intell Res 16:321\u2013357","journal-title":"J Artif Intell Res"},{"key":"2593_CR30","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2023.119735","volume":"221","author":"Q Dai","year":"2023","unstructured":"Dai Q, Liu J, Shi Y (2023) Class-overlap undersampling based on schur decomposition for class-imbalance problems. Expert Syst Appl 221:119735","journal-title":"Expert Syst Appl"},{"key":"2593_CR31","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2020.114301","volume":"168","author":"A Guzm\u00e1n-Ponce","year":"2021","unstructured":"Guzm\u00e1n-Ponce A, S\u00e1nchez JS, Valdovinos RM, Marcial-Romero JR (2021) Dbig-us: a two-stage under-sampling algorithm to face the class imbalance problem. Expert Syst Appl 168:114301","journal-title":"Expert Syst Appl"},{"key":"2593_CR32","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s12864-019-6413-7","volume":"21","author":"D Chicco","year":"2020","unstructured":"Chicco D, Jurman G (2020) The advantages of the matthews correlation coefficient (mcc) over f1 score and accuracy in binary classification evaluation. BMC Genomics 21:1\u201313","journal-title":"BMC Genomics"},{"key":"2593_CR33","unstructured":"Drummond C, Holte RC, et al. (2003) C4. 5, class imbalance, and cost sensitivity: why under-sampling beats over-sampling. In: Workshop on Learning from Imbalanced Datasets II, vol. 11"},{"key":"2593_CR34","doi-asserted-by":"crossref","unstructured":"Han H, Wang W-Y, Mao B-H(2005) Borderline-smote: a new over-sampling method in imbalanced data sets learning. In: International Conference on Intelligent Computing, pp. 878\u2013887 . Springer","DOI":"10.1007\/11538059_91"},{"key":"2593_CR35","doi-asserted-by":"crossref","unstructured":"He H, Bai Y, Garcia EA, Li S (2008) Adasyn: Adaptive synthetic sampling approach for imbalanced learning. In: 2008 IEEE International Joint Conference on Neural Networks (IEEE World Congress on Computational Intelligence), pp. 1322\u20131328 . IEEE","DOI":"10.1109\/IJCNN.2008.4633969"},{"key":"2593_CR36","doi-asserted-by":"publisher","first-page":"529","DOI":"10.1016\/j.neucom.2014.07.064","volume":"150","author":"J B\u0142aszczy\u0144ski","year":"2015","unstructured":"B\u0142aszczy\u0144ski J, Stefanowski J (2015) Neighbourhood sampling in bagging for imbalanced data. Neurocomputing 150:529\u2013542","journal-title":"Neurocomputing"},{"issue":"3","key":"2593_CR37","doi-asserted-by":"publisher","first-page":"515","DOI":"10.1109\/TIT.1968.1054155","volume":"14","author":"P Hart","year":"1968","unstructured":"Hart P (1968) The condensed nearest neighbor rule (corresp.). IEEE Trans Inf Theory 14(3):515\u2013516","journal-title":"IEEE Trans Inf Theory"},{"key":"2593_CR38","unstructured":"Tomek I (1976) An experiment with the edited nearest-nieghbor rule"},{"key":"2593_CR39","doi-asserted-by":"publisher","first-page":"408","DOI":"10.1109\/TSMC.1972.4309137","volume":"3","author":"DL Wilson","year":"1972","unstructured":"Wilson DL (1972) Asymptotic properties of nearest neighbor rules using edited data. IEEE Trans Syst Man Cybern 3:408\u2013421","journal-title":"IEEE Trans Syst Man Cybern"},{"key":"2593_CR40","unstructured":"Kubat M, Matwin S (1997) Addressing the curse of imbalanced data sets: One-sided sampling. In: Proceedings of the Fourteenth International Conference on Machine Learning, pp. 179\u2013186"},{"key":"2593_CR41","doi-asserted-by":"crossref","unstructured":"Laurikkala J (2001) Improving identification of difficult small classes by balancing class distribution. In: Artificial Intelligence in Medicine: 8th Conference on Artificial Intelligence in Medicine in Europe, AIME 2001 Cascais, Portugal, July 1\u20134, 2001, Proceedings 8, pp. 63\u201366 . Springer","DOI":"10.1007\/3-540-48229-6_9"},{"key":"2593_CR42","doi-asserted-by":"publisher","first-page":"225","DOI":"10.1007\/s10994-013-5422-z","volume":"95","author":"MR Smith","year":"2014","unstructured":"Smith MR, Martinez T, Giraud-Carrier C (2014) An instance level analysis of data complexity. Mach Learn 95:225\u2013256","journal-title":"Mach Learn"},{"key":"2593_CR43","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2021.107056","volume":"223","author":"J Li","year":"2021","unstructured":"Li J, Zhu Q, Wu Q, Zhang Z, Gong Y, He Z, Zhu F (2021) Smote-nan-de: addressing the noisy and borderline examples problem in imbalanced classification by natural neighbors and differential evolution. Knowl-Based Syst 223:107056","journal-title":"Knowl-Based Syst"},{"key":"2593_CR44","doi-asserted-by":"crossref","unstructured":"Yoon K, Kwek S (2005) An unsupervised learning approach to resolving the data imbalanced issue in supervised learning problems in functional genomics. In: Fifth International Conference on Hybrid Intelligent Systems (HIS\u201905), p. 6 . IEEE","DOI":"10.1109\/ICHIS.2005.23"},{"key":"2593_CR45","doi-asserted-by":"publisher","first-page":"731","DOI":"10.1007\/978-3-540-37256-1_89","volume":"344","author":"S Yen","year":"2006","unstructured":"Yen S, Lee Y (2006) Under-sampling approaches for improving prediction of the minority class in an imbalanced dataset. Lecture Notes Control Inform Sci 344:731","journal-title":"Lecture Notes Control Inform Sci"},{"issue":"6","key":"2593_CR46","doi-asserted-by":"publisher","first-page":"66","DOI":"10.9790\/0661-1266673","volume":"12","author":"MR Longadge","year":"2013","unstructured":"Longadge MR, Dongre MSS, Malik L (2013) Multi-cluster based approach for skewed data in data mining. J Comput Eng (IOSR-JCE) 12(6):66\u201373","journal-title":"J Comput Eng (IOSR-JCE)"},{"key":"2593_CR47","unstructured":"Rahman MM, Davis D (2013) Cluster based under-sampling for unbalanced cardiovascular data. In: Proceedings of the World Congress on Engineering, vol. 3, pp. 3\u20135"},{"key":"2593_CR48","unstructured":"Barella VH, Costa EP, Carvalho A, Pl F (2014) Clusteross: a new undersampling method for imbalanced learning. In: Proc. of 3th Brazilian Conference on Intelligent Systems. Academic Press, pp. 1\u20136"},{"key":"2593_CR49","doi-asserted-by":"crossref","unstructured":"Sobhani P, Viktor H, Matwin S (2014) Learning from imbalanced data using ensemble methods and cluster-based undersampling. In: International Workshop on New Frontiers in Mining Complex Patterns, pp. 69\u201383 . Springer","DOI":"10.1007\/978-3-319-17876-9_5"},{"key":"2593_CR50","doi-asserted-by":"crossref","unstructured":"Chennuru VK, Timmappareddy SR (2017) Mahalcusfilter: a hybrid undersampling method to improve the minority classification rate of imbalanced datasets. In: Mining Intelligence and Knowledge Exploration: 5th International Conference, MIKE 2017, Hyderabad, India, December 13\u201315, 2017, Proceedings 5, pp. 43\u201353 . Springer","DOI":"10.1007\/978-3-319-71928-3_5"},{"key":"2593_CR51","doi-asserted-by":"publisher","first-page":"88","DOI":"10.1016\/j.neucom.2017.03.011","volume":"243","author":"N Ofek","year":"2017","unstructured":"Ofek N, Rokach L, Stern R, Shabtai A (2017) Fast-cbus: a fast clustering-based undersampling method for addressing the class imbalance problem. Neurocomputing 243:88\u2013102","journal-title":"Neurocomputing"},{"issue":"3","key":"2593_CR52","doi-asserted-by":"publisher","first-page":"264","DOI":"10.1145\/331499.331504","volume":"31","author":"AK Jain","year":"1999","unstructured":"Jain AK, Murty MN, Flynn PJ (1999) Data clustering: a review. ACM Comput Surv (CSUR) 31(3):264\u2013323","journal-title":"ACM Comput Surv (CSUR)"},{"issue":"1","key":"2593_CR53","first-page":"100","volume":"28","author":"JA Hartigan","year":"1979","unstructured":"Hartigan JA, Wong MA (1979) Algorithm as 136: a k-means clustering algorithm. J R Stat Soc series c (appl stat) 28(1):100\u2013108","journal-title":"J R Stat Soc series c (appl stat)"},{"key":"2593_CR54","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2023.109404","volume":"139","author":"H Hu","year":"2023","unstructured":"Hu H, Liu J, Zhang X, Fang M (2023) An effective and adaptable k-means algorithm for big data cluster analysis. Pattern Recogn 139:109404","journal-title":"Pattern Recogn"},{"key":"2593_CR55","doi-asserted-by":"publisher","first-page":"178","DOI":"10.1016\/j.ins.2022.11.139","volume":"622","author":"AM Ikotun","year":"2023","unstructured":"Ikotun AM, Ezugwu AE, Abualigah L, Abuhaija B, Heming J (2023) K-means clustering algorithms: a comprehensive review, variants analysis, and advances in the era of big data. Inf Sci 622:178\u2013210","journal-title":"Inf Sci"},{"issue":"2","key":"2593_CR56","first-page":"539","volume":"39","author":"X-Y Liu","year":"2008","unstructured":"Liu X-Y, Wu J, Zhou Z-H (2008) Exploratory undersampling for class-imbalance learning. IEEE Trans Syst Man Cybern Part B (Cybern) 39(2):539\u2013550","journal-title":"IEEE Trans Syst Man Cybern Part B (Cybern)"},{"issue":"6","key":"2593_CR57","doi-asserted-by":"publisher","first-page":"757","DOI":"10.1109\/TSE.2012.70","volume":"39","author":"Y Kamei","year":"2012","unstructured":"Kamei Y, Shihab E, Adams B, Hassan AE, Mockus A, Sinha A, Ubayashi N (2012) A large-scale empirical study of just-in-time quality assurance. IEEE Trans Software Eng 39(6):757\u2013773","journal-title":"IEEE Trans Software Eng"},{"issue":"1","key":"2593_CR58","doi-asserted-by":"publisher","first-page":"139","DOI":"10.1109\/TR.2019.2931559","volume":"69","author":"X Yu","year":"2019","unstructured":"Yu X, Liu J, Keung JW, Li Q, Bennin KE, Xu Z, Wang J, Cui X (2019) Improving ranking-oriented defect prediction using a cost-sensitive ranking svm. IEEE Trans Reliab 69(1):139\u2013153","journal-title":"IEEE Trans Reliab"},{"issue":"1","key":"2593_CR59","doi-asserted-by":"publisher","first-page":"234","DOI":"10.1109\/TR.2014.2370891","volume":"64","author":"X Yang","year":"2014","unstructured":"Yang X, Tang K, Yao X (2014) A learning-to-rank approach to software defect prediction. IEEE Trans Reliab 64(1):234\u2013246","journal-title":"IEEE Trans Reliab"},{"issue":"12","key":"2593_CR60","doi-asserted-by":"publisher","first-page":"1253","DOI":"10.1109\/TSE.2018.2836442","volume":"45","author":"Q Song","year":"2018","unstructured":"Song Q, Guo Y, Shepperd M (2018) A comprehensive investigation of the role of imbalanced learning for software defect prediction. IEEE Trans Softw Eng 45(12):1253\u20131269","journal-title":"IEEE Trans Softw Eng"},{"key":"2593_CR61","first-page":"255","volume":"17","author":"J Derrac","year":"2015","unstructured":"Derrac J, Garcia S, Sanchez L, Herrera F (2015) Keel data-mining software tool: data set repository, integration of algorithms and experimental analysis framework. J Mult Valued Logic Soft Comput 17:255\u2013287","journal-title":"J Mult Valued Logic Soft Comput"},{"issue":"9","key":"2593_CR62","doi-asserted-by":"publisher","first-page":"1208","DOI":"10.1109\/TSE.2013.11","volume":"39","author":"M Shepperd","year":"2013","unstructured":"Shepperd M, Song Q, Sun Z, Mair C (2013) Data quality: some comments on the nasa software defect datasets. IEEE Trans Softw Eng 39(9):1208\u20131215","journal-title":"IEEE Trans Softw Eng"},{"key":"2593_CR63","doi-asserted-by":"crossref","unstructured":"Wu R, Zhang H, Kim S, Cheung S-C (2011) Relink: recovering links between bugs and changes. In: Proceedings of the 19th ACM SIGSOFT Symposium and the 13th European Conference on Foundations of Software Engineering, pp. 15\u201325","DOI":"10.1145\/2025113.2025120"},{"key":"2593_CR64","first-page":"2825","volume":"12","author":"F Pedregosa","year":"2011","unstructured":"Pedregosa F, Varoquaux G, Gramfort A, Michel V, Thirion B, Grisel O, Blondel M, Prettenhofer P, Weiss R, Dubourg V et al (2011) Scikit-learn: machine learning in python. J Mach Learn Res 12:2825\u20132830","journal-title":"J Mach Learn Res"},{"key":"2593_CR65","doi-asserted-by":"crossref","unstructured":"Rey D, Neuh\u00e4user M (2011) Wilcoxon-signed-rank test. International encyclopedia of statistical science, 1658\u20131659","DOI":"10.1007\/978-3-642-04898-2_616"},{"issue":"2","key":"2593_CR66","doi-asserted-by":"publisher","first-page":"545","DOI":"10.11144\/Javeriana.upsy10-2.cdcp","volume":"10","author":"G Macbeth","year":"2011","unstructured":"Macbeth G, Razumiejczyk E, Ledesma RD (2011) Cliff\u2019s delta calculator: a non-parametric effect size program for two groups of observations. Universitas Psychologica 10(2):545\u2013555","journal-title":"Universitas Psychologica"},{"issue":"11\u201312","key":"2593_CR67","doi-asserted-by":"publisher","first-page":"1073","DOI":"10.1016\/j.infsof.2007.02.015","volume":"49","author":"VB Kampenes","year":"2007","unstructured":"Kampenes VB, Dyb\u00e5 T, Hannay JE, Sj\u00f8berg DI (2007) A systematic review of effect size in software engineering experiments. Inf Softw Technol 49(11\u201312):1073\u20131086","journal-title":"Inf Softw Technol"},{"issue":"11","key":"2593_CR68","doi-asserted-by":"publisher","first-page":"1091","DOI":"10.1109\/TSE.2017.2748129","volume":"43","author":"S Herbold","year":"2017","unstructured":"Herbold S (2017) Comments on scottknottesd in response to \u201can empirical comparison of model validation techniques for defect prediction models\u2019\u2019. IEEE Trans Softw Eng 43(11):1091\u20131094","journal-title":"IEEE Trans Softw Eng"},{"key":"2593_CR69","doi-asserted-by":"crossref","unstructured":"Feng S, Keung J, Liu J, Xiao Y, Yu X, Zhang M (2021) Roct: Radius-based class overlap cleaning technique to alleviate the class overlap problem in software defect prediction. In: 2021 IEEE 45th Annual Computers, Software, and Applications Conference (COMPSAC), pp. 228\u2013237 . IEEE","DOI":"10.1109\/COMPSAC51774.2021.00041"},{"issue":"1","key":"2593_CR70","doi-asserted-by":"publisher","first-page":"12","DOI":"10.1002\/(SICI)1097-4571(199401)45:1<12::AID-ASI2>3.0.CO;2-L","volume":"45","author":"M Buckland","year":"1994","unstructured":"Buckland M, Gey F (1994) The relationship between recall and precision. J Am Soc Inf Sci 45(1):12\u201319","journal-title":"J Am Soc Inf Sci"},{"issue":"15","key":"2593_CR71","doi-asserted-by":"publisher","first-page":"3213","DOI":"10.3390\/electronics12153213","volume":"12","author":"L Yin","year":"2023","unstructured":"Yin L, Hu H, Li K, Zheng G, Qu Y, Chen H (2023) Improvement of dbscan algorithm based on k-dist graph for adaptive determining parameters. Electronics 12(15):3213","journal-title":"Electronics"},{"key":"2593_CR72","doi-asserted-by":"crossref","unstructured":"Kennedy J, Eberhart R (1995) Particle swarm optimization. In: Proceedings of ICNN\u201995-international Conference on Neural Networks, vol. 4, pp. 1942\u20131948 . IEEE","DOI":"10.1109\/ICNN.1995.488968"},{"key":"2593_CR73","doi-asserted-by":"publisher","first-page":"46","DOI":"10.1016\/j.advengsoft.2013.12.007","volume":"69","author":"S Mirjalili","year":"2014","unstructured":"Mirjalili S, Mirjalili SM, Lewis A (2014) Grey wolf optimizer. Adv Eng Softw 69:46\u201361","journal-title":"Adv Eng Softw"},{"key":"2593_CR74","doi-asserted-by":"publisher","first-page":"51","DOI":"10.1016\/j.advengsoft.2016.01.008","volume":"95","author":"S Mirjalili","year":"2016","unstructured":"Mirjalili S, Lewis A (2016) The whale optimization algorithm. Adv Eng Softw 95:51\u201367","journal-title":"Adv Eng Softw"},{"issue":"2","key":"2593_CR75","doi-asserted-by":"publisher","first-page":"2321","DOI":"10.1109\/TSG.2023.3305326","volume":"15","author":"Z Chen","year":"2024","unstructured":"Chen Z, Wang J, Han Q (2024) Receding-horizon chiller operation planning via collaborative neurodynamic optimization. IEEE Trans Smart Grid 15(2):2321\u20132331","journal-title":"IEEE Trans Smart Grid"},{"issue":"3","key":"2593_CR76","doi-asserted-by":"publisher","first-page":"2186","DOI":"10.1109\/TAP.2019.2938703","volume":"68","author":"X Li","year":"2019","unstructured":"Li X, Luk KM (2019) The grey wolf optimizer and its applications in electromagnetics. IEEE Trans Antennas Propag 68(3):2186\u20132197","journal-title":"IEEE Trans Antennas Propag"},{"key":"2593_CR77","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2020.113917","volume":"166","author":"MH Nadimi-Shahraki","year":"2021","unstructured":"Nadimi-Shahraki MH, Taghian S, Mirjalili S (2021) An improved grey wolf optimizer for solving engineering problems. Expert Syst Appl 166:113917","journal-title":"Expert Syst Appl"},{"key":"2593_CR78","doi-asserted-by":"publisher","DOI":"10.1016\/j.enconman.2020.113661","volume":"228","author":"Y Song","year":"2021","unstructured":"Song Y, Wu D, Deng W, Gao X-Z, Li T, Zhang B, Li Y (2021) Mppcede: multi-population parallel co-evolutionary differential evolution for parameter optimization. Energy Convers Manage 228:113661","journal-title":"Energy Convers Manage"}],"container-title":["Knowledge and Information Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10115-025-02593-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10115-025-02593-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10115-025-02593-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,11,21]],"date-time":"2025-11-21T06:03:16Z","timestamp":1763704996000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10115-025-02593-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,9,29]]},"references-count":78,"journal-issue":{"issue":"12","published-print":{"date-parts":[[2025,12]]}},"alternative-id":["2593"],"URL":"https:\/\/doi.org\/10.1007\/s10115-025-02593-1","relation":{},"ISSN":["0219-1377","0219-3116"],"issn-type":[{"type":"print","value":"0219-1377"},{"type":"electronic","value":"0219-3116"}],"subject":[],"published":{"date-parts":[[2025,9,29]]},"assertion":[{"value":"20 February 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"7 July 2025","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"1 September 2025","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"29 September 2025","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no Conflict of interest relevant to the content of this article.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"Not applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval"}},{"value":"Not applicable.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent to participate"}},{"value":"Not applicable.","order":5,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for publication"}}]}}