{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,13]],"date-time":"2026-05-13T09:09:34Z","timestamp":1778663374434,"version":"3.51.4"},"reference-count":27,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2026,5,13]],"date-time":"2026-05-13T00:00:00Z","timestamp":1778630400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,5,13]],"date-time":"2026-05-13T00:00:00Z","timestamp":1778630400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Innovations Syst Softw Eng"],"published-print":{"date-parts":[[2026,6]]},"DOI":"10.1007\/s11334-026-00638-4","type":"journal-article","created":{"date-parts":[[2026,5,13]],"date-time":"2026-05-13T08:15:29Z","timestamp":1778660129000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Evaluating the indispensable aspect of data \u0131mbalance in software fault prediction with feature selection and variants of machine learning and ensemble techniques"],"prefix":"10.1007","volume":"22","author":[{"given":"Kulamala Vinod","family":"Kumar","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Durga Prasad","family":"Mohapatra","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Lov","family":"Kumar","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2026,5,13]]},"reference":[{"key":"638_CR1","doi-asserted-by":"crossref","unstructured":"Ahmed MR, Ali AM, Ahmed N, Zamal MFB and Shamrat FMJM (2021) The impact of software fault prediction in real-world application: an automated approach for software engineering. In: Proceedings of 2020 the 6th international conference on computing and data engineering, 247\u2013251","DOI":"10.1145\/3379247.3379278"},{"key":"638_CR2","doi-asserted-by":"publisher","DOI":"10.1016\/j.compeleceng.2022.107886","volume":"100","author":"I Batool","year":"2022","unstructured":"Batool I, Khan TA (2022) Software fault prediction using data mining, machine learning and deep learning techniques: a systematic literature review. Comput Electr Eng 100:107886","journal-title":"Comput Electr Eng"},{"key":"638_CR3","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2021.114595","volume":"172","author":"AK Pandey","year":"2021","unstructured":"Pandey AK, Mishra RB, Tripathi AK (2021) Machine learning based methods for software fault prediction: a survey. Expert Syst Appl 172:114595","journal-title":"Expert Syst Appl"},{"key":"638_CR4","doi-asserted-by":"publisher","DOI":"10.1016\/j.infsof.2020.106287","volume":"122","author":"N Li","year":"2022","unstructured":"Li N, Shepperd M, Guo Y (2022) A systematic review of unsupervised learning techniques for software defect prediction. Inf Softw Technol 122:106287","journal-title":"Inf Softw Technol"},{"issue":"2","key":"638_CR5","doi-asserted-by":"publisher","first-page":"301","DOI":"10.1007\/s11334-021-00390-x","volume":"18","author":"M Mangla","year":"2022","unstructured":"Mangla M, Sharma N, Mohanty SN (2022) A sequential ensemble model for software fault prediction. Innov Syst Softw Eng 18(2):301\u2013308","journal-title":"Innov Syst Softw Eng"},{"issue":"2","key":"638_CR6","doi-asserted-by":"publisher","first-page":"255","DOI":"10.1007\/s10462-017-9563-5","volume":"51","author":"SS Rathore","year":"2019","unstructured":"Rathore SS, Kumar S (2019) A study on software fault prediction techniques. Artif Intell Rev 51(2):255\u2013327","journal-title":"Artif Intell Rev"},{"key":"638_CR7","doi-asserted-by":"publisher","first-page":"693","DOI":"10.4018\/978-1-7998-9158-1.ch036","volume-title":"Research anthology on usage and development of open source software","author":"W Rhmann","year":"2021","unstructured":"Rhmann W, Ansari GA (2021) Ensemble techniques-based software fault prediction in an open-source project. Research anthology on usage and development of open source software. IGI Global, pp 693\u2013709"},{"key":"638_CR8","unstructured":"Sahu SP, Reddy BR, Mukherjee D, Shyamla DM, Verma BS (2021) A hybrid approach to software fault prediction using genetic programming and ensemble learning methods. Int J Syst Assurance Eng Manag 1\u201315"},{"key":"638_CR9","doi-asserted-by":"publisher","first-page":"541","DOI":"10.1007\/978-981-10-5547-8_56","volume-title":"Smart computing and informatics","author":"D Sharma","year":"2018","unstructured":"Sharma D, Chandra P (2018) Software fault prediction using machine learning techniques. Smart computing and informatics. Springer, pp 541\u2013549"},{"issue":"1","key":"638_CR10","first-page":"37","volume":"11","author":"D Sharma","year":"2019","unstructured":"Sharma D, Chandra P (2019) A comparative analysis of soft computing techniques in software fault prediction model development. Int J Inf Technol 11(1):37\u201346","journal-title":"Int J Inf Technol"},{"issue":"2","key":"638_CR11","doi-asserted-by":"publisher","DOI":"10.3390\/sym11020212","volume":"11","author":"LH Son","year":"2019","unstructured":"Son LH, Pritam N, Khari M, Kumar R, Phuong PTM, Thong PH (2019) Empirical study of software defect prediction: a systematic mapping. Symmetry Basel 11(2):212","journal-title":"Symmetry Basel"},{"issue":"1","key":"638_CR12","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s10515-021-00311-z","volume":"29","author":"A Balaram","year":"2022","unstructured":"Balaram A, Vasundra S (2022) Prediction of software fault-prone classes using ensemble random forest with adaptive synthetic sampling algorithm. Autom Softw Eng 29(1):1\u201321","journal-title":"Autom Softw Eng"},{"issue":"2","key":"638_CR13","doi-asserted-by":"publisher","first-page":"515","DOI":"10.2298\/CSIS180312039B","volume":"16","author":"E Borandag","year":"2019","unstructured":"Borandag E, Ozcift A, Kilinc D, Yucalar F (2019) Majority vote feature selection algorithm in software fault prediction. Comput Sci Inf Syst 16(2):515\u2013539","journal-title":"Comput Sci Inf Syst"},{"issue":"6","key":"638_CR14","first-page":"2185","volume":"13","author":"S Goyal","year":"2021","unstructured":"Goyal S, Bhatia PK (2021) Software fault prediction using lion optimization algorithm. Int J Inf Technol 13(6):2185\u20132190","journal-title":"Int J Inf Technol"},{"issue":"27","key":"638_CR15","first-page":"42","volume":"122","author":"H Turabieh","year":"2019","unstructured":"Turabieh H, Mafarja M, Li X (2019) Iterated feature selection algorithms with layered recurrent neural network for software fault prediction. Expert Syst Appl 122(27):42","journal-title":"Expert Syst Appl"},{"key":"638_CR16","doi-asserted-by":"crossref","unstructured":"Tran HD, Thi My Hanh LE, Binh NT (2019) Combining feature selection, feature learning and ensemble learning for software fault prediction. In: 2019 11th International Conference on Knowledge and Systems Engineering (KSE), pages 1\u20138. IEEE","DOI":"10.1109\/KSE.2019.8919292"},{"key":"638_CR17","doi-asserted-by":"publisher","DOI":"10.1016\/j.jss.2021.111026","volume":"180","author":"K Zhu","year":"2021","unstructured":"Zhu K, Ying S, Zhang N, Zhu D (2021) Software defect prediction based on enhanced metaheuristic feature selection optimization and a hybrid deep neural network. J Syst Softw 180:111026","journal-title":"J Syst Softw"},{"key":"638_CR18","doi-asserted-by":"crossref","unstructured":"Abaei G, Tah WZ, Toh ZJW, Hor ESJ (2022) Improving software fault prediction in imbalanced datasets using the under-sampling approach: In: 2022 11th International Conference on Software and Computer Applications, 41\u201347","DOI":"10.1145\/3524304.3524310"},{"key":"638_CR19","doi-asserted-by":"crossref","unstructured":"Agrawal A, Menzies T (2018) Is better data better than better data miners?: on the benefits of tuning smote for defect prediction: In: ACM Proceedings of the 40th International Conference on Software engineering, 1050\u20131061","DOI":"10.1145\/3180155.3180197"},{"key":"638_CR20","doi-asserted-by":"publisher","DOI":"10.1109\/TR.2022.3158949","author":"SS Rathore","year":"2022","unstructured":"Rathore SS, Chouhary SS, Jain DK, Vachhani AG (2022) Generative oversampling methods for handling imbalanced data in software fault prediction. IEEE Trans Reliab. https:\/\/doi.org\/10.1109\/TR.2022.3158949","journal-title":"IEEE Trans Reliab"},{"issue":"12","key":"638_CR21","doi-asserted-by":"publisher","first-page":"1253","DOI":"10.1109\/TSE.2018.2836442","volume":"45","author":"Q Song","year":"2019","unstructured":"Song Q, Guo Y, Shepperd M (2019) A comprehensive investigation of the role of imbalanced learning for software defect prediction. IEEE Trans Softw Eng 45(12):1253\u20131269","journal-title":"IEEE Trans Softw Eng"},{"key":"638_CR22","doi-asserted-by":"crossref","unstructured":"Nam J, Kim S (2015) CLAMI: Defect Prediction on Unlabeled Datasets (T):30th IEEE\/ACM International Conference on Automated Software Engineering (ASE), Lincoln, NE, USA, 452\u2013463","DOI":"10.1109\/ASE.2015.56"},{"key":"638_CR23","doi-asserted-by":"crossref","unstructured":"Kumar L,\u00a0Sureka A (2018) Feature selection techniques to counter class imbalance problem for aging related bug prediction:\u00a0aging related bug prediction. ISEC '18: Proceedings of the 11th Innovations in Software Engineering Conference, 2:1\u00a0\u2013\u00a011","DOI":"10.1145\/3172871.3172872"},{"key":"638_CR24","doi-asserted-by":"publisher","DOI":"10.1016\/j.infsof.2021.106662","volume":"139","author":"S Feng","year":"2021","unstructured":"Feng S, Keung J, Yu X, Xiao Y, Zhang M (2021) Investigation on the stability of SMOTE-based oversampling techniques in software defect prediction. Inf Softw Technol 139:106662","journal-title":"Inf Softw Technol"},{"key":"638_CR25","doi-asserted-by":"publisher","first-page":"16896","DOI":"10.1109\/ACCESS.2025.3532250","volume":"13","author":"SR Goyal","year":"2025","unstructured":"Goyal SR (2025) Current trends in class imbalance learning for software defect prediction. IEEE Access 13:16896\u201317917","journal-title":"IEEE Access"},{"key":"638_CR26","doi-asserted-by":"publisher","first-page":"1815","DOI":"10.1016\/j.procs.2023.01.159","volume":"218","author":"S Pandey","year":"2023","unstructured":"Pandey S, Kumar K (2023) Software fault prediction for imbalanced data: a survey on recent developments. Procedia Comput Sci 218:1815\u20131824","journal-title":"Procedia Comput Sci"},{"issue":"3","key":"638_CR27","doi-asserted-by":"publisher","first-page":"247","DOI":"10.1007\/s11334-022-00457-3","volume":"19","author":"TR Benala","year":"2023","unstructured":"Benala TR, Tantati K (2023) Efficiency of oversampling methods for enhancing software defect prediction by using imbalanced data. Innov Syst Softw Eng 19(3):247\u2013263","journal-title":"Innov Syst Softw Eng"}],"container-title":["Innovations in Systems and Software Engineering"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11334-026-00638-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11334-026-00638-4","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11334-026-00638-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,5,13]],"date-time":"2026-05-13T08:15:38Z","timestamp":1778660138000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11334-026-00638-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,5,13]]},"references-count":27,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2026,6]]}},"alternative-id":["638"],"URL":"https:\/\/doi.org\/10.1007\/s11334-026-00638-4","relation":{},"ISSN":["1614-5046","1614-5054"],"issn-type":[{"value":"1614-5046","type":"print"},{"value":"1614-5054","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,5,13]]},"assertion":[{"value":"19 May 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"12 April 2026","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 May 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no competing interests.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"11"}}