{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,9]],"date-time":"2026-04-09T00:29:30Z","timestamp":1775694570804,"version":"3.50.1"},"reference-count":111,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2025,5,16]],"date-time":"2025-05-16T00:00:00Z","timestamp":1747353600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,5,16]],"date-time":"2025-05-16T00:00:00Z","timestamp":1747353600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100001809","name":"the National Natural Science Foundation of China","doi-asserted-by":"crossref","award":["62202350"],"award-info":[{"award-number":["62202350"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"crossref"}]},{"name":"the Start-up Grant from Wuhan University of Technology","award":["104-40120693"],"award-info":[{"award-number":["104-40120693"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Autom Softw Eng"],"published-print":{"date-parts":[[2025,11]]},"DOI":"10.1007\/s10515-025-00524-6","type":"journal-article","created":{"date-parts":[[2025,5,15]],"date-time":"2025-05-15T21:30:59Z","timestamp":1747344659000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["The impact of feature selection and feature reduction techniques for code smell detection: A comprehensive empirical study"],"prefix":"10.1007","volume":"32","author":[{"given":"Zexian","family":"Zhang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Lin","family":"Zhu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Shuang","family":"Yin","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Wenhua","family":"Hu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Shan","family":"Gao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Haoxuan","family":"Chen","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Fuyang","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,5,16]]},"reference":[{"issue":"4","key":"524_CR1","doi-asserted-by":"crossref","first-page":"433","DOI":"10.1002\/wics.101","volume":"2","author":"H Abdi","year":"2010","unstructured":"Abdi, H., Williams, L.J.: Principal component analysis. Wiley. Interdiscip. Rev. Comp. stat. 2(4), 433\u2013459 (2010)","journal-title":"Wiley. Interdiscip. Rev. Comp. stat."},{"issue":"7","key":"524_CR2","doi-asserted-by":"crossref","first-page":"1159","DOI":"10.1080\/09720510.2020.1799576","volume":"23","author":"M Agnihotri","year":"2020","unstructured":"Agnihotri, M., Chug, A.: Application of machine learning algorithms for code smell prediction using object-oriented software metrics. JSMS 23(7), 1159\u20131171 (2020)","journal-title":"JSMS"},{"issue":"1","key":"524_CR3","doi-asserted-by":"crossref","first-page":"43","DOI":"10.1016\/j.patrec.2004.08.015","volume":"26","author":"A Ahmad","year":"2005","unstructured":"Ahmad, A., Dey, L.: A feature selection technique for classificatory analysis. Patt. Recognit. Lett. 26(1), 43\u201356 (2005)","journal-title":"Patt. Recognit. Lett."},{"key":"524_CR4","doi-asserted-by":"crossref","DOI":"10.1016\/j.infsof.2021.106648","volume":"138","author":"A Alazba","year":"2021","unstructured":"Alazba, A., Aljamaan, H.: Code smell detection using feature selection and stacking ensemble: An empirical investigation. Inf. Softw. Technol. 138, 106648 (2021)","journal-title":"Inf. Softw. Technol."},{"issue":"1","key":"524_CR5","doi-asserted-by":"crossref","first-page":"29","DOI":"10.1007\/s10515-024-00429-w","volume":"31","author":"A Alazba","year":"2024","unstructured":"Alazba, A., Aljamaan, H., Alshayeb, M.: Automated detection of class diagram smells using self-supervised learning. Automated Software Engineering 31(1), 29 (2024)","journal-title":"Automated Software Engineering"},{"key":"524_CR6","doi-asserted-by":"crossref","unstructured":"Aljamaan, H.: Voting heterogeneous ensemble for code smell detection. In: 2021 20th IEEE international conference on machine learning and applications, pp. 897\u2013902 (2021)","DOI":"10.1109\/ICMLA52953.2021.00148"},{"key":"524_CR7","first-page":"1069","volume":"27","author":"K Alkharabsheh","year":"2019","unstructured":"Alkharabsheh, K., Crespo, Y., Manso, E., Taboada, J.A.: Software design smell detection: a systematic mapping study. SQJ 27, 1069\u20131148 (2019)","journal-title":"SQJ"},{"key":"524_CR8","doi-asserted-by":"crossref","unstructured":"Alkharabsheh, K., et al.: A comparison of machine learning algorithms on design smell detection using balanced and imbalanced dataset: A study of god class. Inf. Softw. Technol. 143, 106736 (2022)","DOI":"10.1016\/j.infsof.2021.106736"},{"issue":"1","key":"524_CR9","doi-asserted-by":"crossref","first-page":"29","DOI":"10.1007\/s10586-024-04724-9","volume":"28","author":"K Alkharabsheh","year":"2025","unstructured":"Alkharabsheh, K., Alawadi, S., Crespo, Y., Taboada, J.A.: Exploring the role of project status information in effective code smell detection. Clust. Comput. 28(1), 29 (2025)","journal-title":"Clust. Comput."},{"key":"524_CR10","doi-asserted-by":"crossref","unstructured":"Amorim, L., Costa, E., Antunes, N., al., F.: Experience report: Evaluating the effectiveness of decision trees for detecting code smells. In: ISSRE 2015, pp. 261\u2013269. IEEE (2015)","DOI":"10.1109\/ISSRE.2015.7381819"},{"key":"524_CR11","doi-asserted-by":"crossref","DOI":"10.1016\/j.cosrev.2021.100378","volume":"40","author":"F Anowar","year":"2021","unstructured":"Anowar, F., Sadaoui, S., Selim, B.: Conceptual and empirical comparison of dimensionality reduction algorithms (pca, kpca, lda, mds, svd, lle, isomap, le, ica, t-sne). Comput. Sci. Rev. 40, 100378 (2021)","journal-title":"Comput. Sci. Rev."},{"key":"524_CR12","doi-asserted-by":"crossref","unstructured":"Arcelli\u00a0Fontana, F., M\u00e4ntyl\u00e4, M.V., al., Z.: Comparing and experimenting machine learning techniques for code smell detection. Empir. Softw. Eng. 21(3), 1143\u20131191 (2016)","DOI":"10.1007\/s10664-015-9378-4"},{"key":"524_CR13","doi-asserted-by":"crossref","unstructured":"Azeem, M.I., Palomba, F., al.: Machine learning techniques for code smell detection: A systematic literature review and meta-analysis. Inf. Softw. Technol. 108, 115\u2013138 (2019)","DOI":"10.1016\/j.infsof.2018.12.009"},{"issue":"3","key":"524_CR14","first-page":"419","volume":"54","author":"MI Azeem","year":"2024","unstructured":"Azeem, M.I., Shafiq, S., Mashkoor, A., Egyed, A.: Code smells in pull requests: An exploratory study. SPE 54(3), 419\u2013436 (2024)","journal-title":"SPE"},{"key":"524_CR15","unstructured":"Bergstra, J., Bengio, Y.: Random search for hyper-parameter optimization. J. Mach. Learn. Res. 13(2) (2012)"},{"key":"524_CR16","doi-asserted-by":"crossref","unstructured":"Bertolino, A.: Software testing research: Achievements, challenges, dreams. In: Future of software engineering, pp. 85\u2013103. IEEE (2007)","DOI":"10.1109\/FOSE.2007.25"},{"key":"524_CR17","doi-asserted-by":"crossref","unstructured":"Boutaib, S., Elarbi, M., Bechikh, S., Palomba, F., Said, L.B.: A possibilistic evolutionary approach to handle the uncertainty of software metrics thresholds in code smells detection. In: 2021 IEEE 21st international conference on software quality, reliability and security, pp. 574\u2013585. IEEE (2021)","DOI":"10.1109\/QRS54544.2021.00068"},{"key":"524_CR18","doi-asserted-by":"crossref","unstructured":"Bryton, S., Abreu, F.B., Monteiro, M.: Reducing subjectivity in code smells detection: Experimenting with the long method. In: 2010 7th international conference on the quality of information and communications technology, pp. 337\u2013342. IEEE, (2010)","DOI":"10.1109\/QUATIC.2010.60"},{"key":"524_CR19","doi-asserted-by":"crossref","unstructured":"Carroll, J.D., Arabie, P.: Multidimensional scaling. Measurement, judgment and decision making, 179\u2013250 (1998)","DOI":"10.1016\/B978-012099975-0.50005-1"},{"key":"524_CR20","doi-asserted-by":"crossref","unstructured":"Charalampidou, S., Ampatzoglou, A., Avgeriou, P.: Size and cohesion metrics as indicators of the long method bad smell: An empirical study. In: Proceedings of the 11th international conference on predictive models and data analytics in software engineering, pp. 1\u201310 (2015)","DOI":"10.1145\/2810146.2810155"},{"issue":"1","key":"524_CR21","doi-asserted-by":"crossref","first-page":"75","DOI":"10.1049\/sfw2.12006","volume":"15","author":"X Chen","year":"2021","unstructured":"Chen, X., Yuan, Z., Cui, Z., Zhang, D., Ju, X.: Empirical studies on the impact of filter-based ranking feature selection on security vulnerability prediction. IET Software 15(1), 75\u201389 (2021)","journal-title":"IET Software"},{"key":"524_CR22","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1007\/s10515-021-00297-8","volume":"28","author":"M Chouchane","year":"2021","unstructured":"Chouchane, M., Soui, M., Ghedira, K.: The impact of the code smells of the presentation layer on the diffuseness of aesthetic defects of android apps. Autom. Softw. Eng. 28, 1\u201329 (2021)","journal-title":"Autom. Softw. Eng."},{"key":"524_CR23","unstructured":"Cover, T.M., Thomas, J.A.: Elements of information theory (1991)"},{"issue":"1","key":"524_CR24","doi-asserted-by":"crossref","first-page":"21","DOI":"10.1109\/TIT.1967.1053964","volume":"13","author":"T Cover","year":"1967","unstructured":"Cover, T., Hart, P.: Nearest neighbor pattern classification. IEEE Trans. Inf. Theory 13(1), 21\u201327 (1967)","journal-title":"IEEE Trans. Inf. Theory"},{"key":"524_CR25","unstructured":"Cristianini, N., Shawe-Taylor, J., et\u00a0al.: An introduction to support vector machines. Cambridge University (2000)"},{"key":"524_CR26","doi-asserted-by":"crossref","unstructured":"Dash, M., Liu, H., Motoda, H.: Consistency based feature selection. In: Pacific-Asia Conference on Knowledge Discovery and Data Mining, pp. 98\u2013109. Springer (2000)","DOI":"10.1007\/3-540-45571-X_12"},{"key":"524_CR27","doi-asserted-by":"crossref","unstructured":"De\u00a0Stefano, M., Pecorelli, F., Palomba, F., De\u00a0Lucia, A.: Comparing within-and cross-project machine learning algorithms for code smell detection. In: Proceedings of the 5th international workshop on machine learning techniques for software quality evolution, pp. 1\u20136 (2021)","DOI":"10.1145\/3472674.3473978"},{"key":"524_CR28","doi-asserted-by":"crossref","unstructured":"Dewangan, S., Rao, R.S.: Code smell detection using classification approaches. ICMIB 2021 431, 257 (2022)","DOI":"10.1007\/978-981-19-0901-6_25"},{"key":"524_CR29","doi-asserted-by":"crossref","first-page":"162869","DOI":"10.1109\/ACCESS.2021.3133810","volume":"9","author":"S Dewangan","year":"2021","unstructured":"Dewangan, S., Rao, R.S., Mishra, A., Gupta, M.: A novel approach for code smell detection: an empirical study. IEEE Access 9, 162869\u2013162883 (2021)","journal-title":"IEEE Access"},{"key":"524_CR30","doi-asserted-by":"crossref","unstructured":"Dewangan, S., et al.: Severity classification of code smells using machine-learning methods. SN Comput. Sci. 4(5), 564 (2023)","DOI":"10.1007\/s42979-023-01979-8"},{"key":"524_CR31","doi-asserted-by":"crossref","unstructured":"Di\u00a0Nucci, D., Palomba, F., Tamburri, D.A., Serebrenik, A., De\u00a0Lucia, A.: Detecting code smells using machine learning techniques: are we there yet? In: 2018 IEEE 25th international conference on software analysis, evolution and reengineering, pp. 612\u2013621. IEEE (2018)","DOI":"10.1109\/SANER.2018.8330266"},{"issue":"7","key":"524_CR32","doi-asserted-by":"crossref","first-page":"1895","DOI":"10.1162\/089976698300017197","volume":"10","author":"TG Dietterich","year":"1998","unstructured":"Dietterich, T.G.: Approximate statistical tests for comparing supervised classification learning algorithms. Neural Comput. 10(7), 1895\u20131923 (1998)","journal-title":"Neural Comput."},{"key":"524_CR33","doi-asserted-by":"crossref","unstructured":"Fong, S., Liang, J., Wong, R., Ghanavati, M.: A novel feature selection by clustering coefficients of variations. In: 9th international conference on digital information management, pp. 205\u2013213. IEEE (2014)","DOI":"10.1109\/ICDIM.2014.6991429"},{"key":"524_CR34","doi-asserted-by":"crossref","unstructured":"Fontana, F.A., Zanoni, M., Marino, A., M\u00e4ntyl\u00e4, M.V.: Code smell detection: Towards a machine learning-based approach. In: 2013 IEEE international conference on software maintenance, pp. 396\u2013399 (2013)","DOI":"10.1109\/ICSM.2013.56"},{"key":"524_CR35","doi-asserted-by":"crossref","unstructured":"Fontana, F.A., Zanoni, M.: Code smell severity classification using machine learning techniques. Knowl.-Based Syst. 128, 43\u201358 (2017)","DOI":"10.1016\/j.knosys.2017.04.014"},{"key":"524_CR36","doi-asserted-by":"crossref","unstructured":"Ghotra, B., McIntosh, S., Hassan, A.E.: A large-scale study of the impact of feature selection techniques on defect classification models. In: 2017 IEEE\/ACM 14th international conference on mining software repositories (MSR), pp. 146\u2013157. IEEE (2017)","DOI":"10.1109\/MSR.2017.18"},{"key":"524_CR37","doi-asserted-by":"crossref","unstructured":"Gong, L., Jiang, S., Wang, R., Jiang, L.: Empirical evaluation of the impact of class overlap on software defect prediction. In: 2019 34th IEEE\/ACM international conference on automated software engineering (ASE), pp. 698\u2013709. IEEE (2019)","DOI":"10.1109\/ASE.2019.00071"},{"key":"524_CR38","unstructured":"Gu, Q., Li, Z., Han, J.: Generalized fisher score for feature selection. (2012). arXiv preprint arXiv:1202.3725"},{"key":"524_CR39","first-page":"1063","volume":"28","author":"T Guggulothu","year":"2020","unstructured":"Guggulothu, T., Moiz, S.A.: Code smell detection using multi-label classification approach. SQJ 28, 1063\u20131086 (2020)","journal-title":"SQJ"},{"key":"524_CR40","doi-asserted-by":"crossref","unstructured":"Gupta, H., Kulkarni, T.G., Kumar, L., Neti, L.B.M., Krishna, A.: An empirical study on predictability of software code smell using deep learning models. In: International conference on advanced information networking and applications, pp. 120\u2013132. Springer (2021)","DOI":"10.1007\/978-3-030-75075-6_10"},{"key":"524_CR41","unstructured":"Guyon, I., Elisseeff, A.: An introduction to variable and feature selection. J. Mach. Learn. Res. 3(Mar), 1157\u20131182 (2003)"},{"issue":"1","key":"524_CR42","doi-asserted-by":"crossref","first-page":"389","DOI":"10.1023\/A:1012487302797","volume":"46","author":"I Guyon","year":"2002","unstructured":"Guyon, I., et al.: Gene selection for cancer classification using support vector machines. Mach. Learn. 46(1), 389\u2013422 (2002)","journal-title":"Mach. Learn."},{"key":"524_CR43","unstructured":"Hall, M.A.: Correlation-based feature selection for discrete and numeric class machine learning. In: Proceedings of the 17th international conference on machine learning, pp. 359\u2013366 (2000)"},{"issue":"3","key":"524_CR44","doi-asserted-by":"crossref","first-page":"863","DOI":"10.1016\/j.patcog.2006.07.009","volume":"40","author":"H Hoffmann","year":"2007","unstructured":"Hoffmann, H.: Kernel pca for novelty detection. Patt. Recognit. 40(3), 863\u2013874 (2007)","journal-title":"Patt. Recognit."},{"issue":"1","key":"524_CR45","doi-asserted-by":"crossref","first-page":"63","DOI":"10.1023\/A:1022631118932","volume":"11","author":"RC Holte","year":"1993","unstructured":"Holte, R.C.: Very simple classification rules perform well on most commonly used datasets. Mach. Learn. 11(1), 63\u201390 (1993)","journal-title":"Mach. Learn."},{"key":"524_CR46","doi-asserted-by":"crossref","unstructured":"Hozano, M., Antunes, N., Fonseca, B., Costa, E.: Evaluating the accuracy of machine learning algorithms on detecting code smells for different developers. In: ICEIS (2), pp. 474\u2013482 (2017)","DOI":"10.5220\/0006338804740482"},{"key":"524_CR47","doi-asserted-by":"crossref","DOI":"10.1016\/j.jss.2024.111968","volume":"210","author":"Z Huang","year":"2024","unstructured":"Huang, Z., Yu, H., Fan, G., Shao, Z., Zhou, Z., Li, M.: On the effectiveness of developer features in code smell prioritization: A replication study. J. Syst. Softw. 210, 111968 (2024)","journal-title":"J. Syst. Softw."},{"key":"524_CR48","doi-asserted-by":"crossref","unstructured":"Jain, S., Saha, A.: Improving performance by genetically optimizing support vector machine to detect code smells. In: Proceedings of the international conference on smart data intelligence (2021a)","DOI":"10.2139\/ssrn.3852580"},{"key":"524_CR49","doi-asserted-by":"crossref","unstructured":"Jain, S., Saha, A.: Improving performance with hybrid feature selection and ensemble machine learning techniques for code smell detection. SCP 212, 102713 (2021b)","DOI":"10.1016\/j.scico.2021.102713"},{"issue":"1","key":"524_CR50","doi-asserted-by":"crossref","first-page":"609","DOI":"10.1007\/s12065-020-00536-z","volume":"15","author":"S Jain","year":"2022","unstructured":"Jain, S., Saha, A.: Rank-based univariate feature selection methods on machine learning classifiers for code smell detection. Evol. Intel. 15(1), 609\u2013638 (2022)","journal-title":"Evol. Intel."},{"key":"524_CR51","doi-asserted-by":"crossref","DOI":"10.1016\/j.scico.2024.103140","volume":"237","author":"S Jain","year":"2024","unstructured":"Jain, S., Saha, A.: Improving and comparing performance of machine learning classifiers optimized by swarm intelligent algorithms for code smell detection. Sci. Comput. Program. 237, 103140 (2024)","journal-title":"Sci. Comput. Program."},{"key":"524_CR52","doi-asserted-by":"crossref","unstructured":"Kannan, S.S., Ramaraj, N.: A novel hybrid feature selection via symmetrical uncertainty ranking based local memetic search algorithm. Knowl.-Based Syst. 23(6), 580\u2013585 (2010)","DOI":"10.1016\/j.knosys.2010.03.016"},{"key":"524_CR53","doi-asserted-by":"crossref","first-page":"8695","DOI":"10.1109\/ACCESS.2021.3049823","volume":"9","author":"I Kaur","year":"2021","unstructured":"Kaur, I., Kaur, A.: A novel four-way approach designed with ensemble feature selection for code smell detection. IEEE Access 9, 8695\u20138707 (2021)","journal-title":"IEEE Access"},{"issue":"3","key":"524_CR54","doi-asserted-by":"crossref","first-page":"1725","DOI":"10.11591\/ijeecs.v26.i3.pp1725-1735","volume":"26","author":"NAA Khleel","year":"2022","unstructured":"Khleel, N.A.A., Neh\u00e9z, K.: Deep convolutional neural network model for bad code smells detection based on oversampling method. IJEECS 26(3), 1725\u20131735 (2022)","journal-title":"IJEECS"},{"issue":"3","key":"524_CR55","first-page":"402","volume":"9","author":"NAA Khleel","year":"2023","unstructured":"Khleel, N.A.A., Neh\u00e9z, K.: Detection of code smells using machine learning techniques combined with data-balancing methods. Int. J. Adv. Intel. Inf. 9(3), 402\u2013417 (2023)","journal-title":"Int. J. Adv. Intel. Inf."},{"key":"524_CR56","doi-asserted-by":"crossref","unstructured":"Khomh, F., Vaucher, S., Gu\u00e9h\u00e9neuc, Y.G., Sahraoui, H.: A bayesian approach for the detection of code and design smells. In: 2009 9th international conference on quality software, pp. 305\u2013314. IEEE (2009)","DOI":"10.1109\/QSIC.2009.47"},{"issue":"4","key":"524_CR57","doi-asserted-by":"crossref","first-page":"559","DOI":"10.1016\/j.jss.2010.11.921","volume":"84","author":"F Khomh","year":"2011","unstructured":"Khomh, F., Vaucher, S., Gueheneuc, Y.G., Sahraoui, H.: Bdtex: A gqm-based bayesian approach for the detection of antipatterns. J. Syst. Softw. 84(4), 559\u2013572 (2011)","journal-title":"J. Syst. Softw."},{"key":"524_CR58","doi-asserted-by":"crossref","first-page":"1925","DOI":"10.1007\/s10664-018-9679-5","volume":"24","author":"M Kondo","year":"2019","unstructured":"Kondo, M., Bezemer, C.P., Kamei, Y., Hassan, A.E., Mizuno, O.: The impact of feature reduction techniques on defect prediction models. Empir. Softw. Eng. 24, 1925\u20131963 (2019)","journal-title":"Empir. Softw. Eng."},{"key":"524_CR59","doi-asserted-by":"crossref","unstructured":"Kononenko, I.: Estimating attributes: Analysis and extensions of relief. In: European conference on machine learning, pp. 171\u2013182. Springer (1994)","DOI":"10.1007\/3-540-57868-4_57"},{"key":"524_CR60","doi-asserted-by":"crossref","unstructured":"Kova\u010devi\u0107, A., Slivka, J., al.: Automatic detection of long method and god class code smells through neural source code embeddings. Expert Syst. Appl. 204, 117607 (2022)","DOI":"10.1016\/j.eswa.2022.117607"},{"issue":"4","key":"524_CR61","doi-asserted-by":"crossref","first-page":"117","DOI":"10.1016\/j.entcs.2005.02.059","volume":"141","author":"J Kreimer","year":"2005","unstructured":"Kreimer, J.: Adaptive detection of design flaws. Electronic Notes in Theoretical Computer Science 141(4), 117\u2013136 (2005)","journal-title":"Electronic Notes in Theoretical Computer Science"},{"key":"524_CR62","doi-asserted-by":"crossref","unstructured":"Li, F., Lu, W., Keung, J.W., Yu, X., Gong, L., Li, J.: The impact of feature selection techniques on effort-aware defect prediction: An empirical study. IET Software 17(2), 168\u2013193 (2023a)","DOI":"10.1049\/sfw2.12099"},{"key":"524_CR63","doi-asserted-by":"crossref","unstructured":"Li, F., Zou, K., Keung, J.W., Yu, X., Feng, S., Xiao, Y.: On the relative value of imbalanced learning for code smell detection. Softw. Pract. Exper. 53(10), 1902\u20131927 (2023b)","DOI":"10.1002\/spe.3235"},{"issue":"3","key":"524_CR64","first-page":"18","volume":"2","author":"A Liaw","year":"2002","unstructured":"Liaw, A., Wiener, M., et al.: Classification and regression by randomforest. R news 2(3), 18\u201322 (2002)","journal-title":"R news"},{"key":"524_CR65","unstructured":"Liu, H., Setiono, R.: Chi2: Feature selection and discretization of numeric attributes. In: Proceedings of 7th IEEE international conference on tools with artificial intelligence, pp. 388\u2013391. IEEE (1995)"},{"key":"524_CR66","doi-asserted-by":"crossref","unstructured":"Liu, H., Xu, Z., Zou, Y.: Deep learning based feature envy detection. In: Proceedings of the 33rd ACM\/IEEE International Conference on Autom. Softw. Eng., pp. 385\u2013396 (2018)","DOI":"10.1145\/3238147.3238166"},{"key":"524_CR67","unstructured":"Liu, H., Jin, J., Xu, Z., Zou, Y., Bu, Y., Zhang, L.: Deep learning based code smell detection. IEEE Trans. Softw. Eng. 47(9), 1811\u20131837 (2019)"},{"key":"524_CR68","doi-asserted-by":"crossref","unstructured":"Liu, B., Liu, H., al.: Deep learning based feature envy detection boosted by real-world examples. In: ESEC\/FSE, pp. 908\u2013920 (2023)","DOI":"10.1145\/3611643.3616353"},{"key":"524_CR69","volume":"249","author":"L Liu","year":"2024","unstructured":"Liu, L., Lin, G., Zhu, L., Yang, Z., Song, P., Wang, X., Hu, W.: Revisiting code smell severity prioritization using learning to rank techniques. Expert Syst. Appl. 249, 123483 (2024)","journal-title":"Expert Syst. Appl."},{"key":"524_CR70","unstructured":"Maaten, L., Hinton, G.: Visualizing data using t-sne. J. Mach. Learn. Res. 9(11) (2008)"},{"key":"524_CR71","doi-asserted-by":"crossref","unstructured":"Maiga, A., Ali, N., Bhattacharya, N., Sabane, A., Gu\u00e9h\u00e9neuc, Y.G., Aimeur, E.: Smurf: A svm-based incremental anti-pattern detection approach. In: 2012 19th working conference on reverse engineering, pp. 466\u2013475. IEEE (2012)","DOI":"10.1109\/WCRE.2012.56"},{"issue":"6","key":"524_CR72","doi-asserted-by":"crossref","first-page":"3473","DOI":"10.1007\/s10586-023-04144-1","volume":"26","author":"R Malhotra","year":"2023","unstructured":"Malhotra, R., Jain, B., Kessentini, M.: Examining deep learning\u2019s capability to spot code smells: A systematic literature review. Clust. Comput. 26(6), 3473\u20133501 (2023)","journal-title":"Clust. Comput."},{"key":"524_CR73","doi-asserted-by":"crossref","unstructured":"Maneerat, N., Muenchaisri, P.: Bad-smell prediction from software design model using machine learning techniques. In: JCSSE 2011, pp. 331\u2013336. IEEE (2011)","DOI":"10.1109\/JCSSE.2011.5930143"},{"issue":"6","key":"524_CR74","doi-asserted-by":"crossref","first-page":"1428","DOI":"10.1007\/s11390-020-0323-7","volume":"35","author":"MY Mhawish","year":"2020","unstructured":"Mhawish, M.Y., Gupta, M.: Predicting code smells and analysis of predictions: using machine learning techniques and software metrics. J. Comput. Sci. Technol. 35(6), 1428\u20131445 (2020)","journal-title":"J. Comput. Sci. Technol."},{"issue":"6","key":"524_CR75","doi-asserted-by":"crossref","first-page":"275","DOI":"10.1002\/cem.873","volume":"18","author":"AJ Myles","year":"2004","unstructured":"Myles, A.J., et al.: An introduction to decision tree modeling. J. Chemometr. J. Chemometr. Soc. 18(6), 275\u2013285 (2004)","journal-title":"J. Chemometr. J. Chemometr. Soc."},{"key":"524_CR76","doi-asserted-by":"crossref","unstructured":"Nunes, H.G., Santana, A., Figueiredo, E., Costa, H.: Tuning code smell prediction models: A replication study. In: Proceedings of the 32nd IEEE\/ACM international conference on program comprehension, pp. 316\u2013327 (2024)","DOI":"10.1145\/3643916.3644436"},{"key":"524_CR77","first-page":"323","volume":"23","author":"A Ouni","year":"2015","unstructured":"Ouni, A., Kessentini, M., Bechikh, S., Sahraoui, H.: Prioritizing code-smells correction tasks using chemical reaction optimization. SQJ 23, 323\u2013361 (2015)","journal-title":"SQJ"},{"key":"524_CR78","doi-asserted-by":"crossref","unstructured":"Patnaik, A., Padhy, N.: A hybrid approach to identify code smell using machine learning algorithms. Int. J. Open Sourc. Softw. Process. 12(2), 21\u201335 (2021a)","DOI":"10.4018\/IJOSSP.2021040102"},{"key":"524_CR79","doi-asserted-by":"crossref","unstructured":"Patnaik, A., Padhy, N.: Does code complexity affect the quality of real-time projects? detection of code smell on software projects using machine learning algorithms. In: DSMLAI, pp. 178\u2013185 (2021b)","DOI":"10.1145\/3484824.3484911"},{"key":"524_CR80","doi-asserted-by":"crossref","unstructured":"Pecorelli, F., Di Nucci, D., De Roover, C., De Lucia, A.: A large empirical assessment of the role of data balancing in machine-learning-based code smell detection. J. Syst. Softw. 169, 110693 (2020a)","DOI":"10.1016\/j.jss.2020.110693"},{"key":"524_CR81","doi-asserted-by":"crossref","unstructured":"Pecorelli, F., Palomba, F., Khomh, F., De\u00a0Lucia, A.: Developer-driven code smell prioritization. In: Proceedings of the 17th international conference on mining software repositories, pp. 220\u2013231 (2020b)","DOI":"10.1145\/3379597.3387457"},{"issue":"1","key":"524_CR82","doi-asserted-by":"crossref","first-page":"3","DOI":"10.1080\/00220670209598786","volume":"96","author":"CYJ Peng","year":"2002","unstructured":"Peng, C.Y.J., Lee, K.L., Ingersoll, G.M.: An introduction to logistic regression analysis and reporting. J. Educ. Res. 96(1), 3\u201314 (2002)","journal-title":"J. Educ. Res."},{"key":"524_CR83","doi-asserted-by":"crossref","unstructured":"Puja, R.S., Fatema, T., Akhter, N., Khatun, A.: Prediction of code smell from source code: A hybrid approach. In: 2023 international conference on information and communication technology for sustainable development (ICICT4SD), pp. 315\u2013319. IEEE (2023)","DOI":"10.1109\/ICICT4SD59951.2023.10303449"},{"key":"524_CR84","unstructured":"Quinlan, J.R.: C 4.5: Programs for machine learning. Morgan Kaufmann Ser. Mach. Learn. (1993)"},{"issue":"9","key":"524_CR85","first-page":"1560","volume":"48","author":"MM Rahman","year":"2018","unstructured":"Rahman, M.M., Riyadh, R.R., Khaled, S.M., Satter, A., Rahman, M.R.: Mmruc3: A recommendation approach of move method refactoring using coupling, cohesion, and contextual similarity to enhance software design. SPE 48(9), 1560\u20131587 (2018)","journal-title":"SPE"},{"issue":"1","key":"524_CR86","doi-asserted-by":"crossref","first-page":"16245","DOI":"10.1038\/s41598-023-43380-8","volume":"13","author":"RS Rao","year":"2023","unstructured":"Rao, R.S., Dewangan, S., Mishra, A., Gupta, M.: A study of dealing class imbalance problem with machine learning methods for code smell severity detection using pca-based feature selection technique. Sci. Rep. 13(1), 16245 (2023)","journal-title":"Sci. Rep."},{"issue":"6062","key":"524_CR87","doi-asserted-by":"crossref","first-page":"1518","DOI":"10.1126\/science.1205438","volume":"334","author":"DN Reshef","year":"2011","unstructured":"Reshef, D.N., et al.: Detecting novel associations in large data sets. Sci. 334(6062), 1518\u20131524 (2011)","journal-title":"Sci."},{"key":"524_CR88","unstructured":"Rish, I., et\u00a0al.: An empirical study of the naive bayes classifier. In: IJCAI 2001 workshop on empirical methods in artificial intelligence, vol. 3, pp. 41\u201346 (2001)"},{"key":"524_CR89","doi-asserted-by":"crossref","first-page":"23","DOI":"10.1023\/A:1025667309714","volume":"53","author":"M Robnik-\u0160ikonja","year":"2003","unstructured":"Robnik-\u0160ikonja, M., Kononenko, I.: Theoretical and empirical analysis of relieff and rrelieff. Mach. Learn. 53, 23\u201369 (2003)","journal-title":"Mach. Learn."},{"issue":"5500","key":"524_CR90","doi-asserted-by":"crossref","first-page":"2323","DOI":"10.1126\/science.290.5500.2323","volume":"290","author":"ST Roweis","year":"2000","unstructured":"Roweis, S.T., Saul, L.K.: Nonlinear dimensionality reduction by locally linear embedding. Sci. 290(5500), 2323\u20132326 (2000)","journal-title":"Sci."},{"key":"524_CR91","doi-asserted-by":"crossref","DOI":"10.1016\/j.jss.2021.110936","volume":"176","author":"T Sharma","year":"2021","unstructured":"Sharma, T., Efstathiou, V., Louridas, P., Spinellis, D.: Code smell detection by deep direct-learning and transfer-learning. J. Syst. Softw. 176, 110936 (2021)","journal-title":"J. Syst. Softw."},{"key":"524_CR92","doi-asserted-by":"crossref","unstructured":"Shen, L., Liu, W., Chen, X., Gu, Q., Liu, X.: Improving machine learning-based code smell detection via hyper-parameter optimization. In: 2020 27th Asia-pacific software engineering conference, pp. 276\u2013285. IEEE (2020)","DOI":"10.1109\/APSEC51365.2020.00036"},{"key":"524_CR93","unstructured":"Singh, Y., Chauhan, A.S.: Neural networks in data mining. J. Theor. Appl. Inf. Technol. 5(1) (2009)"},{"issue":"7","key":"524_CR94","first-page":"1079","volume":"49","author":"BL Sousa","year":"2019","unstructured":"Sousa, B.L., Bigonha, M.A., Ferreira, K.A.: An exploratory study on cooccurrence of design patterns and bad smells using software metrics. SPE 49(7), 1079\u20131113 (2019)","journal-title":"SPE"},{"issue":"1","key":"524_CR95","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1109\/TSE.2016.2584050","volume":"43","author":"C Tantithamthavorn","year":"2016","unstructured":"Tantithamthavorn, C., McIntosh, S., Hassan, A.E., Matsumoto, K.: An empirical comparison of model validation techniques for defect prediction models. IEEE Trans. Softw. Eng. 43(1), 1\u201318 (2016)","journal-title":"IEEE Trans. Softw. Eng."},{"key":"524_CR96","doi-asserted-by":"crossref","unstructured":"Tenenbaum, J.B., Silva, V.d., Langford, J.C.: A global geometric framework for nonlinear dimensionality reduction. Sci. 290(5500), 2319\u20132323 (2000)","DOI":"10.1126\/science.290.5500.2319"},{"key":"524_CR97","volume":"153","author":"CF Tsai","year":"2024","unstructured":"Tsai, C.F., Chen, K.C., Lin, W.C.: Feature selection and its combination with data over-sampling for multi-class imbalanced datasets. Appl. Soft Comput. 153, 111267 (2024)","journal-title":"Appl. Soft Comput."},{"key":"524_CR98","doi-asserted-by":"crossref","unstructured":"Uch\u00f4a, A., Barbosa, C., Coutinho, D., Oizumi, W., Assun\u00e7ao, W.K., Vergilio, S.R., Pereira, J.A., Oliveira, A., Garcia, A.: Predicting design impactful changes in modern code review: A large-scale empirical study. In: 2021 IEEE\/ACM 18th international conference on mining software repositories, pp. 471\u2013482. IEEE (2021)","DOI":"10.1109\/MSR52588.2021.00059"},{"key":"524_CR99","doi-asserted-by":"crossref","unstructured":"Vaucher, S., Khomh, F., Moha, N., Gu\u00e9h\u00e9neuc, Y.G.: Tracking design smells: Lessons from a study of god classes. In: 2009 16th Working Conference on Reverse Engineering, pp. 145\u2013154. IEEE, (2009)","DOI":"10.1109\/WCRE.2009.23"},{"key":"524_CR100","doi-asserted-by":"crossref","unstructured":"Wang, H., Khoshgoftaar, T.M., Gao, K.: A comparative study of filter-based feature ranking techniques. In: 2010 IEEE international conference on information reuse & integration, pp. 43\u201348. IEEE (2010)","DOI":"10.1109\/IRI.2010.5558966"},{"key":"524_CR101","doi-asserted-by":"crossref","unstructured":"Xu, Z., Liu, J., Yang, Z., An, G., Jia, X.: The impact of feature selection on defect prediction performance: An empirical comparison. In: 2016 IEEE 27th international symposium on software reliability engineering (ISSRE), pp. 309\u2013320. IEEE, (2016)","DOI":"10.1109\/ISSRE.2016.13"},{"key":"524_CR102","doi-asserted-by":"crossref","DOI":"10.1016\/j.engappai.2024.109527","volume":"139","author":"PS Yadav","year":"2025","unstructured":"Yadav, P.S., Rao, R.S., Mishra, A., Gupta, M.: Ensemble methods with feature selection and data balancing for improved code smells classification performance. Eng. Appl. Artif. Intell. 139, 109527 (2025)","journal-title":"Eng. Appl. Artif. Intell."},{"key":"524_CR103","doi-asserted-by":"crossref","unstructured":"Yu, X., Liu, J., Yang, Z., Jia, X., Ling, Q., Ye, S.: Learning from imbalanced data for predicting the number of software defects. In: 2017 IEEE 28th international symposium on software reliability engineering (ISSRE), pp. 78\u201389. IEEE (2017)","DOI":"10.1109\/ISSRE.2017.18"},{"key":"524_CR104","doi-asserted-by":"crossref","first-page":"3461","DOI":"10.1007\/s00500-018-3093-1","volume":"22","author":"X Yu","year":"2018","unstructured":"Yu, X., Wu, M., Jian, Y., Bennin, K.E., Fu, M., Ma, C.: Cross-company defect prediction via semi-supervised clustering-based data filtering and mstra-based transfer learning. Soft Comput. 22, 3461\u20133472 (2018)","journal-title":"Soft Comput."},{"key":"524_CR105","doi-asserted-by":"crossref","unstructured":"Yu, X., Bennin, K.E., Liu, J., Keung, J.W., Yin, X., Xu, Z.: An empirical study of learning to rank techniques for effort-aware defect prediction. In: 2019 IEEE 26th international conference on software analysis, evolution and reengineering (SANER), pp. 298\u2013309. IEEE (2019)","DOI":"10.1109\/SANER.2019.8668033"},{"key":"524_CR106","doi-asserted-by":"crossref","unstructured":"Zhang, Z., Lei, Y., Yan, M., Yu, Y., Chen, J., Wang, S., Mao, X.: Reentrancy vulnerability detection and localization: A deep learning based two-phase approach. In: Proceedings of the 37th IEEE\/ACM international conference on automated software engineering, pp. 1\u201313 (2022)","DOI":"10.1145\/3551349.3560428"},{"issue":"1","key":"524_CR107","doi-asserted-by":"crossref","first-page":"22","DOI":"10.1109\/TLA.2024.10375735","volume":"22","author":"D Zhang","year":"2023","unstructured":"Zhang, D., Song, S., Zhang, Y., Liu, H., Shen, G.: Code smell detection research based on pre-training and stacking models. IEEE Lat. Am. Trans. 22(1), 22\u201330 (2023)","journal-title":"IEEE Lat. Am. Trans."},{"key":"524_CR108","doi-asserted-by":"crossref","unstructured":"Zhang, Z., Yin, S., Zhu, L., Gao, S., Chen, H., Hu, W., Li, F.: On the relative value of feature selection techniques for code smell detection. https:\/\/conf.researchr.org\/details\/apsec-2024\/apsec-2024-technical-track\/34\/On-the-Relative-Value-of-Feature-Selection-Techniques-for-Code-Smell-Detection (2024a)","DOI":"10.1109\/APSEC65559.2024.00038"},{"key":"524_CR109","doi-asserted-by":"crossref","unstructured":"Zhang, F., Zhang, Z., Keung, J.W., Tang, X., Yang, Z., Yu, X., Hu, W.: Data preparation for deep learning based code smell detection: A systematic literature review. JSS, 112131 (2024b)","DOI":"10.1016\/j.jss.2024.112131"},{"key":"524_CR110","doi-asserted-by":"crossref","DOI":"10.1016\/j.infsof.2021.106652","volume":"139","author":"K Zhao","year":"2021","unstructured":"Zhao, K., Xu, Z., Yan, M., Zhang, T., Yang, D., Li, W.: A comprehensive investigation of the impact of feature selection techniques on crashing fault residence prediction models. Inf. Softw. Technol. 139, 106652 (2021)","journal-title":"Inf. Softw. Technol."},{"issue":"1","key":"524_CR111","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/3183339","volume":"27","author":"Y Zhou","year":"2018","unstructured":"Zhou, Y., Yang, Y., Lu, H., Chen, L., Li, Y., Zhao, Y., Qian, J., Xu, B.: How far we have progressed in the journey? an examination of cross-project defect prediction. ACM Trans. Softw. Eng. Methodol. 27(1), 1\u201351 (2018)","journal-title":"ACM Trans. Softw. Eng. Methodol."}],"container-title":["Automated Software Engineering"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10515-025-00524-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10515-025-00524-6\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10515-025-00524-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,10]],"date-time":"2025-09-10T13:56:52Z","timestamp":1757512612000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10515-025-00524-6"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,5,16]]},"references-count":111,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2025,11]]}},"alternative-id":["524"],"URL":"https:\/\/doi.org\/10.1007\/s10515-025-00524-6","relation":{},"ISSN":["0928-8910","1573-7535"],"issn-type":[{"value":"0928-8910","type":"print"},{"value":"1573-7535","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,5,16]]},"assertion":[{"value":"15 January 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"21 April 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"16 May 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no competing interests.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}],"article-number":"50"}}