{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,20]],"date-time":"2025-11-20T06:29:37Z","timestamp":1763620177535,"version":"3.40.3"},"publisher-location":"Cham","reference-count":75,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319259628"},{"type":"electronic","value":"9783319259642"}],"license":[{"start":{"date-parts":[[2016,1,1]],"date-time":"2016-01-01T00:00:00Z","timestamp":1451606400000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2016]]},"DOI":"10.1007\/978-3-319-25964-2_3","type":"book-chapter","created":{"date-parts":[[2016,1,14]],"date-time":"2016-01-14T08:24:44Z","timestamp":1452759884000},"page":"33-58","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":21,"title":["Towards Benchmarking Feature Subset Selection Methods for Software Fault Prediction"],"prefix":"10.1007","author":[{"given":"Wasif","family":"Afzal","sequence":"first","affiliation":[]},{"given":"Richard","family":"Torkar","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2016,1,15]]},"reference":[{"issue":"3","key":"3_CR1","doi-asserted-by":"publisher","first-page":"255","DOI":"10.1023\/A:1024424811345","volume":"8","author":"TM Khoshgoftaar","year":"2004","unstructured":"Khoshgoftaar, T.M., Seliya, N.: Fault prediction modeling for software quality estimation: Comparing commonly used techniques. Empirical Softw. Eng. 8(3), 255\u2013283 (2004)","journal-title":"Empirical Softw. Eng."},{"issue":"4","key":"3_CR2","doi-asserted-by":"publisher","first-page":"7346","DOI":"10.1016\/j.eswa.2008.10.027","volume":"36","author":"C Catal","year":"2009","unstructured":"Catal, C., Diri, B.: A systematic review of software fault prediction studies. Expert Syst. Appl. 36(4), 7346\u20137354 (2009)","journal-title":"Expert Syst. Appl."},{"unstructured":"Hall, T., Beecham, S., Bowes, D., Gray, D., Counsell, S.: A systematic review of fault prediction performance in software engineering. IEEE Trans. Softw. Eng. (99) (2011)","key":"3_CR3"},{"issue":"4","key":"3_CR4","doi-asserted-by":"publisher","first-page":"485","DOI":"10.1109\/TSE.2008.35","volume":"34","author":"S Lessmann","year":"2008","unstructured":"Lessmann, S., Baesens, B., Mues, C., Pietsch, S.: Benchmarking classification models for software defect prediction: a proposed framework and novel findings. IEEE Trans. Softw. Eng. 34(4), 485\u2013496 (2008)","journal-title":"IEEE Trans. Softw. Eng."},{"issue":"5","key":"3_CR5","doi-asserted-by":"publisher","first-page":"675","DOI":"10.1109\/32.815326","volume":"25","author":"NE Fenton","year":"1999","unstructured":"Fenton, N.E., Neil, M.: A critique of software defect prediction models. IEEE Trans. Softw. Eng. 25(5), 675\u2013689 (1999)","journal-title":"IEEE Trans. Softw. Eng."},{"issue":"3","key":"3_CR6","doi-asserted-by":"publisher","first-page":"356","DOI":"10.1109\/TSE.2010.90","volume":"37","author":"Q Song","year":"2011","unstructured":"Song, Q., Jia, Z., Shepperd, M., Ying, S., Liu, J.: A general software defect-proneness prediction framework. IEEE Trans. Softw. Eng. 37(3), 356\u2013370 (2011)","journal-title":"IEEE Trans. Softw. Eng."},{"issue":"11","key":"3_CR7","doi-asserted-by":"crossref","first-page":"985","DOI":"10.1109\/TSE.2003.1245300","volume":"29","author":"T. Foss","year":"2003","unstructured":"Foss, T., Stensrud, E., Kitchenham, B.A., Myrtveit, I.: A simulation study of the model evaluation criterion MMRE. IEEE Trans. Softw. Eng. 29(11) (2003)","journal-title":"IEEE Transactions on Software Engineering"},{"key":"3_CR8","doi-asserted-by":"publisher","first-page":"203","DOI":"10.1142\/S0218194012400037","volume":"22","author":"W Afzal","year":"2012","unstructured":"Afzal, W., Torkar, R., Feldt, R.: Resampling methods in software quality classification. Int. J. Software Eng. Knowl. Eng. 22, 203\u2013223 (2012)","journal-title":"Int. J. Software Eng. Knowl. Eng."},{"key":"3_CR9","first-page":"96","volume":"1","author":"D Gray","year":"2011","unstructured":"Gray, D., Bowes, D., Davey, N., Sun, Y., Christianson, B.: The misuse of the NASA metrics data program data sets for automated software defect prediction. IET Semin. Dig. 1, 96\u2013103 (2011)","journal-title":"IET Semin. Dig."},{"key":"3_CR10","volume-title":"Attribute selection and imbalanced data: Problems in software defect prediction","author":"TM Khoshgoftaar","year":"2010","unstructured":"Khoshgoftaar, T.M., Gao, K., Seliya, N.: Attribute selection and imbalanced data: Problems in software defect prediction. IEEE Computer Society, Los Alamitos, CA, USA (2010)"},{"doi-asserted-by":"crossref","unstructured":"Shivaji, S., Whitehead, J.E.J, Akella, R., Kim, S. Reducing features to improve bug prediction. In: Proceedings of the 2009 IEEE\/ACM International Conference on Automated Software Engineering (ASE\u201909), IEEE Computer Society, Washington, DC, USA (2009)","key":"3_CR11","DOI":"10.1109\/ASE.2009.76"},{"doi-asserted-by":"crossref","unstructured":"Rodriguez, D., Ruiz, R., Cuadrado-Gallego, J., Aguilar-Ruiz, J.: Detecting fault modules applying feature selection to classifiers. In: IEEE International Conference on Information Reuse and Integration (IRI\u201907) (2007a)","key":"3_CR12","DOI":"10.1109\/IRI.2007.4296696"},{"doi-asserted-by":"crossref","unstructured":"Rodriguez, D., Ruiz, R., Cuadrado-Gallego, J., Aguilar-Ruiz, J., Garre, M.: Attribute selection in software engineering datasets for detecting fault modules. In: 33rd EUROMICRO Conference on Software Engineering and Advanced Applications (EUROMICRO\u201907) (2007b)","key":"3_CR13","DOI":"10.1109\/EUROMICRO.2007.20"},{"key":"3_CR14","doi-asserted-by":"publisher","first-page":"273","DOI":"10.1016\/S0004-3702(97)00043-X","volume":"97","author":"R Kohavi","year":"1997","unstructured":"Kohavi, R., John, G.H.: Wrappers for feature subset selection. Artif. Intell. 97, 273\u2013324 (1997)","journal-title":"Artif. Intell."},{"key":"3_CR15","doi-asserted-by":"publisher","first-page":"1437","DOI":"10.1109\/TKDE.2003.1245283","volume":"15","author":"MA Hall","year":"2003","unstructured":"Hall, M.A., Holmes, G.: Benchmarking attribute selection techniques for discrete class data mining. IEEE Trans. Knowl. Data Eng. 15, 1437\u20131447 (2003)","journal-title":"IEEE Trans. Knowl. Data Eng."},{"key":"3_CR16","doi-asserted-by":"publisher","first-page":"4","DOI":"10.1109\/34.824819","volume":"22","author":"AK Jain","year":"2000","unstructured":"Jain, A.K., Duin, R.P.W., Mao, J.: Statistical pattern recognition: a review. IEEE Trans. Pattern Anal. Mach. Intell. 22, 4\u201337 (2000)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"3_CR17","doi-asserted-by":"publisher","first-page":"38","DOI":"10.1109\/MS.2005.151","volume":"22","author":"Z Chen","year":"2005","unstructured":"Chen, Z., Boehm, B., Menzies, T., Port, D.: Finding the right data for software cost modeling. IEEE Softw. 22, 38\u201346 (2005)","journal-title":"IEEE Softw."},{"unstructured":"Janecek, A., Gansterer, W., Demel, M., Ecker, G.: On the relationship between feature selection and classification accuracy. In: Proceedings of the 3rd Workshop on New Challenges for Feature Selection in Data Mining and Knowledge Discovery (FSDM\u201908), Microtome Publishing, Brookline, MA, USA (2008)","key":"3_CR18"},{"doi-asserted-by":"crossref","unstructured":"Burke, E.K., Kendall, G. (eds.): Search methodologies\u2014Introductory tutorials in optimization and decision support techniques. Springer Science and Business Media, Inc., 233 Spring Street, New York, USA (2005)","key":"3_CR19","DOI":"10.1007\/0-387-28356-0"},{"issue":"8","key":"3_CR20","doi-asserted-by":"publisher","first-page":"745","DOI":"10.1016\/j.infsof.2005.08.009","volume":"48","author":"T Dyb\u00e5","year":"2006","unstructured":"Dyb\u00e5, T., Kampenes, V.B., Sj\u00f8berg, D.I.: A systematic review of statistical power in software engineering experiments. Inf. Softw. Technol. 48(8), 745\u2013755 (2006)","journal-title":"Inf. Softw. Technol."},{"key":"3_CR21","first-page":"94","volume-title":"Evolutionary Computation and Optimization Algorithms in Software Engineering: Applications and Techniques","author":"W Afzal","year":"2009","unstructured":"Afzal, W., Torkar, R., Feldt, R., Gorschek, T.: Genetic programming for cross-release fault count predictions in large and complex software projects. In: Chis, M. (ed.) Evolutionary Computation and Optimization Algorithms in Software Engineering: Applications and Techniques, pp. 94\u2013126. IGI Global, Hershey, USA (2009)"},{"issue":"1","key":"3_CR22","doi-asserted-by":"publisher","first-page":"106","DOI":"10.1109\/TSMCB.2005.854499","volume":"36","author":"D Muni","year":"2006","unstructured":"Muni, D., Pal, N., Das, J.: Genetic programming for simultaneous feature selection and classifier design. IEEE Trans. Syst. Man Cybern. B Cybern. 36(1), 106\u2013117 (2006)","journal-title":"IEEE Trans. Syst. Man Cybern. B Cybern."},{"key":"3_CR23","first-page":"229","volume-title":"Lecture Notes in Computer Science","author":"Matthew G. Smith","year":"2003","unstructured":"Smith, M.G., Bull. L.: Feature construction and selection using genetic programming and a genetic algorithm. In: Proceedings of the 6th European Conference on Genetic Programming (EuroGP\u201903), Springer-Verlag, Berlin, Heidelberg (2003)"},{"doi-asserted-by":"crossref","unstructured":"Vivanco, R., Kamei, Y., Monden, A., Matsumoto, K., Jin, D.: Using search-based metric selection and oversampling to predict fault prone modules. In: 2010 23rd Canadian Conference on Electrical and Computer Engineering (CCECE\u201910) (2010)","key":"3_CR24","DOI":"10.1109\/CCECE.2010.5575249"},{"issue":"2","key":"3_CR25","doi-asserted-by":"publisher","first-page":"44","DOI":"10.1109\/5254.671091","volume":"13","author":"J Yang","year":"1998","unstructured":"Yang, J., Honavar, V.: Feature subset selection using a genetic algorithm. IEEE Intell. Syst. and Their Appl. 13(2), 44\u201349 (1998)","journal-title":"IEEE Intell. Syst. and Their Appl."},{"unstructured":"Boetticher, G., Menzies, T., Ostrand, T.: PROMISE repository of empirical software engineering data. \n                  http:\/\/promisedata.org\/\n                  \n                 repository, West Virginia University, Department of Computer Science (2007)","key":"3_CR26"},{"key":"3_CR27","doi-asserted-by":"publisher","first-page":"306","DOI":"10.1109\/ICDM.2002.1183917","volume-title":"Proceedings of the 2002 IEEE International Conference on Data Mining (ICDM\u201902)","author":"LC Molina","year":"2002","unstructured":"Molina, L.C., Belanche, L., Nebot, \u00c0ngela: Feature selection algorithms: a survey and experimental evaluation. Proceedings of the 2002 IEEE International Conference on Data Mining (ICDM\u201902), pp. 306\u2013313. IEEE Computer Society, Washington, DC, USA (2002)"},{"key":"3_CR28","first-page":"1157","volume":"3","author":"I Guyon","year":"2003","unstructured":"Guyon, I., Elisseeff, A.: An introduction to variable and feature selection. J. Mach. Learn. Res. 3, 1157\u20131182 (2003)","journal-title":"J. Mach. Learn. Res."},{"key":"3_CR29","doi-asserted-by":"publisher","first-page":"245","DOI":"10.1016\/S0004-3702(97)00063-5","volume":"97","author":"AL Blum","year":"1997","unstructured":"Blum, A.L., Langley, P.: Selection of relevant features and examples in machine learning. Artif. Intell. 97, 245\u2013271 (1997)","journal-title":"Artif. Intell."},{"issue":"1\u20134","key":"3_CR30","doi-asserted-by":"publisher","first-page":"131","DOI":"10.1016\/S1088-467X(97)00008-5","volume":"1","author":"M Dash","year":"1997","unstructured":"Dash, M., Liu, H.: Feature selection for classification. Intelligent Data Analysis 1(1\u20134), 131\u2013156 (1997)","journal-title":"Intelligent Data Analysis"},{"issue":"4","key":"3_CR31","doi-asserted-by":"publisher","first-page":"491","DOI":"10.1109\/TKDE.2005.66","volume":"17","author":"H Liu","year":"2005","unstructured":"Liu, H., Yu, L.: Toward integrating feature selection algorithms for classification and clustering. IEEE Trans. Knowl. Data Eng. 17(4), 491\u2013502 (2005)","journal-title":"IEEE Trans. Knowl. Data Eng."},{"key":"3_CR32","doi-asserted-by":"publisher","first-page":"375","DOI":"10.1109\/TSE.2011.55","volume":"38","author":"K Dejaeger","year":"2012","unstructured":"Dejaeger, K., Verbeke, W., Martens, D., Baesens, B.: Data mining techniques for software effort estimation: a comparative study. IEEE Trans. Softw. Eng. 38, 375\u2013397 (2012)","journal-title":"IEEE Trans. Softw. Eng."},{"issue":"4","key":"3_CR33","first-page":"1","volume":"30","author":"Z Chen","year":"2005","unstructured":"Chen, Z., Menzies, T., Port, D., Boehm, B.: Feature subset selection can improve software cost estimation accuracy. SIGSOFT Softw. Eng. Notes 30(4), 1\u20136 (2005)","journal-title":"SIGSOFT Softw. Eng. Notes"},{"key":"3_CR34","doi-asserted-by":"publisher","first-page":"409","DOI":"10.1007\/s10515-010-0070-z","volume":"17","author":"T Menzies","year":"2010","unstructured":"Menzies, T., Jalali, O., Hihn, J., Baker, D., Lum, K.: Stable rankings for different effort models. Autom. Softw. Eng. 17, 409\u2013437 (2010)","journal-title":"Autom. Softw. Eng."},{"key":"3_CR35","first-page":"1367","volume-title":"Proceedings of the 2002 Genetic and Evolutionary Computation Conference (GECCO\u201902)","author":"C Kirsopp","year":"2002","unstructured":"Kirsopp, C., Shepperd, M.J., Hart, J.: Search heuristics, case-based reasoning and software project effort prediction. Proceedings of the 2002 Genetic and Evolutionary Computation Conference (GECCO\u201902), pp. 1367\u20131374. Morgan Kaufmann Publishers Inc., San Francisco, CA, USA (2002)"},{"doi-asserted-by":"crossref","unstructured":"Azzeh, M., Neagu, D., Cowling, P.: Improving analogy software effort estimation using fuzzy feature subset selection algorithm. In: Proceedings of the 4th International Workshop on Predictor Models in Software Engineering (PROMISE\u201908), ACM, New York, NY, USA (2008)","key":"3_CR36","DOI":"10.1145\/1370788.1370805"},{"issue":"3","key":"3_CR37","doi-asserted-by":"crossref","first-page":"5921","DOI":"10.1016\/j.eswa.2008.07.062","volume":"36","author":"Y.F. Li","year":"2009","unstructured":"Li, Y., Xie, M., Goh, T.: A study of mutual information based feature selection for case based reasoning in software cost estimation. Expert Systems with Applications 36(3, Part 2):5921\u20135931 (2009)","journal-title":"Expert Systems with Applications"},{"issue":"1","key":"3_CR38","doi-asserted-by":"publisher","first-page":"2","DOI":"10.1109\/TSE.2007.256941","volume":"33","author":"T Menzies","year":"2007","unstructured":"Menzies, T., Greenwald, J., Frank, A.: Data mining static code attributes to learn defect predictors. IEEE Trans. Softw. Eng. 33(1), 2\u201313 (2007)","journal-title":"IEEE Trans. Softw. Eng."},{"key":"3_CR39","doi-asserted-by":"publisher","first-page":"1040","DOI":"10.1016\/j.ins.2008.12.001","volume":"179","author":"C Catal","year":"2009","unstructured":"Catal, C., Diri, B.: Investigating the effect of dataset size, metrics sets, and feature selection techniques on software fault prediction problem. Inf. Sci. 179, 1040\u20131058 (2009)","journal-title":"Inf. Sci."},{"key":"3_CR40","doi-asserted-by":"publisher","first-page":"85","DOI":"10.1007\/s11219-006-7597-z","volume":"14","author":"TM Khoshgoftaar","year":"2006","unstructured":"Khoshgoftaar, T.M., Seliya, N., Sundaresh, N.: An empirical study of predicting software faults with case-based reasoning. Softw. Qual. Control 14, 85\u2013111 (2006)","journal-title":"Softw. Qual. Control"},{"doi-asserted-by":"crossref","unstructured":"Wang, H., Khoshgoftaar, T., Gao, K., Seliya, N.: High-dimensional software engineering data and feature selection. In: 21st International Conference on Tools with Artificial Intelligence (ICTAI\u201909), pp. 83\u201390 (2009)","key":"3_CR41","DOI":"10.1109\/ICTAI.2009.20"},{"unstructured":"Khoshgoftaar, T.M., Nguyen, L., Gao, K., Rajeevalochanam, J.: Application of an attribute selection method to CBR-based software quality classification. In: Proceedings of the 15th IEEE International Conference on Tools with Artificial Intelligence (ICTAI\u201903), IEEE Computer Society, Washington, DC, USA (2003)","key":"3_CR42"},{"key":"3_CR43","doi-asserted-by":"publisher","first-page":"425","DOI":"10.1142\/S0218539310003883","volume":"17","author":"W Altidor","year":"2010","unstructured":"Altidor, W., Khoshgoftaar, T.M., Gao, K.: Wrapper-based feature ranking techniques for determining relevance of software engineering metrics. Int. J. Reliab. Qual. Saf. Eng. 17, 425\u2013464 (2010)","journal-title":"Int. J. Reliab. Qual. Saf. Eng."},{"key":"3_CR44","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1007\/s11219-011-9132-0","volume":"20","author":"K Gao","year":"2012","unstructured":"Gao, K., Khoshgoftaar, T., Seliya, N.: Predicting high-risk program modules by selecting the right software measurements. Softw. Qual. J. 20, 3\u201342 (2012)","journal-title":"Softw. Qual. J."},{"issue":"5","key":"3_CR45","doi-asserted-by":"publisher","first-page":"579","DOI":"10.1002\/spe.1043","volume":"41","author":"K Gao","year":"2011","unstructured":"Gao, K., Khoshgoftaar, T.M., Wang, H., Seliya, N.: Choosing software metrics for defect prediction: an investigation on feature selection techniques. Softw. Pract. Experience 41(5), 579\u2013606 (2011)","journal-title":"Softw. Pract. Experience"},{"key":"3_CR46","doi-asserted-by":"publisher","first-page":"161","DOI":"10.1142\/S0218194012400013","volume":"22","author":"TM Khoshgoftaar","year":"2012","unstructured":"Khoshgoftaar, T.M., Gao, K., Napolitano, A.: An empirical study of feature ranking techniques for software quality prediction. Int. J. Softw. Eng. Knowl. Eng. (IJSEKE) 22, 161\u2013183 (2012)","journal-title":"Int. J. Softw. Eng. Knowl. Eng. (IJSEKE)"},{"key":"3_CR47","doi-asserted-by":"publisher","first-page":"124","DOI":"10.1016\/j.neucom.2011.08.040","volume":"92","author":"H Wang","year":"2012","unstructured":"Wang, H., Khoshgoftaar, T.M., Napolitano, A.: Software measurement data reduction using ensemble techniques. Neurocomputing 92, 124\u2013132 (2012)","journal-title":"Neurocomputing"},{"unstructured":"Quinlan, J.R.: C4.5: programs for machine learning. Morgan Kaufmann Publishers Inc., San Francisco, CA, USA (1993)","key":"3_CR48"},{"unstructured":"Novakovic, J.: Using information gain attribute evaluation to classify sonar targets. In: Proceedings of the 17th Telecommunications forum (TELFOR\u201909) (2009)","key":"3_CR49"},{"unstructured":"Kira, K., Rendell, L.A.: The feature selection problem: traditional methods and a new algorithm. In: Proceedings of the 10th National Conference on Artificial Intelligence (AAAI\u201992) (1992)","key":"3_CR50"},{"unstructured":"Sikonja, M., Kononenko, I.: An adaptation of relief for attribute estimation in regression. In: Proceedings of the 14th International Conference on Machine Learning (ICML\u201997) (1997)","key":"3_CR51"},{"unstructured":"Hall, M.A.: Correlation-based feature selection for discrete and numeric class machine learning. In: Proceedings of the 2000 International Conference on Machine Learning (ICML\u201900), Morgan Kaufmann Publishers Inc., San Francisco, CA, USA (2000)","key":"3_CR52"},{"key":"3_CR53","first-page":"319","volume-title":"Proceedings of the 1996 International Conference on Machine Learning (ICML\u201996)","author":"H Liu","year":"1996","unstructured":"Liu, H., Setiono, R.: A probabilistic approach to feature selection\u2014A filter solution. Proceedings of the 1996 International Conference on Machine Learning (ICML\u201996), pp. 319\u2013327. Morgan Kaufmann Publishers Inc., San Francisco, CA, USA (1996)"},{"unstructured":"Poli, R., Langdon, W.B., McPhee, N.F.: A field guide to genetic programming. Published via \n                  http:\/\/lulu.com\n                  \n                 and freely available at \n                  http:\/\/www.gp-field-guide.org.uk\n                  \n                . URL: \n                  http:\/\/www.gp-field-guide.org.uk\n                  \n                , (with contributions by Koza, J.R.) (2008)","key":"3_CR54"},{"key":"3_CR55","volume-title":"Genetic programming: on the programming of computers by means of natural selection","author":"JR Koza","year":"1992","unstructured":"Koza, J.R.: Genetic programming: on the programming of computers by means of natural selection. MIT Press, Cambridge, MA, USA (1992)"},{"unstructured":"Silva, S.: GPLAB\u2014A genetic programming toolbox for MATLAB. \n                  http:\/\/gplab.sourceforge.net\n                  \n                , Last checked: 22 Dec 2014 (2007)","key":"3_CR56"},{"issue":"2\u20133","key":"3_CR57","doi-asserted-by":"publisher","first-page":"131","DOI":"10.1023\/A:1007465528199","volume":"29","author":"N Friedman","year":"1997","unstructured":"Friedman, N., Geiger, D., Goldszmidt, M.: Bayesian network classifiers. Mach. Learn. 29(2\u20133), 131\u2013163 (1997)","journal-title":"Mach. Learn."},{"unstructured":"Rish, I.: An empirical study of the naive Bayes classifier. In: Proceedings of the workshop on empirical methods in AI (IJCAI\u201901) (2001)","key":"3_CR58"},{"issue":"3","key":"3_CR59","doi-asserted-by":"publisher","first-page":"159","DOI":"10.1007\/s10462-007-9052-3","volume":"26","author":"S Kotsiantis","year":"2007","unstructured":"Kotsiantis, S., Zaharakis, I., Pintelas, P.: Machine learning: a review of classification and combining techniques. Artif. Intell. Rev. 26(3), 159\u2013190 (2007)","journal-title":"Artif. Intell. Rev."},{"key":"3_CR60","doi-asserted-by":"publisher","first-page":"10","DOI":"10.1145\/1656274.1656278","volume":"11","author":"M Hall","year":"2009","unstructured":"Hall, M., Frank, E., Holmes, G., Pfahringer, B., Reutemann, P., Witten, I.H.: The WEKA data mining software: an update. SIGKDD Explor. Newsl. 11, 10\u201318 (2009)","journal-title":"SIGKDD Explor. Newsl."},{"unstructured":"Menzies, T., DiStefano, J., Orrego, A., Chapman, R.M.: Assessing predictors of software defects. In: Proceedings of the Workshop on Predictive Software Models, collocated with ICSM\u201904. URL: \n                  http:\/\/menzies.us\/pdf\/04psm.pdf\n                  \n                 (2004)","key":"3_CR61"},{"issue":"3","key":"3_CR62","doi-asserted-by":"publisher","first-page":"301","DOI":"10.1016\/S0164-1212(00)00079-0","volume":"55","author":"K El-Emam","year":"2001","unstructured":"El-Emam, K., Benlarbi, S., Goel, N., Rai, S.N.: Comparing case-based reasoning classifiers for predicting high risk software components. J. Syst. Softw. 55(3), 301\u2013320 (2001)","journal-title":"J. Syst. Softw."},{"doi-asserted-by":"crossref","unstructured":"Ma, Y., Cukic, B.: Adequate and precise evaluation of quality models in software engineering studies. In: Proceedings of the 3rd International Workshop on Predictor Models in Software Engineering (PROMISE\u201907), IEEE Computer Society, pp 1, Washington, DC, USA(2007)","key":"3_CR63","DOI":"10.1109\/PROMISE.2007.1"},{"issue":"8","key":"3_CR64","doi-asserted-by":"publisher","first-page":"861","DOI":"10.1016\/j.patrec.2005.10.010","volume":"27","author":"T Fawcett","year":"2006","unstructured":"Fawcett, T.: An introduction to ROC analysis. Pattern Recogn. Lett. 27(8), 861\u2013874 (2006)","journal-title":"Pattern Recogn. Lett."},{"issue":"1","key":"3_CR65","doi-asserted-by":"crossref","first-page":"29","DOI":"10.1148\/radiology.143.1.7063747","volume":"143","author":"J A Hanley","year":"1982","unstructured":"Hanley, J.A., McNeil, B.J.: The meaning and use of the area under a receiver operating characteristic (ROC) curve. Radiology 143(1):29\u201336 (1982)","journal-title":"Radiology"},{"unstructured":"Ling, C.X., Huang, J., Zhang, H.: AUC: a statistically consistent and more discriminating measure than accuracy. In: Proceedings of the Eighteenth International Joint Conference on Artificial Intelligence (IJCAI\u201903) (2003)","key":"3_CR66"},{"unstructured":"Yousef, W.A., Wagner, R.F., Loew, M.H.: Comparison of non-parametric methods for assessing classifier performance in terms of ROC parameters. In: Proceedings of the 33rd Applied Imagery Pattern Recognition Workshop (AIPR\u201904), IEEE Computer Society, Washington, DC, USA (2004)","key":"3_CR67"},{"doi-asserted-by":"crossref","unstructured":"Jiang, Y., Cukic, B., Menzies, T., Bartlow, N.: Comparing design and code metrics for software quality prediction. In: Proceedings of the 4th international workshop on predictor models in software engineering (PROMISE\u201908), ACM, New York, NY, USA (2008)","key":"3_CR68","DOI":"10.1145\/1370788.1370793"},{"doi-asserted-by":"crossref","unstructured":"Jiang, Y., Cukic, B., Menzies, T.: Fault prediction using early lifecycle data. In: Proceedings of the 18th IEEE International Symposium on Software Reliability (ISSRE\u201907), IEEE Computer Society, Washington, DC, USA (2007)","key":"3_CR69","DOI":"10.1109\/ISSRE.2007.24"},{"key":"3_CR70","doi-asserted-by":"publisher","first-page":"1145","DOI":"10.1016\/S0031-3203(96)00142-2","volume":"30","author":"AP Bradley","year":"1997","unstructured":"Bradley, A.P.: The use of the area under the ROC curve in the evaluation of machine learning algorithms. Pattern Recogn. 30, 1145\u20131159 (1997)","journal-title":"Pattern Recogn."},{"issue":"3","key":"3_CR71","doi-asserted-by":"crossref","first-page":"81","DOI":"10.1049\/ip-sen:20010506","volume":"148","author":"B.A. Kitchenham","year":"2001","unstructured":"Kitchenham, B.A., Pickard, L.M., MacDonell, S., Shepperd, M.: What accuracy statistics really measure? IEE Proc. Softw. 148(3) (2001)","journal-title":"IEE Proceedings - Software"},{"issue":"5","key":"3_CR72","doi-asserted-by":"publisher","first-page":"380","DOI":"10.1109\/TSE.2005.58","volume":"31","author":"I Myrtveit","year":"2005","unstructured":"Myrtveit, I., Stensrud, E., Shepperd, M.: Reliability and validity in comparative studies of software prediction models. IEEE Trans. Softw. Eng. 31(5), 380\u2013391 (2005)","journal-title":"IEEE Trans. Softw. Eng."},{"key":"3_CR73","doi-asserted-by":"publisher","first-page":"251","DOI":"10.1023\/B:GENP.0000030196.55525.f7","volume":"5","author":"WB Langdon","year":"2004","unstructured":"Langdon, W.B., Buxton, B.F.: Genetic programming for mining DNA chip data from cancer patients. Genet. Program Evolvable Mach. 5, 251\u2013257 (2004)","journal-title":"Genet. Program Evolvable Mach."},{"key":"3_CR74","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4615-4625-2","volume-title":"Experimentation in software engineering: an introduction","author":"C Wohlin","year":"2000","unstructured":"Wohlin, C., Runeson, P., H\u00f6st, M., Ohlsson, M., Regnell, B., Wessl\u00e9n, A.: Experimentation in software engineering: an introduction. Kluwer Academic Publishers, USA (2000)"},{"unstructured":"Kohavi, R.: A study of cross-validation and bootstrap for accuracy estimation and model selection. In: Proceedings of the 14th International Joint conference on Artificial Intelligence (IJCAI\u201995), Morgan Kaufmann Publishers Inc., San Francisco, CA, USA (1995)","key":"3_CR75"}],"container-title":["Studies in Computational Intelligence","Computational Intelligence and Quantitative Software Engineering"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-25964-2_3","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,6,1]],"date-time":"2019-06-01T06:23:50Z","timestamp":1559370230000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-25964-2_3"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016]]},"ISBN":["9783319259628","9783319259642"],"references-count":75,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-25964-2_3","relation":{},"ISSN":["1860-949X","1860-9503"],"issn-type":[{"type":"print","value":"1860-949X"},{"type":"electronic","value":"1860-9503"}],"subject":[],"published":{"date-parts":[[2016]]},"assertion":[{"value":"15 January 2016","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}}]}}