{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T17:46:58Z","timestamp":1740160018401,"version":"3.37.3"},"reference-count":40,"publisher":"Springer Science and Business Media LLC","issue":"S2","license":[{"start":{"date-parts":[[2016,12,24]],"date-time":"2016-12-24T00:00:00Z","timestamp":1482537600000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Syst Assur Eng Manag"],"published-print":{"date-parts":[[2017,11]]},"DOI":"10.1007\/s13198-016-0556-6","type":"journal-article","created":{"date-parts":[[2016,12,24]],"date-time":"2016-12-24T19:42:37Z","timestamp":1482608557000},"page":"974-982","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Identifying and eliminating less complex instances from software fault data"],"prefix":"10.1007","volume":"8","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-7777-1370","authenticated-orcid":false,"given":"Raed","family":"Shatnawi","sequence":"first","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2016,12,24]]},"reference":[{"issue":"1","key":"556_CR1","first-page":"37","volume":"6","author":"D Aha","year":"1991","unstructured":"Aha D, Kibler D (1991) Instance-based learning algorithms. Mach Learn 6(1):37\u201366","journal-title":"Mach Learn"},{"issue":"5","key":"556_CR2","doi-asserted-by":"crossref","first-page":"1042","DOI":"10.1016\/j.jss.2011.12.006","volume":"85","author":"J Al Dallal","year":"2012","unstructured":"Al Dallal J (2012) The impact of accounting for special methods in the measurement of object-oriented class cohesion on refactoring and fault prediction activities. J Syst Softw 85(5):1042\u20131057","journal-title":"J Syst Softw"},{"key":"556_CR3","unstructured":"Boetticher G (2006) Improving credibility of machine learner models in software engineering. In: Advanced machine learner applications in software engineering, software engineering and knowledge engineering, pp 52\u201372"},{"issue":"21","key":"556_CR4","doi-asserted-by":"crossref","first-page":"4867","DOI":"10.1016\/j.ins.2011.06.017","volume":"181","author":"C Catal","year":"2011","unstructured":"Catal C, Alan O, Balkan K (2011) Class noise detection based on software metrics and ROC curves. Inf Sci 181(21):4867\u20134877","journal-title":"Inf Sci"},{"key":"556_CR5","doi-asserted-by":"crossref","unstructured":"Challagulla VU, Bastani FB, Yen I, Paul RA (2005) Empirical assessment of machine learning based software defect prediction techniques. In: Tenth IEEE international workshop on object-oriented real-time dependable systems. pp 263\u2013270","DOI":"10.1109\/WORDS.2005.32"},{"issue":"1","key":"556_CR6","doi-asserted-by":"crossref","first-page":"321","DOI":"10.1613\/jair.953","volume":"16","author":"N Chawla","year":"2002","unstructured":"Chawla N, Bowyer K, Hall L, Kegelmeyer W (2002) SMOTE: synthetic minority over-sampling technique. J Artif Intell Res 16(1):321\u2013357","journal-title":"J Artif Intell Res"},{"issue":"6","key":"556_CR7","doi-asserted-by":"crossref","first-page":"476","DOI":"10.1109\/32.295895","volume":"20","author":"SR Chidamber","year":"1994","unstructured":"Chidamber SR, Kemerer CF (1994) A metrics suite for object oriented design. IEEE Trans Softw Eng 20(6):476\u2013493","journal-title":"IEEE Trans Softw Eng"},{"key":"556_CR8","doi-asserted-by":"crossref","unstructured":"D\u2019Ambros M, Lanza M, Robbes R (2010) An extensive comparison of bug prediction approaches. In: Proceedings of MSR 2010 (7th IEEE working conference on mining software repositories). pp 31\u201341","DOI":"10.1109\/MSR.2010.5463279"},{"key":"556_CR9","doi-asserted-by":"crossref","unstructured":"Erni K, Lewerentz C (1996) Applying design-metrics to object-oriented frameworks. In: Proceedings of the third international software metrics symposium. pp 25\u201326","DOI":"10.1109\/METRIC.1996.492444"},{"key":"556_CR10","unstructured":"Fawcett T (2004) ROC graphs: notes and practical considerations for researchers. Technical report, HP Laboratories, Page Mill Road, Palo Alto, 38 pages"},{"issue":"5","key":"556_CR11","doi-asserted-by":"crossref","first-page":"579","DOI":"10.1002\/spe.1043","volume":"41","author":"K Gao","year":"2011","unstructured":"Gao K, Khoshgoftaar K, Wang H, Seliya N (2011) Choosing software metrics for defect prediction: an investigation on feature selection techniques. Softw Pract Exp 41(5):579\u2013606","journal-title":"Softw Pract Exp"},{"issue":"1","key":"556_CR12","doi-asserted-by":"crossref","first-page":"3","DOI":"10.1007\/s11219-011-9132-0","volume":"20","author":"K Gao","year":"2012","unstructured":"Gao K, Khoshgoftaar TM, Seliya N (2012) Predicting high-risk program modules by selecting the right software measurements. Softw Qual J 20(1):3\u201342","journal-title":"Softw Qual J"},{"key":"556_CR13","doi-asserted-by":"crossref","unstructured":"Gray D, Bowes D, Davey N, Sun Y, Christianson B (2011) The misuse of the NASA metrics data program data sets for automated software defect prediction. In: Evaluation and assessment in software engineering (EASE)","DOI":"10.1049\/ic.2011.0012"},{"key":"556_CR01","doi-asserted-by":"crossref","unstructured":"Gyimothy T, Ferenc R, Siket I (2005) Empirical validation of object-oriented metrics on open source software for fault prediction, IEEE Trans Softw Eng 31(10):897\u2013910","DOI":"10.1109\/TSE.2005.112"},{"issue":"1","key":"556_CR14","first-page":"10","volume":"11","author":"M Hall","year":"2009","unstructured":"Hall M, Frank E, Holmes G, Pfahringer B, Reutemann P, Witten I (2009) The WEKA data mining software, an update. Special Interest Group Knowl Discov Data Min Explor Newsl 11(1):10\u201318","journal-title":"Special Interest Group Knowl Discov Data Min Explor Newsl"},{"issue":"6","key":"556_CR15","doi-asserted-by":"crossref","first-page":"1276","DOI":"10.1109\/TSE.2011.103","volume":"38","author":"T Hall","year":"2011","unstructured":"Hall T, Beecham S, Bowes D, Gray D, Counsell S (2011) A systematic review of fault prediction performance in software engineering. IEEE Trans Softw Eng 38(6):1276\u20131304","journal-title":"IEEE Trans Softw Eng"},{"issue":"5","key":"556_CR16","first-page":"49","volume":"24","author":"M Hamill","year":"2014","unstructured":"Hamill M, Goseva-Popstojanova K (2014) Exploring the missing link: an empirical study of software fixes. Softw Test Verif Reliab 24(5):49\u201371","journal-title":"Softw Test Verif Reliab"},{"issue":"9","key":"556_CR17","first-page":"1264","volume":"21","author":"H He","year":"2009","unstructured":"He H, Garcia E (2009) Learning from imbalanced data. IEEE Trans Knowl Data Eng 21(9):1264\u20131284","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"556_CR18","unstructured":"Jiang Y, Cukic B, Menzies T (2007) Can data transformation help in the detection of fault-prone modules? In: Proceedings of the 2008 workshop on defects in large software systems. pp 16\u201320"},{"key":"556_CR19","doi-asserted-by":"crossref","first-page":"561","DOI":"10.1007\/s10664-008-9079-3","volume":"13","author":"Y Jiang","year":"2008","unstructured":"Jiang Y, Cukic B, Ma Y (2008) Techniques for evaluating fault prediction models. Empir Softw Eng 13:561\u2013595","journal-title":"Empir Softw Eng"},{"key":"556_CR20","unstructured":"Jindal R, Malhotra R, Jain A (2016) Prediction of defect severity by mining software project reports. Int J Syst Assur Eng Manag 1\u201318"},{"key":"556_CR02","unstructured":"John GH, Langley P (1995) Estimating continuous distributions in Bayesian classifiers. In: Besnard P, Hanks S (eds) Proceedings of the Eleventh Conference on Uncertainty in Artificial Intelligence, pp 338\u2013345"},{"issue":"1","key":"556_CR21","first-page":"21","volume":"9","author":"M Jureczko","year":"2015","unstructured":"Jureczko M, Madeyski L (2015) Cross\u2013project defect prediction with respect to code ownership model: an empirical study. e-Inform Softw Eng J 9(1):21\u201335","journal-title":"e-Inform Softw Eng J"},{"key":"556_CR22","doi-asserted-by":"crossref","unstructured":"Kaur A, Kaur K, Chopra D (2016) An empirical study of software entropy based bug prediction using machine learning. Int J Syst Assur Eng Manag 1\u201318","DOI":"10.1007\/s13198-016-0479-2"},{"key":"556_CR23","doi-asserted-by":"crossref","unstructured":"Kim S, Zimmermann T, Whitehead E, Zeller A (2007) Predicting faults from cached history. In: Proceedings of the 29th international conference on software engineering (ICSE 2007), Minneapolis, 20\u201326 May","DOI":"10.1109\/ICSE.2007.66"},{"key":"556_CR24","doi-asserted-by":"crossref","first-page":"39","DOI":"10.1145\/1370788.1370799","volume-title":"Proceedings of the 4th international workshop on predictor models in software engineering (PROMISE \u201808)","author":"GA Liebchen","year":"2008","unstructured":"Liebchen GA, Shepperd M (2008) Data sets and data quality in software engineering. Proceedings of the 4th international workshop on predictor models in software engineering (PROMISE \u201808). ACM, New York, pp 39\u201344"},{"issue":"2","key":"556_CR25","doi-asserted-by":"crossref","first-page":"287","DOI":"10.1109\/TSE.2007.70768","volume":"34","author":"A Marcus","year":"2008","unstructured":"Marcus A, Poshyvanyk D, Ferenc R (2008) Using the conceptual cohesion of classes for fault prediction in object-oriented systems. IEEE Trans Softw Eng 34(2):287\u2013300","journal-title":"IEEE Trans Softw Eng"},{"key":"556_CR26","unstructured":"Menzies T, DiStefano J, Orrego A, Chapman R (2004) Assessing predictors of software defects. In: Predictive software models workshop"},{"key":"556_CR27","doi-asserted-by":"crossref","first-page":"375","DOI":"10.1007\/s10515-010-0069-5","volume":"17","author":"T Menzies","year":"2010","unstructured":"Menzies T, Milton Z, Turhan B, Cukic B, Jiang Y, Bener A (2010) Defect prediction from static code features: current results, limitations, new approaches. Autom Softw Eng 17:375\u2013407","journal-title":"Autom Softw Eng"},{"key":"556_CR28","doi-asserted-by":"crossref","unstructured":"Mertik M, Lenic M, Stiglic G, Kokol P (2006) Estimating software quality with advanced data mining techniques. In: International conference on software engineering advances. p 19","DOI":"10.1109\/ICSEA.2006.261275"},{"key":"556_CR29","doi-asserted-by":"crossref","unstructured":"Petri\u0107 J, Bowes D, Hall T, Christianson B, Baddoo N (2016) The jinx on the NASA software defect data sets. In: Proceedings of the 20th international conference on evaluation and assessment in software engineering (EASE \u201816). Article 13, 5 pages","DOI":"10.1145\/2915970.2916007"},{"key":"556_CR30","volume-title":"C4.5: Programs for machine learning","author":"JR Quinlan","year":"1993","unstructured":"Quinlan JR (1993) C4.5: Programs for machine learning. Morgan Kaufmann Publishers, San Mateo"},{"issue":"1","key":"556_CR31","first-page":"67","volume":"2","author":"JC Riquelme","year":"2008","unstructured":"Riquelme JC, Ruiz R, Rodr\u00edguez D, Moreno J (2008) Finding defective modules from highly unbalanced datasets. Actas del 8\u00b0 taller sobre el apoyo a la decisi\u00f3n en ingenier\u00eda del software 2(1):67\u201374","journal-title":"Actas del 8\u00b0 taller sobre el apoyo a la decisi\u00f3n en ingenier\u00eda del software"},{"key":"556_CR32","doi-asserted-by":"crossref","unstructured":"Schr\u00f6ter A, Zimmermann T, Zeller A (2006) Predicting component failures at design time. In: Proceedings of the 2006 ACM\/IEEE international symposium on empirical software engineering. ACM, pp 18\u201327","DOI":"10.1145\/1159733.1159739"},{"key":"556_CR33","doi-asserted-by":"crossref","first-page":"571","DOI":"10.1016\/j.ins.2010.12.016","volume":"259","author":"C Seiffert","year":"2014","unstructured":"Seiffert C, Khoshgoftaar TM, Hulse JV, Folleco A (2014) An empirical study of the classification performance of learners on imbalanced and noisy software quality data. Inf Sci 259:571\u2013595","journal-title":"Inf Sci"},{"issue":"2","key":"556_CR34","doi-asserted-by":"crossref","first-page":"216","DOI":"10.1109\/TSE.2010.9","volume":"36","author":"R Shatnawi","year":"2010","unstructured":"Shatnawi R (2010) A quantitative investigation of the acceptable risk levels of object-oriented metrics in open-source systems. IEEE Trans Softw Eng 36(2):216\u2013225","journal-title":"IEEE Trans Softw Eng"},{"issue":"9","key":"556_CR35","doi-asserted-by":"crossref","first-page":"1208","DOI":"10.1109\/TSE.2013.11","volume":"39","author":"M Shepperd","year":"2013","unstructured":"Shepperd M, Song Q, Sun Z, Mair C (2013) Data quality: some comments on the NASA software defect datasets. IEEE Trans Softw Eng 39(9):1208\u20131215","journal-title":"IEEE Trans Softw Eng"},{"key":"556_CR36","volume-title":"FLAIRS Conference","author":"H Wang","year":"2011","unstructured":"Wang H, Khoshgoftaar TM, Seliya N (2011) How many software metrics should be selected for defect prediction? In: Murray RC, McCarthy PM (eds) FLAIRS Conference. AAAI Press, Palo Alto"},{"issue":"10","key":"556_CR37","doi-asserted-by":"crossref","first-page":"771","DOI":"10.1109\/TSE.2006.102","volume":"32","author":"Y Zhou","year":"2006","unstructured":"Zhou Y, Leung H (2006) Empirical analysis of object-oriented design metrics for predicting high and low severity faults. IEEE Trans Softw Eng 32(10):771\u2013789","journal-title":"IEEE Trans Softw Eng"},{"issue":"1","key":"556_CR38","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/2556777","volume":"23","author":"Y Zhou","year":"2014","unstructured":"Zhou Y, Xu B, Leung H, Chen L (2014) An in-depth study of the potentially confounding effect of class size in fault prediction. ACM Trans Softw Eng Methodol 23(1):1\u201351","journal-title":"ACM Trans Softw Eng Methodol"}],"container-title":["International Journal of System Assurance Engineering and Management"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s13198-016-0556-6\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s13198-016-0556-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s13198-016-0556-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,9,16]],"date-time":"2019-09-16T19:03:50Z","timestamp":1568660630000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s13198-016-0556-6"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,12,24]]},"references-count":40,"journal-issue":{"issue":"S2","published-print":{"date-parts":[[2017,11]]}},"alternative-id":["556"],"URL":"https:\/\/doi.org\/10.1007\/s13198-016-0556-6","relation":{},"ISSN":["0975-6809","0976-4348"],"issn-type":[{"type":"print","value":"0975-6809"},{"type":"electronic","value":"0976-4348"}],"subject":[],"published":{"date-parts":[[2016,12,24]]}}}