{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,18]],"date-time":"2026-03-18T13:19:03Z","timestamp":1773839943646,"version":"3.50.1"},"reference-count":51,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2016,3,22]],"date-time":"2016-03-22T00:00:00Z","timestamp":1458604800000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Nature Science Foundation of China","doi-asserted-by":"crossref","award":["61272273"],"award-info":[{"award-number":["61272273"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100001809","name":"National Nature Science Foundation of China","doi-asserted-by":"crossref","award":["61073113"],"award-info":[{"award-number":["61073113"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"crossref"}]},{"name":"Graduate Student Innovation Research Project of Jiangsu Province in China","award":["CXZZ12_0478"],"award-info":[{"award-number":["CXZZ12_0478"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Autom Softw Eng"],"published-print":{"date-parts":[[2017,3]]},"DOI":"10.1007\/s10515-016-0194-x","type":"journal-article","created":{"date-parts":[[2016,3,22]],"date-time":"2016-03-22T11:04:41Z","timestamp":1458644681000},"page":"47-69","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":102,"title":["Label propagation based semi-supervised learning for software defect prediction"],"prefix":"10.1007","volume":"24","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-2346-580X","authenticated-orcid":false,"given":"Zhi-Wu","family":"Zhang","sequence":"first","affiliation":[],"role":[{"role":"author","vocab":"crossref"}]},{"given":"Xiao-Yuan","family":"Jing","sequence":"additional","affiliation":[],"role":[{"role":"author","vocab":"crossref"}]},{"given":"Tie-Jian","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocab":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2016,3,22]]},"reference":[{"issue":"1","key":"194_CR1","doi-asserted-by":"crossref","first-page":"20","DOI":"10.1145\/1007730.1007735","volume":"6","author":"GE Batista","year":"2004","unstructured":"Batista, G.E., Prati, R.C., Monard, M.C.: A study of the behavior of several methods for balancing machine learning training data. ACM Sigkdd Explorations Newsletter. 6(1), 20\u201329 (2004)","journal-title":"ACM Sigkdd Explorations Newsletter."},{"issue":"11","key":"194_CR2","first-page":"2399","volume":"7","author":"M Belkin","year":"2006","unstructured":"Belkin, M., Niyogi, P., Sindhwani, V.: Manifold regularization: A geometric framework for learning from labeled and unlabeled examples. J. Mach. Learn. Res. 7(11), 2399\u20132434 (2006)","journal-title":"J. Mach. Learn. Res."},{"issue":"4","key":"194_CR3","doi-asserted-by":"crossref","first-page":"7346","DOI":"10.1016\/j.eswa.2008.10.027","volume":"36","author":"C Catal","year":"2009","unstructured":"Catal, C., Diri, B.: A systematic review of software fault prediction studies. Expert Syst. Appl. 36(4), 7346\u20137354 (2009a)","journal-title":"Expert Syst. Appl."},{"issue":"5","key":"194_CR4","doi-asserted-by":"crossref","first-page":"458","DOI":"10.1111\/j.1468-0394.2009.00509.x","volume":"26","author":"C Catal","year":"2009","unstructured":"Catal, C., Diri, B.: Unlabelled extra data do not always mean extra performance for semi-supervised fault prediction. Expert Syst. 26(5), 458\u2013471 (2009b)","journal-title":"Expert Syst."},{"issue":"1","key":"194_CR5","doi-asserted-by":"crossref","first-page":"75","DOI":"10.1515\/jisys-2013-0030","volume":"23","author":"C Catal","year":"2014","unstructured":"Catal, C.: A comparison of semi-supervised classification approaches for software defect prediction. J. Intell. Syst. 23(1), 75\u201382 (2014)","journal-title":"J. Intell. Syst."},{"issue":"12","key":"194_CR6","doi-asserted-by":"crossref","first-page":"1755","DOI":"10.1093\/ptj\/77.12.1755","volume":"77","author":"Y Chan","year":"1997","unstructured":"Chan, Y., Walmsley, R.P.: Learning and understanding the Kruskal-Wallis one-way analysis-of-variance-by-ranks test for differences among three or more independent groups. Phys. Ther. 77(12), 1755\u20131761 (1997)","journal-title":"Phys. Ther."},{"key":"194_CR7","unstructured":"Chapelle, O., Zien, A.: Semi-supervised classification by low density separation. In: Proceedings of the 10th International Workshop on Artificial Intelligence and Statistics, pp. 57\u201364 (2005)"},{"key":"194_CR8","doi-asserted-by":"crossref","first-page":"321","DOI":"10.1613\/jair.953","volume":"16","author":"NV Chawla","year":"2002","unstructured":"Chawla, N.V., Bowyer, K.W., Hall, L.O., Kegelmeyer, W.P.: SMOTE: synthetic minority over-sampling technique. J. Artifici. Intell. Res. 16, 321\u2013357 (2002)","journal-title":"J. Artifici. Intell. Res."},{"issue":"1","key":"194_CR9","doi-asserted-by":"crossref","first-page":"174","DOI":"10.1109\/TPAMI.2007.70765","volume":"30","author":"M Culp","year":"2008","unstructured":"Culp, M., Michailidis, G.: Graph-based semisupervised learning. IEEE Trans. Pattern Anal. Mach. Intell. 30(1), 174\u2013179 (2008)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"8","key":"194_CR10","doi-asserted-by":"crossref","first-page":"797","DOI":"10.1109\/32.879815","volume":"26","author":"N Fenton","year":"2000","unstructured":"Fenton, N., Ohlsson, N.: Quantitative analysis of faults and failures in a complex software system. IEEE Trans. Softw. Eng. 26(8), 797\u2013814 (2000)","journal-title":"IEEE Trans. Softw. Eng."},{"key":"194_CR11","unstructured":"Gao, K., Khoshgoftaar, T. M.: Software defect prediction for high-dimensional and class-imbalanced data. In: Proceedings of the 23rd International Conference on Software Engineering and Knowledge Engineering, pp. 89\u201394 (2011)"},{"issue":"1","key":"194_CR12","first-page":"145004","volume":"21","author":"K Gao","year":"2014","unstructured":"Gao, K., Khoshgoftaar, T.M., Wald, R.: The use of under- and oversampling within ensemble feature selection and classification for\u00a0software\u00a0quality\u00a0prediction. Int. J. Reliab. Qual. Saf. Eng. 21(1), 145004 (2014)","journal-title":"Int. J. Reliab. Qual. Saf. Eng."},{"key":"194_CR13","unstructured":"Goldman, S., Zhou, Y.: Enhancing supervised learning with unlabeled data. In: Proceedings of the 17th International Conference on Machine Learning, pp. 327\u2013334 (2000)"},{"key":"194_CR14","unstructured":"Grandvalet, Y., Bengio, Y.: Semi-supervised learning by entropy minimization. In: Advances in neural information processing systems, pp. 529\u2013536 (2004)"},{"key":"194_CR15","doi-asserted-by":"crossref","unstructured":"Gray, D., Bowes, D., Davey, N., Sun, Y., Christianson, B.: The misuse of the NASA metrics data program data sets for automated software defect prediction. In: Proceedings of 15th Annual Conference on Evaluation and Assessment in Software Engineering, pp. 96\u2013103 (2011)","DOI":"10.1049\/ic.2011.0012"},{"issue":"6","key":"194_CR16","doi-asserted-by":"crossref","first-page":"1276","DOI":"10.1109\/TSE.2011.103","volume":"38","author":"T Hall","year":"2012","unstructured":"Hall, T., Beecham, S., Bowes, D., Gray, D., Counsell, S.: A systematic literature review on fault prediction performance in software engineering. IEEE Trans. Softw. Eng. 38(6), 1276\u20131304 (2012)","journal-title":"IEEE Trans. Softw. Eng."},{"key":"194_CR17","unstructured":"He, X., Cai, D., Niyogi, P.: Laplacian score for feature selection. In: Advances in Neural Information Processing Systems, pp. 507\u2013514 (2005)"},{"issue":"2","key":"194_CR18","doi-asserted-by":"crossref","first-page":"328","DOI":"10.1007\/s11390-011-9439-0","volume":"26","author":"Y Jiang","year":"2011","unstructured":"Jiang, Y., Li, M., Zhou, Z.H.: Software defect detection with ROCUS. J. Comput. Sci. Technol. 26(2), 328\u2013342 (2011)","journal-title":"J. Comput. Sci. Technol."},{"key":"194_CR19","doi-asserted-by":"crossref","unstructured":"Jing, X. Y., Ying, S., Zhang, Z. W., Wu, S. S., Liu, J.: Dictionary learning based software defect prediction. In:\u00a0Proceedings of the 36th International Conference on Software Engineering, pp. 414-423 (2014a)","DOI":"10.1145\/2568225.2568320"},{"key":"194_CR20","doi-asserted-by":"crossref","unstructured":"Jing, X. Y., Zhang, Z. W., Ying, S., Wang, F., Zhu, Y. P.: Software defect prediction based on collaborative representation classification. In:\u00a0Companion Proceedings of the 36th International Conference on Software Engineering, pp. 632\u2013633 (2014b)","DOI":"10.1145\/2591062.2591151"},{"key":"194_CR21","unstructured":"Joachims, T.: Transductive inference for text classification using support vector machines. In: Proceedings of the 16th International Conference on Machine Learning, pp 200\u2013209 (1999)"},{"key":"194_CR22","doi-asserted-by":"crossref","unstructured":"Khoshgoftaar, T. M., Gao, K., Seliya, N.: Attribute selection and imbalanced data: problems in software defect prediction. In: Proceedings of the 22nd IEEE International Conference on Tools with Artificial Intelligence, pp. 137\u2013144 (2010)","DOI":"10.1109\/ICTAI.2010.27"},{"key":"194_CR23","unstructured":"Kubat, M., Matwin, S.: Addressing the curse of imbalanced training sets: one-sided selection. In: Proceedings of the 14th International Conference on Machine Learning, pp 179\u2013186 (1997)"},{"key":"194_CR24","doi-asserted-by":"crossref","first-page":"388","DOI":"10.1016\/j.infsof.2014.07.005","volume":"58","author":"IH Laradji","year":"2015","unstructured":"Laradji, I.H., Alshayeb, M., Ghouti, L.: Software defect prediction using ensemble learning on selected features. Inf. Softw. Technol. 58, 388\u2013402 (2015)","journal-title":"Inf. Softw. Technol."},{"issue":"2","key":"194_CR25","doi-asserted-by":"crossref","first-page":"201","DOI":"10.1007\/s10515-011-0092-1","volume":"19","author":"M Li","year":"2012","unstructured":"Li, M., Zhang, H., Wu, R., Zhou, Z.H.: Sample-based software defect prediction with active and semi-supervised learning. Autom. Softw. Eng. 19(2), 201\u2013230 (2012)","journal-title":"Autom. Softw. Eng."},{"key":"194_CR26","unstructured":"Li, S., Fu, Y.: Low-rank coding with b-matching constraint for semi-supervised classification. In:\u00a0Proceedings of the 23th International Joint Conference on Artificial Intelligence, pp. 1472\u20131478 (2013)"},{"key":"194_CR27","doi-asserted-by":"crossref","unstructured":"Lu, H., Cukic, B., Culp, M.: An iterative semi-supervised approach to software fault prediction. In:\u00a0Proceedings of the 7th International Conference on Predictive Models in Software Engineering\u00a0(Article 15) (2011)","DOI":"10.1145\/2020390.2020405"},{"key":"194_CR28","doi-asserted-by":"crossref","unstructured":"Lu, H., Cukic, B., Culp, M.: Software defect prediction using semi-supervised learning with dimension reduction. In:\u00a0Proceedings of the 27th IEEE\/ACM International Conference on Automated Software Engineering, pp. 314\u2013317 (2012)","DOI":"10.1145\/2351676.2351734"},{"key":"194_CR29","doi-asserted-by":"crossref","unstructured":"Lyu, M. R.: Software reliability engineering: a roadmap. In:\u00a02007 Future of Software Engineering, pp. 153\u2013170 (2007)","DOI":"10.1109\/FOSE.2007.24"},{"key":"194_CR30","doi-asserted-by":"crossref","first-page":"308","DOI":"10.1109\/TSE.1976.233837","volume":"4","author":"TJ McCabe","year":"1976","unstructured":"McCabe, T.J.: A complexity measure. IEEE Trans. Softw. Eng. 4, 308\u2013320 (1976)","journal-title":"IEEE Trans. Softw. Eng."},{"issue":"1","key":"194_CR31","doi-asserted-by":"crossref","first-page":"2","DOI":"10.1109\/TSE.2007.256941","volume":"33","author":"T Menzies","year":"2007","unstructured":"Menzies, T., Greenwald, J., Frank, A.: Data mining static code attributes to learn defect predictors. IEEE Trans. Softw. Eng. 33(1), 2\u201313 (2007)","journal-title":"IEEE Trans. Softw. Eng."},{"key":"194_CR32","unstructured":"Miller, D. J., Uyar, H. S.: A mixture of experts classifier with learning based on both labelled and unlabelled data. In: Advances in neural information processing systems, pp. 571\u2013577 (1997)"},{"key":"194_CR33","doi-asserted-by":"crossref","unstructured":"Nam, J., Pan, S. J., Kim, S.: Transfer defect learning. In: Proceedings of the 35th International Conference on Software Engineering, pp. 382\u2013391 (2013)","DOI":"10.1109\/ICSE.2013.6606584"},{"issue":"2\u20133","key":"194_CR34","doi-asserted-by":"crossref","first-page":"103","DOI":"10.1023\/A:1007692713085","volume":"39","author":"K Nigam","year":"2000","unstructured":"Nigam, K., McCallum, A.K., Thrun, S., Mitchell, T.: Text classification from labeled and unlabeled documents using EM. Mach. Learn. 39(2\u20133), 103\u2013134 (2000)","journal-title":"Mach. Learn."},{"key":"194_CR35","doi-asserted-by":"crossref","unstructured":"Pelayo, L, Dick, S.: Applying novel resampling strategies to software defect prediction. In: Proceedings of the 2007 Annual Meeting of the North American Fuzzy Information Processing Society, pp. 69\u201372 (2007)","DOI":"10.1109\/NAFIPS.2007.383813"},{"issue":"3","key":"194_CR36","doi-asserted-by":"crossref","first-page":"327","DOI":"10.1007\/s11219-007-9013-8","volume":"15","author":"N Seliya","year":"2007","unstructured":"Seliya, N., Khoshgoftaar, T.M.: Software quality estimation with limited fault data: a semi-supervised learning perspective. Softw. Qual. J. 15(3), 327\u2013344 (2007a)","journal-title":"Softw. Qual. J."},{"issue":"2","key":"194_CR37","doi-asserted-by":"crossref","first-page":"201","DOI":"10.1109\/TSMCA.2006.889473","volume":"37","author":"N Seliya","year":"2007","unstructured":"Seliya, N., Khoshgoftaar, T.M.: Software quality analysis of unlabeled program modules with semisupervised clustering. IEEE Trans. Syst. Man. Cyber. 37(2), 201\u2013211 (2007b)","journal-title":"IEEE Trans. Syst. Man. Cyber."},{"issue":"5","key":"194_CR38","doi-asserted-by":"crossref","first-page":"1087","DOI":"10.1109\/36.312897","volume":"32","author":"BM Shahshahani","year":"1994","unstructured":"Shahshahani, B.M., Landgrebe, D.: The effect of unlabeled samples in reducing the small sample size problem and mitigating the Hughes phenomenon. IEEE Trans. Geosci. Remote Sens. 32(5), 1087\u20131095 (1994)","journal-title":"IEEE Trans. Geosci. Remote Sens."},{"issue":"9","key":"194_CR39","doi-asserted-by":"crossref","first-page":"1208","DOI":"10.1109\/TSE.2013.11","volume":"39","author":"M Shepperd","year":"2013","unstructured":"Shepperd, M., Song, Q., Sun, Z., Mair, C.: Data quality: some comments on the NASA software defect datasets. IEEE Trans. Softw. Eng. 39(9), 1208\u20131215 (2013)","journal-title":"IEEE Trans. Softw. Eng."},{"issue":"6","key":"194_CR40","doi-asserted-by":"crossref","first-page":"1806","DOI":"10.1109\/TSMCC.2012.2226152","volume":"42","author":"ZB Sun","year":"2012","unstructured":"Sun, Z.B., Song, Q.B., Zhu, X.Y.: Using coding based ensemble learning to improve software defect prediction. IEEE Trans. Syst. Man Cyber. C 42(6), 1806\u20131817 (2012)","journal-title":"IEEE Trans. Syst. Man Cyber. C"},{"issue":"5","key":"194_CR41","doi-asserted-by":"crossref","first-page":"540","DOI":"10.1007\/s10664-008-9103-7","volume":"14","author":"B Turhan","year":"2009","unstructured":"Turhan, B., Menzies, T., Bener, A.: On the relative value of cross-company and within-company data for defect prediction. Empirical Softw. Eng. 14(5), 540\u2013578 (2009)","journal-title":"Empirical Softw. Eng."},{"issue":"1","key":"194_CR42","doi-asserted-by":"crossref","first-page":"55","DOI":"10.1109\/TKDE.2007.190672","volume":"20","author":"F Wang","year":"2008","unstructured":"Wang, F., Zhang, C.: Label propagation through linear neighborhoods. IEEE Trans. Knowl. Data Eng. 20(1), 55\u201367 (2008)","journal-title":"IEEE Trans. Knowl. Data Eng."},{"issue":"2","key":"194_CR43","doi-asserted-by":"crossref","first-page":"434","DOI":"10.1109\/TR.2013.2259203","volume":"62","author":"S Wang","year":"2013","unstructured":"Wang, S., Yao, X.: Using class imbalance learning for software defect prediction. IEEE Trans. Reliab. 62(2), 434\u2013443 (2013)","journal-title":"IEEE Trans. Reliab."},{"issue":"2","key":"194_CR44","doi-asserted-by":"crossref","first-page":"210","DOI":"10.1109\/TPAMI.2008.79","volume":"31","author":"J Wright","year":"2009","unstructured":"Wright, J., Yang, A.Y., Ganesh, A., Sastry, S.S., Ma, Y.: Robust Face Recognition via Sparse Representation. IEEE Trans. Pattern Anal. Mach. Intell. 31(2), 210\u2013227 (2009)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"194_CR45","doi-asserted-by":"crossref","unstructured":"Xu, J., Man, H.: Dictionary learning based on laplacian score in sparse coding. In:\u00a0Machine Learning and Data Mining in Pattern Recognition, pp.253\u2013264 (2011)","DOI":"10.1007\/978-3-642-23199-5_19"},{"issue":"16","key":"194_CR46","first-page":"321","volume":"16","author":"D Zhou","year":"2004","unstructured":"Zhou, D., Bousquet, O., Lal, T.N., Weston, J., Sch\u00f6lkopf, B.: Learning with local and global consistency. Adv. Neural Inf. Process. Syst. 16(16), 321\u2013328 (2004)","journal-title":"Adv. Neural Inf. Process. Syst."},{"issue":"11","key":"194_CR47","doi-asserted-by":"crossref","first-page":"1529","DOI":"10.1109\/TKDE.2005.186","volume":"17","author":"Z-H Zhou","year":"2005","unstructured":"Zhou, Z.-H., Li, M.: Tri-training: Exploiting unlabeled data using three classifiers. IEEE Trans. Knowl. Data Eng. 17(11), 1529\u20131541 (2005)","journal-title":"IEEE Trans. Knowl. Data Eng."},{"issue":"11","key":"194_CR48","doi-asserted-by":"crossref","first-page":"1479","DOI":"10.1109\/TKDE.2007.190644","volume":"19","author":"Z-H Zhou","year":"2007","unstructured":"Zhou, Z.-H., Li, M.: Semi-supervised regression with co-training style algorithms. IEEE Trans. Knowl. Data Eng. 19(11), 1479\u20131493 (2007)","journal-title":"IEEE Trans. Knowl. Data Eng."},{"key":"194_CR49","unstructured":"Zhu, X.: Semi-supervised learning with graphs. PhD thesis, Carnegie Mellon University (2005)"},{"key":"194_CR50","unstructured":"Zhu, X., Ghahramani, Z.: Learning from labeled and unlabeled data with label propagation. Technical Report CMU-CALD-02-107, Carnegie Mellon University (2002)"},{"key":"194_CR51","unstructured":"Zhu, X., Ghahramani, Z., Lafferty, J.: Semi-supervised learning using gaussian fields and harmonic functions. In:\u00a0Proceedings of the 20th International Conference on Machine Learning, pp. 912\u2013919 (2003)"}],"container-title":["Automated Software Engineering"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10515-016-0194-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10515-016-0194-x\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10515-016-0194-x","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10515-016-0194-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,9,17]],"date-time":"2020-09-17T15:56:21Z","timestamp":1600358181000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10515-016-0194-x"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,3,22]]},"references-count":51,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2017,3]]}},"alternative-id":["194"],"URL":"https:\/\/doi.org\/10.1007\/s10515-016-0194-x","relation":{},"ISSN":["0928-8910","1573-7535"],"issn-type":[{"value":"0928-8910","type":"print"},{"value":"1573-7535","type":"electronic"}],"subject":[],"published":{"date-parts":[[2016,3,22]]}}}