{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,13]],"date-time":"2026-02-13T23:17:14Z","timestamp":1771024634526,"version":"3.50.1"},"reference-count":85,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"8","license":[{"start":{"date-parts":[[2021,8,1]],"date-time":"2021-08-01T00:00:00Z","timestamp":1627776000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2021,8,1]],"date-time":"2021-08-01T00:00:00Z","timestamp":1627776000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,8,1]],"date-time":"2021-08-01T00:00:00Z","timestamp":1627776000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100012166","name":"National Key Research and Development Program of China","doi-asserted-by":"publisher","award":["2018YFB1003904"],"award-info":[{"award-number":["2018YFB1003904"]}],"id":[{"id":"10.13039\/501100012166","id-type":"DOI","asserted-by":"publisher"}]},{"name":"NSFC Program","award":["61602403"],"award-info":[{"award-number":["61602403"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IIEEE Trans. Software Eng."],"published-print":{"date-parts":[[2021,8,1]]},"DOI":"10.1109\/tse.2019.2929761","type":"journal-article","created":{"date-parts":[[2019,7,18]],"date-time":"2019-07-18T19:59:40Z","timestamp":1563479980000},"page":"1559-1586","source":"Crossref","is-referenced-by-count":70,"title":["The Impact of Mislabeled Changes by SZZ on Just-in-Time Defect Prediction"],"prefix":"10.1109","volume":"47","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-5234-0152","authenticated-orcid":false,"given":"Yuanrui","family":"Fan","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6302-3256","authenticated-orcid":false,"given":"Xin","family":"Xia","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4525-3266","authenticated-orcid":false,"given":"Daniel Alencar","family":"da Costa","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4367-7201","authenticated-orcid":false,"given":"David","family":"Lo","sequence":"additional","affiliation":[]},{"given":"Ahmed E.","family":"Hassan","sequence":"additional","affiliation":[]},{"given":"Shanping","family":"Li","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref73","doi-asserted-by":"publisher","DOI":"10.1109\/TSE.2016.2584050"},{"key":"ref72","first-page":"812","article-title":"The impact of mislabelling on the performance and interpretation of defect prediction models","author":"tantithamthavorn","year":"2015","journal-title":"Proceedings of the International Conference on Software Engineering ICSE'94"},{"key":"ref71","doi-asserted-by":"publisher","DOI":"10.1109\/TSE.2018.2876537"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1145\/3183519.3183547"},{"key":"ref76","doi-asserted-by":"publisher","DOI":"10.2307\/3001968"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.1145\/1390817.1390826"},{"key":"ref74","doi-asserted-by":"publisher","DOI":"10.1109\/TSE.2018.2794977"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1145\/1985793.1985859"},{"key":"ref75","first-page":"5","article-title":"Understanding widespread changes: A taxonomic study","author":"wang","year":"2013","journal-title":"Proc European Conf Software Maintenance and Reengineering"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/TSE.2007.70773"},{"key":"ref78","doi-asserted-by":"publisher","DOI":"10.1145\/1370750.1370754"},{"key":"ref79","doi-asserted-by":"publisher","DOI":"10.1007\/s10664-017-9514-4"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/TKDE.2005.50"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1002\/SERIES1345"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1007\/s10664-015-9376-6"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/ICSE.2013.6606585"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/TSE.2012.70"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1007\/s10664-015-9400-x"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/ASE.2013.6693087"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/ICSME.2017.51"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1109\/MSR.2017.4"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1145\/1852786.1852792"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.2307\/2529204"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.1109\/TSE.2012.43"},{"key":"ref28","first-page":"1","article-title":"rms: Regression modeling strategies","author":"harrell","year":"2019"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.1109\/MSR.2017.14"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4757-3462-1"},{"key":"ref65","first-page":"1","article-title":"When do changes induce fixes?","volume":"30","author":"?liwerski","year":"2005","journal-title":"Proc of International Workshop on Mining Software Repositories"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1109\/TSE.2012.19"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/ICSE.2009.5070510"},{"key":"ref67","doi-asserted-by":"publisher","DOI":"10.1109\/MS.2010.63"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.1109\/TSE.2018.2836442"},{"key":"ref69","doi-asserted-by":"publisher","DOI":"10.1109\/ICSE.2015.139"},{"key":"ref2","first-page":"103","article-title":"Bonferroni and &#x0160;id&#x00E1;k corrections for multiple comparisons","volume":"3","author":"abdi","year":"2007","journal-title":"Encyclopedia of Measurement and Statistics N"},{"key":"ref1","year":"2018"},{"key":"ref20","author":"fowler","year":"1999","journal-title":"Refactoring Improving the Design of Existing Code"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1145\/2597073.2597075"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1145\/3106237.3106257"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1145\/1806799.1806871"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1145\/2372251.2372285"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/TSE.2009.3"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/TSE.2011.103"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/TSE.2017.2693980"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/TSE.2012.83"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1109\/TSE.2005.74"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.2307\/1402731"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1145\/1013886.1007524"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1109\/SANER.2018.8330225"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1145\/1368088.1368114"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1002\/bltj.2229"},{"key":"ref53","article-title":"VCD: Visualizing categorical data","author":"meyer","year":"2017"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1007\/s10515-010-0069-5"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1002\/stvr.1570"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2010.10.024"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/ASE.2006.23"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.4324\/9781315806730"},{"key":"ref13","article-title":"Ma-SZZ implementation for SVN repositories","author":"da costa","year":"2019"},{"key":"ref14","article-title":"Refactoring-aware SZZ (RA-SZZ) implementation","author":"da costa","year":"2019"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/TSE.2016.2616306"},{"key":"ref82","doi-asserted-by":"publisher","DOI":"10.1109\/QRS.2015.14"},{"key":"ref16","first-page":"107","article-title":"Comparing text-based and dependence-based approaches for determining the origins of bugs","volume":"26","author":"davies","year":"2014","journal-title":"Journal of Software: Evolution and Process"},{"key":"ref81","doi-asserted-by":"publisher","DOI":"10.1016\/j.infsof.2017.03.007"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1023\/A:1007413511361"},{"key":"ref84","doi-asserted-by":"publisher","DOI":"10.1002\/0470011815.b2a15150"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1201\/9780429246593"},{"key":"ref83","doi-asserted-by":"publisher","DOI":"10.1145\/2950290.2950353"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/TSE.2018.2864217"},{"key":"ref80","doi-asserted-by":"publisher","DOI":"10.1109\/TSE.2016.2543218"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1145\/1882291.1882308"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1145\/1463788.1463819"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/1595696.1595716"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/SCAM.2012.20"},{"key":"ref85","doi-asserted-by":"publisher","DOI":"10.1145\/1137983.1138001"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1023\/A:1010933404324"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/CSMR.2013.19"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1145\/1868328.1868356"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ICST.2013.38"},{"key":"ref46","first-page":"18","article-title":"Classification and regression by RandomForest","volume":"2","author":"liaw","year":"2002","journal-title":"R News"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1007\/s10664-016-9467-z"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1214\/aoms\/1177730491"},{"key":"ref47","article-title":"Naivebayes: High performance implementation of the naive bayes algorithm","author":"majka","year":"2019"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/TSE.2008.90"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/ICECCS.2014.25"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/TSE.2008.35"},{"key":"ref43","first-page":"179","article-title":"Addressing the curse of imbalanced training sets: One-sided selection","volume":"97","author":"kubat","year":"1997","journal-title":"Proc Int Conf Mach Learn"}],"container-title":["IEEE Transactions on Software Engineering"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/32\/9512528\/08765743.pdf?arnumber=8765743","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,5,10]],"date-time":"2022-05-10T14:50:06Z","timestamp":1652194206000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8765743\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,8,1]]},"references-count":85,"journal-issue":{"issue":"8"},"URL":"https:\/\/doi.org\/10.1109\/tse.2019.2929761","relation":{},"ISSN":["0098-5589","1939-3520","2326-3881"],"issn-type":[{"value":"0098-5589","type":"print"},{"value":"1939-3520","type":"electronic"},{"value":"2326-3881","type":"electronic"}],"subject":[],"published":{"date-parts":[[2021,8,1]]}}}