{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,14]],"date-time":"2025-11-14T10:03:13Z","timestamp":1763114593413,"version":"3.37.3"},"reference-count":74,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2023,3,7]],"date-time":"2023-03-07T00:00:00Z","timestamp":1678147200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,3,7]],"date-time":"2023-03-07T00:00:00Z","timestamp":1678147200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Data Min Knowl Disc"],"published-print":{"date-parts":[[2023,5]]},"DOI":"10.1007\/s10618-023-00925-9","type":"journal-article","created":{"date-parts":[[2023,4,4]],"date-time":"2023-04-04T15:17:56Z","timestamp":1680621476000},"page":"1301-1325","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":4,"title":["A two-step anomaly detection based method for PU classification in imbalanced data sets"],"prefix":"10.1007","volume":"37","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-3254-2555","authenticated-orcid":false,"given":"Carlos","family":"Ortega V\u00e1zquez","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8781-3906","authenticated-orcid":false,"given":"Seppe","family":"vanden Broucke","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6151-0504","authenticated-orcid":false,"given":"Jochen","family":"De Weerdt","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2023,3,7]]},"reference":[{"issue":"12","key":"925_CR1","doi-asserted-by":"publisher","first-page":"1215","DOI":"10.1002\/int.10143","volume":"18","author":"J Abell\u00e1n","year":"2003","unstructured":"Abell\u00e1n J, Moral S (2003) Building classification trees using the total uncertainty criterion. Int J Intell Syst 18(12):1215\u20131225","journal-title":"Int J Intell Syst"},{"key":"925_CR2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-47578-3","volume-title":"Outlier Analysis","author":"CC Aggarwal","year":"2017","unstructured":"Aggarwal CC (2017) Outlier Analysis. Springer, New York"},{"key":"925_CR3","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-54765-7","volume-title":"Outlier Ensembles: An Introduction","author":"CC Aggarwal","year":"2017","unstructured":"Aggarwal CC, Sathe S (2017) Outlier Ensembles: An Introduction. Springer, Cham, Switzerland"},{"key":"925_CR4","unstructured":"Alcal\u00e1-Fdez J, Fern\u00e1ndez A, Luengo J, Derrac J, Garc\u00eda S, S\u00e1nchez L, Herrera F (2011) Keel data-mining software tool: data set repository, integration of algorithms and experimental analysis framework. J Multiple-Valued Logic & Soft Comput. 17"},{"key":"925_CR5","doi-asserted-by":"publisher","DOI":"10.1002\/9781119146841","volume-title":"Fraud Analytics Using Descriptive, Predictive, and Social Network Techniques: a Guide to Data Science for Fraud Detection","author":"B Baesens","year":"2015","unstructured":"Baesens B, Van Vlasselaer V, Verbeke W (2015) Fraud Analytics Using Descriptive, Predictive, and Social Network Techniques: a Guide to Data Science for Fraud Detection. John Wiley & Sons, New Jersey"},{"key":"925_CR6","doi-asserted-by":"crossref","unstructured":"Baesens B, H\u00f6ppner S, Ortner I, Verdonck T (2021) robRose: a robust approach for dealing with imbalanced data in fraud detection. Stat Methods Appl 1\u201321","DOI":"10.1007\/s10260-021-00573-7"},{"key":"925_CR7","doi-asserted-by":"publisher","first-page":"719","DOI":"10.1007\/s10994-020-05877-5","volume":"109","author":"J Bekker","year":"2020","unstructured":"Bekker J, Davis J (2020) Learning from positive and unlabeled data: a survey. Mach Learn 109:719\u2013760","journal-title":"Mach Learn"},{"key":"925_CR8","doi-asserted-by":"crossref","unstructured":"Bekker J, Davis J (2018) Estimating the class prior in positive and unlabeled data through decision tree induction. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol 32","DOI":"10.1609\/aaai.v32i1.11715"},{"key":"925_CR9","doi-asserted-by":"crossref","unstructured":"Bekker J, Robberechts P, Davis J (2019) Beyond the selected completely at random assumption for learning from positive and unlabeled data. In: Joint European Conference on Machine Learning and Knowledge Discovery in Databases, pp 71\u201385. Springer","DOI":"10.1007\/978-3-030-46147-8_5"},{"issue":"2","key":"925_CR10","doi-asserted-by":"publisher","first-page":"93","DOI":"10.1145\/335191.335388","volume":"29","author":"M Breunig","year":"2000","unstructured":"Breunig M, Kriegel H, Ng R, Sander J (2000) LOF: identifying density-based local outliers. Sigmod Rec 29(2):93\u2013104","journal-title":"Sigmod Rec"},{"key":"925_CR11","doi-asserted-by":"publisher","first-page":"131","DOI":"10.1613\/jair.606","volume":"11","author":"C Brodley","year":"1999","unstructured":"Brodley C, Friedl M (1999) Identifying mislabeled training data. J Artif Intell Res 11:131\u2013167","journal-title":"J Artif Intell Res"},{"issue":"4","key":"925_CR12","doi-asserted-by":"publisher","first-page":"891","DOI":"10.1007\/s10618-015-0444-8","volume":"30","author":"GO Campos","year":"2016","unstructured":"Campos GO, Zimek A, Sander J, Campello RJ, Micenkov\u00e1 B, Schubert E, Assent I, Houle ME (2016) On the evaluation of unsupervised outlier detection: measures, datasets, and an empirical study. Data Min Knowl Disc 30(4):891\u2013927","journal-title":"Data Min Knowl Disc"},{"issue":"12","key":"925_CR13","doi-asserted-by":"publisher","first-page":"4451","DOI":"10.1016\/j.patcog.2012.05.002","volume":"45","author":"J Cao","year":"2012","unstructured":"Cao J, Kwong S, Wang R (2012) A noise-detection based adaboost algorithm for mislabeled data. Pattern Recogn 45(12):4451\u20134465","journal-title":"Pattern Recogn"},{"key":"925_CR14","doi-asserted-by":"crossref","unstructured":"Caron L, Dionne G (1999) Insurance fraud estimation: more evidence from the quebec automobile insurance industry, 175\u2013182","DOI":"10.1007\/978-1-4615-4058-8_9"},{"key":"925_CR15","doi-asserted-by":"crossref","unstructured":"Chapelle O, Sch\u00f6lkopf B, Zien A, et al (2006) Semi-supervised learning, vol. 2. Cambridge: MIT Press. Cortes C, Mohri M(2014). Domain adaptation and sample bias correction theory and algorithm for regression. Theoretical Computer Science. 519:103126","DOI":"10.1016\/j.tcs.2013.09.027"},{"key":"925_CR16","doi-asserted-by":"publisher","first-page":"321","DOI":"10.1613\/jair.953","volume":"16","author":"NV Chawla","year":"2002","unstructured":"Chawla NV, Bowyer KW, Hall LO, Kegelmeyer WP (2002) Smote: synthetic minority over-sampling technique. J Artif Intell Res 16:321\u2013357","journal-title":"J Artif Intell Res"},{"issue":"2","key":"925_CR17","doi-asserted-by":"publisher","first-page":"225","DOI":"10.1007\/s10618-008-0087-0","volume":"17","author":"NV Chawla","year":"2008","unstructured":"Chawla NV, Cieslak DA, Hall LO, Joshi A (2008) Automatically countering imbalance and its empirical relationship to cost. Data Min Knowl Disc 17(2):225\u2013252","journal-title":"Data Min Knowl Disc"},{"key":"925_CR18","doi-asserted-by":"crossref","unstructured":"Chen T, Guestrin C (2016) Xgboost: A scalable tree boosting system. In: Krishnapuram B, Shah M, Smola AJ, Aggarwal CC, Shen D, Rastogi R (eds.) Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining 13-17, 2016, pp 785\u2013794. ACM, San Francisco","DOI":"10.1145\/2939672.2939785"},{"key":"925_CR19","unstructured":"Christoffel M, Niu G, Sugiyama M (2016) Class-prior estimation for learning from positive and unlabeled data. In: Asian Conference on Machine Learning, pp 221\u2013236. PMLR"},{"key":"925_CR20","doi-asserted-by":"publisher","first-page":"73","DOI":"10.1016\/j.neucom.2014.10.081","volume":"160","author":"M Claesen","year":"2015","unstructured":"Claesen M, De Smet F, Suykens JA, De Moor B (2015) A robust ensemble approach to learn from positive and unlabeled data using svm base models. Neurocomputing 160:73\u201384","journal-title":"Neurocomputing"},{"issue":"10","key":"925_CR21","doi-asserted-by":"publisher","first-page":"4915","DOI":"10.1016\/j.eswa.2014.02.026","volume":"41","author":"A Dal Pozzolo","year":"2014","unstructured":"Dal Pozzolo A, Caelen O, Le Borgne Y-A, Waterschoot S, Bontempi G (2014) Learned lessons in credit card fraud detection from a practitioner perspective. Expert Syst Appl 41(10):4915\u20134928. https:\/\/doi.org\/10.1016\/j.eswa.2014.02.026","journal-title":"Expert Syst Appl"},{"key":"925_CR22","doi-asserted-by":"crossref","unstructured":"De\u00a0Comit\u00e9 F, Denis F, Gilleron R, Letouzey F (1999) Positive and unlabeled examples help learning. In: International Conference on Algorithmic Learning Theory, pp 219\u2013230 . Springer","DOI":"10.1007\/3-540-46769-6_18"},{"key":"925_CR23","first-page":"1","volume":"7","author":"J Dem\u0161ar","year":"2006","unstructured":"Dem\u0161ar J (2006) Statistical comparisons of classifiers over multiple data sets. The J Mach Learn Res 7:1\u201330","journal-title":"The J Mach Learn Res"},{"issue":"1","key":"925_CR24","doi-asserted-by":"publisher","first-page":"70","DOI":"10.1016\/j.tcs.2005.09.007","volume":"348","author":"F Denis","year":"2005","unstructured":"Denis F, Gilleron R, Letouzey F (2005) Learning from positive and unlabeled examples. Theor Comput Sci 348(1):70\u201383","journal-title":"Theor Comput Sci"},{"issue":"4","key":"925_CR25","doi-asserted-by":"publisher","first-page":"463","DOI":"10.1007\/s10994-016-5604-6","volume":"106","author":"MC du Plessis","year":"2017","unstructured":"du Plessis MC, Niu G, Sugiyama M (2017) Class-prior estimation for learning from positive and unlabeled data. Mach Learn 106(4):463\u2013492","journal-title":"Mach Learn"},{"key":"925_CR26","unstructured":"Du\u00a0Plessis M, Niu G, Sugiyama M (2015) Convex formulation for learning from positive and unlabeled data. In: International Conference on Machine Learning, pp 1386\u20131394. PMLR"},{"key":"925_CR27","doi-asserted-by":"crossref","unstructured":"Elkan C, Noto K (2008) Learning classifiers from only positive and unlabeled data. In: Proceedings of the 14th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, pp 213\u2013220","DOI":"10.1145\/1401890.1401920"},{"key":"925_CR28","unstructured":"Emmott A, Das S, Dietterich T, Fern A, Wong W-K (2015) A meta-analysis of the anomaly detection problem. Preprint at https:\/\/arxiv.org\/pdf\/1503.01158.pdf"},{"issue":"18","key":"925_CR29","doi-asserted-by":"publisher","first-page":"2378","DOI":"10.1016\/j.fss.2007.12.023","volume":"159","author":"A Fern\u00e1ndez","year":"2008","unstructured":"Fern\u00e1ndez A, Garc\u00eda S, del Jesus MJ, Herrera F (2008) A study of the behaviour of linguistic fuzzy rule based classification systems in the framework of imbalanced data-sets. Fuzzy Sets Syst 159(18):2378\u20132398","journal-title":"Fuzzy Sets Syst"},{"key":"925_CR30","doi-asserted-by":"crossref","unstructured":"Fern\u00e1ndez A, Garc\u00eda S, Galar M, Prati RC, Krawczyk B, Herrera F (2018) Learning from Imbalanced Data Sets vol. 11. Springer","DOI":"10.1007\/978-3-319-98074-4"},{"issue":"5","key":"925_CR31","doi-asserted-by":"publisher","first-page":"845","DOI":"10.1109\/TNNLS.2013.2292894","volume":"25","author":"B Frenay","year":"2014","unstructured":"Frenay B, Verleysen M (2014) Classification in the presence of label noise: a survey. IEEE Trans Neural Netw Learn Syst 25(5):845\u2013869","journal-title":"IEEE Trans Neural Netw Learn Syst"},{"issue":"1","key":"925_CR32","doi-asserted-by":"publisher","first-page":"13","DOI":"10.1016\/j.knosys.2011.06.013","volume":"25","author":"V Garc\u00eda","year":"2012","unstructured":"Garc\u00eda V, S\u00e1nchez JS, Mollineda RA (2012) On the effectiveness of preprocessing methods when dealing with different levels of class imbalance. Knowl-Based Syst 25(1):13\u201321","journal-title":"Knowl-Based Syst"},{"issue":"3","key":"925_CR33","doi-asserted-by":"publisher","first-page":"255","DOI":"10.1177\/1471082X0700700303","volume":"7","author":"R Gerlach","year":"2007","unstructured":"Gerlach R, Stamey J (2007) Bayesian model selection for logistic regression with misclassified outcomes. Stat Model 7(3):255\u2013273","journal-title":"Stat Model"},{"key":"925_CR34","unstructured":"Hariri S, Kind MC, Brunner RJ (2018) Extended isolation forest. arXiv preprint arXiv:1811.02141"},{"key":"925_CR35","unstructured":"He H, Bai Y, Garcia EA, Li S (2008) Adasyn: adaptive synthetic sampling approach for imbalanced learning. In: 2008 IEEE International Joint Conference on Neural Networks (IEEE World Congress on Computational Intelligence), pp 1322\u20131328 . IEEE"},{"key":"925_CR36","unstructured":"He F, Liu T, Webb GI, Tao D (2018) Instance-dependent PU learning by bayesian optimal relabeling. Preprint at https:\/\/arxiv.org\/pdf\/1808.02180.pdf"},{"key":"925_CR37","doi-asserted-by":"publisher","first-page":"127343","DOI":"10.1109\/ACCESS.2020.3008150","volume":"8","author":"L Huang","year":"2020","unstructured":"Huang L, Zhao J, Zhu B, Chen H, Broucke SV (2020) An experimental investigation of calibration techniques for imbalanced data. Ieee Access 8:127343\u2013127352","journal-title":"Ieee Access"},{"key":"925_CR38","doi-asserted-by":"crossref","unstructured":"Khoshgoftaar TM, Rebours P (2004) Generating multiple noise elimination filters with the ensemble-partitioning filter. In: Proceedings of the 2004 IEEE International Conference on Information Reuse and Integration, 2004. IRI 2004., pp 369\u2013375 . IEEE","DOI":"10.1109\/IRI.2004.1431489"},{"issue":"3","key":"925_CR39","doi-asserted-by":"publisher","first-page":"552","DOI":"10.1109\/TSMCA.2010.2084081","volume":"41","author":"TM Khoshgoftaar","year":"2010","unstructured":"Khoshgoftaar TM, Van Hulse J, Napolitano A (2010) Comparing boosting and bagging techniques with noisy and imbalanced data. IEEE Trans Syst Man Cybern-Part A: Syst Humans 41(3):552\u2013568","journal-title":"IEEE Trans Syst Man Cybern-Part A: Syst Humans"},{"key":"925_CR40","unstructured":"Kiryo R, Niu G, du Plessis MC, Sugiyama M (2017) Positive-unlabeled learning with non-negative risk estimator. In: Advances in Neural Information Processing Systems 30: Annual Conference on Neural Information Processing Systems, Long Beach, pp 1675\u20131685"},{"key":"925_CR41","doi-asserted-by":"crossref","unstructured":"Kriegel H-P, Schubert M, Zimek A (2008) Angle-based outlier detection in high-dimensional data. In: Proceedings of the 14th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, pp 444\u2013452","DOI":"10.1145\/1401890.1401946"},{"key":"925_CR42","unstructured":"Lee WS, Liu B (2003) Learning with positive and unlabeled examples using weighted logistic regression. In: ICML, vol 3, pp 448\u2013455"},{"key":"925_CR43","unstructured":"Li X, Liu B (2003) Learning to classify texts using positive and unlabeled data. In: IJCAI, vol 3, pp 587\u2013592"},{"key":"925_CR44","doi-asserted-by":"crossref","unstructured":"Liu FT, Ting KM, Zhou Z-H (2008) Isolation forest. In: 2008 Eighth IEEE International Conference on Data Mining, pp 413\u2013422. IEEE","DOI":"10.1109\/ICDM.2008.17"},{"key":"925_CR45","doi-asserted-by":"crossref","unstructured":"Liu FT, Ting KM, Zhou Z-H (2010) On detecting clustered anomalies using sciforest. In: Joint European Conference on Machine Learning and Knowledge Discovery in Databases, pp 274\u2013290. Springer","DOI":"10.1007\/978-3-642-15883-4_18"},{"key":"925_CR46","doi-asserted-by":"crossref","unstructured":"Liu FT, Ting KM, Zhou Z-H (2012) Isolation-based anomaly detection. ACM Trans Knowl Discov Data (TKDD) 6(1):1\u201339","DOI":"10.1145\/2133360.2133363"},{"key":"925_CR47","unstructured":"Liu B, Dai Y, Li X, Lee WS, Yu PS (2003) Building text classifiers using positive and unlabeled examples. In: Third IEEE International Conference on Data Mining, pp 179\u2013186 . IEEE"},{"key":"925_CR48","unstructured":"Liu B, Lee WS, Yu PS, Li X (2002) Partially supervised classification of text documents. In: ICML, vol 2, pp 387\u2013394. Citeseer"},{"key":"925_CR49","doi-asserted-by":"crossref","unstructured":"Lukashevich H, Nowak S, Dunker P (2009) Using one-class svm outliers detection for verification of collaboratively tagged image training sets, pp 682\u2013685. IEEE, New York","DOI":"10.1109\/ICME.2009.5202588"},{"issue":"17","key":"925_CR50","doi-asserted-by":"publisher","first-page":"2114","DOI":"10.1093\/bioinformatics\/btl346","volume":"22","author":"A Malossini","year":"2006","unstructured":"Malossini A, Blanzieri E, Ng RT (2006) Detecting potential labeling errors in microarrays by data perturbation. Bioinformatics 22(17):2114\u20132121","journal-title":"Bioinformatics"},{"issue":"3","key":"925_CR51","doi-asserted-by":"publisher","first-page":"1146","DOI":"10.1109\/TSMCB.2012.2223460","volume":"43","author":"N Manwani","year":"2013","unstructured":"Manwani N, Sastry P (2013) Noise tolerance under risk minimization. IEEE Trans Cybern 43(3):1146\u20131151","journal-title":"IEEE Trans Cybern"},{"key":"925_CR52","doi-asserted-by":"crossref","unstructured":"Matic N, Guyon I, Bottou L, Denker J, Vapnik V (1992) Computer aided cleaning of large databases for character recognition. In: 11th IAPR International Conference on Pattern Recognition. Vol. II. Conference B: Pattern Recognition Methodology and Systems, pp 330\u2013331","DOI":"10.1109\/ICPR.1992.201784"},{"key":"925_CR53","doi-asserted-by":"crossref","unstructured":"Mignone P, Pio G, D\u017eeroski S, Ceci M (2020a) Multi-task learning for the simultaneous reconstruction of the human and mouse gene regulatory networks. Sci Rep 10(1):1\u201315","DOI":"10.1038\/s41598-020-78033-7"},{"key":"925_CR54","doi-asserted-by":"crossref","unstructured":"Mignone P, Pio G, D\u2019Elia D, Ceci M (2020b) Exploiting transfer learning for the reconstruction of the human gene regulatory network. Bioinformatics 36(5):1553\u20131561","DOI":"10.1093\/bioinformatics\/btz781"},{"key":"925_CR55","doi-asserted-by":"publisher","first-page":"201","DOI":"10.1016\/j.patrec.2013.06.010","volume":"37","author":"F Mordelet","year":"2014","unstructured":"Mordelet F, Vert J-P (2014) A bagging svm to learn from positive and unlabeled examples. Pattern Recogn Lett 37:201\u2013209","journal-title":"Pattern Recogn Lett"},{"key":"925_CR56","doi-asserted-by":"publisher","first-page":"22","DOI":"10.1016\/j.dss.2014.03.001","volume":"62","author":"S Moro","year":"2014","unstructured":"Moro S, Cortez P, Rita P (2014) A data-driven approach to predict the success of bank telemarketing. Decis Supp Syst 62:22\u201331","journal-title":"Decis Supp Syst"},{"key":"925_CR57","unstructured":"Northcutt CG, Wu T, Chuang IL (2017) Learning with confident examples: Rank pruning for robust classification with noisy labels. In: Proceedings of the Thirty-Third Conference on Uncertainty in Artificial Intelligence, UAI 2017, Aug 11-15, 2017. AUAI Press, Sydney"},{"key":"925_CR58","unstructured":"Oracle (2015) Oracle Database Online Documentation 12c . https:\/\/docs.oracle.com\/database\/121\/"},{"issue":"1","key":"925_CR59","first-page":"71","volume":"101","author":"CJ P\u00e9rez","year":"2007","unstructured":"P\u00e9rez CJ, Gir\u00f3n FJ, Mart\u00edn J, Ruiz M, Rojano C (2007) Misclassified multinomial data: a bayesian approach. RACSAM 101(1):71\u201380","journal-title":"RACSAM"},{"key":"925_CR60","unstructured":"Ramaswamy HG, Scott C, Tewari A (2016) Mixture proportion estimation via kernel embeddings of distributions. In: Proceedings of the 33nd International Conference on Machine Learning, ICML 2016, New York City, NY, USA, June 19-24, 2016. JMLR Workshop and Conference Proceedings, vol. 48, pp 2052\u20132060. JMLR.org"},{"key":"925_CR61","unstructured":"Scott C, Blanchard G, Handy G (2013) Classification with asymmetric label noise: consistency and maximal denoising. COLT 2013 - The 26th Annual Conference on Learning Theory, vol 30. JMLR Workshop and Conference Proceedings. JMLR.org, New Jersey, pp 489\u2013511"},{"key":"925_CR62","unstructured":"Shebuti R (2016) ODDS library. http:\/\/odds.cs.stonybrook.edu"},{"key":"925_CR63","doi-asserted-by":"publisher","first-page":"13","DOI":"10.1016\/j.dss.2018.04.001","volume":"111","author":"E Stripling","year":"2018","unstructured":"Stripling E, Baesens B, Chizi B, Vanden Broucke S (2018) Isolation-based conditional anomaly detection on mixed-attribute data to uncover workers\u2019 compensation fraud. Decis Supp Syst 111:13\u201326","journal-title":"Decis Supp Syst"},{"issue":"1","key":"925_CR64","doi-asserted-by":"publisher","first-page":"1039","DOI":"10.1016\/j.eswa.2010.07.143","volume":"38","author":"L \u0160ubelj","year":"2011","unstructured":"\u0160ubelj L, Furlan v, Bajec M (2011) An expert system for detecting automobile insurance fraud using social network analysis. Expert Syst Appl 38(1):1039\u20131052","journal-title":"Expert Syst Appl"},{"key":"925_CR65","doi-asserted-by":"crossref","unstructured":"Su G, Chen W, Xu M (2021) Positive-unlabeled learning from imbalanced data. In: International Joint Conferences on Artificial Intelligence IJCAI, pp 2995\u20133001. ijcai.org, Montreal","DOI":"10.24963\/ijcai.2021\/412"},{"key":"925_CR66","doi-asserted-by":"publisher","unstructured":"Sun J, Zhao F, Wang C, Chen S (2007) Identifying and correcting mislabeled training instances. In: Future Generation Communication and Networking (FGCN 2007), vol 1, pp 244\u2013250. https:\/\/doi.org\/10.1109\/FGCN.2007.146","DOI":"10.1109\/FGCN.2007.146"},{"issue":"2","key":"925_CR67","doi-asserted-by":"publisher","first-page":"245","DOI":"10.1007\/s10115-013-0706-y","volume":"42","author":"I Triguero","year":"2015","unstructured":"Triguero I, Garc\u00eda S, Herrera F (2015) Self-labeled techniques for semi-supervised learning: taxonomy, software and empirical study. Knowl Inf Syst 42(2):245\u2013284","journal-title":"Knowl Inf Syst"},{"key":"925_CR68","doi-asserted-by":"publisher","unstructured":"Van Hulse J, Khoshgoftaar T (2009) Knowledge discovery from imbalanced and noisy data. Data & Knowledge Engineering 68(12), 1513\u20131542 . https:\/\/doi.org\/10.1016\/j.datak.2009.08.005.Including Special Section: 21st IEEE International Symposium on Computer-Based Medical Systems (IEEE CBMS 2008)","DOI":"10.1016\/j.datak.2009.08.005."},{"issue":"2","key":"925_CR69","doi-asserted-by":"publisher","first-page":"49","DOI":"10.1145\/2641190.2641198","volume":"15","author":"J Vanschoren","year":"2013","unstructured":"Vanschoren J, van Rijn JN, Bischl B, Torgo L (2013) Openml: networked science in machine learning. SIGKDD Explor 15(2):49\u201360. https:\/\/doi.org\/10.1145\/2641190.2641198","journal-title":"SIGKDD Explor"},{"key":"925_CR70","doi-asserted-by":"publisher","first-page":"23","DOI":"10.1016\/j.compbiolchem.2018.05.022","volume":"76","author":"A Vasighizaker","year":"2018","unstructured":"Vasighizaker A, Jalili S (2018) C-pugp: a cluster-based positive unlabeled learning method for disease gene prediction and prioritization. Comput Biol Chem 76:23\u201331","journal-title":"Comput Biol Chem"},{"issue":"3","key":"925_CR71","doi-asserted-by":"publisher","first-page":"304","DOI":"10.1109\/TKDE.2006.46","volume":"18","author":"H Xiong","year":"2006","unstructured":"Xiong H, Pandey G, Steinbach M, Kumar V (2006) Enhancing data analysis with noise removal. IEEE Trans Knowl Data Eng 18(3):304\u2013319","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"925_CR72","doi-asserted-by":"crossref","unstructured":"Yu S, Li C (2007) Pe-puc: a graph based pu-learning approach for text classification. In: International Workshop on Machine Learning and Data Mining in Pattern Recognition, pp 574\u2013584. Springer","DOI":"10.1007\/978-3-540-73499-4_43"},{"issue":"1","key":"925_CR73","doi-asserted-by":"publisher","first-page":"44","DOI":"10.1093\/nsr\/nwx106","volume":"5","author":"Z-H Zhou","year":"2018","unstructured":"Zhou Z-H (2018) A brief introduction to weakly supervised learning. Natl Sci Rev 5(1):44\u201353","journal-title":"Natl Sci Rev"},{"issue":"1","key":"925_CR74","doi-asserted-by":"publisher","first-page":"49","DOI":"10.1057\/s41274-016-0176-1","volume":"69","author":"B Zhu","year":"2018","unstructured":"Zhu B, Baesens B, Backiel A, vanden Broucke SK (2018) Benchmarking sampling techniques for imbalance learning in churn prediction. J Oper Res Soc 69(1):49\u201365","journal-title":"J Oper Res Soc"}],"container-title":["Data Mining and Knowledge Discovery"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10618-023-00925-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10618-023-00925-9\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10618-023-00925-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,10,17]],"date-time":"2024-10-17T18:18:59Z","timestamp":1729189139000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10618-023-00925-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,3,7]]},"references-count":74,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2023,5]]}},"alternative-id":["925"],"URL":"https:\/\/doi.org\/10.1007\/s10618-023-00925-9","relation":{},"ISSN":["1384-5810","1573-756X"],"issn-type":[{"type":"print","value":"1384-5810"},{"type":"electronic","value":"1573-756X"}],"subject":[],"published":{"date-parts":[[2023,3,7]]},"assertion":[{"value":"3 February 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"6 February 2023","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"7 March 2023","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}