{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,18]],"date-time":"2025-12-18T19:55:40Z","timestamp":1766087740140,"version":"3.37.3"},"reference-count":78,"publisher":"Springer Science and Business Media LLC","issue":"7","license":[{"start":{"date-parts":[[2021,6,1]],"date-time":"2021-06-01T00:00:00Z","timestamp":1622505600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2021,6,1]],"date-time":"2021-06-01T00:00:00Z","timestamp":1622505600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/501100010198","name":"Ministerio de Econom\u00eda, Industria y Competitividad, Gobierno de Espa\u00f1a","doi-asserted-by":"publisher","award":["TIN2017-89517-P"],"award-info":[{"award-number":["TIN2017-89517-P"]}],"id":[{"id":"10.13039\/501100010198","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100006393","name":"Universidad de Granada","doi-asserted-by":"crossref","award":["PRII2018-02"],"award-info":[{"award-number":["PRII2018-02"]}],"id":[{"id":"10.13039\/501100006393","id-type":"DOI","asserted-by":"crossref"}]},{"name":"Ministerio de Universidades","award":["FPU17\/04069"],"award-info":[{"award-number":["FPU17\/04069"]}]},{"name":"Proyecto Regional Andaluz","award":["P18-FR-4961"],"award-info":[{"award-number":["P18-FR-4961"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Knowl Inf Syst"],"published-print":{"date-parts":[[2021,7]]},"DOI":"10.1007\/s10115-021-01577-1","type":"journal-article","created":{"date-parts":[[2021,6,1]],"date-time":"2021-06-01T17:10:19Z","timestamp":1622567419000},"page":"1961-1989","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":17,"title":["Revisiting data complexity metrics based on morphology for overlap and imbalance: snapshot, new overlap number of balls metrics and singular problems prospect"],"prefix":"10.1007","volume":"63","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-4106-3182","authenticated-orcid":false,"given":"Jos\u00e9 Daniel","family":"Pascual-Triana","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"David","family":"Charte","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Marta","family":"Andr\u00e9s\u00a0Arroyo","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Alberto","family":"Fern\u00e1ndez","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Francisco","family":"Herrera","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2021,6,1]]},"reference":[{"key":"1577_CR1","doi-asserted-by":"publisher","DOI":"10.1201\/b17320","author":"C Aggarwal","year":"2014","unstructured":"Aggarwal C (2014) Data classification: algorithms and applications data classification: algorithms and applications. Chapman & Hall\/CRC. https:\/\/doi.org\/10.1201\/b17320","journal-title":"Chapman & Hall\/CRC"},{"issue":"2","key":"1577_CR2","doi-asserted-by":"publisher","first-page":"249","DOI":"10.1007\/s10115-018-1183-0","volume":"58","author":"M Ahmed","year":"2019","unstructured":"Ahmed M (2019) Data summarization: a survey. Knowl Information Syst 58(2):249\u2013273. https:\/\/doi.org\/10.1007\/s10115-018-1183-0","journal-title":"Knowl Information Syst"},{"issue":"4","key":"1577_CR3","doi-asserted-by":"publisher","first-page":"380","DOI":"10.1016\/j.patrec.2012.09.003","volume":"34","author":"R Alejo","year":"2013","unstructured":"Alejo R, Valdovinos RM, Garc\u00eda V, Pacheco-Sanchez JH (2013) A hybrid method to face class overlap and class imbalance on neural networks and multi-class scenarios. Pattern Recognit Lett 34(4):380\u2013388. https:\/\/doi.org\/10.1016\/j.patrec.2012.09.003","journal-title":"Pattern Recognit Lett"},{"key":"1577_CR4","volume-title":"Machine learning: the new AI","author":"E Alpaydin","year":"2016","unstructured":"Alpaydin E (2016) Machine learning: the new AI. MIT Press, Cambridge"},{"key":"1577_CR5","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.knosys.2014.09.002","volume":"73","author":"S Alshomrani","year":"2015","unstructured":"Alshomrani S, Bawakid A, Shim SO, Fern\u00e1ndez A, Herrera F (2015) A proposal for evolutionary fuzzy systems using feature weighting: dealing with overlapping in imbalanced datasets. Knowl-Based Syst 73:1\u201317. https:\/\/doi.org\/10.1016\/j.knosys.2014.09.002","journal-title":"Knowl-Based Syst"},{"key":"1577_CR6","doi-asserted-by":"publisher","DOI":"10.1109\/ICRAIE.2014.6909245","author":"G Anuradha Gupta","year":"2014","unstructured":"Anuradha Gupta G (2014) A self explanatory review of decision tree classifiers. ICRAIE. https:\/\/doi.org\/10.1109\/ICRAIE.2014.6909245","journal-title":"ICRAIE"},{"key":"1577_CR7","first-page":"1","volume":"2400","author":"A Astorino","year":"2019","unstructured":"Astorino A, Fuduli A, Gaudioso M, Vocaturo E (2019) Multiple instance learning algorithm for medical image classification. SEBD 2400:1\u20138","journal-title":"SEBD"},{"key":"1577_CR8","doi-asserted-by":"publisher","first-page":"405","DOI":"10.1016\/j.eswa.2017.04.006","volume":"83","author":"F Barboza","year":"2017","unstructured":"Barboza F, Kimura H, Altman E (2017) Machine learning models and bankruptcy prediction. Expert Syst Appl 83:405\u2013417. https:\/\/doi.org\/10.1016\/j.eswa.2017.04.006","journal-title":"Expert Syst Appl"},{"key":"1577_CR9","doi-asserted-by":"publisher","first-page":"1383","DOI":"10.1016\/j.patrec.2006.01.006","volume":"27","author":"R Baumgartner","year":"2006","unstructured":"Baumgartner R, Somorjai R (2006) Data complexity assesment in undersampled classification of high dimensional biomedical data. Pattern Recog Lett 27:1383\u20131389. https:\/\/doi.org\/10.1016\/j.patrec.2006.01.006","journal-title":"Pattern Recog Lett"},{"key":"1577_CR10","doi-asserted-by":"publisher","DOI":"10.1016\/j.artmed.2019.101785","author":"D Ben-Israel","year":"2020","unstructured":"Ben-Israel D, Jacobs W, Casha S, Lang S, Ryu W, de Lotbiniere-Bassett M, Cadotte D (2020) The impact of machine learning on patient care: a systematic review. Artifi Intell Med. https:\/\/doi.org\/10.1016\/j.artmed.2019.101785","journal-title":"Artifi Intell Med"},{"issue":"10","key":"1577_CR11","first-page":"281","volume":"13","author":"J Bergstra","year":"2012","unstructured":"Bergstra J, Bengio Y (2012) Random search for hyper-parameter optimization. J Mach Learn Res 13(10):281\u2013305","journal-title":"J Mach Learn Res"},{"issue":"1","key":"1577_CR12","doi-asserted-by":"publisher","first-page":"82","DOI":"10.1109\/TEVC.2004.840153","volume":"9","author":"E Bernad\u00f3-Mansilla","year":"2005","unstructured":"Bernad\u00f3-Mansilla E, Ho T (2005) Domain of competence of XCS classifier system in complexity measurement space. IEEE Trans Evol Comput 9(1):82\u2013104. https:\/\/doi.org\/10.1109\/TEVC.2004.840153","journal-title":"IEEE Trans Evol Comput"},{"issue":"6","key":"1577_CR13","doi-asserted-by":"publisher","first-page":"705","DOI":"10.1016\/j.ijar.2011.01.007","volume":"52","author":"C Bielza","year":"2011","unstructured":"Bielza C, Li G, Larra\u00f1aga P (2011) Multi-dimensional classification with bayesian networks. Int J Approx Reason 52(6):705\u2013727. https:\/\/doi.org\/10.1016\/j.ijar.2011.01.007","journal-title":"Int J Approx Reason"},{"doi-asserted-by":"crossref","unstructured":"Borchani H, Varando G, Bielza C, Larra\u00f1aga P (2015) A survey on multi-output regression. Wiley Interdiscip. Rev. Data Min. Knowl. Discov. 5(5):216\u2013233. https:\/\/doi.org\/10.1002\/widm.1157","key":"1577_CR14","DOI":"10.1002\/widm.1157"},{"issue":"9","key":"1577_CR15","doi-asserted-by":"publisher","first-page":"1757","DOI":"10.1016\/j.patcog.2004.03.009","volume":"37","author":"MR Boutell","year":"2004","unstructured":"Boutell MR, Luo J, Shen X, Brown CM (2004) Learning multi-label scene classification. Pattern Recognit 37(9):1757\u20131771. https:\/\/doi.org\/10.1016\/j.patcog.2004.03.009","journal-title":"Pattern Recognit"},{"issue":"12","key":"1577_CR16","doi-asserted-by":"publisher","first-page":"4820","DOI":"10.1016\/j.eswa.2013.02.025","volume":"40","author":"JR Cano","year":"2013","unstructured":"Cano JR (2013) Analysis of data complexity measures for classification. Expert Syst Appl 40(12):4820\u20134831. https:\/\/doi.org\/10.1016\/j.eswa.2013.02.025","journal-title":"Expert Syst Appl"},{"key":"1577_CR17","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2017.10.009","author":"MA Carbonneau","year":"2016","unstructured":"Carbonneau MA, Cheplygina V, Granger E, Gagnon G (2016) Multiple instance learning: a survey of problem characteristics and applications. Pattern Recognit. https:\/\/doi.org\/10.1016\/j.patcog.2017.10.009","journal-title":"Pattern Recognit"},{"issue":"1","key":"1577_CR18","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s13748-018-00167-7","volume":"8","author":"D Charte","year":"2019","unstructured":"Charte D, Charte F, Garc\u00eda S, Herrera F (2019) A snapshot on nonstandard supervised learning problems: taxonomy, relationships, problem transformations and algorithm adaptations. Prog Artif Intell 8(1):1\u201314. https:\/\/doi.org\/10.1007\/s13748-018-00167-7","journal-title":"Prog Artif Intell"},{"key":"1577_CR19","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1016\/j.neucom.2014.08.091","volume":"163","author":"F Charte","year":"2015","unstructured":"Charte F, Rivera AJ, del Jesus MJ, Herrera F (2015) Addressing imbalance in multilabel classification: measures and random resampling algorithms. Neurocomputing 163:3\u201316. https:\/\/doi.org\/10.1016\/j.neucom.2014.08.091","journal-title":"Neurocomputing"},{"issue":"4","key":"1577_CR20","doi-asserted-by":"publisher","first-page":"701","DOI":"10.1109\/TFUZZ.2018.2866967","volume":"27","author":"J C\u00f3zar","year":"2019","unstructured":"C\u00f3zar J, Fern\u00e1ndez A, Herrera F, G\u00e1mez JA (2019) A metahierarchical rule decision system to design robust fuzzy classifiers based on data complexity. IEEE Trans Fuzzy Syst 27(4):701\u2013715. https:\/\/doi.org\/10.1109\/TFUZZ.2018.2866967","journal-title":"IEEE Trans Fuzzy Syst"},{"doi-asserted-by":"crossref","unstructured":"Das S, Datta S, Chaudhuri BB (2018) Handling data irregularities in classification: foundations, trends, and future challenges. Pattern Recognit. 81:674\u2013693. https:\/\/doi.org\/10.1016\/j.patcog.2018.03.008","key":"1577_CR21","DOI":"10.1016\/j.patcog.2018.03.008"},{"issue":"4","key":"1577_CR22","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1371\/journal.pone.0121945","volume":"10","author":"B Diedenhofen","year":"2015","unstructured":"Diedenhofen B, Musch J (2015) cocor: a comprehensive solution for the statistical comparison of correlations. PLOS ONE 10(4):1\u201312. https:\/\/doi.org\/10.1371\/journal.pone.0121945","journal-title":"PLOS ONE"},{"unstructured":"Diederhofen B cocor function | R Documentation. URL https:\/\/www.rdocumentation.org\/packages\/cocor\/versions\/1.1-3\/topics\/cocor","key":"1577_CR23"},{"key":"1577_CR24","doi-asserted-by":"publisher","DOI":"10.1142\/S0129065717500289","author":"A Fern\u00e1ndez","year":"2017","unstructured":"Fern\u00e1ndez A, Carmona CJ, Del Jesus MJ, Herrera F (2017) A pareto based ensemble with feature and instance selection for learning from multi-class imbalanced datasets. Int J Neural Syst. https:\/\/doi.org\/10.1142\/S0129065717500289","journal-title":"Int J Neural Syst"},{"doi-asserted-by":"publisher","unstructured":"Fern\u00e1ndez A, Garc\u00eda S, Galar M, Prati R, Krawczyk B, Herrera F (2018). Learning from Imbalanced Data Sets Springer. https:\/\/doi.org\/10.1007\/978-3-319-98074-4","key":"1577_CR25","DOI":"10.1007\/978-3-319-98074-4"},{"key":"1577_CR26","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-05318-5_1","volume-title":"Hyperparameter optimization","author":"M Feurer","year":"2019","unstructured":"Feurer M, Hutter F (2019) Hyperparameter optimization. Springer, Berlin. https:\/\/doi.org\/10.1007\/978-3-030-05318-5_1"},{"key":"1577_CR27","doi-asserted-by":"publisher","first-page":"135","DOI":"10.1016\/j.ins.2013.12.053","volume":"264","author":"M Galar","year":"2014","unstructured":"Galar M, Fern\u00e1ndez A, Barrenechea E, Herrera F (2014) Empowering difficult classes with a similarity-based aggregation in multi-class classification problems. Inf Sci 264:135\u2013157. https:\/\/doi.org\/10.1016\/j.ins.2013.12.053","journal-title":"Inf Sci"},{"doi-asserted-by":"crossref","unstructured":"Galar M, Fern\u00e1ndez A, Tartas EB, Sola HB, Herrera F (2011) An overview of ensemble methods for binary classifiers in multi-class problems: experimental study on one-vs-one and one-vs-all schemes. Pattern Recognit 44(8):1761\u20131776. https:\/\/doi.org\/10.1016\/j.patcog.2011.01.017","key":"1577_CR28","DOI":"10.1016\/j.patcog.2011.01.017"},{"key":"1577_CR29","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2014.10.085","author":"LPF Garcia","year":"2015","unstructured":"Garcia LPF, Carvalho ACPdLFd, Lorena AC (2015) Effect of label noise in the complexity of classification problems. Neurocomputing. https:\/\/doi.org\/10.1016\/j.neucom.2014.10.085","journal-title":"Neurocomputing"},{"key":"1577_CR30","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.knosys.2015.12.006","volume":"98","author":"S Garc\u00eda","year":"2016","unstructured":"Garc\u00eda S, Luengo J, Herrera F (2016) Tutorial on practical tips of the most influential data preprocessing algorithms in data mining. Knowl-Based Syst 98:1\u201329. https:\/\/doi.org\/10.1016\/j.knosys.2015.12.006","journal-title":"Knowl-Based Syst"},{"issue":"7","key":"1577_CR31","doi-asserted-by":"publisher","first-page":"1734","DOI":"10.1109\/TKDE.2016.2545658","volume":"28","author":"X Geng","year":"2016","unstructured":"Geng X (2016) Label distribution learning. IEEE Trans Knowl Data Eng 28(7):1734\u20131748. https:\/\/doi.org\/10.1109\/TKDE.2016.2545658","journal-title":"IEEE Trans Knowl Data Eng"},{"issue":"7","key":"1577_CR32","doi-asserted-by":"publisher","first-page":"1403","DOI":"10.1109\/TNNLS.2014.2342533","volume":"26","author":"B Gu","year":"2015","unstructured":"Gu B, Sheng V, Tay K, Romano W, Li S (2015) Incremental support vector learning for ordinal regression. IEEE Trans Neural Netw Learn Syst 26(7):1403\u20131416. https:\/\/doi.org\/10.1109\/TNNLS.2014.2342533","journal-title":"IEEE Trans Neural Netw Learn Syst"},{"unstructured":"Gupta MR, Bengio S, Weston J (2014) Training highly multiclass classifiers. J Mach Learn Res 15(1):1461\u20131492. https:\/\/dl.acm.org\/doi\/10.5555\/2627435.2638582","key":"1577_CR33"},{"issue":"2","key":"1577_CR34","doi-asserted-by":"publisher","first-page":"171","DOI":"10.1023\/A:1010920819831","volume":"45","author":"DJ Hand","year":"2001","unstructured":"Hand DJ, Till RJ (2001) A simple generalisation of the area under the ROC curve for multiple class classification problems. Mach Learn 45(2):171\u2013186. https:\/\/doi.org\/10.1023\/A:1010920819831","journal-title":"Mach Learn"},{"key":"1577_CR35","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-41111-8","volume-title":"Multilabel Classification : Problem Analysis, Metrics and Techniques","author":"F Herrera","year":"2016","unstructured":"Herrera F, Charte F, Rivera AJ, Jesus MJd (2016) Multilabel Classification : Problem Analysis, Metrics and Techniques. Springer, Berlin. https:\/\/doi.org\/10.1007\/978-3-319-41111-8"},{"key":"1577_CR36","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-47759-6","volume-title":"Multiple instance learning: foundations and algorithms","author":"F Herrera","year":"2016","unstructured":"Herrera F, Ventura S, Bello R, Cornelis C, Zafra A, S\u00e1nchez-Tarrag\u00f3 D, Vluymans S (2016) Multiple instance learning: foundations and algorithms. Springer, Berlin. https:\/\/doi.org\/10.1007\/978-3-319-47759-6"},{"issue":"3","key":"1577_CR37","doi-asserted-by":"publisher","first-page":"289","DOI":"10.1109\/34.990132","volume":"24","author":"TK Ho","year":"2002","unstructured":"Ho TK, Basu M (2002) Complexity measures of supervised classification problems. IEEE Trans Pattern Anal Mach Intell 24(3):289\u2013300. https:\/\/doi.org\/10.1109\/34.990132","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"doi-asserted-by":"publisher","unstructured":"Hoekstra A, Duin R (1996) On the nonlinearity of pattern classifiers. In: Proceedings of 13th International Conference on Pattern Recognition, vol.\u00a04, pp. 271\u2013275 vol.4. https:\/\/doi.org\/10.1109\/ICPR.1996.547429. ISSN: 1051-4651","key":"1577_CR38","DOI":"10.1109\/ICPR.1996.547429"},{"unstructured":"Hornik K Weka$$\\_$$classifier$$\\_$$trees function | R Documentation. URL https:\/\/www.rdocumentation.org\/packages\/RWeka\/versions\/0.4-42\/topics\/Weka_classifier_trees","key":"1577_CR39"},{"issue":"16\u201317","key":"1577_CR40","doi-asserted-by":"publisher","first-page":"1897","DOI":"10.1016\/j.artint.2008.08.002","volume":"172","author":"E H\u00fcllermeier","year":"2008","unstructured":"H\u00fcllermeier E, F\u00fcrnkranz J, Cheng W, Brinker K (2008) Label ranking by learning pairwise preferences. Artif Intell 172(16\u201317):1897\u20131916. https:\/\/doi.org\/10.1016\/j.artint.2008.08.002","journal-title":"Artif Intell"},{"key":"1577_CR41","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-05318-5","volume-title":"Automated machine learning - methods, systems challenges","author":"F Hutter","year":"2019","unstructured":"Hutter F, Kotthoff L, Vanschoren J (2019) Automated machine learning - methods, systems challenges. Springer, Berlin"},{"unstructured":"Katakis I, Tsoumakas G, Vlahavas I (2008) Multilabel text classification for automated tag suggestion. Proc. ECML PKDD08 Discovery Challenge p.\u00a09","key":"1577_CR42"},{"issue":"3","key":"1577_CR43","doi-asserted-by":"publisher","first-page":"601","DOI":"10.1007\/s10115-018-1220-z","volume":"59","author":"B Krawczyk","year":"2019","unstructured":"Krawczyk B, Triguero I, Garc\u00eda S, Wo\u017aniak M, Herrera F (2019) Instance reduction for one-class classification. Knowl Inf Syst 59(3):601\u2013628. https:\/\/doi.org\/10.1007\/s10115-018-1220-z","journal-title":"Knowl Inf Syst"},{"key":"1577_CR44","doi-asserted-by":"publisher","DOI":"10.1186\/s40537-018-0151-6","author":"J Leevy","year":"2018","unstructured":"Leevy J, Khoshgoftaar T, Bauder R, Seliya N (2018) A survey on addressing high-class imbalance in big data. J Big Data. https:\/\/doi.org\/10.1186\/s40537-018-0151-6","journal-title":"J Big Data"},{"issue":"2","key":"1577_CR45","doi-asserted-by":"publisher","first-page":"354","DOI":"10.1109\/TKDE.2014.2327034","volume":"27","author":"E Leyva","year":"2015","unstructured":"Leyva E, Gonz\u00e1lez A, P\u00e9rez R (2015) A set of complexity measures designed for applying meta-learning to instance selection. IEEE Trans Knowl Data Eng 27(2):354\u2013367. https:\/\/doi.org\/10.1109\/TKDE.2014.2327034","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"1577_CR46","doi-asserted-by":"publisher","first-page":"33","DOI":"10.1016\/j.neucom.2011.03.054","volume":"75","author":"A Lorena","year":"2012","unstructured":"Lorena A, Costa I, Spola\u00f4r N, de Souto M (2012) Analysis of complexity indices for classification problems: cancer gene expression data. Neurocomputing 75:33\u201342. https:\/\/doi.org\/10.1016\/j.neucom.2011.03.054","journal-title":"Neurocomputing"},{"doi-asserted-by":"crossref","unstructured":"Lorena AC, Garcia LPF, Lehmann J, Souto MCP, Ho TK (2019) How Complex is your classification problem? A survey on measuring classification complexity. ACM Comput Surv 52(5):34. https:\/\/doi.org\/10.1145\/3347711","key":"1577_CR47","DOI":"10.1145\/3347711"},{"issue":"10","key":"1577_CR48","doi-asserted-by":"publisher","first-page":"1909","DOI":"10.1007\/s00500-010-0625-8","volume":"15","author":"J Luengo","year":"2011","unstructured":"Luengo J, Fern\u00e1ndez A, Garc\u00eda S, Herrera F (2011) Addressing data complexity for imbalanced data sets: analysis of SMOTE-based oversampling and evolutionary undersampling. Soft Comput 15(10):1909\u20131936. https:\/\/doi.org\/10.1007\/s00500-010-0625-8","journal-title":"Soft Comput"},{"key":"1577_CR49","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-39105-8","volume-title":"Big data preprocessing: enabling smart data","author":"J Luengo","year":"2020","unstructured":"Luengo J, Garc\u00eda-Gil D, Ram\u00edrez-Gallego S, Garc\u00eda S, Herrera F (2020) Big data preprocessing: enabling smart data. Springer, Berlin. https:\/\/doi.org\/10.1007\/978-3-030-39105-8"},{"issue":"1","key":"1577_CR50","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1016\/j.fss.2009.04.001","volume":"161","author":"J Luengo","year":"2010","unstructured":"Luengo J, Herrera F (2010) Domains of competence of fuzzy rule based classification systems with data complexity measures: A case of study using a fuzzy hybrid genetic based machine learning method. Fuzzy Sets Syst 161(1):3\u201319. https:\/\/doi.org\/10.1016\/j.fss.2009.04.001","journal-title":"Fuzzy Sets Syst"},{"issue":"1","key":"1577_CR51","doi-asserted-by":"publisher","first-page":"43","DOI":"10.1016\/j.ins.2011.09.022","volume":"185","author":"J Luengo","year":"2012","unstructured":"Luengo J, Herrera F (2012) Shared domains of competence of approximate learning models using measures of separability of classes. Inf Sci 185(1):43\u201365. https:\/\/doi.org\/10.1016\/j.ins.2011.09.022","journal-title":"Inf Sci"},{"issue":"1","key":"1577_CR52","doi-asserted-by":"publisher","first-page":"147","DOI":"10.1007\/s10115-013-0700-4","volume":"42","author":"J Luengo","year":"2015","unstructured":"Luengo J, Herrera F (2015) An automatic extraction method of the domains of competence for learning classifiers using data complexity measures. Knowl Inf Syst 42(1):147\u2013180. https:\/\/doi.org\/10.1007\/s10115-013-0700-4","journal-title":"Knowl Inf Syst"},{"key":"1577_CR53","doi-asserted-by":"publisher","DOI":"10.1007\/s13721-016-0125-6","author":"G Luo","year":"2016","unstructured":"Luo G (2016) A review of automatic selection methods for machine learning algorithms and hyper-parameter values. Netw Model Anal Health Inform Bioinform. https:\/\/doi.org\/10.1007\/s13721-016-0125-6","journal-title":"Netw Model Anal Health Inform Bioinform"},{"key":"1577_CR54","doi-asserted-by":"publisher","first-page":"216","DOI":"10.1016\/j.patcog.2019.02.023","volume":"91","author":"A Luque","year":"2019","unstructured":"Luque A, Carrasco A, Mart\u00edn A, de\u00a0lasde\u00a0las Heras AA (2019) The impact of class imbalance in classification performance metrics based on the binary confusion matrix. Pattern Recognit 91:216\u2013231. https:\/\/doi.org\/10.1016\/j.patcog.2019.02.023","journal-title":"Pattern Recognit"},{"key":"1577_CR55","doi-asserted-by":"publisher","first-page":"113","DOI":"10.1016\/j.ins.2013.07.007","volume":"250","author":"V L\u00f3pez","year":"2013","unstructured":"L\u00f3pez V, Fern\u00e1ndez A, Garc\u00eda S, Palade V, Herrera F (2013) An insight into classification with imbalanced data: empirical results and current trends on using data intrinsic characteristics. Inf Sci 250:113\u2013141. https:\/\/doi.org\/10.1016\/j.ins.2013.07.007","journal-title":"Inf Sci"},{"key":"1577_CR56","doi-asserted-by":"publisher","DOI":"10.23940\/ijpe.18.08.p5.16951704","author":"Y Ma","year":"2018","unstructured":"Ma Y (2018) Data complexity analysis for software defect detection. Int J Perform Eng. https:\/\/doi.org\/10.23940\/ijpe.18.08.p5.16951704","journal-title":"Int J Perform Eng"},{"unstructured":"Manukyan A, Ceyhan E (2016) Classification of Imbalanced Data with a Geometric Digraph Family. J. Mach. Learn. Res. https:\/\/dl.acm.org\/doi\/abs\/10.5555\/2946645.3053471","key":"1577_CR57"},{"issue":"10","key":"1577_CR58","doi-asserted-by":"publisher","first-page":"2823","DOI":"10.1007\/s13042-018-00906-1","volume":"10","author":"J Mart\u00ednez Torres","year":"2019","unstructured":"Mart\u00ednez Torres J, Iglesias Comesa\u00f1a C, Garc\u00eda-Nieto PJ (2019) Review: machine learning techniques applied to cybersecurity. Int J Mach Learn Cybern 10(10):2823\u20132836. https:\/\/doi.org\/10.1007\/s13042-018-00906-1","journal-title":"Int J Mach Learn Cybern"},{"issue":"2","key":"1577_CR59","doi-asserted-by":"publisher","first-page":"473","DOI":"10.1088\/0031-9155\/56\/2\/012","volume":"56","author":"M Mazurowski","year":"2011","unstructured":"Mazurowski M, Malof J, Tourassi G (2011) Comparative analysis of instance selection algorithms for instance-based classifiers in the context of medical decision support. Phys Med Biol 56(2):473\u2013489. https:\/\/doi.org\/10.1088\/0031-9155\/56\/2\/012","journal-title":"Phys Med Biol"},{"unstructured":"Meyer D naiveBayes function | R Documentation. URL https:\/\/www.rdocumentation.org\/packages\/e1071\/versions\/1.7-2\/topics\/naiveBayes","key":"1577_CR60"},{"doi-asserted-by":"publisher","unstructured":"Morais G, Prati RC (2013) Complex Network Measures for Data Set Characterization. In: 2013 Brazilian Conference on Intelligent Systems, pp. 12\u201318. https:\/\/doi.org\/10.1109\/BRACIS.2013.11","key":"1577_CR61","DOI":"10.1109\/BRACIS.2013.11"},{"key":"1577_CR62","doi-asserted-by":"publisher","DOI":"10.1007\/s10115-016-1003-3","author":"L Mor\u00e1n-Fern\u00e1ndez","year":"2016","unstructured":"Mor\u00e1n-Fern\u00e1ndez L, Bol\u00f3n-Canedo V, Alonso-Betanzos A (2016) Can classification performance be predicted by complexity measures? a study using microarray data. Knowl Inf Syst. https:\/\/doi.org\/10.1007\/s10115-016-1003-3","journal-title":"Knowl Inf Syst"},{"key":"1577_CR63","first-page":"1","volume":"196","author":"A Orriols-Puig","year":"2010","unstructured":"Orriols-Puig A, Macia N, Ho TK (2010) Documentation for the data complexity library in C++. Universitat Ramon Llull, La Salle 196:1\u201340","journal-title":"Universitat Ramon Llull, La Salle"},{"doi-asserted-by":"crossref","unstructured":"Prati RC, Luengo J, Herrera F (2019) Emerging topics and challenges of learning from noisy data in nonstandard classification: a survey beyond binary class noise. Knowl Inf Syst 60:63\u201397. https:\/\/doi.org\/10.1007\/s10115-018-1244-4","key":"1577_CR64","DOI":"10.1007\/s10115-018-1244-4"},{"doi-asserted-by":"publisher","unstructured":"Rodriguez D, Dolado J, Tuya J (2015) Bayesian concepts in software testing: An initial review. In: A-TEST 2015: Proceedings of the 6th International Workshop on Automating Test Case Design, Selection and Evaluation, pp. 41\u201346. https:\/\/doi.org\/10.1145\/2804322.2804329","key":"1577_CR65","DOI":"10.1145\/2804322.2804329"},{"unstructured":"Schliep K kknn function | R Documentation. https:\/\/www.rdocumentation.org\/packages\/kknn\/versions\/1.3.1%20\/topics\/kknn","key":"1577_CR66"},{"unstructured":"Scopus: Document Search. URL https:\/\/www.scopus.com\/search\/form.uri?display=basic","key":"1577_CR67"},{"key":"1577_CR68","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9781107298019","volume-title":"Understanding Machine Learning: From Theory to Algorithms","author":"S Shalev-Shwartz","year":"2014","unstructured":"Shalev-Shwartz S, Ben-David S (2014) Understanding Machine Learning: From Theory to Algorithms. Cambridge University Press, USA"},{"key":"1577_CR69","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2003.1251146","author":"S Singh","year":"2003","unstructured":"Singh S (2003) Multiresolution estimates of classification complexity. IEEE Trans Pattern Anal Mach Intell. https:\/\/doi.org\/10.1109\/TPAMI.2003.1251146","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"1577_CR70","doi-asserted-by":"publisher","DOI":"10.1007\/978-981-13-3029-2","volume-title":"Multiview Machine Learning","author":"S Sun","year":"2019","unstructured":"Sun S, Mao L, Dong Z, Wu L (2019) Multiview Machine Learning, 1st edn. Springer, Berlin","edition":"1"},{"issue":"1","key":"1577_CR71","doi-asserted-by":"publisher","first-page":"355","DOI":"10.1016\/j.patcog.2012.07.009","volume":"46","author":"JA S\u00e1ez","year":"2013","unstructured":"S\u00e1ez JA, Luengo J, Herrera F (2013) Predicting noise filtering efficacy with data complexity measures for nearest neighbor classification. Pattern Recognit 46(1):355\u2013364. https:\/\/doi.org\/10.1016\/j.patcog.2012.07.009","journal-title":"Pattern Recognit"},{"doi-asserted-by":"publisher","unstructured":"Tanwani AK, Farooq M (2010) Classification Potential vs. Classification Accuracy: A Comprehensive Study of Evolutionary Algorithms with Biomedical Datasets. In: Bacardit J, Browne W, Drugowitsch, J Bernad\u00f3-Mansilla E, Butz MV (eds) Learning Classifier Systems Lecture Notes in Computer Science, (pp. 127\u2013144) Springer, Berlin. doi: https:\/\/doi.org\/10.1007\/978-3-642-17508-4_9","key":"1577_CR72","DOI":"10.1007\/978-3-642-17508-4_9"},{"issue":"1","key":"1577_CR73","doi-asserted-by":"publisher","first-page":"1238","DOI":"10.2991\/ijcis.10.1.82","volume":"10","author":"I Triguero","year":"2017","unstructured":"Triguero I, Gonz\u00e1lez S, Moyano JM, Garc\u00eda S, Alcal\u00e1-Fdez J, Luengo J, Fern\u00e1ndez A, Jes\u00fas MJd, S\u00e1nchez L, Herrera F (2017) KEEL 3.0: an open source software for multi-stage analysis in data mining. Int J Comput Intell Syst 10(1):1238\u20131249. https:\/\/doi.org\/10.2991\/ijcis.10.1.82","journal-title":"Int J Comput Intell Syst"},{"key":"1577_CR74","doi-asserted-by":"publisher","first-page":"47","DOI":"10.1016\/j.ins.2019.08.062","volume":"509","author":"P Vuttipittayamongkol","year":"2020","unstructured":"Vuttipittayamongkol P, Elyan E (2020) Neighbourhood-based undersampling approach for handling imbalanced and overlapped data. Inf Sci 509:47\u201370. https:\/\/doi.org\/10.1016\/j.ins.2019.08.062","journal-title":"Inf Sci"},{"issue":"2","key":"1577_CR75","doi-asserted-by":"publisher","first-page":"149","DOI":"10.1515\/fcds-2017-0007","volume":"42","author":"S Wojciechowski","year":"2017","unstructured":"Wojciechowski S, Wilk S (2017) Difficulty factors and preprocessing in imbalanced data sets: an experimental study on artificial data. Found Comput Decis Sci 42(2):149\u2013176. https:\/\/doi.org\/10.1515\/fcds-2017-0007","journal-title":"Found Comput Decis Sci"},{"key":"1577_CR76","doi-asserted-by":"publisher","first-page":"43","DOI":"10.1016\/j.inffus.2017.02.007","volume":"38","author":"J Zhao","year":"2017","unstructured":"Zhao J, Xie X, Xu X, Sun S (2017) Multi-view learning overview: recent progress and new challenges. Inf Fusion 38:43\u201354. https:\/\/doi.org\/10.1016\/j.inffus.2017.02.007","journal-title":"Inf Fusion"},{"unstructured":"Zhu X (2005) Semi-supervised learning with graphs. phd, Carnegie Mellon University, USA. AAI3179046 ISBN-10: 0542190591","key":"1577_CR77"},{"issue":"4","key":"1577_CR78","doi-asserted-by":"publisher","first-page":"399","DOI":"10.1037\/1082-989X.12.4.399","volume":"12","author":"GY Zou","year":"2007","unstructured":"Zou GY (2007) Toward using confidence intervals to compare correlations. Psychol Methods 12(4):399\u2013413. https:\/\/doi.org\/10.1037\/1082-989X.12.4.399","journal-title":"Psychol Methods"}],"container-title":["Knowledge and Information Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10115-021-01577-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10115-021-01577-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10115-021-01577-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,6,18]],"date-time":"2021-06-18T07:09:37Z","timestamp":1624000177000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10115-021-01577-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,6,1]]},"references-count":78,"journal-issue":{"issue":"7","published-print":{"date-parts":[[2021,7]]}},"alternative-id":["1577"],"URL":"https:\/\/doi.org\/10.1007\/s10115-021-01577-1","relation":{},"ISSN":["0219-1377","0219-3116"],"issn-type":[{"type":"print","value":"0219-1377"},{"type":"electronic","value":"0219-3116"}],"subject":[],"published":{"date-parts":[[2021,6,1]]},"assertion":[{"value":"19 July 2020","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"30 April 2021","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"5 May 2021","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"1 June 2021","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of Interest"}}]}}