{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,29]],"date-time":"2026-04-29T12:22:00Z","timestamp":1777465320258,"version":"3.51.4"},"reference-count":37,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2016,10,14]],"date-time":"2016-10-14T00:00:00Z","timestamp":1476403200000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Knowl Inf Syst"],"published-print":{"date-parts":[[2017,6]]},"DOI":"10.1007\/s10115-016-1003-3","type":"journal-article","created":{"date-parts":[[2016,10,14]],"date-time":"2016-10-14T02:16:21Z","timestamp":1476411381000},"page":"1067-1090","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":35,"title":["Can classification performance be predicted by complexity measures? A study using microarray data"],"prefix":"10.1007","volume":"51","author":[{"given":"L.","family":"Mor\u00e1n-Fern\u00e1ndez","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"V.","family":"Bol\u00f3n-Canedo","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"A.","family":"Alonso-Betanzos","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2016,10,14]]},"reference":[{"key":"1003_CR1","volume-title":"Data complexity in pattern recognition","author":"TK Ho","year":"2006","unstructured":"Ho TK, Basu M (2006) Data complexity in pattern recognition. Springer, Berlin"},{"issue":"2","key":"1003_CR2","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/980972.980974","volume":"5","author":"G Piatetsky","year":"2003","unstructured":"Piatetsky G, Tamayo P (2003) Microarray data mining: facing the challenges. ACM SIGKDD Explor Newsl 5(2):1\u20135","journal-title":"ACM SIGKDD Explor Newsl"},{"issue":"19","key":"1003_CR3","doi-asserted-by":"publisher","first-page":"111","DOI":"10.1016\/j.ins.2014.05.042","volume":"282","author":"V Bol\u00f3n-Canedo","year":"2014","unstructured":"Bol\u00f3n-Canedo V, S\u00e1nchez-Maro\u00f1o N, Alonso-Betanzos A, Herrera F (2014) A review of microarray datasets and applied feature selection methods. Inf Sci 282(19):111\u2013135","journal-title":"Inf Sci"},{"issue":"19","key":"1003_CR4","doi-asserted-by":"publisher","first-page":"2507","DOI":"10.1093\/bioinformatics\/btm344","volume":"23","author":"Y Saeys","year":"2007","unstructured":"Saeys Y, Inza I, Larra\u00f1aga P (2007) A review of feature selection techniques in bioinformatics. Bioinformatics 23(19):2507\u20132517","journal-title":"Bioinformatics"},{"issue":"1","key":"1003_CR5","doi-asserted-by":"publisher","first-page":"82","DOI":"10.1109\/TEVC.2004.840153","volume":"9","author":"E Bernad\u00f3-Mansilla","year":"2005","unstructured":"Bernad\u00f3-Mansilla E, Ho TK (2005) Domain of competence of XCS classifier system in complexity measures space. IEEE Trans Evol Comput 9(1):82\u2013104","journal-title":"IEEE Trans Evol Comput"},{"issue":"3","key":"1003_CR6","doi-asserted-by":"publisher","first-page":"189","DOI":"10.1007\/s10044-007-0061-2","volume":"10","author":"JS S\u00e1nchez","year":"2007","unstructured":"S\u00e1nchez JS, Mollineda RA, Sotoca JM (2007) An analysis of how training data complexity affects the nearest neighbor classifiers. Pattern Anal Appl 10(3):189\u2013201","journal-title":"Pattern Anal Appl"},{"key":"1003_CR7","doi-asserted-by":"publisher","unstructured":"Mollineda RA, S\u00e1nchez JS, Sotoca JM (2005) Data characterization for effective prototype selection. In: First edition of the Iberian conference on pattern recognition and image analysis (ibPRIA, 2005) Lecture Notes in Computer Science. Springer, Berlin, pp 3523","DOI":"10.1007\/11492542_4"},{"issue":"3","key":"1003_CR8","doi-asserted-by":"publisher","first-page":"1054","DOI":"10.1016\/j.patcog.2012.09.022","volume":"46","author":"N Maci\u00e0","year":"2013","unstructured":"Maci\u00e0 N, Bernad\u00f3-Mansilla E, Orriols-Puig A, Ho TK (2013) Learner excellence biased by data set selection: a case for data characterisation and artificial data sets. Pattern Recogn 46(3):1054\u20131066","journal-title":"Pattern Recogn"},{"issue":"1","key":"1003_CR9","doi-asserted-by":"publisher","first-page":"33","DOI":"10.1016\/j.neucom.2011.03.054","volume":"75","author":"AC Lorena","year":"2012","unstructured":"Lorena AC, Costa IG, Spola\u00f4r N, de Souto MC (2012) Analysis of complexity indices for classification problems: cancer gene expression data. Neurocomputing 75(1):33\u201342","journal-title":"Neurocomputing"},{"issue":"2","key":"1003_CR10","doi-asserted-by":"publisher","first-page":"151","DOI":"10.1016\/j.artmed.2008.08.004","volume":"45","author":"O Okun","year":"2009","unstructured":"Okun O, Priisalu H (2009) Dataset complexity in gene expression based cancer classification using ensembles of k-nearest neighbors. Artif Intel Med 45(2):151\u2013162","journal-title":"Artif Intel Med"},{"issue":"5439","key":"1003_CR11","doi-asserted-by":"publisher","first-page":"531","DOI":"10.1126\/science.286.5439.531","volume":"286","author":"TR Golub","year":"1999","unstructured":"Golub TR et al (1999) Molecular classification of cancer: class discovery and class prediction by gene expression monitoring. J Sci 286(5439):531\u2013537","journal-title":"J Sci"},{"key":"1003_CR12","doi-asserted-by":"publisher","unstructured":"Ding C, Peng H (2003) Minimum redundancy feature selection from microarray gene expression data. In: Proceedings of the computacional systems bioinformatics conference, pp 523\u2013529","DOI":"10.1109\/CSB.2003.1227396"},{"key":"1003_CR13","doi-asserted-by":"publisher","first-page":"37","DOI":"10.1016\/j.compbiolchem.2004.11.001","volume":"29","author":"Y Wanga","year":"2005","unstructured":"Wanga Y, Tetkoa IV, Hallb MA, Frankb E, Faciusa A, Mayera KFX, Mewesa HW (2005) Gene selection from microarray data for cancer classification-a machine learning approach. Comput Biol Chem 29:37\u201346","journal-title":"Comput Biol Chem"},{"key":"1003_CR14","unstructured":"Xing E, Jordan M, Karp R (2001) Feature selection for high-dimensional genomic microarray data. In: Proceedings of the 18th internacional conference on machine learning, pp 601\u2013608"},{"key":"1003_CR15","unstructured":"Data Complexity Library in C++. [Online]. Available: http:\/\/dcol.sourceforge.net\/"},{"key":"1003_CR16","unstructured":"Alberts B, Johnson A, Lewis J, Raff M, Roberts K, Walter P (2004) Molecular biology of the cell. Garland Science"},{"key":"1003_CR17","doi-asserted-by":"publisher","unstructured":"Novianti PW, Jong VL, Roes KCB, Eijkemans MJC (2015) Factors affecting the accuracy of a class prediction model in gene expression data. BMC Bioinformatics 16(1):199","DOI":"10.1186\/s12859-015-0610-4"},{"issue":"1","key":"1003_CR18","doi-asserted-by":"publisher","first-page":"91","DOI":"10.1109\/MSP.2007.273062","volume":"24","author":"U Braga-Neto","year":"2007","unstructured":"Braga-Neto U (2007) Fads and fallacies in the name of small-sample microarray classification\u2014a highlight of misunderstanding and erroneous usage in the applications of genomic signal processing. Sig Process Mag IEEE 24(1):91\u201399","journal-title":"Sig Process Mag IEEE"},{"issue":"1","key":"1003_CR19","doi-asserted-by":"publisher","first-page":"521","DOI":"10.1016\/j.patcog.2011.06.019","volume":"45","author":"JG Moreno-Torres","year":"2012","unstructured":"Moreno-Torres JG, Raeder T, Alaiz-Rodr\u00edguez R, Chawla NV, Herrera F (2012) A unifying view on dataset shift in classification. Pattern Recogn 45(1):521\u2013530","journal-title":"Pattern Recogn"},{"key":"1003_CR20","unstructured":"Broad Institute. Cancer program data sets. [Online]. Available http:\/\/www.broadinstitute.org\/cgi-bin\/cancer\/datasets.cgi"},{"key":"1003_CR21","unstructured":"Technology Agency\u00a0for Sciency and Research. Kent ridge bio-medical dataset repository. [Online]. Available: http:\/\/datam.i2r.a-star.edu.sg\/datasets\/krbd\/"},{"key":"1003_CR22","unstructured":"Arizona\u00a0State University. Feature selection datasets. [Online]. Available: http:\/\/featureselection.asu.edu\/datasets.php"},{"key":"1003_CR23","unstructured":"Statnikov A, Aliferis C, Tsardinos I. Gems: gene expression model selector. [Online]. Available: http:\/\/www.gems-system.org\/"},{"issue":"1","key":"1003_CR24","doi-asserted-by":"publisher","first-page":"10","DOI":"10.1145\/1656274.1656278","volume":"11","author":"M Hall","year":"2009","unstructured":"Hall M, Frank E, Holmes G, Pfahringer B, Reutemann P, Witten IH (2009) The weka data mining software: an update. ACM SIGKDD Explor Newsl 11(1):10\u201318","journal-title":"ACM SIGKDD Explor Newsl"},{"key":"1003_CR25","unstructured":"Rish I (2001) An empirical study of the naive bayes classifier. In: IJCAI 2001 workshop on empirical methods in artifical intelligence 3(22):41\u201346"},{"key":"1003_CR26","volume-title":"Statistical learning theory","author":"VN Vapnik","year":"1998","unstructured":"Vapnik VN (1998) Statistical learning theory. Wiley, New York"},{"key":"1003_CR27","volume-title":"C4.5: programs for machine learning","author":"J Ross Quinlan","year":"1993","unstructured":"Ross Quinlan J (1993) C4.5: programs for machine learning. Morgan Kaufmann Publishers Inc, New York"},{"issue":"1","key":"1003_CR28","first-page":"37","volume":"6","author":"DW Aha","year":"1991","unstructured":"Aha DW, Kibler D, Albert MK (1991) Instance-based learning algorithms. Mach Learn 6(1):37\u201366","journal-title":"Mach Learn"},{"key":"1003_CR29","doi-asserted-by":"crossref","unstructured":"Bol\u00f3n-Canedo V, S\u00e1nchez-Maro\u00f1o N, Alonso-Betanzos A (2015) Recent advances and emerging challenges of feature selection in the context of big data. Knowl Based Syst","DOI":"10.1007\/978-3-319-21858-8_6"},{"key":"1003_CR30","unstructured":"Hall M (1999) Correlation-based feature selection for machine learning. PhD thesis"},{"issue":"1\u20132","key":"1003_CR31","doi-asserted-by":"publisher","first-page":"155","DOI":"10.1016\/S0004-3702(03)00079-1","volume":"151","author":"M Dash","year":"2003","unstructured":"Dash M, Liu H (2003) Consistency-based search in feature selection. J Artif Intel 151(1\u20132):155\u2013176","journal-title":"J Artif Intel"},{"key":"1003_CR32","unstructured":"Supplementary material. [Online]. Available: http:\/\/www.lidiagroup.org\/index.php\/en\/materials-en.html"},{"key":"1003_CR33","first-page":"1289","volume":"3","author":"G Forman","year":"2003","unstructured":"Forman G (2003) An extensive empirical study of feature selection metrics for text classification. J Mach Learn Res 3:1289\u20131305","journal-title":"J Mach Learn Res"},{"issue":"5","key":"1003_CR34","doi-asserted-by":"publisher","first-page":"5947","DOI":"10.1016\/j.eswa.2010.11.028","volume":"38","author":"V Bol\u00f3n-Canedo","year":"2011","unstructured":"Bol\u00f3n-Canedo V, S\u00e1nchez-Maro\u00f1o N, Alonso-Betanzos A (2011) Feature selection and classification in multiple class datasets: an application to KDD Cup 99 dataset. Expert Syst Appl 38(5):5947\u20135957","journal-title":"Expert Syst Appl"},{"issue":"3","key":"1003_CR35","doi-asserted-by":"publisher","first-page":"201","DOI":"10.1080\/00031305.2015.1005128","volume":"69","author":"A-L Boulesteix","year":"2015","unstructured":"Boulesteix A-L, Hable R, Lauer S, Eugster MJA (2015) A statistical framework for hypothesis testing in real data comparison studies. Am Stat 69(3):201\u2013212","journal-title":"Am Stat"},{"issue":"Jan","key":"1003_CR36","first-page":"1","volume":"7","author":"J Dem\u0161ar","year":"2006","unstructured":"Dem\u0161ar J (2006) Statistical comparisons of classifiers over multiple data sets. J Mach Learn Res 7(Jan):1\u201330","journal-title":"J Mach Learn Res"},{"key":"1003_CR37","unstructured":"Navarro FFG (2011) Feature selection in cancer research: microarray gene expression and in vivo 1h-mrs domains. PhD thesis, Universitat Polit\u00e8cnica de Catalunya"}],"container-title":["Knowledge and Information Systems"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10115-016-1003-3\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10115-016-1003-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10115-016-1003-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,9,14]],"date-time":"2019-09-14T11:50:06Z","timestamp":1568461806000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10115-016-1003-3"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,10,14]]},"references-count":37,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2017,6]]}},"alternative-id":["1003"],"URL":"https:\/\/doi.org\/10.1007\/s10115-016-1003-3","relation":{},"ISSN":["0219-1377","0219-3116"],"issn-type":[{"value":"0219-1377","type":"print"},{"value":"0219-3116","type":"electronic"}],"subject":[],"published":{"date-parts":[[2016,10,14]]}}}