{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,22]],"date-time":"2026-04-22T08:39:12Z","timestamp":1776847152362,"version":"3.51.2"},"reference-count":31,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2013,4,5]],"date-time":"2013-04-05T00:00:00Z","timestamp":1365120000000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/2.0"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["BMC Bioinformatics"],"published-print":{"date-parts":[[2013,12]]},"DOI":"10.1186\/1471-2105-14-119","type":"journal-article","created":{"date-parts":[[2013,4,5]],"date-time":"2013-04-05T15:32:42Z","timestamp":1365175962000},"source":"Crossref","is-referenced-by-count":227,"title":["An AUC-based permutation variable importance measure for random forests"],"prefix":"10.1186","volume":"14","author":[{"given":"Silke","family":"Janitza","sequence":"first","affiliation":[]},{"given":"Carolin","family":"Strobl","sequence":"additional","affiliation":[]},{"given":"Anne-Laure","family":"Boulesteix","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2013,4,5]]},"reference":[{"key":"5789_CR1","doi-asserted-by":"publisher","first-page":"5","DOI":"10.1023\/A:1010933404324","volume":"45","author":"L Breiman","year":"2001","unstructured":"Breiman L: Random forests. Machine Learning. 2001, 45: 5-32. 10.1023\/A:1010933404324.","journal-title":"Machine Learning"},{"issue":"6","key":"5789_CR2","doi-asserted-by":"publisher","first-page":"493","DOI":"10.1002\/widm.1072","volume":"2","author":"AL Boulesteix","year":"2012","unstructured":"Boulesteix AL, Janitza S, Kruppa J, K\u00f6nig I: Overview of random forest methodology and practical guidance with emphasis on computational biology and bioinformatics. Wiley Interdisciplinary Reviews: Data Mining and Knowledge Discovery. 2012, 2 (6): 493-507. 10.1002\/widm.1072.","journal-title":"Wiley Interdisciplinary Reviews: Data Mining and Knowledge Discovery"},{"issue":"2","key":"5789_CR3","doi-asserted-by":"publisher","first-page":"217","DOI":"10.1093\/aje\/kwq086","volume":"172","author":"F Briggs","year":"2010","unstructured":"Briggs F, Goldstein B, McCauley J, Zuvich R, De Jager P, Rioux J, Ivinson A, Compston A, Hafler D, Hauser S: Variation within DNA repair pathway genes and risk of multiple sclerosis. Am J Epidemiol. 2010, 172 (2): 217-10.1093\/aje\/kwq086.","journal-title":"Am J Epidemiol"},{"issue":"6","key":"5789_CR4","doi-asserted-by":"publisher","first-page":"1368","DOI":"10.1158\/1055-9965.EPI-07-2830","volume":"17","author":"J Chang","year":"2008","unstructured":"Chang J, Yeh R, Wiencke J, Wiemels J, Smirnov I, Pico A, Tihan T, Patoka J, Miike R, Sison J: Pathway analysis of single-nucleotide polymorphisms potentially associated with glioblastoma multiforme susceptibility using random forests. Cancer Epidemiol Biomarkers Prev. 2008, 17 (6): 1368-1373. 10.1158\/1055-9965.EPI-07-2830.","journal-title":"Cancer Epidemiol Biomarkers Prev"},{"issue":"5","key":"5789_CR5","doi-asserted-by":"publisher","first-page":"473","DOI":"10.1007\/s00439-010-0943-z","volume":"129","author":"C Liu","year":"2011","unstructured":"Liu C, Ackerman H, Carulli J: A genome-wide screen of gene-gene interactions for rheumatoid arthritis susceptibility. Hum Genet. 2011, 129 (5): 473-485. 10.1007\/s00439-010-0943-z.","journal-title":"Hum Genet"},{"issue":"4","key":"5789_CR6","doi-asserted-by":"publisher","first-page":"441","DOI":"10.1007\/s00439-009-0782-y","volume":"127","author":"K Nicodemus","year":"2010","unstructured":"Nicodemus K, Callicott J, Higier R, Luna A, Nixon D, Lipska B, Vakkalanka R, Giegling I, Rujescu D, Clair D: Evidence of statistical epistasis between DISC1, CIT and NDEL1 impacting risk for schizophrenia: biological validation with functional neuroimaging. Hum Genet. 2010, 127 (4): 441-452. 10.1007\/s00439-009-0782-y.","journal-title":"Hum Genet"},{"issue":"Suppl 1","key":"5789_CR7","doi-asserted-by":"publisher","first-page":"S62","DOI":"10.1186\/1753-6561-1-s1-s62","volume":"1","author":"Y Sun","year":"2007","unstructured":"Sun Y, Cai Z, Desai K, Lawrance R, Leff R, Jawaid A, Kardia S, Yang H: Classification of rheumatoid arthritis status with candidate gene and genome-wide single-nucleotide polymorphisms using random forests. BMC Proceedings. 2007, 1 (Suppl 1): S62-10.1186\/1753-6561-1-s1-s62.","journal-title":"BMC Proceedings"},{"key":"5789_CR8","doi-asserted-by":"publisher","first-page":"523","DOI":"10.1186\/1471-2105-11-523","volume":"11","author":"R Blagus","year":"2010","unstructured":"Blagus R, Lusa L: Class prediction for high-dimensional class-imbalanced data. BMC Bioinformatics. 2010, 11: 523-10.1186\/1471-2105-11-523.","journal-title":"BMC Bioinformatics"},{"key":"5789_CR9","volume-title":"Brief Bioinform","author":"WJ Lin","year":"2012","unstructured":"Lin WJ, Chen J: Class-imbalanced classifiers for high-dimensional data. Brief Bioinform. 2012"},{"key":"5789_CR10","first-page":"310","volume-title":"Tools with Artificial Intelligence, 2007","author":"T Khoshgoftaar","year":"2007","unstructured":"Khoshgoftaar T, Golawala M, Van Hulse J: An empirical study of learning from imbalanced data using random forest. Tools with Artificial Intelligence, 2007. 2007, ICTAI 2007: 19th IEEE International Conference on, Volume 2, IEEE, 310-317."},{"issue":"4","key":"5789_CR11","doi-asserted-by":"publisher","first-page":"720","DOI":"10.1016\/j.nonrwa.2005.04.006","volume":"7","author":"Y Huang","year":"2006","unstructured":"Huang Y, Hung C, Jiau H: Evaluation of neural networks and data mining methods on a credit assessment task for class imbalance problem. Nonlinear Analysis: Real World Applications. 2006, 7 (4): 720-747. 10.1016\/j.nonrwa.2005.04.006.","journal-title":"Nonlinear Analysis: Real World Applications"},{"issue":"3","key":"5789_CR12","doi-asserted-by":"publisher","first-page":"291","DOI":"10.1023\/A:1009700419189","volume":"1","author":"T Fawcett","year":"1997","unstructured":"Fawcett T, Provost F: Adaptive fraud detection. Data Mining and Knowledge Discovery. 1997, 1 (3): 291-316. 10.1023\/A:1009700419189.","journal-title":"Data Mining and Knowledge Discovery"},{"issue":"2","key":"5789_CR13","doi-asserted-by":"publisher","first-page":"195","DOI":"10.1023\/A:1007452223027","volume":"30","author":"M Kubat","year":"1998","unstructured":"Kubat M, Holte R, Matwin S: Machine learning for the detection of oil spills in satellite radar images. Machine Learning. 1998, 30 (2): 195-215. 10.1023\/A:1007452223027.","journal-title":"Machine Learning"},{"key":"5789_CR14","volume-title":"Using random forest to learn imbalanced data","author":"C Chen","year":"2004","unstructured":"Chen C, Liaw A, Breiman L: Using random forest to learn imbalanced data. 2004, University of California, Berkeley: Tech. rep, [\n                    http:\/\/statistics.berkeley.edu\/tech-reports\/666\n                    \n                  ]"},{"issue":"3","key":"5789_CR15","doi-asserted-by":"publisher","first-page":"5445","DOI":"10.1016\/j.eswa.2008.06.121","volume":"36","author":"Y Xie","year":"2009","unstructured":"Xie Y, Li X, Ngai E, Ying W: Customer churn prediction using improved balanced random forests. Expert Systems with Applications. 2009, 36 (3): 5445-5449. 10.1016\/j.eswa.2008.06.121.","journal-title":"Expert Systems with Applications"},{"key":"5789_CR16","doi-asserted-by":"publisher","first-page":"20","DOI":"10.1145\/1007730.1007735","volume":"6","author":"G Batista","year":"2004","unstructured":"Batista G, Prati R, Monard M: A study of the behavior of several methods for balancing machine learning training data. ACM SIGKDD Explorations Newsletter. 2004, 6: 20-29. 10.1145\/1007730.1007735.","journal-title":"ACM SIGKDD Explorations Newsletter"},{"key":"5789_CR17","doi-asserted-by":"publisher","first-page":"18","DOI":"10.1111\/j.0824-7935.2004.t01-1-00228.x","volume":"20","author":"A Estabrooks","year":"2004","unstructured":"Estabrooks A, Jo T, Japkowicz N: A multiple resampling method for learning from imbalanced data sets. Computational Intelligence. 2004, 20: 18-36. 10.1111\/j.0824-7935.2004.t01-1-00228.x.","journal-title":"Computational Intelligence"},{"key":"5789_CR18","first-page":"935","volume-title":"Experimental perspectives on learning from imbalanced data","author":"J Van Hulse","year":"2007","unstructured":"Van Hulse J, Khoshgoftaar T, Napolitano A: Experimental perspectives on learning from imbalanced data. 2007, ACM: In Proceedings of the 24th International Conference on Machine Learning, 935-942."},{"issue":"12","key":"5789_CR19","doi-asserted-by":"publisher","first-page":"1513","DOI":"10.1016\/j.datak.2009.08.005","volume":"68","author":"J Van Hulse","year":"2009","unstructured":"Van Hulse J, Khoshgoftaar T: Knowledge discovery from imbalanced and noisy data. Data & Knowledge Engineering. 2009, 68 (12): 1513-1542. 10.1016\/j.datak.2009.08.005.","journal-title":"Data & Knowledge Engineering"},{"issue":"5","key":"5789_CR20","doi-asserted-by":"crossref","first-page":"429","DOI":"10.3233\/IDA-2002-6504","volume":"6","author":"N Japkowicz","year":"2002","unstructured":"Japkowicz N, Stephen S: The class imbalance problem: A systematic study. Intelligent Data Analysis. 2002, 6 (5): 429-449.","journal-title":"Intelligent Data Analysis"},{"key":"5789_CR21","doi-asserted-by":"publisher","first-page":"51","DOI":"10.1186\/1472-6947-11-51","volume":"11","author":"M Khalilia","year":"2011","unstructured":"Khalilia M, Chakraborty S, Popescu M: Predicting disease risks from highly imbalanced data using random forest. BMC Med Inform Decis Mak. 2011, 11: 51-10.1186\/1472-6947-11-51.","journal-title":"BMC Med Inform Decis Mak"},{"key":"5789_CR22","doi-asserted-by":"publisher","first-page":"25","DOI":"10.1186\/1471-2105-8-25","volume":"8","author":"C Strobl","year":"2007","unstructured":"Strobl C, Boulesteix AL, Zeileis A, Hothorn T: Bias in random forest variable importance measures: Illustrations, sources and a solution. BMC Bioinformatics. 2007, 8: 25-10.1186\/1471-2105-8-25.","journal-title":"BMC Bioinformatics"},{"issue":"15","key":"5789_CR23","doi-asserted-by":"publisher","first-page":"1884","DOI":"10.1093\/bioinformatics\/btp331","volume":"25","author":"KK Nicodemus","year":"2009","unstructured":"Nicodemus KK, Malley JD: Predictor correlation impacts machine learning algorithms: implications for genomic studies. Bioinformatics. 2009, 25 (15): 1884-1890. 10.1093\/bioinformatics\/btp331.","journal-title":"Bioinformatics"},{"issue":"4","key":"5789_CR24","doi-asserted-by":"publisher","first-page":"369","DOI":"10.1093\/bib\/bbr016","volume":"12","author":"KK Nicodemus","year":"2011","unstructured":"Nicodemus KK: Letter to the editor: On the stability and ranking of predictors from random forest variable importance measures. Brief Bioinform. 2011, 12 (4): 369-373. 10.1093\/bib\/bbr016.","journal-title":"Brief Bioinform"},{"key":"5789_CR25","doi-asserted-by":"publisher","first-page":"292","DOI":"10.1093\/bib\/bbr053","volume":"13","author":"AL Boulesteix","year":"2012","unstructured":"Boulesteix AL, Bender A, Bermejo JL, Strobl C: Random forest Gini importance favours SNPs with large minor allele frequency: assessment, sources and recommendations. Brief Bioinform. 2012, 13: 292-304. 10.1093\/bib\/bbr053.","journal-title":"Brief Bioinform"},{"issue":"2","key":"5789_CR26","doi-asserted-by":"publisher","first-page":"121","DOI":"10.1159\/000330778","volume":"72","author":"M Calle","year":"2011","unstructured":"Calle M, Urrea V, Boulesteix AL, Malats N: AUC-RF: A new strategy for genomic profiling with random forest. Hum Hered. 2011, 72 (2): 121-132. 10.1159\/000330778.","journal-title":"Hum Hered"},{"issue":"3","key":"5789_CR27","doi-asserted-by":"publisher","first-page":"651","DOI":"10.1198\/106186006X133933","volume":"15","author":"T Hothorn","year":"2006","unstructured":"Hothorn T, Hornik K, Zeileis A: Unbiased recursive partitioning: A conditional inference framework. J Comput Graph Stat. 2006, 15 (3): 651-674. 10.1198\/106186006X133933.","journal-title":"J Comput Graph Stat"},{"key":"5789_CR28","volume-title":"The statistical evaluation of medical tests for classification and prediction","author":"M Pepe","year":"2004","unstructured":"Pepe M: The statistical evaluation of medical tests for classification and prediction. 2004, USA: Oxford University Press"},{"key":"5789_CR29","first-page":"0","volume-title":"Party: a laboratory for recursive partytioning","author":"T Hothorn","year":"2012","unstructured":"Hothorn T, Hornik K, Zeileis A: Party: a laboratory for recursive partytioning. 2012, R package version, 0-3. URL \n                    http:\/\/cran.r-project.org\/package=party"},{"key":"5789_CR30","doi-asserted-by":"publisher","first-page":"132","DOI":"10.1186\/1471-2105-5-132","volume":"5","author":"M Cummings","year":"2004","unstructured":"Cummings M, Myers D: Simple statistical models predict C-to-U edited sites in plant mitochondrial RNA. BMC Bioinformatics. 2004, 5: 132-10.1186\/1471-2105-5-132.","journal-title":"BMC Bioinformatics"},{"key":"5789_CR31","doi-asserted-by":"publisher","first-page":"110","DOI":"10.1186\/1471-2105-11-110","volume":"11","author":"KK Nicodemus","year":"2010","unstructured":"Nicodemus KK, Malley J, Strobl C, Ziegler A: The behavior of random forest permutation-based variable importance measures under predictor correlation. BMC Bioinformatics. 2010, 11: 110-10.1186\/1471-2105-11-110.","journal-title":"BMC Bioinformatics"}],"container-title":["BMC Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/1471-2105-14-119.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1186\/1471-2105-14-119\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/1471-2105-14-119.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,1,22]],"date-time":"2019-01-22T05:27:06Z","timestamp":1548134826000},"score":1,"resource":{"primary":{"URL":"https:\/\/bmcbioinformatics.biomedcentral.com\/articles\/10.1186\/1471-2105-14-119"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2013,4,5]]},"references-count":31,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2013,12]]}},"alternative-id":["5789"],"URL":"https:\/\/doi.org\/10.1186\/1471-2105-14-119","relation":{},"ISSN":["1471-2105"],"issn-type":[{"value":"1471-2105","type":"electronic"}],"subject":[],"published":{"date-parts":[[2013,4,5]]},"article-number":"119"}}