{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,6]],"date-time":"2026-05-06T20:02:41Z","timestamp":1778097761767,"version":"3.51.4"},"reference-count":44,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2016,11,29]],"date-time":"2016-11-29T00:00:00Z","timestamp":1480377600000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/501100001659","name":"Deutsche Forschungsgemeinschaft","doi-asserted-by":"publisher","award":["BO3139\/2-2"],"award-info":[{"award-number":["BO3139\/2-2"]}],"id":[{"id":"10.13039\/501100001659","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001659","name":"Deutsche Forschungsgemeinschaft","doi-asserted-by":"publisher","award":["BO3139\/6-1"],"award-info":[{"award-number":["BO3139\/6-1"]}],"id":[{"id":"10.13039\/501100001659","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Adv Data Anal Classif"],"published-print":{"date-parts":[[2018,12]]},"DOI":"10.1007\/s11634-016-0276-4","type":"journal-article","created":{"date-parts":[[2016,11,29]],"date-time":"2016-11-29T05:04:04Z","timestamp":1480395844000},"page":"885-915","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":173,"title":["A computationally fast variable importance test for random forests for high-dimensional data"],"prefix":"10.1007","volume":"12","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-0948-1501","authenticated-orcid":false,"given":"Silke","family":"Janitza","sequence":"first","affiliation":[]},{"given":"Ender","family":"Celik","sequence":"additional","affiliation":[]},{"given":"Anne-Laure","family":"Boulesteix","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2016,11,29]]},"reference":[{"key":"276_CR1","doi-asserted-by":"crossref","first-page":"6745","DOI":"10.1073\/pnas.96.12.6745","volume":"96","author":"U Alon","year":"1999","unstructured":"Alon U, Barkai N, Notterman DA, Gish K, Ybarra S, Mack D, Levine AJ (1999) Broad patterns of gene expression revealed by clustering analysis of tumor and normal colon tissues probed by oligonucleotide arrays. Proc Natl Acad Sci 96:6745\u20136750","journal-title":"Proc Natl Acad Sci"},{"key":"276_CR2","doi-asserted-by":"crossref","first-page":"1340","DOI":"10.1093\/bioinformatics\/btq134","volume":"26","author":"A Altmann","year":"2010","unstructured":"Altmann A, Tolo\u015fi L, Sander O, Lengauer T (2010) Permutation importance: a corrected feature importance measure. Bioinformatics 26:1340\u20131347","journal-title":"Bioinformatics"},{"key":"276_CR3","doi-asserted-by":"crossref","first-page":"e1004191","DOI":"10.1371\/journal.pcbi.1004191","volume":"4","author":"A-L Boulesteix","year":"2015","unstructured":"Boulesteix A-L (2015) Ten simple rules for reducing overoptimistic reporting in methodological computational research. PLoS Comput Biol 4:e1004191","journal-title":"PLoS Comput Biol"},{"key":"276_CR4","doi-asserted-by":"crossref","first-page":"292","DOI":"10.1093\/bib\/bbr053","volume":"13","author":"AL Boulesteix","year":"2012","unstructured":"Boulesteix AL, Bender A, Bermejo JL, Strobl C (2012) Random forest Gini importance favours SNPs with large minor allele frequency: assessment, sources and recommendations. Brief Bioinform 13:292\u2013304","journal-title":"Brief Bioinform"},{"key":"276_CR5","doi-asserted-by":"crossref","first-page":"5","DOI":"10.1023\/A:1010933404324","volume":"45","author":"L Breiman","year":"2001","unstructured":"Breiman L (2001) Random forests. Mach Learn 45:5\u201332","journal-title":"Mach Learn"},{"key":"276_CR6","unstructured":"Breiman L, C.\u00a0A (2008) Random forests. http:\/\/www.stat.berkeley.edu\/users\/breiman\/RandomForests\/cc_home.htm"},{"key":"276_CR7","doi-asserted-by":"crossref","first-page":"1061","DOI":"10.1093\/bioinformatics\/btf867","volume":"19","author":"M Dettling","year":"2003","unstructured":"Dettling M, B\u00fchlmann P (2003) Boosting for tumor classification with gene expression data. Bioinformatics 19:1061\u20131069","journal-title":"Bioinformatics"},{"key":"276_CR8","doi-asserted-by":"crossref","first-page":"3","DOI":"10.1186\/1471-2105-7-3","volume":"7","author":"R D\u00edaz-Uriarte","year":"2006","unstructured":"D\u00edaz-Uriarte R, De Andres SA (2006) Gene selection and classification of microarray data using random forest. BMC Bioinform 7:3","journal-title":"BMC Bioinform"},{"key":"276_CR9","doi-asserted-by":"crossref","first-page":"531","DOI":"10.1126\/science.286.5439.531","volume":"286","author":"TR Golub","year":"1999","unstructured":"Golub TR, Slonim DK, Tamayo P, Huard C, Gaasenbeek M, Mesirov JP, Coller H, Loh ML, Downing JR, Caligiuri MA et al (1999) Molecular classification of cancer: class discovery and class prediction by gene expression monitoring. Science 286:531\u2013537","journal-title":"Science"},{"key":"276_CR10","unstructured":"Gregorutti B, Michel B, Saint-Pierre P (2013) Correlation and variable importance in random forests. arXiv preprint arXiv:1310.5726"},{"key":"276_CR11","doi-asserted-by":"crossref","first-page":"50","DOI":"10.1016\/j.csda.2012.09.020","volume":"60","author":"A Hapfelmeier","year":"2013","unstructured":"Hapfelmeier A, Ulm K (2013) A new variable selection approach using random forests. Comput Stat Data Anal 60:50\u201369","journal-title":"Comput Stat Data Anal"},{"key":"276_CR12","doi-asserted-by":"crossref","first-page":"651","DOI":"10.1198\/106186006X133933","volume":"15","author":"T Hothorn","year":"2006","unstructured":"Hothorn T, Hornik K, Zeileis A (2006) Unbiased recursive partitioning: a conditional inference framework. J Comput Graph Stat 15:651\u2013674","journal-title":"J Comput Graph Stat"},{"key":"276_CR13","doi-asserted-by":"crossref","first-page":"1766","DOI":"10.1093\/bioinformatics\/bts238","volume":"28","author":"VA Huynh-Thu","year":"2012","unstructured":"Huynh-Thu VA, Saeys Y, Wehenkel L, Geurts P (2012) Statistical interpretation of machine learning-based feature importance scores for biomarker discovery. Bioinformatics 28:1766\u20131774","journal-title":"Bioinformatics"},{"key":"276_CR14","doi-asserted-by":"crossref","first-page":"519","DOI":"10.1214\/07-EJS039","volume":"1","author":"H Ishwaran","year":"2007","unstructured":"Ishwaran H (2007) Variable importance in binary regression trees and forests. Electron J Stat 1:519\u2013537","journal-title":"Electron J Stat"},{"key":"276_CR15","doi-asserted-by":"crossref","first-page":"841","DOI":"10.1214\/08-AOAS169","volume":"2","author":"H Ishwaran","year":"2008","unstructured":"Ishwaran H, Kogalur UB, Blackstone EH, Lauer MS (2008) Random survival forests. Ann Appl Stat 2:841\u2013860","journal-title":"Ann Appl Stat"},{"key":"276_CR16","doi-asserted-by":"crossref","first-page":"119","DOI":"10.1186\/1471-2105-14-119","volume":"14","author":"S Janitza","year":"2013","unstructured":"Janitza S, Strobl C, Boulesteix AL (2013) An AUC-based permutation variable importance measure for random forests. BMC Bioinform 14:119","journal-title":"BMC Bioinform"},{"key":"276_CR17","doi-asserted-by":"crossref","first-page":"57","DOI":"10.1016\/j.csda.2015.10.005","volume":"96","author":"S Janitza","year":"2016","unstructured":"Janitza S, Tutz G, Boulesteix A-L (2016) Random forest for ordinal responses: prediction and variable selection. Comput Stat Data Anal 96:57\u201373","journal-title":"Comput Stat Data Anal"},{"key":"276_CR18","doi-asserted-by":"crossref","first-page":"589","DOI":"10.1198\/016214501753168271","volume":"96","author":"H Kim","year":"2001","unstructured":"Kim H, Loh W-Y (2001) Classification trees with unbiased multiway splits. J Am Stat Assoc 96:589\u2013604","journal-title":"J Am Stat Assoc"},{"key":"276_CR19","first-page":"18","volume":"2","author":"A Liaw","year":"2002","unstructured":"Liaw A, Wiener M (2002) Classification and regression by randomForest. R News 2:18\u201322","journal-title":"R News"},{"key":"276_CR20","unstructured":"Louppe G, Wehenkel L, Sutera A, Geurts P (2013) Understanding variable importances in forests of randomized trees. In: Burges CJC, Bottou L, Welling M, Ghahramani Z, Weinberger KQ (eds) Advances in neural information processing systems, pp 431\u2013439"},{"key":"276_CR21","doi-asserted-by":"crossref","first-page":"85","DOI":"10.1159\/000330579","volume":"72","author":"AM Molinaro","year":"2011","unstructured":"Molinaro AM, Carriero N, Bjornson R, Hartge P, Rothman N, Chatterjee N (2011) Power of data mining methods to detect genetic associations and interactions. Hum Hered 72:85\u201397","journal-title":"Hum Hered"},{"key":"276_CR22","doi-asserted-by":"crossref","first-page":"369","DOI":"10.1093\/bib\/bbr016","volume":"12","author":"K Nicodemus","year":"2011","unstructured":"Nicodemus K (2011) Letter to the editor: on the stability and ranking of predictors from random forest variable importance measures. Brief Bioinform 12:369\u2013373","journal-title":"Brief Bioinform"},{"key":"276_CR23","doi-asserted-by":"crossref","first-page":"1884","DOI":"10.1093\/bioinformatics\/btp331","volume":"25","author":"K Nicodemus","year":"2009","unstructured":"Nicodemus K, Malley J (2009) Predictor correlation impacts machine learning algorithms: implications for genomic studies. Bioinformatics 25:1884\u20131890","journal-title":"Bioinformatics"},{"key":"276_CR24","volume-title":"The statistical evaluation of medical tests for classification and prediction","author":"M Pepe","year":"2004","unstructured":"Pepe M (2004) The statistical evaluation of medical tests for classification and prediction. Oxford University Press, USA"},{"key":"276_CR25","doi-asserted-by":"crossref","first-page":"1544","DOI":"10.2202\/1544-6115.1585","volume":"9","author":"B Phipson","year":"2010","unstructured":"Phipson B, Smyth G (2010) Permutation P-values should never be zero: calculating exact P-values when permutations are randomly drawn. Stat Appl Genet Mol Biol 9:1544\u20136115","journal-title":"Stat Appl Genet Mol Biol"},{"key":"276_CR26","doi-asserted-by":"crossref","first-page":"360","DOI":"10.1038\/nature14221","volume":"518","author":"P Polak","year":"2015","unstructured":"Polak P, Karli\u0107 R, Koren A, Thurman R, Sandstrom R, Lawrence MS, Reynolds A, Rynes E, Vlahovi\u010dek K, Stamatoyannopoulos JA et al (2015) Cell-of-origin chromatin organization shapes the mutational landscape of cancer. Nature 518:360\u2013364","journal-title":"Nature"},{"key":"276_CR27","doi-asserted-by":"crossref","first-page":"436","DOI":"10.1038\/415436a","volume":"415","author":"SL Pomeroy","year":"2002","unstructured":"Pomeroy SL, Tamayo P, Gaasenbeek M, Sturla LM, Angelo M, McLaughlin ME, Kim JY, Goumnerova LC, Black PM, Lau C et al (2002) Prediction of central nervous system embryonal tumour outcome based on gene expression. Nature 415:436\u2013442","journal-title":"Nature"},{"key":"276_CR28","doi-asserted-by":"crossref","first-page":"S7","DOI":"10.1186\/1755-8794-7-S1-S7","volume":"7","author":"MC Prosperi","year":"2014","unstructured":"Prosperi MC, Marinho S, Simpson A, Custovic A, Buchan IE (2014) Predicting phenotypes of asthma and eczema with machine learning. BMC Med Genomics 7:S7","journal-title":"BMC Med Genomics"},{"key":"276_CR29","doi-asserted-by":"crossref","first-page":"112","DOI":"10.1038\/gene.2008.80","volume":"10","author":"DM Reif","year":"2009","unstructured":"Reif DM, Motsinger-Reif AA, McKinney BA, Rock MT, Crowe J, Moore JH (2009) Integrated analysis of genetic and proteomic data identifies biomarkers associated with adverse events following smallpox vaccination. Genes Immun 10:112\u2013119","journal-title":"Genes Immun"},{"key":"276_CR30","doi-asserted-by":"crossref","first-page":"1752","DOI":"10.1093\/bioinformatics\/btq257","volume":"26","author":"DF Schwarz","year":"2010","unstructured":"Schwarz DF, K\u00f6nig IR, Ziegler A (2010) On safari to random jungle: a fast implementation of random forests for high-dimensional data. Bioinformatics 26:1752\u20131758","journal-title":"Bioinformatics"},{"key":"276_CR31","doi-asserted-by":"crossref","first-page":"203","DOI":"10.1016\/S1535-6108(02)00030-2","volume":"1","author":"D Singh","year":"2002","unstructured":"Singh D, Febbo PG, Ross K, Jackson DG, Manola J, Ladd C, Tamayo P, Renshaw AA, D\u2019Amico AV, Richie JP et al (2002) Gene expression correlates of clinical prostate cancer behavior. Cancer Cell 1:203\u2013209","journal-title":"Cancer Cell"},{"key":"276_CR32","doi-asserted-by":"crossref","unstructured":"Strobl C, Boulesteix A-L, Kneib T, Augustin T, Zeileis A (2008) Conditional variable importance for random forests. BMC Bioinform 9:307","DOI":"10.1186\/1471-2105-9-307"},{"key":"276_CR33","doi-asserted-by":"crossref","unstructured":"Strobl C, Boulesteix AL, Zeileis A, Hothorn T (2007) Bias in random forest variable importance measures: Illustrations, sources and a solution. BMC Bioinform 8:25","DOI":"10.1186\/1471-2105-8-25"},{"key":"276_CR34","doi-asserted-by":"crossref","first-page":"323","DOI":"10.1037\/a0016973","volume":"14","author":"C Strobl","year":"2009","unstructured":"Strobl C, Malley J, Tutz G (2009) An introduction to recursive partitioning: rationale, application, and characteristics of classification and regression trees, bagging, and random forests. Psychol Methods 14:323\u2013348","journal-title":"Psychol Methods"},{"key":"276_CR35","first-page":"59","volume-title":"Proceedings of the 18th international conference on computational statistics","author":"C Strobl","year":"2008","unstructured":"Strobl C, Zeileis A (2008) Danger: high power!\u2014exploring the statistical properties of a test for random forest variable importance. In: Brito P (ed) Proceedings of the 18th international conference on computational statistics. Porto, Portugal (CD-ROM), Springer, Heidelberg, pp 59\u201366"},{"key":"276_CR36","doi-asserted-by":"crossref","first-page":"7","DOI":"10.1186\/s13040-016-0087-3","volume":"9","author":"S Szymczak","year":"2016","unstructured":"Szymczak S, Holzinger E, Dasgupta A, Malley JD, Molloy AN, Mills JL, Brody LC, Stambolian D, Bailey-Wilson JE (2016) r2VIM: a new variable selection method for random forests in genome-wide association studies. BioData Min 9:7","journal-title":"BioData Min"},{"key":"276_CR37","first-page":"S75","volume":"2","author":"AC Tan","year":"2003","unstructured":"Tan AC, Gilbert D (2003) Ensemble machine learning on gene expression data for cancer classification. Appl Bioinform 2:S75\u2013S83","journal-title":"Appl Bioinform"},{"key":"276_CR38","doi-asserted-by":"crossref","first-page":"S68","DOI":"10.1186\/1753-6561-3-s7-s68","volume":"3","author":"R Tang","year":"2009","unstructured":"Tang R, Sinnwell JP, Li J, Rider DN, de Andrade M, Biernacka JM (2009) Identification of genes and haplotypes that predict rheumatoid arthritis using random forests. BMC Proc 3:S68","journal-title":"BMC Proc"},{"key":"276_CR39","doi-asserted-by":"crossref","unstructured":"van\u2019t Veer LJ, Dai H, Van De Vijver MJ, He YD, Hart AA, Mao M, Peterse HL, van der Kooy K, Marton MJ, Witteveen AT et al (2002) Gene expression profiling predicts clinical outcome of breast cancer. Nature 415:530\u2013536","DOI":"10.1038\/415530a"},{"key":"276_CR40","doi-asserted-by":"crossref","first-page":"60","DOI":"10.1186\/s12859-016-0900-5","volume":"17","author":"H Wang","year":"2016","unstructured":"Wang H, Yang F, Luo Z (2016) An experimental study of the intrinsic stability of random forest variable importance measures. BMC Bioinform 17:60","journal-title":"BMC Bioinform"},{"key":"276_CR41","doi-asserted-by":"publisher","unstructured":"Wang-Sattler R, Yu Z, Herder C, Messias AC, Floegel A, He Y, Heim K, Campillos M, Holzapfel C, Thorand B et\u00a0al (2012) Novel biomarkers for pre-diabetes identified by metabolomics. Mol Syst Biol 8:615. doi: 10.1038\/msb.2012.43","DOI":"10.1038\/msb.2012.43"},{"key":"276_CR42","doi-asserted-by":"crossref","unstructured":"Wright MN, Ziegler A (2016) ranger: a fast implementation of random forests for high dimensional data in C++ and R. J Stat Softw (in press)","DOI":"10.18637\/jss.v077.i01"},{"key":"276_CR43","doi-asserted-by":"crossref","first-page":"222","DOI":"10.1038\/nature11053","volume":"486","author":"T Yatsunenko","year":"2012","unstructured":"Yatsunenko T, Rey FE, Manary MJ, Trehan I, Dominguez-Bello MG, Contreras M, Magris M, Hidalgo G, Baldassano RN, Anokhin AP et al (2012) Human gut microbiome viewed across age and geography. Nature 486:222\u2013227","journal-title":"Nature"},{"key":"276_CR44","first-page":"1770","volume":"110","author":"R Zhu","year":"2015","unstructured":"Zhu R, Zeng D, Kosorok MR (2015) Reinforcement learning trees. JASA 110:1770\u20131784","journal-title":"Reinforcement learning trees. JASA"}],"container-title":["Advances in Data Analysis and Classification"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s11634-016-0276-4\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s11634-016-0276-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s11634-016-0276-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,9,15]],"date-time":"2019-09-15T21:55:05Z","timestamp":1568584505000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s11634-016-0276-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,11,29]]},"references-count":44,"aliases":["10.1007\/s11634-016-0270-x"],"journal-issue":{"issue":"4","published-print":{"date-parts":[[2018,12]]}},"alternative-id":["276"],"URL":"https:\/\/doi.org\/10.1007\/s11634-016-0276-4","relation":{},"ISSN":["1862-5347","1862-5355"],"issn-type":[{"value":"1862-5347","type":"print"},{"value":"1862-5355","type":"electronic"}],"subject":[],"published":{"date-parts":[[2016,11,29]]}}}