{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,21]],"date-time":"2025-10-21T15:15:53Z","timestamp":1761059753824},"reference-count":35,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2014,6,22]],"date-time":"2014-06-22T00:00:00Z","timestamp":1403395200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Cheminform"],"published-print":{"date-parts":[[2014,12]]},"DOI":"10.1186\/1758-2946-6-34","type":"journal-article","created":{"date-parts":[[2014,6,21]],"date-time":"2014-06-21T21:02:42Z","timestamp":1403384562000},"update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":19,"title":["Using beta binomials to estimate classification uncertainty for ensemble models"],"prefix":"10.1186","volume":"6","author":[{"given":"Robert D","family":"Clark","sequence":"first","affiliation":[]},{"given":"Wenkel","family":"Liang","sequence":"additional","affiliation":[]},{"given":"Adam C","family":"Lee","sequence":"additional","affiliation":[]},{"given":"Michael S","family":"Lawless","sequence":"additional","affiliation":[]},{"given":"Robert","family":"Fraczkiewicz","sequence":"additional","affiliation":[]},{"given":"Marvin","family":"Waldman","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2014,6,22]]},"reference":[{"key":"610_CR1","doi-asserted-by":"publisher","first-page":"1361","DOI":"10.1289\/ehp.5758","volume":"111","author":"L Eriksson","year":"2003","unstructured":"Eriksson L, Jaworska J, Worth AP, Cronin MTD, McDowell RM, Gramatica P: Methods for reliability and uncertainty assessment and for applicability evaluations of classification- and regression-based QSARs. Environ Health Perspect. 2003, 111: 1361-1375.","journal-title":"Environ Health Perspect"},{"key":"610_CR2","doi-asserted-by":"publisher","first-page":"367","DOI":"10.1007\/978-1-4020-9783-6_13","volume-title":"Advances in Computational Chemistry and Physics Volume 8: Recent Advances in QSAR Studies","author":"AP Worth","year":"2010","unstructured":"Worth AP: The role of QSAR methodology in the regulatory assessment of chemicals. Advances in Computational Chemistry and Physics Volume 8: Recent Advances in QSAR Studies. Edited by: Puzyn T, Leszczynski J, Cronin MT. 2010, Netherlands: Springer, 367-"},{"key":"610_CR3","doi-asserted-by":"crossref","first-page":"111","DOI":"10.1177\/026119291304100111","volume":"41","author":"U Sahlin","year":"2013","unstructured":"Sahlin U: Uncertainty in QSAR Predictions. Altern Lab Anim. 2013, 41: 111-125.","journal-title":"Altern Lab Anim"},{"key":"610_CR4","doi-asserted-by":"publisher","first-page":"1315","DOI":"10.1016\/j.jmgm.2008.01.002","volume":"26","author":"S Weaver","year":"2008","unstructured":"Weaver S, Gleeson MP: The importance of the domain of applicability in QSAR modeling. J Mol Graph Model. 2008, 26: 1315-1326.","journal-title":"J Mol Graph Model"},{"key":"610_CR5","doi-asserted-by":"publisher","first-page":"1249","DOI":"10.1289\/ehp.7125","volume":"112","author":"W Tong","year":"2004","unstructured":"Tong W, Xie Q, Hong H, Shi L, Fang H, Perkins R: Assessment of prediction confidence and domain extrapolation of two structure\u2013activity relationship models for predicting estrogen receptor binding activity. Environ Health Perspect. 2004, 112: 1249-1254.","journal-title":"Environ Health Perspect"},{"key":"610_CR6","doi-asserted-by":"publisher","first-page":"1733","DOI":"10.1021\/ci800151m","volume":"48","author":"IV Tetko","year":"2008","unstructured":"Tetko IV, Sushko I, Pandey AK, Zhu H, Tropsha A, Papa E, \u00d6berg T, Todeschini R, Fourches D, Varnek A: Critical assessment of QSAR models of environmental toxicity against Tetrahymena pyriformis: Focusing on applicability domain and overfitting by variable selection. J Chem Inf Model. 2008, 48: 1733-1746.","journal-title":"J Chem Inf Model"},{"key":"610_CR7","doi-asserted-by":"publisher","first-page":"1046","DOI":"10.1021\/ci990131n","volume":"40","author":"B Beck","year":"2000","unstructured":"Beck B, Breindl A, Clark T: QM\/NN QSPR models with error estimation: Vapor pressure and logP. J Chem Inf Comput Sci. 2000, 40: 1046-1051.","journal-title":"J Chem Inf Comput Sci"},{"key":"610_CR8","doi-asserted-by":"publisher","first-page":"11","DOI":"10.1186\/1758-2946-1-11","volume":"1","author":"RD Clark","year":"2009","unstructured":"Clark RD: DPRESS: localizing estimates of predictive uncertainty. J Cheminform. 2009, 1: 11-","journal-title":"J Cheminform"},{"key":"610_CR9","doi-asserted-by":"publisher","first-page":"551","DOI":"10.1002\/minf.201000177","volume":"30","author":"U Sahlin","year":"2011","unstructured":"Sahlin U, Jeliazkova N, \u00d6berg T: Applicability domain dependent predictive uncertainty in QSAR regressions. Mol Inf. 2011, 30: 551-564.","journal-title":"Mol Inf"},{"key":"610_CR10","doi-asserted-by":"publisher","first-page":"203","DOI":"10.1007\/s10822-013-9639-5","volume":"27","author":"DJ Wood","year":"2013","unstructured":"Wood DJ, Carlsson L, Eklund M, Norinder U, St\u00e5lring J: QSAR with experimental and predictive distributions: an information theoretic approach for assessing model quality. J Comput Aided Mol Des. 2013, 27: 203-219.","journal-title":"J Comput Aided Mol Des"},{"key":"610_CR11","doi-asserted-by":"publisher","first-page":"368","DOI":"10.1021\/ci300554t","volume":"53","author":"CE Keefer","year":"2013","unstructured":"Keefer CE, Kauffman GW, Gupta RR: Interpretable, probability-based confidence metric for continuous quantitative structure\u2013activity relationship models. J Chem Inf Model. 2013, 53: 368-383.","journal-title":"J Chem Inf Model"},{"key":"610_CR12","doi-asserted-by":"publisher","first-page":"2837","DOI":"10.1021\/ci400482e","volume":"53","author":"RP Sheridan","year":"2013","unstructured":"Sheridan RP: Using random forest to model the domain applicability of another random forest model. J Chem Inf Model. 2013, 53: 2837-2850.","journal-title":"J Chem Inf Model"},{"key":"610_CR13","doi-asserted-by":"publisher","first-page":"26","DOI":"10.1002\/minf.201200131","volume":"33","author":"U Sahlin","year":"2014","unstructured":"Sahlin U, Jeliazkova N, \u00d6berg T: Applicability domain dependent predictive uncertainty in QSAR regressions. Mol Inf. 2014, 33: 26-35.","journal-title":"Mol Inf"},{"key":"610_CR14","doi-asserted-by":"publisher","first-page":"202","DOI":"10.1002\/cem.1296","volume":"24","author":"I Sushko","year":"2010","unstructured":"Sushko I, Novotarskyi S, K\u00f6rner R, Pandey AK, Kovalishyn VV, Prokopenko VV, Tetko IV: Applicability domain for in silico models to achieve accuracy of experimental measurements. J Chemometrics. 2010, 24: 202-208.","journal-title":"J Chemometrics"},{"key":"610_CR15","doi-asserted-by":"publisher","first-page":"2094","DOI":"10.1021\/ci100253r","volume":"50","author":"I Sushko","year":"2010","unstructured":"Sushko I, Novotarskyi S, K\u00f6rner R, Pandey AK, Cherkasov A, Li J, Gramatica P, Hansen K, Schroeter T, Klaus-Robert M\u00fcller K-R, Xi L, Liu H, Yao X, \u00d6berg T, Hormozdiari F, Dao P, Sahinalp C, Todeschini R, Polishchuk P, Artemenko A, Kuz\u2019min V, Martin TM, Douglas MDM, Fourches D, Muratov E, Tropsha A, Baskin I, Horvath D, Marcou G, Muller C, et al: Applicability domains for classification problems: benchmarking of distance to models for Ames mutagenicity set. J Chem Inf Model. 2010, 50: 2094-2111.","journal-title":"J Chem Inf Model"},{"key":"610_CR16","doi-asserted-by":"publisher","first-page":"9480","DOI":"10.1021\/ja00025a009","volume":"113","author":"N Bodor","year":"1991","unstructured":"Bodor N, Harget A, Huang M-J: Neural network studies.1. Estimation of the aqueous solubility of organic compounds. J Am Chem Soc. 1991, 113: 9480-9483.","journal-title":"J Am Chem Soc"},{"key":"610_CR17","doi-asserted-by":"publisher","first-page":"149","DOI":"10.1111\/j.0006-341X.1999.00149.x","volume":"55","author":"JK Lindsey","year":"1999","unstructured":"Lindsey JK: Response surfaces for overdispersion in the study of the conditions for fish eggs hatching. Biometrics. 1999, 55: 149-155.","journal-title":"Biometrics"},{"key":"610_CR18","first-page":"255","volume":"35","author":"E D\u00e1vila","year":"2012","unstructured":"D\u00e1vila E, L\u00f3pez LA, D\u00edaz LG: A statistical model for analyzing interdependent complex of plant pathogens. Rev Colomb Estad. 2012, 35: 255-270.","journal-title":"Rev Colomb Estad"},{"key":"610_CR19","doi-asserted-by":"publisher","first-page":"197","DOI":"10.1016\/j.artmed.2007.07.003","volume":"41","author":"H Moon","year":"2007","unstructured":"Moon H, Ahn H, Kodell RL, Baek S, Lin C-J, Lee T, Chen JJ: Ensemble methods for classification of patients for personalized medicine with high-dimensional data. Artif Intell Med. 2007, 41: 197-207.","journal-title":"Artif Intell Med"},{"key":"610_CR20","volume-title":"Handbook of Mathematical Functions with Formulas, Graphs, and Mathematical Tables, Tenth Printing","year":"1972","unstructured":"Handbook of Mathematical Functions with Formulas, Graphs, and Mathematical Tables, Tenth Printing. Edited by: Abramowitz M, Stegun IA. 1972, Washington: National Bureau of Standards"},{"key":"610_CR21","doi-asserted-by":"publisher","first-page":"68","DOI":"10.1080\/01621459.1951.10500769","volume":"46","author":"FJ Massey Jr","year":"1951","unstructured":"Massey FJ: The Kolmogorov-Smirnov test for goodness of fit. J Am Stat Assoc. 1951, 46: 68-78.","journal-title":"J Am Stat Assoc"},{"key":"610_CR22","unstructured":"Simulations Plus, Inc: ADMET Predictor\u2122. [ http:\/\/www.simulations-plus.com ]"},{"key":"610_CR23","first-page":"168","volume-title":"EuroQSAR 2002: Designing Drugs and Crop Protectants: Processes, Problems and Solutions","author":"JC Dearden","year":"2003","unstructured":"Dearden JC, Netzeva TI, Bibby R: A comparison of commercially available software for the prediction of partition coefficient. EuroQSAR 2002: Designing Drugs and Crop Protectants: Processes, Problems and Solutions. Edited by: Ford M, Livingstone D, Dearden J, Van de Waterbeemd H. 2003, Oxford: Blackwell Publishing, 168-169."},{"key":"610_CR24","doi-asserted-by":"publisher","first-page":"861","DOI":"10.1002\/jps.21494","volume":"98","author":"R Mannhold","year":"2009","unstructured":"Mannhold R, Poda GI, Ostermann C, Tetko IV: Calculation of molecular lipophilicity: State-of-the-art and comparison of log P methods on more than 96,000 compounds. J Pharm Sci. 2009, 98: 861-893.","journal-title":"J Pharm Sci"},{"key":"610_CR25","doi-asserted-by":"publisher","first-page":"1351","DOI":"10.1002\/sim.1761","volume":"23","author":"MJ Sweeting","year":"2004","unstructured":"Sweeting MJ, Sutton AJ, Lambert PC: What to add to nothing? Use and avoidance of continuity corrections in meta-analysis of sparse data. Stat Med. 2004, 23: 1351-1375.","journal-title":"Stat Med"},{"key":"610_CR26","doi-asserted-by":"publisher","first-page":"2077","DOI":"10.1021\/ci900161g","volume":"49","author":"K Hansen","year":"2009","unstructured":"Hansen K, Sebastian Mika S, Schroeter T, Sutter A, Ter Laak A, Steger-Hartmann T, Heinrich N, M\u00fcller K-R: Benchmark data set for in silico prediction of Ames mutagenicity. J Chem Inf Model. 2009, 49: 2077-2081.","journal-title":"J Chem Inf Model"},{"key":"610_CR27","doi-asserted-by":"publisher","first-page":"135","DOI":"10.1080\/15287398809531194","volume":"25","author":"R Benigni","year":"1988","unstructured":"Benigni R, Giuliani A: Computer-assisted analysis of interlaboratory Ames test variability. J Toxicol Environ Health. 1988, 25: 135-148.","journal-title":"J Toxicol Environ Health"},{"key":"610_CR28","doi-asserted-by":"publisher","first-page":"32","DOI":"10.1002\/1097-0142(1950)3:1<32::AID-CNCR2820030106>3.0.CO;2-3","volume":"3","author":"WJ Youden","year":"1950","unstructured":"Youden WJ: Index for rating diagnostic tests. Cancer. 1950, 3: 32-35.","journal-title":"Cancer"},{"key":"610_CR29","volume-title":"PubChem Bioassay","author":"National Institutes of Health","year":"1851","unstructured":"National Institutes of Health: AID 1851 \u2013 PubChem BioAssay Summary. PubChem Bioassay. 1851, [ http:\/\/pubchem.ncbi.nlm.nih.gov\/assay\/assay.cgi?aid=1851 ; accessed 10 July 2013]"},{"key":"610_CR30","doi-asserted-by":"publisher","first-page":"783","DOI":"10.1002\/minf.201200065","volume":"31","author":"H Sun","year":"2012","unstructured":"Sun H, Veith H, Xia M, Austin CP, Tice RR, Huang R: Prediction of cytochrome P450 profiles of environmental chemicals with QSAR Models built from drug-like molecules. Mol Inform. 2012, 31: 783-792.","journal-title":"Mol Inform"},{"key":"610_CR31","first-page":"123","volume":"24","author":"L Breiman","year":"1996","unstructured":"Breiman L: Bagging predictors. Mach Learn. 1996, 24: 123-140.","journal-title":"Mach Learn"},{"key":"610_CR32","doi-asserted-by":"publisher","first-page":"119","DOI":"10.1021\/ed075p119","volume":"75","author":"DC Harris","year":"1998","unstructured":"Harris DC: Nonlinear least-squares curve fitting with microsoft excel solver. J Chem Ed. 1998, 75: 119-121.","journal-title":"J Chem Ed"},{"key":"610_CR33","unstructured":"BioByte Corp: BioByte Master Database. [ http:\/\/www.biobyte.com ]"},{"key":"610_CR34","doi-asserted-by":"publisher","first-page":"1050","DOI":"10.1038\/nbt.1581","volume":"27","author":"H Veith","year":"2009","unstructured":"Veith H, Southall N, Huang R, James T, Fayne D, Artemenko N, Shen M, Inglese J, Austin CP, Lloyd DG, Auld DS: Comprehensive characterization of cytochrome P450 isozyme selectivity across chemical libraries. Nat Biotechnol. 2009, 27: 1050-1055.","journal-title":"Nat Biotechnol"},{"key":"610_CR35","doi-asserted-by":"publisher","first-page":"429","DOI":"10.1021\/ci025590u","volume":"43","author":"A Yan","year":"2003","unstructured":"Yan A, Gasteiger J: Prediction of aqueous solubility of organic compounds based on a 3D structure representation. J Chem Inf Comput Sci. 2003, 43: 429-434.","journal-title":"J Chem Inf Comput Sci"}],"container-title":["Journal of Cheminformatics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/article\/10.1186\/1758-2946-6-34\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/1758-2946-6-34.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/1758-2946-6-34.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,8,11]],"date-time":"2019-08-11T16:19:21Z","timestamp":1565540361000},"score":1,"resource":{"primary":{"URL":"https:\/\/jcheminf.biomedcentral.com\/articles\/10.1186\/1758-2946-6-34"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014,6,22]]},"references-count":35,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2014,12]]}},"alternative-id":["610"],"URL":"https:\/\/doi.org\/10.1186\/1758-2946-6-34","relation":{},"ISSN":["1758-2946"],"issn-type":[{"value":"1758-2946","type":"electronic"}],"subject":[],"published":{"date-parts":[[2014,6,22]]},"assertion":[{"value":"5 March 2014","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"16 June 2014","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"22 June 2014","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}],"article-number":"34"}}