{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,9]],"date-time":"2026-05-09T10:11:16Z","timestamp":1778321476634,"version":"3.51.4"},"reference-count":74,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2017,6,28]],"date-time":"2017-06-28T00:00:00Z","timestamp":1498608000000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0\/"},{"start":{"date-parts":[[2017,6,28]],"date-time":"2017-06-28T00:00:00Z","timestamp":1498608000000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","award":["CNS 1337899"],"award-info":[{"award-number":["CNS 1337899"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Cheminform"],"published-print":{"date-parts":[[2017,12]]},"DOI":"10.1186\/s13321-017-0226-y","type":"journal-article","created":{"date-parts":[[2017,6,28]],"date-time":"2017-06-28T11:42:38Z","timestamp":1498650158000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":248,"title":["Deep-learning: investigating deep neural networks hyper-parameters and comparison of performance to shallow methods for modeling bioactivity data"],"prefix":"10.1186","volume":"9","author":[{"given":"Alexios","family":"Koutsoukas","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Keith J.","family":"Monaghan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xiaoli","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4929-2617","authenticated-orcid":false,"given":"Jun","family":"Huan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2017,6,28]]},"reference":[{"key":"226_CR1","first-page":"44","volume":"5","author":"W Bains","year":"2002","unstructured":"Bains W, Gilbert R, Sviridenko L, Gascon JM, Scoffin R, Birchall K, Harvey I, Caldwell J (2002) Evolutionary computational methods to predict oral bioavailability QSPRs. Curr Opin Drug Discov Dev 5:44\u201351","journal-title":"Curr Opin Drug Discov Dev"},{"key":"226_CR2","first-page":"692","volume":"41","author":"SC Basak","year":"2001","unstructured":"Basak SC, Mills D (2001) Quantitative structure\u2013property relationships (QSPRs) for the estimation of vapor pressure: a hierarchical approach using mathematical structural descriptors. J Chem Inf Model 41:692\u2013701","journal-title":"J Chem Inf Model"},{"key":"226_CR3","doi-asserted-by":"publisher","first-page":"2889","DOI":"10.1021\/cr200066h","volume":"112","author":"T Le","year":"2012","unstructured":"Le T, Epa VC, Burden FR, Winkler DA (2012) Quantitative structure\u2013property relationship modeling of diverse materials properties. Chem Rev 112:2889\u20132919","journal-title":"Chem Rev"},{"key":"226_CR4","doi-asserted-by":"crossref","unstructured":"Cronin MTD (2010) Quantitative structure\u2013activity relationships (QSARs)\u2014applications and methodology. In: Puzyn T, Leszczynski J, Cronin MT (eds) Recent advances in QSAR studies methods and applications. Springer, pp 3\u201311","DOI":"10.1007\/978-1-4020-9783-6_1"},{"key":"226_CR5","doi-asserted-by":"publisher","first-page":"529","DOI":"10.1038\/clpt.2011.300","volume":"91","author":"NL Kruhlak","year":"2012","unstructured":"Kruhlak NL, Benz RD, Zhou H, Colatsky TJ (2012) (Q)SAR modeling and safety assessment in regulatory review. Clin Pharmacol Ther 91:529\u2013534","journal-title":"Clin Pharmacol Ther"},{"key":"226_CR6","doi-asserted-by":"publisher","first-page":"16","DOI":"10.1016\/j.drudis.2009.09.010","volume":"15","author":"C Merlot","year":"2010","unstructured":"Merlot C (2010) Computational toxicology\u2014a tool for early safety evaluation. Drug Discov Today 15:16\u201322","journal-title":"Drug Discov Today"},{"key":"226_CR7","doi-asserted-by":"publisher","first-page":"2554","DOI":"10.1016\/j.jprot.2011.05.011","volume":"74","author":"A Koutsoukas","year":"2011","unstructured":"Koutsoukas A, Simms B, Kirchmair J, Bond PJ, Whitmore AV, Zimmer S, Young MP, Jenkins JL, Glick M, Glen RC, Bender A (2011) From in silico target prediction to multi-target drug design: current databases, methods and applications. J Proteomics 74:2554\u20132574","journal-title":"J Proteomics"},{"key":"226_CR8","doi-asserted-by":"publisher","first-page":"139","DOI":"10.1385\/MB:27:2:139","volume":"27","author":"DA Winkler","year":"2004","unstructured":"Winkler DA (2004) Neural networks as robust tools in drug lead discovery and development. Mol Biotechnol 27:139\u2013168","journal-title":"Mol Biotechnol"},{"key":"226_CR9","first-page":"1460","volume":"42","author":"PD Mosier","year":"2002","unstructured":"Mosier PD, Jurs PC (2002) QSAR\/QSPR studies using probabilistic neural networks and generalized regression neural networks. J Chem Inf Model 42:1460\u20131470","journal-title":"J Chem Inf Model"},{"key":"226_CR10","doi-asserted-by":"publisher","first-page":"3183","DOI":"10.1021\/jm980697n","volume":"42","author":"FR Burden","year":"1999","unstructured":"Burden FR (1999) Robust QSAR models using bayesian regularized neural networks. J Med Chem 42:3183\u20133187","journal-title":"J Med Chem"},{"key":"226_CR11","doi-asserted-by":"publisher","first-page":"450","DOI":"10.1021\/ci970100x","volume":"38","author":"J Huuskonen","year":"1998","unstructured":"Huuskonen J, Salo M, Taskinen J (1998) Aqueous solubility prediction of drugs based on molecular topology and neural network modeling. J Chem Inf Comput Sci 38:450\u2013456","journal-title":"J Chem Inf Comput Sci"},{"key":"226_CR12","first-page":"121","volume":"39","author":"B Lucic","year":"1999","unstructured":"Lucic B, Trinajstic N (1999) Multivariate regression outperforms several robust architectures of neural networks in QSAR modeling. J Chem Inf Model 39:121\u2013132","journal-title":"J Chem Inf Model"},{"key":"226_CR13","doi-asserted-by":"publisher","first-page":"71","DOI":"10.1016\/S0166-1280(02)00619-X","volume":"622","author":"SP Niculescu","year":"2003","unstructured":"Niculescu SP (2003) Artificial neural networks and genetic algorithms in QSAR. J Mol Struct (Thoechem) 622:71\u201383","journal-title":"J Mol Struct (Thoechem)"},{"key":"226_CR14","first-page":"903","volume":"42","author":"DK Agrafiotis","year":"2002","unstructured":"Agrafiotis DK, Cedeno W, Lobanov VS (2002) On the use of neural network ensembles in QSAR and QSPR. J Chem Inf Model 42:903\u2013911","journal-title":"J Chem Inf Model"},{"key":"226_CR15","doi-asserted-by":"publisher","first-page":"800","DOI":"10.1021\/ci050022a","volume":"45","author":"R Guha","year":"2005","unstructured":"Guha R, Jurs PC (2005) Interpreting computational neural network QSAR models: a measure of descriptor importance. J Chem Inf Model 45:800\u2013806","journal-title":"J Chem Inf Model"},{"key":"226_CR16","doi-asserted-by":"publisher","first-page":"195","DOI":"10.1016\/S0223-5234(99)80052-X","volume":"34","author":"DT Manallack","year":"1999","unstructured":"Manallack DT, Livingstone DJ (1999) Neural networks in drug discovery: have they lived up to their promise? Eur J Med Chem 34:195\u2013208","journal-title":"Eur J Med Chem"},{"key":"226_CR17","doi-asserted-by":"publisher","first-page":"15","DOI":"10.1016\/S0893-6080(99)00094-5","volume":"13","author":"G Schneider","year":"2000","unstructured":"Schneider G (2000) Neural networks are useful tools for drug design. Neural Netw 13:15\u201316","journal-title":"Neural Netw"},{"key":"226_CR18","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1002\/minf.201501008","volume":"35","author":"E Gawehn","year":"2016","unstructured":"Gawehn E, Hiss JA, Schneider G (2016) Deep learning in drug discovery. Mol Inform 35:3\u201314","journal-title":"Mol Inform"},{"key":"226_CR19","doi-asserted-by":"publisher","first-page":"263","DOI":"10.1021\/ci500747n","volume":"55","author":"J Ma","year":"2015","unstructured":"Ma J, Sheridan RP, Liaw A, Dahl GE, Svetnik V (2015) Deep neural nets as a method for quantitative structure\u2013activity relationships. J Chem Inf Model 55:263\u2013274","journal-title":"J Chem Inf Model"},{"key":"226_CR20","first-page":"80","volume":"3","author":"GK Andreas Mayr","year":"2016","unstructured":"Andreas Mayr GK, Unterthiner T, Hochreiter S (2016) DeepTox: toxicity prediction using deep learning. Front Environ Sci 3:80","journal-title":"Front Environ Sci"},{"key":"226_CR21","doi-asserted-by":"publisher","first-page":"13","DOI":"10.1109\/MCI.2010.938364","volume":"5","author":"I Arel","year":"2010","unstructured":"Arel I, Rose DC, Karnowski TP (2010) Deep machine learning\u2014a new frontier in artificial intelligence research [research frontier]. IEEE Comput Intell Mag 5:13\u201318","journal-title":"IEEE Comput Intell Mag"},{"key":"226_CR22","doi-asserted-by":"publisher","first-page":"436","DOI":"10.1038\/nature14539","volume":"521","author":"Y LeCun","year":"2015","unstructured":"LeCun Y, Bengio Y, Hinton G (2015) Deep learning. Nature 521:436\u2013444","journal-title":"Nature"},{"key":"226_CR23","doi-asserted-by":"publisher","first-page":"1798","DOI":"10.1109\/TPAMI.2013.50","volume":"35","author":"Y Bengio","year":"2013","unstructured":"Bengio Y, Courville A, Vincent P (2013) Representation learning: a review and new perspectives. IEEE Trans Pattern Anal Mach Intell 35:1798\u20131828","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"226_CR24","first-page":"469","volume":"2010","author":"G Dahl","year":"2010","unstructured":"Dahl G, Mohamed A-R, Hinton GE (2010) Phone recognition with the mean-covariance restricted Boltzmann machine. Adv Neural Inf Process Syst 2010:469\u2013477","journal-title":"Adv Neural Inf Process Syst"},{"key":"226_CR25","doi-asserted-by":"crossref","unstructured":"Ciresan D, Meier U, Schmidhuber J (2012) Multi-column deep neural networks for image classification. In: Proceedings of the IEEE international conference on computer vision and pattern recognition (CVPR), pp 3642\u20133649","DOI":"10.1109\/CVPR.2012.6248110"},{"key":"226_CR26","doi-asserted-by":"publisher","first-page":"3207","DOI":"10.1162\/NECO_a_00052","volume":"22","author":"DC Cire\u015fan","year":"2010","unstructured":"Cire\u015fan DC, Meier U, Gambardella LM, Schmidhuber J (2010) Deep, big, simple neural nets for handwritten digit recognition. Neural Comput 22:3207\u20133220","journal-title":"Neural Comput"},{"key":"226_CR27","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1016\/S0167-7012(00)00201-3","volume":"43","author":"IA Basheer","year":"2000","unstructured":"Basheer IA, Hajmeer M (2000) Artificial neural networks: fundamentals, computing, design, and application. J Microbiol Methods 43:3\u201331","journal-title":"J Microbiol Methods"},{"key":"226_CR28","doi-asserted-by":"publisher","first-page":"115","DOI":"10.1007\/BF02478259","volume":"5","author":"WS McCulloch","year":"1943","unstructured":"McCulloch WS, Pitts W (1943) A logical calculus of the ideas immanent in nervous activity. Bull Math Biophys 5:115\u2013133","journal-title":"Bull Math Biophys"},{"key":"226_CR29","first-page":"1","volume":"10","author":"H Larochelle","year":"2009","unstructured":"Larochelle H, Bengio Y, Louradour M, Lamblin P (2009) Exploring strategies for training deep neural networks. J Mach Learn Res 10:1\u201340","journal-title":"J Mach Learn Res"},{"key":"226_CR30","doi-asserted-by":"publisher","first-page":"533","DOI":"10.1038\/323533a0","volume":"323","author":"DE Rumelhart","year":"1986","unstructured":"Rumelhart DE, Hinton GE, Williams RJ (1986) Learning representations by back-propagating errors. Nature 323:533\u2013536","journal-title":"Nature"},{"key":"226_CR31","first-page":"1929","volume":"15","author":"N Srivastava","year":"2014","unstructured":"Srivastava N, Hinton G, Krizhevsky A, Sutskever I, Salakhutdinov R (2014) Dropout: a simple way to prevent neural networks from overfitting. J Mach Learn Res 15:1929\u20131958","journal-title":"J Mach Learn Res"},{"key":"226_CR32","doi-asserted-by":"publisher","first-page":"879","DOI":"10.1109\/JPROC.2008.917757","volume":"96","author":"JD Owens","year":"2008","unstructured":"Owens JD, Houston M, Luebke D, Green S, Stone JE, Phillips JC (2008) GPU computing. Proc IEEE 96:879\u2013899","journal-title":"Proc IEEE"},{"key":"226_CR33","doi-asserted-by":"publisher","first-page":"1563","DOI":"10.1021\/ci400187y","volume":"53","author":"A Lusci","year":"2013","unstructured":"Lusci A, Pollastri G, Baldi P (2013) Deep architectures and deep learning in chemoinformatics: the prediction of aqueous solubility for drug-like molecules. J Chem Inf Model 53:1563\u20131575","journal-title":"J Chem Inf Model"},{"key":"226_CR34","doi-asserted-by":"publisher","first-page":"2085","DOI":"10.1021\/acs.jcim.5b00238","volume":"55","author":"Y Xu","year":"2015","unstructured":"Xu Y, Dai Z, Chen F, Gao S, Pei J, Lai L (2015) Deep learning for drug-induced liver injury. J Chem Inf Model 55:2085\u20132093","journal-title":"J Chem Inf Model"},{"key":"226_CR35","doi-asserted-by":"publisher","first-page":"2524","DOI":"10.1021\/acs.molpharmaceut.6b00248","volume":"13","author":"A Aliper","year":"2016","unstructured":"Aliper A, Plis S, Artemov A, Ulloa A, Mamoshina P, Zhavoronkov A (2016) Deep learning applications for predicting pharmacological properties of drugs and drug repurposing using transcriptomic data. Mol Pharm 13:2524\u20132530","journal-title":"Mol Pharm"},{"key":"226_CR36","unstructured":"Aspuru-Guzik A, Duvenaud D, Maclaurin D, Aguilera-Iparraguire J, Gomez-Bombarelli R, Hirzel TD, Adams RP (2015) Convolutional networks on graphs for learning molecular fingerprints. In: Proceedings of neural information processing systems, Quebec, pp 2224\u20132232"},{"key":"226_CR37","unstructured":"Team TTD, Al-Rfou R, Alain G, Almahairi A, Angermueller C, Bahdanau D, Ballas N, Bastien F, Bayer J, Belikov A (2016) Theano: a Python framework for fast computation of mathematical expressions. arXiv preprint arXiv:1605.02688"},{"key":"226_CR38","doi-asserted-by":"crossref","unstructured":"Jia Y, Shelhamer E, Donahue J, Karayev S, Long J, Girshick R, Guadarrama S, Darrell T (2014) Caffe: convolutional architecture for fast feature embedding. In: Proceedings of the ACM international conference on multimedia, 2014. ACM, pp 675\u2013678","DOI":"10.1145\/2647868.2654889"},{"key":"226_CR39","doi-asserted-by":"crossref","unstructured":"Zeiler MD, Ranzato M, Monga R, Mao M, Yang K, Le QV, Nguyen P, Senior A, Vanhoucke V, Dean J, Hinton GE (2013) On rectified linear units for speech processing. In: Proceedings of IEEE international conference on acoustics, speech and signal processing, Vancouver, pp 3517\u20133521","DOI":"10.1109\/ICASSP.2013.6638312"},{"key":"226_CR40","doi-asserted-by":"publisher","first-page":"319","DOI":"10.1021\/ci2003126","volume":"52","author":"P Tiikkainen","year":"2012","unstructured":"Tiikkainen P, Franke L (2012) Analysis of commercial and public bioactivity databases. J Chem Inf Model 52:319\u2013326","journal-title":"J Chem Inf Model"},{"key":"226_CR41","doi-asserted-by":"publisher","first-page":"685","DOI":"10.1016\/j.drudis.2012.02.013","volume":"17","author":"AJ Williams","year":"2012","unstructured":"Williams AJ, Ekins S, Tkachenko V (2012) Towards a gold standard: regarding quality in public domain chemistry databases and approaches to improving the situation. Drug Discov Today 17:685\u2013701","journal-title":"Drug Discov Today"},{"key":"226_CR42","doi-asserted-by":"publisher","first-page":"5165","DOI":"10.1021\/jm300131x","volume":"55","author":"C Kramer","year":"2012","unstructured":"Kramer C, Kalliokoski T, Gedeck P, Vulpetti A (2012) The experimental uncertainty of heterogeneous PublicKiData. J Med Chem 55:5165\u20135173","journal-title":"J Med Chem"},{"key":"226_CR43","doi-asserted-by":"publisher","first-page":"1213","DOI":"10.1016\/j.drudis.2016.03.015","volume":"21","author":"C Kramer","year":"2016","unstructured":"Kramer C, Dahl G, Tyrchan C, Ulander J (2016) A comprehensive company database analysis of biological assay variability. Drug Discov Today 21:1213\u20131221","journal-title":"Drug Discov Today"},{"key":"226_CR44","doi-asserted-by":"publisher","first-page":"32","DOI":"10.1177\/1087057103260590","volume":"9","author":"M Glick","year":"2004","unstructured":"Glick M (2004) Enrichment of extremely noisy high-throughput screening data using a Naive Bayes classifier. J Biomol Screen 9:32\u201336","journal-title":"J Biomol Screen"},{"key":"226_CR45","doi-asserted-by":"publisher","first-page":"857","DOI":"10.1007\/s10822-008-9240-5","volume":"22","author":"R Guha","year":"2008","unstructured":"Guha R (2008) On the interpretation and interpretability of quantitative structure\u2013activity relationship models. J Comput Aided Mol Des 22:857\u2013871","journal-title":"J Comput Aided Mol Des"},{"key":"226_CR46","doi-asserted-by":"publisher","first-page":"2551","DOI":"10.1021\/ci9002206","volume":"49","author":"L Carlsson","year":"2009","unstructured":"Carlsson L, Helgee EA, Boyer S (2009) Interpretation of nonlinear QSAR models applied to AMES mutagenicity data. J Chem Inf Model 49:2551\u20132558","journal-title":"J Chem Inf Model"},{"key":"226_CR47","doi-asserted-by":"publisher","first-page":"11","DOI":"10.1186\/1758-2946-3-11","volume":"3","author":"L Rosenbaum","year":"2011","unstructured":"Rosenbaum L, Hinselmann G, Jahn A, Zell A (2011) Interpreting linear support vector machine models with heat map molecule coloring. J Cheminform 3:11","journal-title":"J Cheminform"},{"key":"226_CR48","doi-asserted-by":"publisher","first-page":"D1083","DOI":"10.1093\/nar\/gkt1031","volume":"42","author":"AP Bento","year":"2014","unstructured":"Bento AP, Gaulton A, Hersey A, Bellis LJ, Chambers J, Davies M, Kr\u00fcger FA, Light Y, Mak L, McGlinchey S, Nowotka M, Papadatos G, Santos R, Overington JP (2014) The ChEMBL bioactivity database: an update. Nucleic Acids Res 42:D1083\u2013D1090","journal-title":"Nucleic Acids Res"},{"key":"226_CR49","doi-asserted-by":"publisher","first-page":"D1100","DOI":"10.1093\/nar\/gkr777","volume":"40","author":"A Gaulton","year":"2011","unstructured":"Gaulton A, Bellis LJ, Bento AP, Chambers J, Davies M, Hersey A, Light Y, McGlinchey S, Michalovich D, Al-Lazikani B, Overington JP (2011) ChEMBL: a large-scale bioactivity database for drug discovery. Nucleic Acids Res 40:D1100\u2013D1107","journal-title":"Nucleic Acids Res"},{"key":"226_CR50","unstructured":"Molecular Operating Environment (MOE) 2013.08. Chemical Computing Group Inc.: Sherbooke St. West, Suite #910, Montreal, QC, Canada, H3A 2R7, 2016"},{"key":"226_CR51","doi-asserted-by":"publisher","first-page":"742","DOI":"10.1021\/ci100050t","volume":"50","author":"D Rogers","year":"2010","unstructured":"Rogers D, Hahn M (2010) Extended-connectivity fingerprints. J Chem Inf Model 50:742\u2013754","journal-title":"J Chem Inf Model"},{"key":"226_CR52","unstructured":"Landrum G. RDKit: Open-source cheminformatics. http:\/\/www.rdkit.org"},{"key":"226_CR53","doi-asserted-by":"publisher","first-page":"108","DOI":"10.1021\/ci800249s","volume":"49","author":"A Bender","year":"2009","unstructured":"Bender A, Jenkins JL, Scheiber J, Sukuru SCK, Glick M, Davies JW (2009) How similar are similarity searching methods? A principal component analysis of molecular descriptor space. J Chem Inf Model 49:108\u2013119","journal-title":"J Chem Inf Model"},{"key":"226_CR54","unstructured":"McCallum A, Nigam K (1998) A comparison of event models for Naive Bayes text classification. In: Proceedings of the AAAI-98 workshop on learning for text categorization, vol 752, pp 41\u201348"},{"key":"226_CR55","series-title":"Lecture notes in computer science","doi-asserted-by":"publisher","first-page":"4","DOI":"10.1007\/BFb0026666","volume-title":"Machine learning: ECML-98. ECML 1998","author":"DD Lewis","year":"1998","unstructured":"Lewis DD (1998) Naive (Bayes) at forty: the independence assumption in information retrieval. In: N\u00e9dellec C, Rouveirol C (eds) Machine learning: ECML-98. ECML 1998. Lecture notes in computer science, vol 1398. Springer, Berlin, Heidelberg, pp 4\u201315"},{"key":"226_CR56","first-page":"841","volume":"14","author":"A Jordan","year":"2002","unstructured":"Jordan A (2002) On discriminative vs. generative classifiers: a comparison of logistic regression and naive bayes. Adv Neural Inf Process Syst 14:841","journal-title":"Adv Neural Inf Process Syst"},{"key":"226_CR57","first-page":"2825","volume":"12","author":"F Pedregosa","year":"2011","unstructured":"Pedregosa F, Varoquaux G, Gramfort A, Michel V, Thirion B, Grisel O, Blondel M, Prettenhofer P, Weiss R, Dubourg V (2011) Scikit-learn: machine learning in Python. J Mach Learn Res 12:2825\u20132830","journal-title":"J Mach Learn Res"},{"key":"226_CR58","doi-asserted-by":"crossref","first-page":"175","DOI":"10.1080\/00031305.1992.10475879","volume":"46","author":"NS Altman","year":"1992","unstructured":"Altman NS (1992) An introduction to kernel and nearest-neighbor nonparametric regression. Am Stat 46:175\u2013185","journal-title":"Am Stat"},{"key":"226_CR59","first-page":"1947","volume":"43","author":"V Svetnik","year":"2003","unstructured":"Svetnik V, Liaw A, Tong C, Culberson JC, Sheridan RP, Feuston BP (2003) Random forest: a classification and regression tool for compound classification and QSAR modeling. J Chem Inf Model 43:1947\u20131958","journal-title":"J Chem Inf Model"},{"key":"226_CR60","doi-asserted-by":"publisher","first-page":"5","DOI":"10.1023\/A:1010933404324","volume":"45","author":"L Breiman","year":"2001","unstructured":"Breiman L (2001) Random forests. Mach Learn 45:5\u201332","journal-title":"Mach Learn"},{"key":"226_CR61","doi-asserted-by":"publisher","first-page":"2507","DOI":"10.1093\/bioinformatics\/btm344","volume":"23","author":"Y Saeys","year":"2007","unstructured":"Saeys Y, Inza I, Larranaga P (2007) A review of feature selection techniques in bioinformatics. Bioinformatics 23:2507\u20132517","journal-title":"Bioinformatics"},{"key":"226_CR62","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1186\/1471-2105-7-3","volume":"7","author":"R D\u00edaz-Uriarte","year":"2006","unstructured":"D\u00edaz-Uriarte R, Alvarez de Andr\u00e9s S (2006) Gene selection and classification of microarray data using random forest. BMC Bioinform 7:3","journal-title":"BMC Bioinform"},{"key":"226_CR63","doi-asserted-by":"publisher","first-page":"468","DOI":"10.1002\/wcms.1183","volume":"4","author":"JBO Mitchell","year":"2014","unstructured":"Mitchell JBO (2014) Machine learning methods in chemoinformatics. Wiley Interdiscipl Rev Comput Mol Sci 4:468\u2013481","journal-title":"Wiley Interdiscipl Rev Comput Mol Sci"},{"key":"226_CR64","first-page":"99","volume":"36","author":"SJ Barrett","year":"2006","unstructured":"Barrett SJ, Langdon WB (2006) Advances in the application of machine learning techniques in drug discovery. Des Dev 36:99\u2013110","journal-title":"Des Dev"},{"key":"226_CR65","first-page":"273","volume":"20","author":"C Cortes","year":"1995","unstructured":"Cortes C, Vapnik V (1995) Support-vector networks. Mach Learn 20:273\u2013297","journal-title":"Mach Learn"},{"key":"226_CR66","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/1961189.1961199","volume":"2","author":"C-C Chang","year":"2011","unstructured":"Chang C-C, Lin C-J (2011) Libsvm. ACM Trans Intell Syst Technol 2:1\u201327","journal-title":"ACM Trans Intell Syst Technol"},{"key":"226_CR67","first-page":"1871","volume":"9","author":"R-E Fan","year":"2008","unstructured":"Fan R-E, Chang K-W, Hsieh C-J, Wang X-R, Lin C-J (2008) LIBLINEAR: a library for large linear classification. J Mach Learn Res 9:1871\u20131874","journal-title":"J Mach Learn Res"},{"key":"226_CR68","doi-asserted-by":"publisher","first-page":"3211","DOI":"10.1021\/ci500344v","volume":"54","author":"J Alvarsson","year":"2014","unstructured":"Alvarsson J, Eklund M, Andersson C, Carlsson L, Spjuth O, Wikberg JE (2014) Benchmarking study of parameter variation when using signature fingerprints together with support vector machines. J Chem Inf Model 54:3211\u20133217","journal-title":"J Chem Inf Model"},{"key":"226_CR69","unstructured":"Chu H. OpenLDAP lighting memory-mapped database. http:\/\/symas.com\/mdb\/"},{"key":"226_CR70","unstructured":"Group TH. Hierarchical data format (HDF). www.hdfgroup.org"},{"key":"226_CR71","doi-asserted-by":"publisher","first-page":"442","DOI":"10.1016\/0005-2795(75)90109-9","volume":"405","author":"BW Matthews","year":"1975","unstructured":"Matthews BW (1975) Comparison of the predicted and observed secondary structure of T4 phage lysozyme. Biochim Biophys Acta (BBA) Protein Struct 405:442\u2013451","journal-title":"Biochim Biophys Acta (BBA) Protein Struct"},{"key":"226_CR72","doi-asserted-by":"publisher","first-page":"412","DOI":"10.1093\/bioinformatics\/16.5.412","volume":"16","author":"P Baldi","year":"2000","unstructured":"Baldi P, Brunak S, Chauvin Y, Andersen CAF, Nielsen H (2000) Assessing the accuracy of prediction algorithms for classification: an overview. Bioinformatics 16:412\u2013424","journal-title":"Bioinformatics"},{"key":"226_CR73","doi-asserted-by":"publisher","first-page":"80","DOI":"10.2307\/3001968","volume":"1","author":"F Wilcoxon","year":"1945","unstructured":"Wilcoxon F (1945) Individual comparisons by ranking methods. Biom Bull 1:80","journal-title":"Biom Bull"},{"key":"226_CR74","unstructured":"Team RC (2014) In: ISBN 3-900051-07-0"}],"container-title":["Journal of Cheminformatics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s13321-017-0226-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1186\/s13321-017-0226-y\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s13321-017-0226-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,6,25]],"date-time":"2024-06-25T01:32:43Z","timestamp":1719279163000},"score":1,"resource":{"primary":{"URL":"https:\/\/jcheminf.biomedcentral.com\/articles\/10.1186\/s13321-017-0226-y"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,6,28]]},"references-count":74,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2017,12]]}},"alternative-id":["226"],"URL":"https:\/\/doi.org\/10.1186\/s13321-017-0226-y","relation":{},"ISSN":["1758-2946"],"issn-type":[{"value":"1758-2946","type":"electronic"}],"subject":[],"published":{"date-parts":[[2017,6,28]]},"assertion":[{"value":"30 September 2016","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 May 2017","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"28 June 2017","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}],"article-number":"42"}}