{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,9]],"date-time":"2026-03-09T07:41:30Z","timestamp":1773042090153,"version":"3.50.1"},"reference-count":51,"publisher":"American Chemical Society (ACS)","issue":"4","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["J. Chem. Inf. Model."],"published-print":{"date-parts":[[2013,4,22]]},"DOI":"10.1021\/ci4000536","type":"journal-article","created":{"date-parts":[[2013,3,6]],"date-time":"2013-03-06T19:18:06Z","timestamp":1362597486000},"page":"958-971","source":"Crossref","is-referenced-by-count":44,"title":["Oversampling to Overcome Overfitting: Exploring the Relationship between Data Set Composition, Molecular Descriptors, and Predictive Modeling Methods"],"prefix":"10.1021","volume":"53","author":[{"given":"Chia-Yun","family":"Chang","sequence":"first","affiliation":[{"name":"School of Pharmacy, College of Medicine, National Taiwan University, No.1, Sec.1, Jen-Ai Road,\rTaipei, Taiwan 100"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ming-Tsung","family":"Hsu","sequence":"additional","affiliation":[{"name":"Genome\rand Systems Biology Degree Program, College of Life Science, National Taiwan University, No.1 Sec.4, Roosevelt Road,\rTaipei, Taiwan 106"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Emilio Xavier","family":"Esposito","sequence":"additional","affiliation":[{"name":"exeResearch, LLC, 32 University Drive, East Lansing,\rMichigan 48823, United States"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yufeng J.","family":"Tseng","sequence":"additional","affiliation":[{"name":"School of Pharmacy, College of Medicine, National Taiwan University, No.1, Sec.1, Jen-Ai Road,\rTaipei, Taiwan 100"},{"name":"Genome\rand Systems Biology Degree Program, College of Life Science, National Taiwan University, No.1 Sec.4, Roosevelt Road,\rTaipei, Taiwan 106"},{"name":"Department of Computer Science and Information\rEngineering, National Taiwan University, No.1 Sec.4, Roosevelt Road, Taipei, Taiwan 106"},{"name":"Graduate Institute of Biomedical Electronics and\rBioinformatics, National Taiwan University, No.1 Sec.4, Roosevelt Road, Taipei, Taiwan 106"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"316","published-online":{"date-parts":[[2013,3,15]]},"reference":[{"key":"ref1\/cit1","doi-asserted-by":"crossref","first-page":"1047","DOI":"10.1289\/ehp.1001925","volume":"118","author":"Rusyn I.","year":"2010","journal-title":"Environ. Health Perspect."},{"key":"ref2\/cit2","doi-asserted-by":"crossref","first-page":"997","DOI":"10.1016\/j.drudis.2010.07.007","volume":"15","author":"Shukla S. J.","year":"2010","journal-title":"Drug Discovery Today"},{"key":"ref3\/cit3","doi-asserted-by":"crossref","first-page":"161","DOI":"10.1146\/annurev-publhealth-031210-101153","volume":"32","author":"Krewski D.","year":"2011","journal-title":"Annu. Rev. Public Health"},{"key":"ref4\/cit4","doi-asserted-by":"crossref","first-page":"473","DOI":"10.1208\/s12248-012-9358-1","volume":"14","author":"Sun H.","year":"2012","journal-title":"AAPS J."},{"key":"ref5\/cit5","doi-asserted-by":"crossref","first-page":"303","DOI":"10.1016\/j.drudis.2007.12.007","volume":"13","author":"Muster W.","year":"2008","journal-title":"Drug Discovery Today"},{"key":"ref6\/cit6","doi-asserted-by":"crossref","first-page":"16","DOI":"10.1016\/j.drudis.2009.09.010","volume":"15","author":"Merlot C.","year":"2010","journal-title":"Drug Discovery Today"},{"key":"ref7\/cit7","doi-asserted-by":"crossref","first-page":"135","DOI":"10.1016\/j.drudis.2011.10.022","volume":"17","author":"Modi S.","year":"2012","journal-title":"Drug Discovery Today"},{"key":"ref8\/cit8","doi-asserted-by":"crossref","first-page":"2729","DOI":"10.1039\/a905764a","volume":"2","author":"Selassie C. D.","year":"1999","journal-title":"J. Chem. Soc., Perkin Trans."},{"key":"ref9\/cit9","doi-asserted-by":"crossref","first-page":"508","DOI":"10.1039\/b718860a","volume":"10","author":"Garcia-Lorenzo A.","year":"2008","journal-title":"Green Chem."},{"key":"ref10\/cit10","doi-asserted-by":"crossref","first-page":"367","DOI":"10.1007\/s10822-008-9192-9","volume":"22","author":"Guha R.","year":"2008","journal-title":"J. Comput.-Aided Mol. Des."},{"key":"ref11\/cit11","doi-asserted-by":"crossref","first-page":"39","DOI":"10.1016\/S0166-1280(02)00616-4","volume":"622","author":"Cronin M. T. D.","year":"2003","journal-title":"J. Mol. Struct.: THEOCHEM"},{"key":"ref12\/cit12","doi-asserted-by":"crossref","first-page":"284","DOI":"10.1289\/ehp.10727","volume":"116","author":"Xia M.","year":"2008","journal-title":"Environ. Health Perspect."},{"key":"ref13\/cit13","doi-asserted-by":"crossref","first-page":"3310","DOI":"10.1093\/bioinformatics\/btp589","volume":"25","author":"Li Q.","year":"2009","journal-title":"Bioinformatics"},{"key":"ref14\/cit14","doi-asserted-by":"crossref","first-page":"18","DOI":"10.1111\/j.0824-7935.2004.t01-1-00228.x","volume":"20","author":"Estabrooks A.","year":"2004","journal-title":"Comput. Intell."},{"key":"ref15\/cit15","doi-asserted-by":"crossref","first-page":"127","DOI":"10.1145\/1321440.1321461","volume-title":"Proceedings of the sixteenth ACM conference on Conference on information and knowledge management","author":"Ertekin S.","year":"2007"},{"key":"ref16\/cit16","doi-asserted-by":"crossref","first-page":"677","DOI":"10.1109\/DAS.2008.74","volume-title":"Proceedings of the 2008 The Eighth IAPR International Workshop on Document Analysis Systems","author":"Gazzah S.","year":"2008"},{"key":"ref17\/cit17","doi-asserted-by":"crossref","first-page":"281","DOI":"10.1109\/TSMCB.2008.2002909","volume":"39","author":"Tang Y.","year":"2009","journal-title":"Trans. Sys. Man Cyber. Part B"},{"key":"ref18\/cit18","doi-asserted-by":"crossref","first-page":"191","DOI":"10.1016\/j.dss.2009.07.011","volume":"48","author":"Sun A. X.","year":"2009","journal-title":"Decis. Support Syst."},{"key":"ref19\/cit19","doi-asserted-by":"crossref","first-page":"557","DOI":"10.1016\/j.patcog.2006.01.009","volume":"40","author":"Xie J. G.","year":"2007","journal-title":"Pattern Recognit."},{"key":"ref20\/cit20","volume-title":"Neural Networks: A Comprehensive Foundation","author":"Haykin S. S.","year":"1998"},{"key":"ref21\/cit21","doi-asserted-by":"crossref","first-page":"5","DOI":"10.1023\/A:1010933404324","volume":"45","author":"Breiman L.","year":"2001","journal-title":"Mach. Learn."},{"key":"ref22\/cit22","first-page":"81","volume":"1","author":"Quinlan J. R.","year":"1986","journal-title":"Mach. Learn."},{"key":"ref23\/cit23","doi-asserted-by":"crossref","first-page":"241","DOI":"10.1186\/1471-2105-9-241","volume":"9","author":"Judson R.","year":"2008","journal-title":"BMC Bioinf."},{"key":"ref24\/cit24","doi-asserted-by":"crossref","first-page":"232","DOI":"10.1007\/s12539-011-0102-9","volume":"3","author":"Sharma A.","year":"2011","journal-title":"Interdiscip. Sci.:, Comput. Life Sci."},{"key":"ref25\/cit25","doi-asserted-by":"crossref","first-page":"1947","DOI":"10.1021\/ci034160g","volume":"43","author":"Svetnik V.","year":"2003","journal-title":"J. Chem. Inf. Comput. Sci."},{"key":"ref26\/cit26","doi-asserted-by":"crossref","first-page":"2481","DOI":"10.1021\/ci900203n","volume":"49","author":"Polishchuk P. G.","year":"2009","journal-title":"J. Chem. Inf. Model."},{"key":"ref27\/cit27","doi-asserted-by":"crossref","first-page":"105","DOI":"10.1016\/j.tox.2005.08.019","volume":"217","author":"Zhao C. Y.","year":"2006","journal-title":"Toxicology"},{"key":"ref28\/cit28","doi-asserted-by":"crossref","first-page":"5714","DOI":"10.1021\/cr900238d","volume":"110","author":"Katritzky A. R.","year":"2010","journal-title":"Chem. Rev."},{"key":"ref29\/cit29","doi-asserted-by":"crossref","first-page":"536","DOI":"10.1021\/ci050358k","volume":"46","author":"von Korff M.","year":"2006","journal-title":"J. Chem. Inf. Model."},{"key":"ref30\/cit30","doi-asserted-by":"crossref","first-page":"312","DOI":"10.1021\/jm040835a","volume":"48","author":"Kazius J.","year":"2005","journal-title":"J. Med. Chem."},{"key":"ref31\/cit31","doi-asserted-by":"crossref","first-page":"1630","DOI":"10.1021\/ci049869h","volume":"44","author":"Xue Y.","year":"2004","journal-title":"J. Chem. Inf. Comput. Sci."},{"key":"ref32\/cit32","doi-asserted-by":"crossref","first-page":"39","DOI":"10.1007\/s10822-011-9511-4","volume":"26","author":"Tseng Y. J.","year":"2012","journal-title":"J. Comput.-Aided Mol. Des."},{"key":"ref33\/cit33","volume-title":"Pharmacophores and Pharmacophore Searches","author":"Renner S.","year":"2006"},{"key":"ref34\/cit34","doi-asserted-by":"crossref","first-page":"1660","DOI":"10.1021\/ci300060b","volume":"52","author":"Su B. H.","year":"2012","journal-title":"J. Chem. Inf. Model."},{"key":"ref35\/cit35","doi-asserted-by":"crossref","first-page":"934","DOI":"10.1021\/tx200099j","volume":"24","author":"Shen M. Y.","year":"2011","journal-title":"Chem. Res. Toxicol."},{"key":"ref36\/cit36","doi-asserted-by":"crossref","first-page":"1526","DOI":"10.1021\/ci049898s","volume":"44","author":"Senese C. L.","year":"2004","journal-title":"J. Chem. Inf. Comput. Sci."},{"key":"ref37\/cit37","unstructured":"Molecular Operating Environment (MOE). Chemical Computing Group Inc.:1010 Sherbooke St. West, Suite #910, Montreal, QC, Canada, H3A 2R7, 2011."},{"key":"ref38\/cit38","unstructured":"MOE (Molecular Operating Environment). Chemical Computing Group, Inc.:Montreal, Canada, 2008."},{"key":"ref39\/cit39","unstructured":"Lin, A.QuaSAR-Descriptor. November 2012. Available fromhttp:\/\/www.chemcomp.com\/journal\/descr.htm."},{"key":"ref40\/cit40","doi-asserted-by":"crossref","first-page":"2894","DOI":"10.1002\/(SICI)1521-3773(19991004)38:19<2894::AID-ANIE2894>3.0.CO;2-F","volume":"38","author":"Schneider G.","year":"1999","journal-title":"Angew. Chem., Int. Ed. Engl."},{"key":"ref41\/cit41","volume-title":"Statistical Learning Theory","author":"Vapnik V. N.","year":"1998"},{"key":"ref42\/cit42","doi-asserted-by":"crossref","DOI":"10.1007\/978-1-4757-3264-1","volume-title":"The Nature of Statistical Learning Theory","author":"Vapnik V. N.","year":"2000"},{"key":"ref43\/cit43","first-page":"18","volume":"2","author":"Liaw A.","year":"2002","journal-title":"R News"},{"key":"ref44\/cit44","unstructured":"Team, R. D. C.R: A language and environment for statistical computing;R Foundation for Statistical Computing:Vienna, Austria, 2011."},{"key":"ref45\/cit45","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/1961189.1961199","volume":"2","author":"Chang C.-C.","year":"2011","journal-title":"ACM Trans. Intell. Syst. Technol."},{"key":"ref46\/cit46","doi-asserted-by":"crossref","first-page":"37","DOI":"10.1177\/001316446002000104","volume":"20","author":"Cohen J. A.","year":"1960","journal-title":"Educ. Psychol. Meas."},{"key":"ref47\/cit47","doi-asserted-by":"crossref","first-page":"2345","DOI":"10.1021\/ci700157b","volume":"47","author":"Rucker C.","year":"2007","journal-title":"J. Chem. Inf. Model."},{"key":"ref48\/cit48","unstructured":"PubChem Substructure Fingerprint, 2009."},{"key":"ref49\/cit49","first-page":"133","volume":"14","author":"Schwartzman R. A.","year":"1993","journal-title":"Endocr. Rev."},{"key":"ref50\/cit50","doi-asserted-by":"crossref","first-page":"725","DOI":"10.1016\/S0006-3495(01)75737-2","volume":"81","author":"Groot R. D.","year":"2001","journal-title":"Biophys. J."},{"key":"ref51\/cit51","doi-asserted-by":"crossref","first-page":"2143","DOI":"10.1246\/bcsj.69.2143","volume":"69","author":"Nakamura E.","year":"1996","journal-title":"Bull. Chem. Soc. Jpn."}],"container-title":["Journal of Chemical Information and Modeling"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/pubs.acs.org\/doi\/pdf\/10.1021\/ci4000536","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,4,16]],"date-time":"2023-04-16T08:53:07Z","timestamp":1681635187000},"score":1,"resource":{"primary":{"URL":"https:\/\/pubs.acs.org\/doi\/10.1021\/ci4000536"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2013,3,15]]},"references-count":51,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2013,4,22]]}},"alternative-id":["10.1021\/ci4000536"],"URL":"https:\/\/doi.org\/10.1021\/ci4000536","relation":{},"ISSN":["1549-9596","1549-960X"],"issn-type":[{"value":"1549-9596","type":"print"},{"value":"1549-960X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2013,3,15]]}}}