{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,19]],"date-time":"2026-03-19T18:06:46Z","timestamp":1773943606999,"version":"3.50.1"},"publisher-location":"New York, NY","reference-count":30,"publisher":"Springer US","isbn-type":[{"value":"9781071601495","type":"print"},{"value":"9781071601501","type":"electronic"}],"license":[{"start":{"date-parts":[[2020,1,1]],"date-time":"2020-01-01T00:00:00Z","timestamp":1577836800000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020]]},"DOI":"10.1007\/978-1-0716-0150-1_5","type":"book-chapter","created":{"date-parts":[[2020,1,16]],"date-time":"2020-01-16T13:29:19Z","timestamp":1579181359000},"page":"97-109","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":13,"title":["Importance of Data Curation in QSAR Studies Especially While Modeling Large-Size Datasets"],"prefix":"10.1007","author":[{"given":"Pravin","family":"Ambure","sequence":"first","affiliation":[]},{"given":"M. Nat\u00e1lia Dias Soeiro","family":"Cordeiro","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2020,1,17]]},"reference":[{"issue":"17-18","key":"5_CR1","doi-asserted-by":"publisher","first-page":"747","DOI":"10.1016\/j.drudis.2011.07.007","volume":"16","author":"Antony J. Williams","year":"2011","unstructured":"Williams AJ, Ekins S (2011) A quality alert and call for improved curation of public chemistry databases. \u200eDrug Discov Today 16:747\u2013750","journal-title":"Drug Discovery Today"},{"issue":"9","key":"5_CR2","doi-asserted-by":"publisher","first-page":"897","DOI":"10.1007\/s10822-015-9865-0","volume":"29","author":"M Waldman","year":"2015","unstructured":"Waldman M, Fraczkiewicz R, Clark RD (2015) Tales from the war on error: the art and science of curating QSAR data. J Comput Aided Mol Des 29(9):897\u2013910","journal-title":"J Comput Aided Mol Des"},{"key":"5_CR3","doi-asserted-by":"publisher","first-page":"17","DOI":"10.1016\/j.ddtec.2015.01.005","volume":"14","author":"A Hersey","year":"2015","unstructured":"Hersey A, Chambers J, Bellis L, Bento AP, Gaulton A, Overington JP (2015) Chemical databases: curation or integration by user-defined equivalence? Drug Discov Today Technol 14:17\u201324","journal-title":"Drug Discov Today Technol"},{"issue":"D1","key":"5_CR4","doi-asserted-by":"publisher","first-page":"D1202","DOI":"10.1093\/nar\/gkv951","volume":"44","author":"S Kim","year":"2015","unstructured":"Kim S, Thiessen PA, Bolton EE, Chen J, Fu G, Gindulyte A, Han L, He J, He S, Shoemaker BA (2015) PubChem substance and compound databases. Nucleic Acids Res 44(D1):D1202\u2013D1213","journal-title":"Nucleic Acids Res"},{"issue":"D1","key":"5_CR5","doi-asserted-by":"publisher","first-page":"D1100","DOI":"10.1093\/nar\/gkr777","volume":"40","author":"A Gaulton","year":"2011","unstructured":"Gaulton A, Bellis LJ, Bento AP, Chambers J, Davies M, Hersey A, Light Y, McGlinchey S, Michalovich D, Al-Lazikani B (2011) ChEMBL: a large-scale bioactivity database for drug discovery. Nucleic Acids Res 40(D1):D1100\u2013D1107","journal-title":"Nucleic Acids Res"},{"issue":"Suppl_1","key":"5_CR6","first-page":"D198","volume":"35","author":"T Liu","year":"2006","unstructured":"Liu T, Lin Y, Wen X, Jorissen RN, Gilson MK (2006) BindingDB: a web-accessible database of experimentally determined protein\u2013ligand binding affinities. Nucleic Acids Res 35(Suppl_1):D198\u2013D201","journal-title":"Nucleic Acids Res"},{"issue":"Suppl_1","key":"5_CR7","doi-asserted-by":"publisher","first-page":"D344","DOI":"10.1093\/nar\/gkm791","volume":"36","author":"K Degtyarenko","year":"2007","unstructured":"Degtyarenko K, De Matos P, Ennis M, Hastings J, Zbinden M, McNaught A, Alc\u00e1ntara R, Darsow M, Guedj M, Ashburner M (2007) ChEBI: a database and ontology for chemical entities of biological interest. Nucleic Acids Res 36(Suppl_1):D344\u2013D350","journal-title":"Nucleic Acids Res"},{"issue":"1","key":"5_CR8","doi-asserted-by":"publisher","first-page":"177","DOI":"10.1021\/ci049714+","volume":"45","author":"JJ Irwin","year":"2005","unstructured":"Irwin JJ, Shoichet BK (2005) ZINC\u2212 a free database of commercially available compounds for virtual screening. J Chem Inf Model 45(1):177\u2013182","journal-title":"J Chem Inf Model"},{"issue":"11","key":"5_CR9","doi-asserted-by":"publisher","first-page":"1123","DOI":"10.1021\/ed100697w","volume":"87","author":"Harry E. Pence","year":"2010","unstructured":"Pence HE, Williams A (2010) ChemSpider: an online chemical information resource. J Chem Educ 87(11):1123\u20131124","journal-title":"Journal of Chemical Education"},{"issue":"11\u201312","key":"5_CR10","doi-asserted-by":"publisher","first-page":"1337","DOI":"10.1002\/qsar.200810084","volume":"27","author":"D Young","year":"2008","unstructured":"Young D, Martin T, Venkatapathy R, Harten P (2008) Are the chemical structures in your QSAR correct? QSAR Comb Sci 27(11\u201312):1337\u20131345","journal-title":"QSAR Comb Sci"},{"issue":"13\u201314","key":"5_CR11","doi-asserted-by":"publisher","first-page":"685","DOI":"10.1016\/j.drudis.2012.02.013","volume":"17","author":"AJ Williams","year":"2012","unstructured":"Williams AJ, Ekins S, Tkachenko V (2012) Towards a gold standard: regarding quality in public domain chemistry databases and approaches to improving the situation. Drug Discov Today 17(13\u201314):685\u2013701","journal-title":"Drug Discov Today"},{"issue":"11","key":"5_CR12","doi-asserted-by":"publisher","first-page":"5165","DOI":"10.1021\/jm300131x","volume":"55","author":"C Kramer","year":"2012","unstructured":"Kramer C, Kalliokoski T, Gedeck P, Vulpetti A (2012) The experimental uncertainty of heterogeneous public K i data. J Med Chem 55(11):5165\u20135173","journal-title":"J Med Chem"},{"issue":"10","key":"5_CR13","doi-asserted-by":"publisher","first-page":"2499","DOI":"10.1021\/ci400099q","volume":"53","author":"P Tiikkainen","year":"2013","unstructured":"Tiikkainen P, Bellis L, Light Y, Franke L (2013) Estimating error rates in bioactivity databases. J Chem Inf Model 53(10):2499\u20132505","journal-title":"J Chem Inf Model"},{"issue":"4","key":"5_CR14","doi-asserted-by":"publisher","first-page":"e61007","DOI":"10.1371\/journal.pone.0061007","volume":"8","author":"T Kalliokoski","year":"2013","unstructured":"Kalliokoski T, Kramer C, Vulpetti A, Gedeck P (2013) Comparability of mixed IC50 data\u2013a statistical analysis. PLoS One 8(4):e61007","journal-title":"PLoS One"},{"issue":"9","key":"5_CR15","doi-asserted-by":"publisher","first-page":"885","DOI":"10.1007\/s10822-015-9860-5","volume":"29","author":"G Papadatos","year":"2015","unstructured":"Papadatos G, Gaulton A, Hersey A, Overington JP (2015) Activity, assay and target data curation and quality in the ChEMBL database. J Comput Aided Mol Des 29(9):885\u2013896","journal-title":"J Comput Aided Mol Des"},{"issue":"11","key":"5_CR16","doi-asserted-by":"publisher","first-page":"911","DOI":"10.1080\/1062936X.2016.1253611","volume":"27","author":"K Mansouri","year":"2016","unstructured":"Mansouri K, Grulke C, Richard A, Judson R, Williams A (2016) An automated curation procedure for addressing chemical errors and inconsistencies in public datasets used in QSAR modelling. SAR QSAR Environ Res 27(11):911\u2013937","journal-title":"SAR QSAR Environ Res"},{"issue":"1","key":"5_CR17","doi-asserted-by":"publisher","first-page":"26","DOI":"10.1145\/1656274.1656280","volume":"11","author":"MR Berthold","year":"2009","unstructured":"Berthold MR, Cebron N, Dill F, Gabriel TR, K\u00f6tter T, Meinl T, Ohl P, Thiel K, Wiswedel B (2009) KNIME-the Konstanz information miner: version 2.0 and beyond. AcM SIGKDD Explorations Newsletter 11(1):26\u201331","journal-title":"AcM SIGKDD Explorations Newsletter"},{"issue":"1","key":"5_CR18","doi-asserted-by":"crossref","first-page":"75","DOI":"10.2478\/s11532-010-0116-x","volume":"9","author":"A Toropova","year":"2011","unstructured":"Toropova A, Toropov A, Benfenati E, Gini G (2011) QSAR modelling toxicity toward rats of inorganic substances by means of CORAL. Open Chem 9(1):75\u201385","journal-title":"Open Chem"},{"issue":"2","key":"5_CR19","doi-asserted-by":"publisher","first-page":"215","DOI":"10.1016\/j.chemolab.2010.12.007","volume":"105","author":"A Toropova","year":"2011","unstructured":"Toropova A, Toropov A, Benfenati E, Gini G (2011) Co-evolutions of correlations for QSAR of toxicity of organometallic and inorganic substances: an unexpected good prediction based on a model that seems untrustworthy. Chemom Intell Lab Syst 105(2):215\u2013219","journal-title":"Chemom Intell Lab Syst"},{"issue":"7","key":"5_CR20","doi-asserted-by":"publisher","first-page":"1189","DOI":"10.1021\/ci100176x","volume":"50","author":"D Fourches","year":"2010","unstructured":"Fourches D, Muratov E, Tropsha A (2010) Trust, but verify: on the importance of chemical structure curation in cheminformatics and QSAR modeling research. J Chem Inf Model 50(7):1189\u20131204","journal-title":"J Chem Inf Model"},{"issue":"6\u20137","key":"5_CR21","doi-asserted-by":"publisher","first-page":"491","DOI":"10.1002\/minf.201200006","volume":"31","author":"I Oprisiu","year":"2012","unstructured":"Oprisiu I, Varlamova E, Muratov E, Artemenko A, Marcou G, Polishchuk P, Kuz\u2019min V, Varnek A (2012) QSPR approach to predict nonadditive properties of mixtures. Application to bubble point temperatures of binary mixtures of liquids. Mol Inform 31(6\u20137):491\u2013502","journal-title":"Mol Inform"},{"issue":"2","key":"5_CR22","doi-asserted-by":"publisher","first-page":"323","DOI":"10.1021\/ci9902696","volume":"40","author":"F Csizmadia","year":"2000","unstructured":"Csizmadia F (2000) JChem: Java applets and modules supporting chemical database handling from web browsers. J Chem Inf Comput Sci 40(2):323\u2013324","journal-title":"J Chem Inf Comput Sci"},{"issue":"1","key":"5_CR23","doi-asserted-by":"publisher","first-page":"60","DOI":"10.1186\/s13321-018-0315-6","volume":"10","author":"D Gadaleta","year":"2018","unstructured":"Gadaleta D, Lombardo A, Toma C, Benfenati E (2018) A new semi-automated workflow for chemical data retrieval and quality checking for modeling applications. J Chem 10(1):60","journal-title":"J Chem"},{"issue":"4","key":"5_CR24","doi-asserted-by":"publisher","first-page":"588","DOI":"10.1093\/bioinformatics\/btt718","volume":"30","author":"D Fourches","year":"2013","unstructured":"Fourches D, Sassano MF, Roth BL, Tropsha A (2013) HTS navigator: freely accessible cheminformatics software for analyzing high-throughput screening data. Bioinformatics 30(4):588\u2013589","journal-title":"Bioinformatics"},{"issue":"6","key":"5_CR25","doi-asserted-by":"publisher","first-page":"533","DOI":"10.1007\/s10822-011-9440-2","volume":"25","author":"I Sushko","year":"2011","unstructured":"Sushko I, Novotarskyi S, K\u00f6rner R, Pandey AK, Rupp M, Teetz W, Brandmaier S, Abdelaziz A, Prokopenko VV, Tanchuk VY (2011) Online chemical modeling environment (OCHEM): web platform for data storage, model development and publishing of chemical information. J Comput Aided Mol Des 25(6):533\u2013554","journal-title":"J Comput Aided Mol Des"},{"issue":"9","key":"5_CR26","doi-asserted-by":"publisher","first-page":"3786","DOI":"10.1021\/jm500317a","volume":"57","author":"C Kramer","year":"2014","unstructured":"Kramer C, Fuchs JE, Whitebread S, Gedeck P, Liedl KR (2014) Matched molecular pair analysis: significance and the impact of experimental uncertainty. J Med Chem 57(9):3786\u20133802","journal-title":"J Med Chem"},{"issue":"7","key":"5_CR27","doi-asserted-by":"publisher","first-page":"1243","DOI":"10.1021\/acs.jcim.6b00129","volume":"56","author":"D Fourches","year":"2016","unstructured":"Fourches D, Muratov E, Tropsha A (2016) Trust, but verify II: a practical guide to chemogenomics data curation. J Chem Inf Model 56(7):1243\u20131252","journal-title":"J Chem Inf Model"},{"key":"5_CR28","first-page":"161","volume-title":"Methods in Molecular Biology","author":"Marlene T. Kim","year":"2016","unstructured":"Kim MT, Wang W, Sedykh A, Zhu H (2016) Curating and preparing high-throughput screening data for quantitative structure-activity relationship modeling. In: High-throughput screening assays in toxicology. Springer, Humana Press, New York, NY, pp 161\u2013172"},{"issue":"1","key":"5_CR29","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s13321-017-0256-5","volume":"10","author":"S Kausar","year":"2018","unstructured":"Kausar S, Falcao AO (2018) An automated framework for QSAR model building. J Chem 10(1):1","journal-title":"J Chem"},{"key":"5_CR30","doi-asserted-by":"publisher","first-page":"1282","DOI":"10.1080\/07391102.2018.1456975","volume":"37","author":"P Ambure","year":"2019","unstructured":"Ambure P, Bhat J, Puzyn T, Roy K (2019) Identifying natural compounds as multi-target-directed ligands against Alzheimer\u2019s disease: an in silico approach. J Biomol Struct Dyn 37:1282\u20131306","journal-title":"J Biomol Struct Dyn"}],"container-title":["Methods in Pharmacology and Toxicology","Ecotoxicological QSARs"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-1-0716-0150-1_5","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,2,22]],"date-time":"2021-02-22T11:10:59Z","timestamp":1613992259000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-1-0716-0150-1_5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020]]},"ISBN":["9781071601495","9781071601501"],"references-count":30,"URL":"https:\/\/doi.org\/10.1007\/978-1-0716-0150-1_5","relation":{},"ISSN":["1557-2153","1940-6053"],"issn-type":[{"value":"1557-2153","type":"print"},{"value":"1940-6053","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020]]},"assertion":[{"value":"17 January 2020","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}}]}}