{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,8]],"date-time":"2026-02-08T07:32:14Z","timestamp":1770535934085,"version":"3.49.0"},"reference-count":60,"publisher":"American Chemical Society (ACS)","issue":"4","license":[{"start":{"date-parts":[[2023,2,9]],"date-time":"2023-02-09T00:00:00Z","timestamp":1675900800000},"content-version":"unspecified","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"DOI":"10.13039\/100004325","name":"AstraZeneca","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100004325","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100000266","name":"Engineering and Physical Sciences Research Council","doi-asserted-by":"publisher","award":["EP\/S035990\/1"],"award-info":[{"award-number":["EP\/S035990\/1"]}],"id":[{"id":"10.13039\/501100000266","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100004316","name":"International Business Machines Corporation","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100004316","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100004330","name":"GlaxoSmithKline","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100004330","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["J. Chem. Inf. Model."],"published-print":{"date-parts":[[2023,2,27]]},"DOI":"10.1021\/acs.jcim.2c01189","type":"journal-article","created":{"date-parts":[[2023,2,9]],"date-time":"2023-02-09T20:46:23Z","timestamp":1675975583000},"page":"1099-1113","source":"Crossref","is-referenced-by-count":21,"title":["Blinded Predictions and Post Hoc Analysis of the Second Solubility Challenge Data: Exploring Training Data and Feature Set Selection for Machine and Deep Learning Models"],"prefix":"10.1021","volume":"63","author":[{"given":"Jonathan G. M.","family":"Conn","sequence":"first","affiliation":[{"name":"Department of Pure and Applied Chemistry, University of Strathclyde, Thomas Graham Building, 295 Cathedral Street, Glasgow G1 1XL, U.K."}]},{"given":"James W.","family":"Carter","sequence":"additional","affiliation":[{"name":"Department of Pure and Applied Chemistry, University of Strathclyde, Thomas Graham Building, 295 Cathedral Street, Glasgow G1 1XL, U.K."}]},{"given":"Justin J. A.","family":"Conn","sequence":"additional","affiliation":[{"name":"Department of Pure and Applied Chemistry, University of Strathclyde, Thomas Graham Building, 295 Cathedral Street, Glasgow G1 1XL, U.K."}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7319-8885","authenticated-orcid":true,"given":"Vigneshwari","family":"Subramanian","sequence":"additional","affiliation":[{"name":"Drug Metabolism and Pharmacokinetics, Research and Early Development, Respiratory & Immunology, BioPharmaceuticals R&D, AstraZeneca, Pepparedsleden 1, SE-431 83 G\u00f6teborg, Sweden"}]},{"given":"Andrew","family":"Baxter","sequence":"additional","affiliation":[{"name":"GSK Medicines Research Centre, Gunnels Wood Road, Stevenage SG1 2NY, U.K."}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4970-6461","authenticated-orcid":true,"given":"Ola","family":"Engkvist","sequence":"additional","affiliation":[{"name":"Medicinal Chemistry, Research and Early Development, Cardiovascular, Renal and Metabolism (CVRM), BioPharmaceuticals R&D, AstraZeneca, SE-431 50 G\u00f6teborg, Sweden"},{"name":"Department of Computer Science and Engineering, Chalmers University of Technology, SE-412 96 G\u00f6teborg, Sweden"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4620-9363","authenticated-orcid":true,"given":"Antonio","family":"Llinas","sequence":"additional","affiliation":[{"name":"Drug Metabolism and Pharmacokinetics, Research and Early Development, Respiratory & Immunology, BioPharmaceuticals R&D, AstraZeneca, Pepparedsleden 1, SE-431 83 G\u00f6teborg, Sweden"}]},{"given":"Ekaterina L.","family":"Ratkova","sequence":"additional","affiliation":[{"name":"Medicinal Chemistry, Research and Early Development, Cardiovascular, Renal and Metabolism (CVRM), BioPharmaceuticals R&D, AstraZeneca, SE-431 50 G\u00f6teborg, Sweden"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0958-9830","authenticated-orcid":true,"given":"Stephen D.","family":"Pickett","sequence":"additional","affiliation":[{"name":"Computational Sciences, GlaxoSmithKline R&D Pharmaceuticals, Stevenage SG1 2NY, U.K."}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2323-6898","authenticated-orcid":true,"given":"James L.","family":"McDonagh","sequence":"additional","affiliation":[{"name":"IBM Research Europe, Hartree Centre, SciTech Daresbury, Warrington, Cheshire WA4 4AD, U.K."}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4356-9144","authenticated-orcid":true,"given":"David S.","family":"Palmer","sequence":"additional","affiliation":[{"name":"Department of Pure and Applied Chemistry, University of Strathclyde, Thomas Graham Building, 295 Cathedral Street, Glasgow G1 1XL, U.K."}]}],"member":"316","published-online":{"date-parts":[[2023,2,9]]},"reference":[{"key":"ref1\/cit1","first-page":"82","volume":"5","author":"Lipinski C.","year":"2002","journal-title":"Am. Pharm. Rev."},{"key":"ref2\/cit2","doi-asserted-by":"publisher","DOI":"10.1039\/C5CP00288E"},{"key":"ref3\/cit3","doi-asserted-by":"publisher","DOI":"10.1002\/0471722804"},{"key":"ref4\/cit4","doi-asserted-by":"publisher","DOI":"10.2174\/1389557518666180727164417"},{"key":"ref5\/cit5","doi-asserted-by":"publisher","DOI":"10.1039\/D0CP03596C"},{"key":"ref6\/cit6","doi-asserted-by":"publisher","DOI":"10.3390\/molecules26206185"},{"key":"ref7\/cit7","doi-asserted-by":"publisher","DOI":"10.1021\/acsomega.2c00697"},{"key":"ref8\/cit8","doi-asserted-by":"publisher","DOI":"10.1021\/acsomega.2c00642"},{"key":"ref9\/cit9","doi-asserted-by":"publisher","DOI":"10.1016\/j.ailsci.2021.100021"},{"key":"ref10\/cit10","doi-asserted-by":"publisher","DOI":"10.1021\/acs.jcim.1c00331"},{"key":"ref11\/cit11","doi-asserted-by":"publisher","DOI":"10.1186\/s13321-020-0414-z"},{"key":"ref12\/cit12","doi-asserted-by":"publisher","DOI":"10.3103\/S0146411617020043"},{"key":"ref13\/cit13","doi-asserted-by":"publisher","DOI":"10.1002\/jcc.25213"},{"key":"ref14\/cit14","doi-asserted-by":"publisher","DOI":"10.5599\/admet.766"},{"key":"ref15\/cit15","doi-asserted-by":"publisher","DOI":"10.1021\/mp500103r"},{"key":"ref16\/cit16","doi-asserted-by":"publisher","DOI":"10.1002\/jps.20302"},{"key":"ref17\/cit17","doi-asserted-by":"publisher","DOI":"10.1063\/1.4983754"},{"key":"ref18\/cit18","doi-asserted-by":"publisher","DOI":"10.1063\/1.5040366"},{"key":"ref19\/cit19","doi-asserted-by":"publisher","DOI":"10.1063\/1.4968045"},{"key":"ref20\/cit20","doi-asserted-by":"publisher","DOI":"10.1039\/C8CP01786G"},{"key":"ref21\/cit21","doi-asserted-by":"publisher","DOI":"10.1063\/1.5117281"},{"key":"ref22\/cit22","doi-asserted-by":"publisher","DOI":"10.1021\/ct300345m"},{"key":"ref23\/cit23","doi-asserted-by":"publisher","DOI":"10.1021\/ci4005805"},{"key":"ref24\/cit24","doi-asserted-by":"publisher","DOI":"10.1021\/acs.jctc.1c00130"},{"key":"ref25\/cit25","doi-asserted-by":"publisher","DOI":"10.1021\/acs.molpharmaceut.9b01138"},{"key":"ref26\/cit26","doi-asserted-by":"publisher","DOI":"10.1021\/ci800058v"},{"key":"ref27\/cit27","doi-asserted-by":"publisher","DOI":"10.1021\/acs.jcim.9b00345"},{"key":"ref28\/cit28","doi-asserted-by":"publisher","DOI":"10.1021\/mp7000878"},{"key":"ref29\/cit29","doi-asserted-by":"publisher","DOI":"10.1021\/acs.jcim.0c00701"},{"key":"ref30\/cit30","doi-asserted-by":"publisher","DOI":"10.1016\/S0960-894X(00)00172-4"},{"key":"ref31\/cit31","doi-asserted-by":"publisher","DOI":"10.1023\/A:1014224900524"},{"key":"ref32\/cit32","doi-asserted-by":"publisher","DOI":"10.1021\/jm020986i"},{"key":"ref33\/cit33","doi-asserted-by":"publisher","DOI":"10.1021\/ci970100x"},{"key":"ref34\/cit34","doi-asserted-by":"publisher","DOI":"10.1016\/j.ejps.2012.10.028"},{"key":"ref35\/cit35","doi-asserted-by":"publisher","DOI":"10.1021\/ac048767n"},{"key":"ref36\/cit36","doi-asserted-by":"publisher","DOI":"10.1021\/ci400692n"},{"key":"ref37\/cit37","doi-asserted-by":"publisher","DOI":"10.1021\/ci800406y"},{"key":"ref38\/cit38","doi-asserted-by":"publisher","DOI":"10.1016\/j.ejmech.2010.05.059"},{"key":"ref39\/cit39","doi-asserted-by":"publisher","DOI":"10.1002\/cem.3349"},{"key":"ref40\/cit40","doi-asserted-by":"publisher","DOI":"10.1201\/EBK1439802458"},{"key":"ref41\/cit41","doi-asserted-by":"publisher","DOI":"10.1038\/s41597-019-0151-1"},{"key":"ref42\/cit42","unstructured":"Quacpac Toolkit 2021.1.1; OpenEye Scientific\nSoftware: Santa Fe, NM. http:\/\/www.eyesopen.com (accessed 2021-05-01)."},{"key":"ref43\/cit43","doi-asserted-by":"publisher","DOI":"10.1186\/1758-2946-3-33"},{"key":"ref44\/cit44","unstructured":"Open Babel Package, version 3.1.1. http:\/\/openbabel.org (accessed 2020-11-01)."},{"key":"ref45\/cit45","unstructured":"PubChem. Sketcher V2.4. https:\/\/pubchem.ncbi.nlm.nih.gov\/\/edit3\/index.html (accessed\n2020-11-01)."},{"key":"ref46\/cit46","unstructured":"NCI\/CADD Chemical Identifier\nResolver. https:\/\/cactus.nci.nih.gov\/chemical\/structure (accessed 2020-11-01)."},{"key":"ref47\/cit47","unstructured":"RDKit: Open-source cheminformatics. https:\/\/www.rdkit.org\/ (accessed\n2021-02-01)."},{"key":"ref48\/cit48","doi-asserted-by":"publisher","DOI":"10.1002\/spe.4380211102"},{"key":"ref49\/cit49","doi-asserted-by":"publisher","DOI":"10.1186\/s13321-018-0258-y"},{"key":"ref50\/cit50","unstructured":"Chemical Computing\nGroup ULC Molecular Operating Environment\n(MOE), 2018.01; 1010 Sherbrooke St. West,\nSuite #910, Montreal, QC, Canada H3A 2R7, 2019."},{"key":"ref51\/cit51","unstructured":"Schr\u00f6dinger Release 2017; LigPrep,\nSchr\u00f6dinger, LLC: New York, 2017. https:\/\/www.schrodinger.com\/products\/ligprep (accessed 2020-11-01)."},{"key":"ref52\/cit52","volume-title":"Deep Learning for the Life Sciences","author":"Ramsundar B.","year":"2019"},{"key":"ref53\/cit53","first-page":"2825","volume":"12","author":"Pedregosa F.","year":"2011","journal-title":"J. Mach. Learn. Res."},{"key":"ref54\/cit54","unstructured":"Tensorflow: A\nsystem for large-scale machine learning. https:\/\/www.tensorflow.org\/ (accessed 2021-02-01)."},{"key":"ref55\/cit55","unstructured":"Duvenaud, D.; Maclaurin, D.; Aguilera-Iparraguirre, J.; G\u00f3mez-Bombarelli, R.; Hirzel, T.; Aspuru-Guzik, A.; Adams, R. P. Convolutional networks on graphs for learning molecular fingerprints. 2015, arXiv:1509.09292.  arXiv preprint. https:\/\/arxiv.org\/abs\/1509.09292 (accessed 2023-01-30)."},{"key":"ref56\/cit56","doi-asserted-by":"publisher","DOI":"10.1021\/ci400187y"},{"key":"ref57\/cit57","doi-asserted-by":"publisher","DOI":"10.1007\/s10822-016-9938-8"},{"key":"ref58\/cit58","doi-asserted-by":"publisher","DOI":"10.1021\/ci990307l"},{"key":"ref59\/cit59","doi-asserted-by":"publisher","DOI":"10.1039\/D1SC05259D"},{"key":"ref60\/cit60","doi-asserted-by":"publisher","DOI":"10.1021\/ci060164k"}],"container-title":["Journal of Chemical Information and Modeling"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/pubs.acs.org\/doi\/pdf\/10.1021\/acs.jcim.2c01189","content-type":"application\/pdf","content-version":"vor","intended-application":"unspecified"},{"URL":"https:\/\/pubs.acs.org\/doi\/pdf\/10.1021\/acs.jcim.2c01189","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,4,25]],"date-time":"2023-04-25T22:32:26Z","timestamp":1682461946000},"score":1,"resource":{"primary":{"URL":"https:\/\/pubs.acs.org\/doi\/10.1021\/acs.jcim.2c01189"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,2,9]]},"references-count":60,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2023,2,27]]}},"alternative-id":["10.1021\/acs.jcim.2c01189"],"URL":"https:\/\/doi.org\/10.1021\/acs.jcim.2c01189","relation":{},"ISSN":["1549-9596","1549-960X"],"issn-type":[{"value":"1549-9596","type":"print"},{"value":"1549-960X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,2,9]]}}}