{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,17]],"date-time":"2026-03-17T03:58:05Z","timestamp":1773719885298,"version":"3.50.1"},"reference-count":61,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2024,12,5]],"date-time":"2024-12-05T00:00:00Z","timestamp":1733356800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2024,12,5]],"date-time":"2024-12-05T00:00:00Z","timestamp":1733356800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"funder":[{"name":"Portuguese Foundation for Science and Technology","award":["SFRH\/BD\/144314\/2019"],"award-info":[{"award-number":["SFRH\/BD\/144314\/2019"]}]},{"name":"Portuguese Foundation for Science and Technology","award":["DFA\/BD\/08789\/2021"],"award-info":[{"award-number":["DFA\/BD\/08789\/2021"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Cheminform"],"DOI":"10.1186\/s13321-024-00937-7","type":"journal-article","created":{"date-parts":[[2024,12,5]],"date-time":"2024-12-05T08:07:49Z","timestamp":1733386069000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":16,"title":["Deepmol: an automated machine and deep learning framework for computational chemistry"],"prefix":"10.1186","volume":"16","author":[{"given":"Jo\u00e3o","family":"Correia","sequence":"first","affiliation":[]},{"given":"Jo\u00e3o","family":"Capela","sequence":"additional","affiliation":[]},{"given":"Miguel","family":"Rocha","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,12,5]]},"reference":[{"issue":"10","key":"937_CR1","doi-asserted-by":"publisher","first-page":"2520","DOI":"10.3390\/molecules23102520","volume":"23","author":"G Hessler","year":"2018","unstructured":"Hessler G, Baringhaus KH (2018) Artificial intelligence in drug design. Molecules 23(10):2520. https:\/\/doi.org\/10.3390\/molecules23102520","journal-title":"Molecules"},{"key":"937_CR2","doi-asserted-by":"publisher","first-page":"29","DOI":"10.1016\/j.ddtec.2020.05.001","volume":"32\u201333","author":"J Shen","year":"2019","unstructured":"Shen J, Nicolaou CA (2019) Molecular property prediction: recent trends in the era of artificial intelligence. Drug Discov Today: Technol 32\u201333:29\u201336. https:\/\/doi.org\/10.1016\/j.ddtec.2020.05.001","journal-title":"Drug Discov Today: Technol"},{"issue":"20","key":"937_CR3","doi-asserted-by":"publisher","first-page":"2233","DOI":"10.1002\/cphc.202000518","volume":"21","author":"J Gasteiger","year":"2020","unstructured":"Gasteiger J (2020) Chemistry in times of artificial intelligence. ChemPhysChem 21(20):2233\u20132242. https:\/\/doi.org\/10.1002\/cphc.202000518","journal-title":"ChemPhysChem"},{"issue":"2","key":"937_CR4","doi-asserted-by":"publisher","first-page":"263","DOI":"10.1021\/acs.accounts.0c00699","volume":"54","author":"WP Walters","year":"2020","unstructured":"Walters WP, Barzilay R (2020) Applications of deep learning in molecule generation and molecular property prediction. Acc Chem Res 54(2):263\u2013270. https:\/\/doi.org\/10.1021\/acs.accounts.0c00699","journal-title":"Acc Chem Res"},{"issue":"15","key":"937_CR5","doi-asserted-by":"publisher","DOI":"10.1088\/1367-2630\/15\/9\/095003","volume":"9","author":"G Montavon","year":"2013","unstructured":"Montavon G, Rupp M, Gobre V, Vazquez-Mayagoitia A, Hansen K, Tkatchenko A et al (2013) Machine learning of molecular electronic properties in chemical compound space. New J Phys 9(15):095003. https:\/\/doi.org\/10.1088\/1367-2630\/15\/9\/095003","journal-title":"New J Phys"},{"issue":"11","key":"937_CR6","doi-asserted-by":"publisher","first-page":"4125","DOI":"10.1038\/s41467-020-17844-8","volume":"8","author":"A Tkatchenko","year":"2020","unstructured":"Tkatchenko A (2020) Machine learning for chemical discovery. Nat Commun 8(11):4125. https:\/\/doi.org\/10.1038\/s41467-020-17844-8","journal-title":"Nat Commun"},{"issue":"96","key":"937_CR7","doi-asserted-by":"publisher","first-page":"1027","DOI":"10.1021\/cr950202r","volume":"1","author":"M Karelson","year":"1996","unstructured":"Karelson M, Lobanov VS, Katritzky AR (1996) Quantum-chemical descriptors in QSAR\/QSPR studies. Chem Rev 1(96):1027\u20131044. https:\/\/doi.org\/10.1021\/cr950202r","journal-title":"Chem Rev"},{"issue":"77","key":"937_CR8","doi-asserted-by":"publisher","first-page":"507","DOI":"10.1002\/cplu.201200038","volume":"7","author":"WM Berhanu","year":"2012","unstructured":"Berhanu WM, Pillai GG, Oliferenko AA, Katritzky AR (2012) Quantitative structure-activity\/property relationships: the ubiquitous links between cause and effect. ChemPlusChem 7(77):507\u2013517. https:\/\/doi.org\/10.1002\/cplu.201200038","journal-title":"ChemPlusChem"},{"issue":"9","key":"937_CR9","doi-asserted-by":"publisher","first-page":"60","DOI":"10.3390\/math9010060","volume":"12","author":"PCS Costa","year":"2020","unstructured":"Costa PCS, Evangelista JS, Leal I, Miranda PCML (2020) Chemical graph theory for property modeling in QSAR and QSPR-charming QSAR and QSPR. Mathematics 12(9):60. https:\/\/doi.org\/10.3390\/math9010060","journal-title":"Mathematics"},{"issue":"124","key":"937_CR10","doi-asserted-by":"publisher","DOI":"10.1016\/j.jmgm.2023.108564","volume":"11","author":"IL Guidotti","year":"2023","unstructured":"Guidotti IL, Neis A, Martinez DP, Seixas FK, Machado K, Kremer FS (2023) Bambu and its applications in the discovery of active molecules against melanoma. J Mol Graph Model 11(124):108564. https:\/\/doi.org\/10.1016\/j.jmgm.2023.108564","journal-title":"J Mol Graph Model"},{"issue":"1","key":"937_CR11","doi-asserted-by":"publisher","first-page":"334","DOI":"10.1124\/pr.112.007336","volume":"66","author":"G Sliwoski","year":"2014","unstructured":"Sliwoski G, Kothiwale S, Meiler J, Lowe Edward W, J, (2014) Computational methods in drug discovery. Pharmacol Rev 66(1):334\u2013395. https:\/\/doi.org\/10.1124\/pr.112.007336","journal-title":"Pharmacol Rev"},{"key":"937_CR12","doi-asserted-by":"publisher","first-page":"22","DOI":"10.1093\/bib\/bbaa321","volume":"7","author":"Z Wu","year":"2021","unstructured":"Wu Z, Zhu M, Kang Y, Leung ELH, Lei T, Shen C et al (2021) Do we need different machine learning algorithms for QSAR modeling? A comprehensive assessment of 16 machine learning algorithms on 14 QSAR data sets. Brief Bioinform 7:22. https:\/\/doi.org\/10.1093\/bib\/bbaa321","journal-title":"Brief Bioinform"},{"key":"937_CR13","doi-asserted-by":"crossref","unstructured":"Xu Y (2022) In: Deep Neural Networks for QSAR; p. 233\u2013260","DOI":"10.1007\/978-1-0716-1787-8_10"},{"issue":"12","key":"937_CR14","doi-asserted-by":"publisher","DOI":"10.1016\/j.drudis.2022.103373","volume":"27","author":"Z Li","year":"2022","unstructured":"Li Z, Jiang M, Wang S, Zhang S (2022) Deep learning methods for molecular representation and property prediction. Drug Discov Today 27(12):103373. https:\/\/doi.org\/10.1016\/j.drudis.2022.103373","journal-title":"Drug Discov Today"},{"key":"937_CR15","doi-asserted-by":"publisher","DOI":"10.3389\/fchem.2022.852893","author":"\u00c1 Orosz","year":"2022","unstructured":"Orosz \u00c1, H\u00e9berger K, R\u00e1cz A (2022) Comparison of descriptor- and fingerprint sets in machine learning models for ADME-tox targets. Front Chem. https:\/\/doi.org\/10.3389\/fchem.2022.852893","journal-title":"Front Chem"},{"key":"937_CR16","doi-asserted-by":"publisher","first-page":"5736","DOI":"10.1038\/s41467-023-41512-2","volume":"14","author":"G Turon","year":"2023","unstructured":"Turon G, Hlozek J, Woodland JG et al (2023) First fully-automated AI\/ML virtual screening cascade implemented at a drug discovery centre in Africa. Nat Commun 14:5736. https:\/\/doi.org\/10.1038\/s41467-023-41512-2","journal-title":"Nat Commun"},{"issue":"14","key":"937_CR17","doi-asserted-by":"publisher","first-page":"5365","DOI":"10.1021\/acs.jcim.4c00457","volume":"64","author":"L Mervin","year":"2024","unstructured":"Mervin L, Voronov A, Kabeshov M, Engkvist O (2024) QSARtuna: an automated qsar modeling platform for molecular property prediction in drug design. J Chem Inform Model 64(14):5365\u20135374. https:\/\/doi.org\/10.1021\/acs.jcim.4c00457","journal-title":"J Chem Inform Model"},{"key":"937_CR18","doi-asserted-by":"crossref","unstructured":"Akiba T, Sano S, Yanase T, Ohta T, Koyama M (2019) Optuna: A Next-generation Hyperparameter Optimization Framework. In: Proceedings of the 25th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining","DOI":"10.1145\/3292500.3330701"},{"key":"937_CR19","unstructured":": RDKit: Open-source cheminformatics. http:\/\/www.rdkit.org"},{"key":"937_CR20","first-page":"2825","volume":"12","author":"F Pedregosa","year":"2011","unstructured":"Pedregosa F, Varoquaux G, Gramfort A, Michel V, Thirion B, Grisel O et al (2011) Scikit-learn: machine learning in python. J Mach Learn Res 12:2825\u20132830","journal-title":"J Mach Learn Res"},{"key":"937_CR21","unstructured":"Abadi M, Agarwal A, Barham P, Brevdo E, Chen Z, Citro C, et\u00a0al.: TensorFlow: Large-Scale Machine Learning on Heterogeneous Systems. Software available from tensorflow.org. Available from: https:\/\/www.tensorflow.org\/"},{"key":"937_CR22","unstructured":"Ramsundar B, Eastman P, Walters P, Pande V, Leswing K, Wu Z (2019) Deep Learning for the Life Sciences. O\u2019Reilly Media. https:\/\/www.amazon.com\/Deep-Learning-Life-Sciences-Microscopy\/dp\/1492039837"},{"key":"937_CR23","unstructured":"Huang K, Fu T, Gao W, Zhao Y, Roohani Y, Leskovec J, et\u00a0al. (2021) Therapeutics Data Commons: Machine Learning Datasets and Tasks for Drug Discovery and Development. In: Vanschoren J, Yeung S, editors. Proceedings of the Neural Information Processing Systems Track on Datasets and Benchmarks. vol.\u00a01. Curran. Available from: https:\/\/datasets-benchmarks-proceedings.neurips.cc\/paper_files\/paper\/2021\/file\/4c56ff4ce4aaf9573aa5dff913df997a-Paper-round1.pdf"},{"issue":"1","key":"937_CR24","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1021\/acs.jcim.7b00425","volume":"58","author":"D Probst","year":"2018","unstructured":"Probst D, Reymond JL (2018) SmilesDrawer: parsing and drawing SMILES-encoded molecular structures using client-side javascript. J Chem Inform Model 58(1):1\u20137. https:\/\/doi.org\/10.1021\/acs.jcim.7b00425","journal-title":"J Chem Inform Model"},{"issue":"5","key":"937_CR25","doi-asserted-by":"publisher","first-page":"1030","DOI":"10.1021\/ci960343+","volume":"36","author":"J Gasteiger","year":"1996","unstructured":"Gasteiger J, Sadowski J, Schuur J, Selzer P, Steinhauer L, Steinhauer V (1996) Chemical information in 3D space. J Chem Inform Comput Sci 36(5):1030\u20131037. https:\/\/doi.org\/10.1021\/ci960343+","journal-title":"J Chem Inform Comput Sci"},{"key":"937_CR26","volume-title":"Handbook of computational chemistry","author":"J Polanski","year":"2017","unstructured":"Polanski J, Gasteiger J (2017) Computer representation of chemical compounds. In: Leszczynski Jerzy, Kaczmarek-Kedziera Anna, Puzyn Tomasz, Papadopoulos Manthos G, Reis Heribert, Shukla Manoj K (eds) Handbook of computational chemistry. Springer International Publishing, New York"},{"key":"937_CR27","doi-asserted-by":"publisher","first-page":"12","DOI":"10.1002\/wcms.1603","volume":"9","author":"DS Wigh","year":"2022","unstructured":"Wigh DS, Goodman JM, Lapkin AA (2022) A review of molecular representation in the age of machine learning. WIREs Comput Mol Sci 9:12. https:\/\/doi.org\/10.1002\/wcms.1603","journal-title":"WIREs Comput Mol Sci"},{"issue":"27","key":"937_CR28","doi-asserted-by":"publisher","first-page":"911","DOI":"10.1080\/1062936X.2016.1253611","volume":"11","author":"K Mansouri","year":"2016","unstructured":"Mansouri K, Grulke CM, Richard AM, Judson RS, Williams AJ (2016) An automated curation procedure for addressing chemical errors and inconsistencies in public datasets used in QSAR modelling. SAR and QSAR Environ Res 11(27):911\u2013937. https:\/\/doi.org\/10.1080\/1062936X.2016.1253611","journal-title":"SAR and QSAR Environ Res"},{"issue":"7","key":"937_CR29","doi-asserted-by":"publisher","first-page":"1189","DOI":"10.1021\/ci100176x","volume":"50","author":"D Fourches","year":"2010","unstructured":"Fourches D, Muratov E, Tropsha A (2010) Trust, but verify: on the importance of chemical structure curation in cheminformatics and QSAR modeling research. J Chem Inform Model 50(7):1189\u20131204. https:\/\/doi.org\/10.1021\/ci100176x","journal-title":"J Chem Inform Model"},{"key":"937_CR30","doi-asserted-by":"publisher","DOI":"10.1186\/s13321-020-00456-1","author":"AP Bento","year":"2020","unstructured":"Bento AP, Hersey A, F\u00e9lix E, Landrum G, Gaulton A, Atkinson F et al (2020) An open source chemical structure curation pipeline using RDKit. J Cheminform. https:\/\/doi.org\/10.1186\/s13321-020-00456-1","journal-title":"J Cheminform"},{"key":"937_CR31","doi-asserted-by":"publisher","DOI":"10.1186\/s13321-018-0293-8","author":"VD H\u00e4hnke","year":"2018","unstructured":"H\u00e4hnke VD, Kim S, Bolton EE (2018) PubChem chemical structure standardization. J Cheminform. https:\/\/doi.org\/10.1186\/s13321-018-0293-8","journal-title":"J Cheminform"},{"key":"937_CR32","doi-asserted-by":"publisher","DOI":"10.1186\/s13321-015-0072-8","author":"K Karapetyan","year":"2015","unstructured":"Karapetyan K, Batchelor C, Sharpe D, Tkachenko V, Williams AJ (2015) The chemical validation and standardization platform (CVSP): large-scale automated validation of chemical structure datasets. J Cheminform. https:\/\/doi.org\/10.1186\/s13321-015-0072-8","journal-title":"J Cheminform"},{"key":"937_CR33","volume-title":"Molecular descriptors for chemoinformatics","author":"V Consonni","year":"2009","unstructured":"Consonni V, Todeschini R (2009) Molecular descriptors for chemoinformatics. John Wiley & Sons, Hoboken"},{"key":"937_CR34","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4020-9783-6_3","author":"R Todeschini","year":"2010","unstructured":"Todeschini R, Consonni V (2010) Molecular descriptors. Recent Adv QSAR Stud. https:\/\/doi.org\/10.1007\/978-1-4020-9783-6_3","journal-title":"Recent Adv QSAR Stud"},{"issue":"10","key":"937_CR35","doi-asserted-by":"publisher","first-page":"4","DOI":"10.1186\/s13321-018-0258-y","volume":"12","author":"H Moriwaki","year":"2018","unstructured":"Moriwaki H, Tian YS, Kawashita N, Takagi T (2018) Mordred: a molecular descriptor calculator. J Cheminform 12(10):4. https:\/\/doi.org\/10.1186\/s13321-018-0258-y","journal-title":"J Cheminform"},{"issue":"61","key":"937_CR36","doi-asserted-by":"publisher","first-page":"1560","DOI":"10.1021\/acs.jcim.0c01127","volume":"4","author":"X Li","year":"2021","unstructured":"Li X, Fourches D (2021) SMILES pair encoding: a data-driven substructure tokenization algorithm for deep learning. J Chem Inform Model 4(61):1560\u20131569. https:\/\/doi.org\/10.1021\/acs.jcim.0c01127","journal-title":"J Chem Inform Model"},{"issue":"30","key":"937_CR37","doi-asserted-by":"publisher","first-page":"595","DOI":"10.1007\/s10822-016-9938-8","volume":"8","author":"S Kearnes","year":"2016","unstructured":"Kearnes S, McCloskey K, Berndl M, Pande V, Riley P (2016) Molecular graph convolutions: moving beyond fingerprints. J Comput-Aided Mol Des 8(30):595\u2013608. https:\/\/doi.org\/10.1007\/s10822-016-9938-8","journal-title":"J Comput-Aided Mol Des"},{"key":"937_CR38","unstructured":"Duvenaud DK, Maclaurin D, Iparraguirre J, Bombarell R, Hirzel T, Aspuru-Guzik A, et\u00a0al. (2015) Convolutional networks on graphs for learning molecular fingerprints. Advances in neural information processing systems. 28"},{"key":"937_CR39","doi-asserted-by":"publisher","DOI":"10.4855\/arXiv.1805.11973","author":"N De Cao","year":"2018","unstructured":"De Cao N, Kipf T (2018) MolGAN: an implicit generative model for small molecular graphs. arXiv preprint. https:\/\/doi.org\/10.48550\/arXiv.1805.11973","journal-title":"arXiv preprint"},{"key":"937_CR40","unstructured":"Montavon G, Hansen K, Fazli S, Rupp M, Biegler F, Ziehe A, et\u00a0al. (2012) Learning invariant representations of molecules for atomization energy prediction. Advances in neural information processing systems. 25"},{"key":"937_CR41","doi-asserted-by":"publisher","DOI":"10.1863\/jss.v036.i11","author":"MB Kursa","year":"2010","unstructured":"Kursa MB, Rudnicki WR (2010) Feature selection with the boruta package. J Stat Softw. https:\/\/doi.org\/10.1863\/jss.v036.i11","journal-title":"J Stat Softw"},{"key":"937_CR42","doi-asserted-by":"publisher","DOI":"10.1515\/jib-2022-0006","author":"D Baptista","year":"2022","unstructured":"Baptista D, Correia J, Pereira B, Rocha M (2022) Evaluating molecular representations in machine learning models for drug response prediction and interpretability. J Integr Bioinform. https:\/\/doi.org\/10.1515\/jib-2022-0006","journal-title":"J Integr Bioinform"},{"key":"937_CR43","doi-asserted-by":"crossref","unstructured":"Capela J, Correia J, Pereira V, Rocha M (2022) Development of Deep Learning approaches to predict relationships between chemical structures and sweetness. In: 2022 International Joint Conference on Neural Networks (IJCNN). IEEE. Available from: https:\/\/doi.org\/10.1109\/ijcnn55064.2022.9891992","DOI":"10.1109\/IJCNN55064.2022.9891992"},{"issue":"4","key":"937_CR44","doi-asserted-by":"publisher","first-page":"747","DOI":"10.1021\/ci9803381","volume":"39","author":"D Butina","year":"1999","unstructured":"Butina D (1999) Unsupervised data base clustering based on daylight\u2019s fingerprint and tanimoto similarity: a fast and automated way to cluster small and large data sets. J Chem Inform Comput Sci 39(4):747\u2013750. https:\/\/doi.org\/10.1021\/ci9803381","journal-title":"J Chem Inform Comput Sci"},{"issue":"11","key":"937_CR45","doi-asserted-by":"publisher","first-page":"2840","DOI":"10.1021\/ci300400a","volume":"52","author":"C Xu","year":"2012","unstructured":"Xu C, Cheng F, Chen L, Du Z, Li W, Liu G et al (2012) In silico prediction of chemical Ames mutagenicity. J Chem Inform Model 52(11):2840\u20132847","journal-title":"J Chem Inform Model"},{"key":"937_CR46","doi-asserted-by":"publisher","DOI":"10.1186\/s40537-019-0192-5","author":"JM Johnson","year":"2019","unstructured":"Johnson JM, Khoshgoftaar TM (2019) Survey on deep learning with class imbalance. J Big Data. https:\/\/doi.org\/10.1186\/s40537-019-0192-5","journal-title":"J Big Data"},{"issue":"9","key":"937_CR47","doi-asserted-by":"publisher","first-page":"4180","DOI":"10.1021\/acs.jcim.9b01162","volume":"60","author":"S Korkmaz","year":"2020","unstructured":"Korkmaz S (2020) Deep learning-based imbalanced data classification for drug discovery. J Chem Inform Model 60(9):4180\u20134190. https:\/\/doi.org\/10.1021\/acs.jcim.9b01162","journal-title":"J Chem Inform Model"},{"issue":"17","key":"937_CR48","first-page":"1","volume":"18","author":"G Lema\u00eetre","year":"2017","unstructured":"Lema\u00eetre G, Nogueira F, Aridas CK (2017) Imbalanced-learn: a python toolbox to tackle the curse of imbalanced datasets in machine learning. J Mach Learn Res 18(17):1\u20135","journal-title":"J Mach Learn Res"},{"key":"937_CR49","doi-asserted-by":"publisher","first-page":"321","DOI":"10.1613\/jair.953","volume":"16","author":"NV Chawla","year":"2002","unstructured":"Chawla NV, Bowyer KW, Hall LO, Kegelmeyer WP (2002) SMOTE: synthetic minority over-sampling technique. J Artif Intell Res 16:321\u2013357. https:\/\/doi.org\/10.1613\/jair.953","journal-title":"J Artif Intell Res"},{"key":"937_CR50","unstructured":"Batista GEAPA, Bazzan ALC, Monard MC (2003) Balancing Training Data for Automated Annotation of Keywords: a Case Study. In: WOB"},{"issue":"1","key":"937_CR51","doi-asserted-by":"publisher","first-page":"20","DOI":"10.1145\/1007730.1007735","volume":"6","author":"GEAPA Batista","year":"2004","unstructured":"Batista GEAPA, Prati RC, Monard MC (2004) A study of the behavior of several methods for balancing machine learning training data. ACM SIGKDD Explor Newslett 6(1):20\u201329. https:\/\/doi.org\/10.1145\/1007730.1007735","journal-title":"ACM SIGKDD Explor Newslett"},{"key":"937_CR52","unstructured":"Lundberg SM, Lee SI (2017) A unified approach to interpreting model predictions. Advances in neural information processing systems. 30"},{"issue":"4\u20135","key":"937_CR53","doi-asserted-by":"publisher","first-page":"677","DOI":"10.1016\/j.jpba.2008.03.023","volume":"47","author":"CY Ma","year":"2008","unstructured":"Ma CY, Yang SY, Zhang H, Xiang ML, Huang Q, Wei YQ (2008) Prediction models of human plasma protein binding rate and oral bioavailability derived by using GA-CG-SVM method. J Pharm Biomed Anal 47(4\u20135):677\u2013682","journal-title":"J Pharm Biomed Anal"},{"key":"937_CR54","doi-asserted-by":"crossref","unstructured":"Baptista D, Correia J, Pereira B, Rocha M (2021) A Comparison of Different Compound Representations for Drug Sensitivity Prediction. In: Practical Applications of Computational Biology and Bioinformatics, 15th International Conference (PACBB 2021). Springer International Publishing. p. 145\u2013154. Available from: https:\/\/doi.org\/10.1007\/978-3-030-86258-9_15","DOI":"10.1007\/978-3-030-86258-9_15"},{"issue":"D1","key":"937_CR55","doi-asserted-by":"publisher","first-page":"D1373","DOI":"10.1093\/nar\/gkac956","volume":"51","author":"S Kim","year":"2022","unstructured":"Kim S, Chen J, Cheng T, Gindulyte A, He J, He S et al (2022) PubChem 2023 update. Nucleic Acids Res 51(D1):D1373\u2013D1380. https:\/\/doi.org\/10.1093\/nar\/gkac956","journal-title":"Nucleic Acids Res"},{"key":"937_CR56","unstructured":"Capela J, Cheixo J, de\u00a0Ridder D, Rocha M, Dias O (2024) Automated Machine Learning to Predict the Precursors of Plant Specialized Metabolites. Manuscript submitted"},{"issue":"5","key":"937_CR57","doi-asserted-by":"publisher","first-page":"960","DOI":"10.1111\/cbdd.13479","volume":"93","author":"SR Tangadpalliwar","year":"2019","unstructured":"Tangadpalliwar SR, Vishwakarma S, Nimbalkar R, Garg P (2019) ChemSuite: a package for chemoinformatics calculations and machine learning. Chem Biol Drug Des 93(5):960\u2013964. https:\/\/doi.org\/10.1111\/cbdd.13479","journal-title":"Chem Biol Drug Des"},{"issue":"4","key":"937_CR58","doi-asserted-by":"publisher","first-page":"1955","DOI":"10.1021\/acs.jcim.9b01053","volume":"60","author":"AJ Minnich","year":"2020","unstructured":"Minnich AJ, McLoughlin K, Tse M, Deng J, Weber A, Murad N et al (2020) AMPL: a data-driven modeling pipeline for drug discovery. J Chem Inform Model 60(4):1955\u20131968. https:\/\/doi.org\/10.1021\/acs.jcim.9b01053","journal-title":"J Chem Inform Model"},{"issue":"1","key":"937_CR59","doi-asserted-by":"publisher","first-page":"7","DOI":"10.1021\/acs.jcim.0c00971","volume":"61","author":"M Korshunova","year":"2021","unstructured":"Korshunova M, Ginsburg B, Tropsha A, Isayev O (2021) OpenChem: a deep learning toolkit for computational chemistry and drug design. J Chem Inform Model 61(1):7\u201313. https:\/\/doi.org\/10.1021\/acs.jcim.0c00971","journal-title":"J Chem Inform Model"},{"key":"937_CR60","doi-asserted-by":"publisher","DOI":"10.3389\/fphar.2022.833099","author":"BP Brown","year":"2022","unstructured":"Brown BP, Vu O, Geanes AR, Kothiwale S, Butkiewicz M, Lowe EW et al (2022) Introduction to the biochemical library (BCL): an application-based open-source toolkit for integrated cheminformatics and machine learning in computer-aided drug discovery. Front Pharmacol. https:\/\/doi.org\/10.3389\/fphar.2022.833099","journal-title":"Front Pharmacol"},{"key":"937_CR61","doi-asserted-by":"publisher","DOI":"10.1021\/acs.jcim.4c00863","author":"J Sieg","year":"2024","unstructured":"Sieg J, Feldmann CW, Hemmerich J, Stork C, Sandfort F, Eiden P et al (2024) MolPipeline: a python package for processing molecules with RDKit in scikit-learn. J Chem Inform Model. https:\/\/doi.org\/10.1021\/acs.jcim.4c00863","journal-title":"J Chem Inform Model"}],"container-title":["Journal of Cheminformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s13321-024-00937-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1186\/s13321-024-00937-7\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s13321-024-00937-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,12,5]],"date-time":"2024-12-05T09:06:48Z","timestamp":1733389608000},"score":1,"resource":{"primary":{"URL":"https:\/\/jcheminf.biomedcentral.com\/articles\/10.1186\/s13321-024-00937-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,12,5]]},"references-count":61,"journal-issue":{"issue":"1","published-online":{"date-parts":[[2024,12]]}},"alternative-id":["937"],"URL":"https:\/\/doi.org\/10.1186\/s13321-024-00937-7","relation":{"has-preprint":[{"id-type":"doi","id":"10.1101\/2024.05.27.595849","asserted-by":"object"}]},"ISSN":["1758-2946"],"issn-type":[{"value":"1758-2946","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,12,5]]},"assertion":[{"value":"5 June 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"25 November 2024","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"5 December 2024","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no competing interests.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}],"article-number":"136"}}