{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,18]],"date-time":"2026-03-18T17:33:02Z","timestamp":1773855182301,"version":"3.50.1"},"reference-count":87,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2025,9,15]],"date-time":"2025-09-15T00:00:00Z","timestamp":1757894400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,9,15]],"date-time":"2025-09-15T00:00:00Z","timestamp":1757894400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Comput Aided Mol Des"],"published-print":{"date-parts":[[2025,12]]},"DOI":"10.1007\/s10822-025-00657-6","type":"journal-article","created":{"date-parts":[[2025,9,15]],"date-time":"2025-09-15T06:30:25Z","timestamp":1757917825000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["Synergy of advanced machine learning and deep neural networks with consensus molecular docking for virtual screening of anaplastic lymphoma kinase inhibitors"],"prefix":"10.1007","volume":"39","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-8693-030X","authenticated-orcid":false,"given":"The-Chuong","family":"Trinh","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3532-2064","authenticated-orcid":false,"given":"Tieu-Long","family":"Phan","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7640-0807","authenticated-orcid":false,"given":"Van-Thinh","family":"To","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0271-2696","authenticated-orcid":false,"given":"Thanh-An","family":"Pham","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0009-0001-5379-1593","authenticated-orcid":false,"given":"Gia-Bao","family":"Truong","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2473-6309","authenticated-orcid":false,"given":"Lai Hoang Son","family":"Le","sequence":"additional","affiliation":[]},{"given":"Xuan-Truc Dinh","family":"Tran","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0952-1633","authenticated-orcid":false,"given":"Tuyen Ngoc","family":"Truong","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,9,15]]},"reference":[{"key":"657_CR1","unstructured":"Observatory G-GC (2020) Journal. https:\/\/gco.iarc.fr\/. Accessed 2020"},{"key":"657_CR2","unstructured":"Society AC (2023) Journal. https:\/\/www.cancer.org\/. Accessed 2023"},{"key":"657_CR3","unstructured":"Targeted Therapy to Treat Cancer (2023) https:\/\/www.cancer.gov\/about-cancer\/treatment\/types\/targeted-therapies. Accessed 15 May 2023"},{"issue":"1","key":"657_CR4","doi-asserted-by":"publisher","first-page":"193","DOI":"10.1146\/annurev.bi.48.070179.001205","volume":"48","author":"G Carpenter","year":"1979","unstructured":"Carpenter G, Cohen S (1979) Epidermal growth factor. Annu Rev Biochem 48(1):193\u2013216","journal-title":"Annu Rev Biochem"},{"issue":"8","key":"657_CR5","doi-asserted-by":"publisher","first-page":"1105","DOI":"10.1200\/JCO.2012.44.5353","volume":"31","author":"AT Shaw","year":"2013","unstructured":"Shaw AT, Engelman JA (2013) Alk in lung cancer: past, present, and future. J Clin Oncol 31(8):1105\u20131111","journal-title":"J Clin Oncol"},{"issue":"1","key":"657_CR6","doi-asserted-by":"publisher","first-page":"44","DOI":"10.1038\/s41556-018-0195-z","volume":"21","author":"D Pei","year":"2019","unstructured":"Pei D, Shu X, Gassama-Diagne A, Thiery JP (2019) Mesenchymal-epithelial transition in development and reprogramming. Nat Cell Biol 21(1):44\u201353","journal-title":"Nat Cell Biol"},{"issue":"2","key":"657_CR7","doi-asserted-by":"publisher","first-page":"305","DOI":"10.1097\/SLA.0b013e3181ae333f","volume":"250","author":"A Machens","year":"2009","unstructured":"Machens A, Lorenz K, Dralle H (2009) Individualization of lymph node dissection in ret (rearranged during transfection) carriers at risk for medullary thyroid cancer: value of pretherapeutic calcitonin levels. Ann Surg 250(2):305\u2013310","journal-title":"Ann Surg"},{"issue":"6","key":"657_CR8","doi-asserted-by":"publisher","first-page":"789","DOI":"10.1161\/ATVBAHA.108.179663","volume":"29","author":"N Ferrara","year":"2009","unstructured":"Ferrara N (2009) Vascular endothelial growth factor. Arterioscler Thromb Vasc Biol 29(6):789\u2013791","journal-title":"Arterioscler Thromb Vasc Biol"},{"key":"657_CR9","doi-asserted-by":"publisher","first-page":"175883592097561","DOI":"10.1177\/1758835920975613","volume":"12","author":"A Forsythe","year":"2020","unstructured":"Forsythe A, Zhang W, Phillip Strauss U, Fellous M, Korei M, Keating K (2020) A systematic review and meta-analysis of neurotrophic tyrosine receptor kinase gene fusion frequencies in solid tumors. Therap Adv Med Oncol 12:1758835920975613","journal-title":"Therap Adv Med Oncol"},{"key":"657_CR10","doi-asserted-by":"publisher","first-page":"127","DOI":"10.1016\/j.lungcan.2021.08.003","volume":"160","author":"CC Cheung","year":"2021","unstructured":"Cheung CC, Smith AC, Albadine R, Bigras G, Bojarski A, Couture C, Cutz J-C, Huang W-Y, Ionescu D, Itani D et al (2021) Canadian ros proto-oncogene 1 study (cros) for multi-institutional implementation of ros1 testing in non-small cell lung cancer. Lung Cancer 160:127\u2013135","journal-title":"Lung Cancer"},{"issue":"1","key":"657_CR11","doi-asserted-by":"publisher","first-page":"73","DOI":"10.1016\/j.jtcvs.2020.05.097","volume":"163","author":"Z Ma","year":"2022","unstructured":"Ma Z, Zhang Y, Deng C, Fu F, Deng L, Li Y, Chen H (2022) The prognostic value of kirsten rat sarcoma viral oncogene homolog mutations in resected lung adenocarcinoma differs according to clinical features. J Thorac Cardiovasc Surg 163(1):73\u201385","journal-title":"J Thorac Cardiovasc Surg"},{"issue":"23","key":"657_CR12","doi-asserted-by":"publisher","first-page":"15056","DOI":"10.3390\/ijms232315056","volume":"23","author":"J Wu","year":"2022","unstructured":"Wu J, Lin Z (2022) Non-small cell lung cancer targeted therapy: drugs and mechanisms of drug resistance. Int J Mol Sci 23(23):15056","journal-title":"Int J Mol Sci"},{"issue":"4","key":"657_CR13","doi-asserted-by":"publisher","first-page":"439","DOI":"10.1038\/sj.onc.1200849","volume":"14","author":"T Iwahara","year":"1997","unstructured":"Iwahara T, Fujimoto J, Wen D, Cupples R, Bucay N, Arakawa T, Mori S, Ratzkin B, Yamamoto T (1997) Molecular characterization of alk, a receptor tyrosine kinase expressed specifically in the nervous system. Oncogene 14(4):439\u2013449","journal-title":"Oncogene"},{"issue":"5","key":"657_CR14","doi-asserted-by":"publisher","first-page":"448","DOI":"10.1016\/j.modgep.2005.11.006","volume":"6","author":"E Vernersson","year":"2006","unstructured":"Vernersson E, Khoo NK, Henriksson ML, Roos G, Palmer RH, Hallberg B (2006) Characterization of the expression of the alk receptor tyrosine kinase in mice. Gene Expr Patterns 6(5):448\u2013461","journal-title":"Gene Expr Patterns"},{"issue":"1","key":"657_CR15","doi-asserted-by":"publisher","first-page":"68","DOI":"10.1016\/j.phrs.2012.11.007","volume":"68","author":"R Roskoski Jr","year":"2013","unstructured":"Roskoski R Jr (2013) Anaplastic lymphoma kinase (alk): structure, oncogenic activation, and pharmacological inhibition. Pharmacol Res 68(1):68\u201394","journal-title":"Pharmacol Res"},{"issue":"12","key":"657_CR16","doi-asserted-by":"publisher","first-page":"1691","DOI":"10.1080\/15384047.2015.1095407","volume":"16","author":"Z Zhao","year":"2015","unstructured":"Zhao Z, Verma V, Zhang M (2015) Anaplastic lymphoma kinase: role in cancer and therapy perspective. Cancer Biol Therapy 16(12):1691\u20131701","journal-title":"Cancer Biol Therapy"},{"key":"657_CR17","doi-asserted-by":"publisher","first-page":"289","DOI":"10.1007\/s12010-017-2650-x","volume":"185","author":"N James","year":"2018","unstructured":"James N, Shanthi V, Ramanathan K (2018) Drug design for alk-positive nsclc: an integrated pharmacophore-based 3d qsar and virtual screening strategy. Appl Biochem Biotechnol 185:289\u2013315","journal-title":"Appl Biochem Biotechnol"},{"key":"657_CR18","doi-asserted-by":"publisher","first-page":"127","DOI":"10.1016\/j.molstruc.2014.03.036","volume":"1067","author":"Z Ke","year":"2014","unstructured":"Ke Z, Lu T, Liu H, Yuan H, Ran T, Zhang Y, Yao S, Xiong X, Xu J, Xu A et al (2014) 3d-qsar and molecular fragment replacement study on diaminopyrimidine and pyrrolotriazine alk inhibitors. J Mol Struct 1067:127\u2013137","journal-title":"J Mol Struct"},{"key":"657_CR19","doi-asserted-by":"publisher","first-page":"2576","DOI":"10.1007\/s00044-013-0853-4","volume":"23","author":"P Wang","year":"2014","unstructured":"Wang P, Cai J, Chen J, Li L, Sun C, Xue B, Ji M (2014) 3d-qsar and docking studies of piperidine carboxamide derivatives as alk inhibitors. Med Chem Res 23:2576\u20132583","journal-title":"Med Chem Res"},{"issue":"1","key":"657_CR20","doi-asserted-by":"publisher","first-page":"0246126","DOI":"10.1371\/journal.pone.0246126","volume":"16","author":"GZ Espinoza","year":"2021","unstructured":"Espinoza GZ, Angelo RM, Oliveira PR, Honorio KM (2021) Evaluating deep learning models for predicting alk-5 inhibition. PLoS ONE 16(1):0246126","journal-title":"PLoS ONE"},{"issue":"15","key":"657_CR21","doi-asserted-by":"publisher","first-page":"4951","DOI":"10.3390\/molecules27154951","volume":"27","author":"RD Jawarkar","year":"2022","unstructured":"Jawarkar RD, Sharma P, Jain N, Gandhi A, Mukerjee N, Al-Mutairi AA, Zaki ME, Al-Hussain SA, Samad A, Masand VH et al (2022) Qsar, molecular docking, md simulation and mmgbsa calculations approaches to recognize concealed pharmacophoric features requisite for the optimization of alk tyrosine kinase inhibitors as anticancer leads. Molecules 27(15):4951","journal-title":"Molecules"},{"key":"657_CR22","doi-asserted-by":"crossref","unstructured":"Akiba T, Sano S, Yanase T, Ohta T, Koyama M (2019) Optuna: a next-generation hyperparameter optimization framework. In: Proceedings of the 25th ACM SIGKDD international conference on knowledge discovery & data mining, pp 2623\u20132631","DOI":"10.1145\/3292500.3330701"},{"key":"657_CR23","doi-asserted-by":"crossref","unstructured":"Sakamoto K, Lavvson L, Milner J (1997) Allyl sulfides from garlic suppress the in vitro proliferation of human a549 lung tumor cells","DOI":"10.1080\/01635589709514617"},{"issue":"D1","key":"657_CR24","doi-asserted-by":"publisher","first-page":"1100","DOI":"10.1093\/nar\/gkr777","volume":"40","author":"A Gaulton","year":"2012","unstructured":"Gaulton A, Bellis LJ, Bento AP, Chambers J, Davies M, Hersey A, Light Y, McGlinchey S, Michalovich D, Al-Lazikani B et al (2012) Chembl: a large-scale bioactivity database for drug discovery. Nucleic Acids Res 40(D1):1100\u20131107","journal-title":"Nucleic Acids Res"},{"issue":"5","key":"657_CR25","doi-asserted-by":"publisher","first-page":"679","DOI":"10.1016\/j.ccr.2011.04.004","volume":"19","author":"H Sakamoto","year":"2011","unstructured":"Sakamoto H, Tsukaguchi T, Hiroshima S, Kodama T, Kobayashi T, Fukami TA, Oikawa N, Tsukuda T, Ishii N, Aoki Y (2011) Ch5424802, a selective alk inhibitor capable of blocking the resistant gatekeeper mutant. Cancer Cell 19(5):679\u2013690","journal-title":"Cancer Cell"},{"issue":"4","key":"657_CR26","doi-asserted-by":"publisher","first-page":"337","DOI":"10.1016\/j.ddtec.2004.11.007","volume":"1","author":"CA Lipinski","year":"2004","unstructured":"Lipinski CA (2004) Lead-and drug-like compounds: the rule-of-five revolution. Drug Discov Today Technol 1(4):337\u2013341","journal-title":"Drug Discov Today Technol"},{"key":"657_CR27","unstructured":"Landrum G (2016) RDKit: open-source cheminformatics. http:\/\/www.rdkit.org\/. https:\/\/github.com\/rdkit\/rdkit. Release 2016_09_5, Reference: 149, 650"},{"key":"657_CR28","first-page":"2825","volume":"12","author":"F Pedregosa","year":"2011","unstructured":"Pedregosa F, Varoquaux G, Gramfort A, Michel V, Thirion B, Grisel O, Blondel M, Prettenhofer P, Weiss R, Dubourg V et al (2011) Scikit-learn: machine learning in python. J Mach Learn Res 12:2825\u20132830","journal-title":"J Mach Learn Res"},{"issue":"17","key":"657_CR29","first-page":"1","volume":"18","author":"G Lema\u00c3\u017dtre","year":"2017","unstructured":"Lema\u00c3\u017dtre G, Nogueira F, Aridas CK (2017) Imbalanced-learn: a python toolbox to tackle the curse of imbalanced datasets in machine learning. J Mach Learn Res 18(17):1\u20135","journal-title":"J Mach Learn Res"},{"issue":"1","key":"657_CR30","doi-asserted-by":"publisher","first-page":"4","DOI":"10.1186\/s13321-018-0258-y","volume":"10","author":"H Moriwaki","year":"2018","unstructured":"Moriwaki H, Tian Y-S, Kawashita N, Takagi T (2018) Mordred: a molecular descriptor calculator. J Cheminform 10(1):4","journal-title":"J Cheminform"},{"issue":"1","key":"657_CR31","doi-asserted-by":"publisher","first-page":"27","DOI":"10.1021\/acs.jcim.7b00616","volume":"58","author":"S Jaeger","year":"2018","unstructured":"Jaeger S, Fulle S, Turk S (2018) Mol2vec: unsupervised machine learning approach with chemical intuition. J Chem Inf Model 58(1):27\u201335","journal-title":"J Chem Inf Model"},{"key":"657_CR32","doi-asserted-by":"publisher","first-page":"58","DOI":"10.1016\/j.ymeth.2014.08.005","volume":"71","author":"A Cereto-Massagu\u00e9","year":"2015","unstructured":"Cereto-Massagu\u00e9 A, Ojeda MJ, Valls C, Mulero M, Garcia-Vallv\u00e9 S, Pujadas G (2015) Molecular fingerprint similarity search in virtual screening. Methods 71:58\u201363","journal-title":"Methods"},{"issue":"10","key":"657_CR33","doi-asserted-by":"publisher","first-page":"4536","DOI":"10.1021\/acs.jcim.0c00469","volume":"60","author":"LJ Martin","year":"2020","unstructured":"Martin LJ, Bowen MT (2020) Comparing fingerprints for ligand-based virtual screening: a fast and scalable approach for unbiased evaluation. J Chem Inf Model 60(10):4536\u20134545","journal-title":"J Chem Inf Model"},{"issue":"10","key":"657_CR34","doi-asserted-by":"publisher","first-page":"5054","DOI":"10.1021\/acs.jcim.1c00589","volume":"61","author":"D Warszycki","year":"2021","unstructured":"Warszycki D, Struski \u0141, Smieja M, Kafel R, Kurczab R (2021) Pharmacoprint: a combination of a pharmacophore fingerprint and artificial intelligence as a tool for computer-aided drug design. J Chem Inf Model 61(10):5054\u20135065","journal-title":"J Chem Inf Model"},{"key":"657_CR35","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s13321-020-00445-4","volume":"12","author":"A Capecchi","year":"2020","unstructured":"Capecchi A, Probst D, Reymond J-L (2020) One molecular fingerprint to rule them all: drugs, biomolecules, and the metabolome. J Cheminform 12:1\u201315","journal-title":"J Cheminform"},{"key":"657_CR36","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s13321-018-0321-8","volume":"10","author":"D Probst","year":"2018","unstructured":"Probst D, Reymond J-L (2018) A probabilistic molecular fingerprint for big data settings. J Cheminform 10:1\u201312","journal-title":"J Cheminform"},{"key":"657_CR37","doi-asserted-by":"crossref","unstructured":"Breunig MM, Kriegel H-P, Ng RT, Sander J (2000) Lof: identifying density-based local outliers. In: Proceedings of the 2000 ACM sigmod international conference on management of data, pp 93\u2013104","DOI":"10.1145\/342009.335388"},{"issue":"18","key":"657_CR38","doi-asserted-by":"publisher","first-page":"2395","DOI":"10.1161\/CIRCULATIONAHA.106.682658","volume":"117","author":"MP LaValley","year":"2008","unstructured":"LaValley MP (2008) Logistic regression. Circulation 117(18):2395\u20132399","journal-title":"Circulation"},{"issue":"2","key":"657_CR39","doi-asserted-by":"publisher","first-page":"1883","DOI":"10.4249\/scholarpedia.1883","volume":"4","author":"LE Peterson","year":"2009","unstructured":"Peterson LE (2009) K-nearest neighbor. Scholarpedia 4(2):1883","journal-title":"Scholarpedia"},{"issue":"12","key":"657_CR40","doi-asserted-by":"publisher","first-page":"1565","DOI":"10.1038\/nbt1206-1565","volume":"24","author":"WS Noble","year":"2006","unstructured":"Noble WS (2006) What is a support vector machine? Nat Biotechnol 24(12):1565\u20131567","journal-title":"Nat Biotechnol"},{"key":"657_CR41","doi-asserted-by":"crossref","unstructured":"Cutler A, Cutler DR, Stevens JR (2012) Random forests. Ensemble machine learning: methods and applications, 157\u2013175","DOI":"10.1007\/978-1-4419-9326-7_5"},{"key":"657_CR42","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1007\/s10994-006-6226-1","volume":"63","author":"P Geurts","year":"2006","unstructured":"Geurts P, Ernst D, Wehenkel L (2006) Extremely randomized trees. Mach Learn 63:3\u201342","journal-title":"Mach Learn"},{"key":"657_CR43","doi-asserted-by":"crossref","unstructured":"Schapire RE (2013) Explaining adaboost. In: Empirical inference: Festschrift in Honor of Vladimir N. Vapnik, pp 37\u201352. Springer","DOI":"10.1007\/978-3-642-41136-6_5"},{"key":"657_CR44","doi-asserted-by":"crossref","unstructured":"Friedman JH (2001) Greedy function approximation: a gradient boosting machine. Ann Stat 1189\u20131232","DOI":"10.1214\/aos\/1013203451"},{"key":"657_CR45","doi-asserted-by":"crossref","unstructured":"Chen T, Guestrin C (2016) Xgboost: a scalable tree boosting system. In: Proceedings of the 22nd ACM Sigkdd international conference on knowledge discovery and data mining, pp 785\u2013794","DOI":"10.1145\/2939672.2939785"},{"key":"657_CR46","unstructured":"Dorogush AV, Ershov V, Gulin A (2018) Catboost: gradient boosting with categorical features support. arXiv preprint arXiv:1810.11363"},{"key":"657_CR47","volume-title":"Neural networks: a comprehensive foundation","author":"S Haykin","year":"1994","unstructured":"Haykin S (1994) Neural networks: a comprehensive foundation. Prentice Hall PTR, New Jersey"},{"key":"657_CR48","doi-asserted-by":"crossref","unstructured":"Rey D, Neuh\u00e4user M (2011) Wilcoxon-signed-rank test. In: International encyclopedia of statistical science, pp 1658\u20131659. Springer","DOI":"10.1007\/978-3-642-04898-2_616"},{"key":"657_CR49","unstructured":"scikit-learn developers. sklearn.naive_bayes.GaussianNB \u2013 scikit-learn documentation. https:\/\/scikit-learn.org\/stable\/modules\/generated\/sklearn.naive_bayes.GaussianNB.html"},{"key":"657_CR50","unstructured":"scikit-learn developers. sklearn.naive_bayes.BernoulliNB \u2013 scikit-learn documentation. https:\/\/scikit-learn.org\/stable\/modules\/generated\/sklearn.naive_bayes.BernoulliNB.html"},{"key":"657_CR51","unstructured":"Riffenburgh RH (1957) Linear discriminant analysis"},{"key":"657_CR52","unstructured":"scikit-learn developers. Linear and Quadratic Discriminant Analysis \u2013 scikit-learn documentation. https:\/\/scikit-learn.org\/stable\/modules\/lda_qda.html"},{"key":"657_CR53","doi-asserted-by":"crossref","unstructured":"Rokach L, Maimon O (2005) Decision trees. Data mining and knowledge discovery handbook, 165\u2013192","DOI":"10.1007\/0-387-25465-X_9"},{"key":"657_CR54","doi-asserted-by":"publisher","first-page":"321","DOI":"10.1613\/jair.953","volume":"16","author":"NV Chawla","year":"2002","unstructured":"Chawla NV, Bowyer KW, Hall LO, Kegelmeyer WP (2002) Smote: synthetic minority over-sampling technique. J Artif Intell Res 16:321\u2013357","journal-title":"J Artif Intell Res"},{"key":"657_CR55","unstructured":"Watanabe S (2023) Tree-structured parzen estimator: Understanding its algorithm components and their roles for better empirical performance. arXiv preprint arXiv:2304.11127"},{"key":"657_CR56","unstructured":"Paszke A, Gross S, Massa F, Lerer A, Bradbury J, Chanan G, Killeen T, Lin Z, Gimelshein N, Antiga L, et al (2019) Advances in neural information processing systems. Curran Associates, Inc 32, 8024\u20138035"},{"issue":"1","key":"657_CR57","first-page":"1929","volume":"15","author":"N Srivastava","year":"2014","unstructured":"Srivastava N, Hinton G, Krizhevsky A, Sutskever I, Salakhutdinov R (2014) Dropout: a simple way to prevent neural networks from overfitting. J Mach Learn Res 15(1):1929\u20131958","journal-title":"J Mach Learn Res"},{"key":"657_CR58","unstructured":"Agarap AF (2018) Deep learning using rectified linear units (relu). arXiv preprint arXiv:1803.08375"},{"issue":"1\u20132","key":"657_CR59","doi-asserted-by":"publisher","first-page":"69","DOI":"10.1016\/S0020-0255(96)00200-9","volume":"99","author":"S Narayan","year":"1997","unstructured":"Narayan S (1997) The generalized sigmoid activation function: competitive supervised learning. Inf Sci 99(1\u20132):69\u201382","journal-title":"Inf Sci"},{"issue":"6","key":"657_CR60","doi-asserted-by":"publisher","first-page":"84","DOI":"10.1145\/3065386","volume":"60","author":"A Krizhevsky","year":"2017","unstructured":"Krizhevsky A, Sutskever I, Hinton GE (2017) Imagenet classification with deep convolutional neural networks. Commun ACM 60(6):84\u201390","journal-title":"Commun ACM"},{"key":"657_CR61","unstructured":"Krogh A, Hertz J (1991) A simple weight decay can improve generalization. Adv Neural Inf Process Syst 4"},{"key":"657_CR62","unstructured":"Kingma DP (2014) Adam: a method for stochastic optimization. arXiv preprint arXiv:1412.6980"},{"key":"657_CR63","doi-asserted-by":"crossref","unstructured":"Refaeilzadeh P, Tang L, Liu H (2009) Cross-validation. In: Encyclopedia of database systems, pp 532\u2013538. Springer","DOI":"10.1007\/978-0-387-39940-9_565"},{"key":"657_CR64","doi-asserted-by":"crossref","unstructured":"Goutte C, Gaussier E (2005) A probabilistic interpretation of precision, recall and f-score, with implication for evaluation. In: European conference on information retrieval, pp 345\u2013359. Springer","DOI":"10.1007\/978-3-540-31865-1_25"},{"key":"657_CR65","doi-asserted-by":"crossref","unstructured":"Zhang E, Zhang Y (2009) Average precision. Encyclopedia of database systems, 192\u2013193","DOI":"10.1007\/978-0-387-39940-9_482"},{"issue":"9","key":"657_CR66","doi-asserted-by":"publisher","first-page":"1263","DOI":"10.1109\/TKDE.2008.239","volume":"21","author":"H He","year":"2009","unstructured":"He H, Garcia EA (2009) Learning from imbalanced data. IEEE Trans Knowl Data Eng 21(9):1263\u20131284","journal-title":"IEEE Trans Knowl Data Eng"},{"issue":"7","key":"657_CR67","doi-asserted-by":"publisher","first-page":"1762","DOI":"10.1021\/ci9000579","volume":"49","author":"H Dragos","year":"2009","unstructured":"Dragos H, Gilles M, Alexandre V (2009) Predicting the predictability: a unified approach to the applicability domain problem of qsar models. J Chem Inf Model 49(7):1762\u20131776","journal-title":"J Chem Inf Model"},{"key":"657_CR68","doi-asserted-by":"publisher","unstructured":"Trinh T-C, Phan T-L, To V-T, Truong G-B, Pham T-A, Le H-SL, Van\u00a0Nguyen P-C, Truong TN (2023) A graph neural network model enables accurate prediction of anaplastic lymphoma kinase inhibitors compared to other machine learning models. In: 2023 15th International Conference on Knowledge and Systems Engineering (KSE), pp. 1\u20136. https:\/\/doi.org\/10.1109\/KSE59128.2023.10299477. IEEE","DOI":"10.1109\/KSE59128.2023.10299477"},{"issue":"11","key":"657_CR69","doi-asserted-by":"publisher","first-page":"559","DOI":"10.1080\/14786440109462720","volume":"2","author":"K Pearson","year":"1901","unstructured":"Pearson K (1901) Liii. on lines and planes of closest fit to systems of points in space. Lond Edinb aDublin Philos Mag J Sci 2(11):559\u2013572","journal-title":"Lond Edinb aDublin Philos Mag J Sci"},{"issue":"3","key":"657_CR70","doi-asserted-by":"publisher","first-page":"379","DOI":"10.1021\/ci970437z","volume":"38","author":"DR Flower","year":"1998","unstructured":"Flower DR (1998) On the properties of bit string-based measures of chemical similarity. J Chem Inf Comput Sci 38(3):379\u2013386","journal-title":"J Chem Inf Comput Sci"},{"key":"657_CR71","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s13321-015-0069-3","volume":"7","author":"D Bajusz","year":"2015","unstructured":"Bajusz D, R\u00e1cz A, H\u00e9berger K (2015) Why is tanimoto index an appropriate choice for fingerprint-based similarity calculations? J Cheminform 7:1\u201313","journal-title":"J Cheminform"},{"key":"657_CR72","doi-asserted-by":"publisher","DOI":"10.1007\/978-0-387-39940-9","volume-title":"Encyclopedia of database systems","author":"L Liu","year":"2009","unstructured":"Liu L, \u00d6zsu MT (2009) Encyclopedia of database systems, vol 6. Springer, Berlin"},{"issue":"2","key":"657_CR73","doi-asserted-by":"publisher","first-page":"895","DOI":"10.1021\/acs.jcim.8b00545","volume":"59","author":"M Su","year":"2018","unstructured":"Su M, Yang Q, Du Y, Feng G, Liu Z, Li Y, Wang R (2018) Comparative assessment of scoring functions: the casf-2016 update. J Chem Inf Model 59(2):895\u2013913","journal-title":"J Chem Inf Model"},{"issue":"7","key":"657_CR74","doi-asserted-by":"publisher","first-page":"1982","DOI":"10.1021\/acs.jcim.2c01504","volume":"63","author":"J Ding","year":"2023","unstructured":"Ding J, Tang S, Mei Z, Wang L, Huang Q, Hu H, Ling M, Wu J (2023) Vina-gpu 2.0: further accelerating autodock vina and its derivatives with graphics processing units. J Chem Inf Model 63(7):1982\u20131998","journal-title":"J Chem Inf Model"},{"issue":"1","key":"657_CR75","doi-asserted-by":"publisher","first-page":"43","DOI":"10.1186\/s13321-021-00522-2","volume":"13","author":"AT McNutt","year":"2021","unstructured":"McNutt AT, Francoeur P, Aggarwal R, Masuda T, Meli R, Ragoza M, Sunseri J, Koes DR (2021) Gnina 1.0: molecular docking with deep learning. J Cheminform 13(1):43","journal-title":"J Cheminform"},{"issue":"2","key":"657_CR76","doi-asserted-by":"publisher","first-page":"455","DOI":"10.1002\/jcc.21334","volume":"31","author":"O Trott","year":"2010","unstructured":"Trott O, Olson AJ (2010) Autodock vina: improving the speed and accuracy of docking with a new scoring function, efficient optimization, and multithreading. J Comput Chem 31(2):455\u2013461","journal-title":"J Comput Chem"},{"issue":"2","key":"657_CR77","doi-asserted-by":"publisher","first-page":"241","DOI":"10.1016\/S0893-6080(05)80023-1","volume":"5","author":"DH Wolpert","year":"1992","unstructured":"Wolpert DH (1992) Stacked generalization. Neural Netw 5(2):241\u2013259","journal-title":"Neural Netw"},{"issue":"1","key":"657_CR78","doi-asserted-by":"publisher","first-page":"49","DOI":"10.1023\/A:1018046112532","volume":"24","author":"L Breiman","year":"1996","unstructured":"Breiman L (1996) Stacked regressions. Mach Learn 24(1):49\u201364","journal-title":"Mach Learn"},{"key":"657_CR79","doi-asserted-by":"publisher","first-page":"4","DOI":"10.1016\/j.addr.2012.09.019","volume":"64","author":"CA Lipinski","year":"2012","unstructured":"Lipinski CA, Lombardo F, Dominy BW, Feeney PJ (2012) Experimental and computational approaches to estimate solubility and permeability in drug discovery and development settings. Adv Drug Deliv Rev 64:4\u201317","journal-title":"Adv Drug Deliv Rev"},{"issue":"2","key":"657_CR80","doi-asserted-by":"publisher","first-page":"90","DOI":"10.1038\/nchem.1243","volume":"4","author":"GR Bickerton","year":"2012","unstructured":"Bickerton GR, Paolini GV, Besnard J, Muresan S, Hopkins AL (2012) Quantifying the chemical beauty of drugs. Nat Chem 4(2):90\u201398","journal-title":"Nat Chem"},{"key":"657_CR81","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/1758-2946-1-8","volume":"1","author":"P Ertl","year":"2009","unstructured":"Ertl P, Schuffenhauer A (2009) Estimation of synthetic accessibility score of drug-like molecules based on molecular complexity and fragment contributions. J Cheminform 1:1\u201311","journal-title":"J Cheminform"},{"issue":"22","key":"657_CR82","doi-asserted-by":"publisher","first-page":"10026","DOI":"10.1021\/acs.jmedchem.9b00004","volume":"62","author":"YA Ivanenkov","year":"2019","unstructured":"Ivanenkov YA, Zagribelnyy BA, Aladinskiy VA (2019) Are we opening the door to a new era of medicinal chemistry or being collapsed to a chemical singularity? perspective. J Med Chem 62(22):10026\u201310043","journal-title":"J Med Chem"},{"issue":"7","key":"657_CR83","doi-asserted-by":"publisher","first-page":"2719","DOI":"10.1021\/jm901137j","volume":"53","author":"JB Baell","year":"2010","unstructured":"Baell JB, Holloway GA (2010) New substructure filters for removal of pan assay interference compounds (pains) from screening libraries and for their exclusion in bioassays. J Med Chem 53(7):2719\u20132740","journal-title":"J Med Chem"},{"issue":"5","key":"657_CR84","doi-asserted-by":"publisher","first-page":"1244","DOI":"10.1021\/jm1011947","volume":"54","author":"K Nakagawa-Goto","year":"2011","unstructured":"Nakagawa-Goto K, Wu P-C, Lai C-Y, Hamel E, Zhu H, Zhang L, Kozaka T, Ohkoshi E, Goto M, Bastow KF et al (2011) Antitumor agents. 284. new desmosdumotin b analogues with bicyclic b-ring as cytotoxic and antitubulin agents. J Med Chem 54(5):1244\u20131255","journal-title":"J Med Chem"},{"issue":"10","key":"657_CR85","doi-asserted-by":"publisher","first-page":"2974","DOI":"10.1016\/j.bmcl.2013.03.037","volume":"23","author":"Y Zhou","year":"2013","unstructured":"Zhou Y, Xu X, Sun Y, Wang H, Sun H, You Q (2013) Synthesis, cytotoxicity and topoisomerase ii inhibitory activity of lomefloxacin derivatives. Bioorg Med Chem Lett 23(10):2974\u20132978","journal-title":"Bioorg Med Chem Lett"},{"key":"657_CR86","doi-asserted-by":"crossref","unstructured":"Ougolkov AV, Bone ND, Fernandez-Zapico ME, Kay NE, Billadeau DD (2007) Inhibition of glycogen synthase kinase-3 activity leads to epigenetic silencing of nuclear factor $$\\kappa $$b target genes and induction of apoptosis in chronic lymphocytic leukemia b cells. Blood J Am Soc Hematol 110(2):735\u2013742","DOI":"10.1182\/blood-2006-12-060947"},{"issue":"9","key":"657_CR87","doi-asserted-by":"publisher","first-page":"2555","DOI":"10.1021\/ci500319f","volume":"54","author":"C Da","year":"2014","unstructured":"Da C, Kireev D (2014) Structural protein ligand interaction fingerprints (splif) for structure-based virtual screening: Method and benchmark study. J Chem Inf Model 54(9):2555\u20132561. https:\/\/doi.org\/10.1021\/ci500319f","journal-title":"J Chem Inf Model"}],"container-title":["Journal of Computer-Aided Molecular Design"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10822-025-00657-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10822-025-00657-6\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10822-025-00657-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,11,6]],"date-time":"2025-11-06T18:02:19Z","timestamp":1762452139000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10822-025-00657-6"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,9,15]]},"references-count":87,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2025,12]]}},"alternative-id":["657"],"URL":"https:\/\/doi.org\/10.1007\/s10822-025-00657-6","relation":{},"ISSN":["0920-654X","1573-4951"],"issn-type":[{"value":"0920-654X","type":"print"},{"value":"1573-4951","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,9,15]]},"assertion":[{"value":"9 July 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"19 August 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"15 September 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"79"}}