{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,6]],"date-time":"2026-03-06T17:53:13Z","timestamp":1772819593328,"version":"3.50.1"},"reference-count":69,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2025,3,5]],"date-time":"2025-03-05T00:00:00Z","timestamp":1741132800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,3,5]],"date-time":"2025-03-05T00:00:00Z","timestamp":1741132800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Nat Mach Intell"],"DOI":"10.1038\/s42256-025-00991-2","type":"journal-article","created":{"date-parts":[[2025,3,5]],"date-time":"2025-03-05T10:04:00Z","timestamp":1741169040000},"page":"423-436","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":18,"title":["Data-driven federated learning in drug discovery with knowledge distillation"],"prefix":"10.1038","volume":"7","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-0392-6154","authenticated-orcid":false,"given":"Thierry","family":"Hanser","sequence":"first","affiliation":[]},{"given":"Ernst","family":"Ahlberg","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9923-0137","authenticated-orcid":false,"given":"Alexander","family":"Amberg","sequence":"additional","affiliation":[]},{"given":"Lennart T.","family":"Anger","sequence":"additional","affiliation":[]},{"given":"Chris","family":"Barber","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0449-2730","authenticated-orcid":false,"given":"Richard J.","family":"Brennan","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6860-9515","authenticated-orcid":false,"given":"Alessandro","family":"Brigo","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6345-7989","authenticated-orcid":false,"given":"Annie","family":"Delaunois","sequence":"additional","affiliation":[]},{"given":"Susanne","family":"Glowienke","sequence":"additional","affiliation":[]},{"given":"Nigel","family":"Greene","sequence":"additional","affiliation":[]},{"given":"Laura","family":"Johnston","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0550-4174","authenticated-orcid":false,"given":"Daniel","family":"Kuhn","sequence":"additional","affiliation":[]},{"given":"Lara","family":"Kuhnke","sequence":"additional","affiliation":[]},{"given":"Jean-Fran\u00e7ois","family":"Marchaland","sequence":"additional","affiliation":[]},{"given":"Wolfgang","family":"Muster","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6606-1920","authenticated-orcid":false,"given":"Jeffrey","family":"Plante","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4604-9251","authenticated-orcid":false,"given":"Friedrich","family":"Rippmann","sequence":"additional","affiliation":[]},{"given":"Yogesh","family":"Sabnis","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0265-0974","authenticated-orcid":false,"given":"Friedemann","family":"Schmidt","sequence":"additional","affiliation":[]},{"given":"Ruud","family":"van Deursen","sequence":"additional","affiliation":[]},{"given":"St\u00e9phane","family":"Werner","sequence":"additional","affiliation":[]},{"given":"Angela","family":"White","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6846-7446","authenticated-orcid":false,"given":"Joerg","family":"Wichard","sequence":"additional","affiliation":[]},{"given":"Tomoya","family":"Yukawa","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,3,5]]},"reference":[{"key":"991_CR1","doi-asserted-by":"publisher","first-page":"e271","DOI":"10.1016\/S2589-7500(19)30123-2","volume":"1","author":"X Liu","year":"2019","unstructured":"Liu, X. et al. A comparison of deep learning performance against health-care professionals in detecting diseases from medical imaging: a systematic review and meta-analysis. Lancet Digit. Health 1, e271\u2013e297 (2019).","journal-title":"Lancet Digit. Health"},{"key":"991_CR2","doi-asserted-by":"publisher","DOI":"10.1038\/s41467-021-21466-z","volume":"12","author":"W Zhou","year":"2021","unstructured":"Zhou, W. et al. Ensembled deep learning model outperforms human experts in diagnosing biliary atresia from sonographic gallbladder images. Nat. Commun. 12, 1259 (2021).","journal-title":"Nat. Commun."},{"key":"991_CR3","doi-asserted-by":"publisher","first-page":"746497","DOI":"10.3389\/frai.2021.746497","volume":"4","author":"MY Topaloglu","year":"2021","unstructured":"Topaloglu, M. Y., Morrell, E. M., Rajendran, S. & Topaloglu, U. In the pursuit of privacy: the promises and predicaments of federated learning in healthcare. Front. Artif. Intell. 4, 746497 (2021).","journal-title":"Front. Artif. Intell."},{"key":"991_CR4","doi-asserted-by":"publisher","first-page":"2","DOI":"10.1038\/s42256-022-00601-5","volume":"5","author":"A Brauneck","year":"2023","unstructured":"Brauneck, A. et al. Federated machine learning in data-protection-compliant research. Nat. Mach. Intell. 5, 2\u20134 (2023).","journal-title":"Nat. Mach. Intell."},{"key":"991_CR5","doi-asserted-by":"publisher","first-page":"370","DOI":"10.1038\/s42256-024-00813-x","volume":"6","author":"M Bak","year":"2024","unstructured":"Bak, M. et al. Federated learning is not a cure-all for data ethics. Nat. Mach. Intell. 6, 370\u2013372 (2024).","journal-title":"Nat. Mach. Intell."},{"key":"991_CR6","doi-asserted-by":"publisher","first-page":"371","DOI":"10.1016\/j.neucom.2021.07.098","volume":"465","author":"H Zhu","year":"2021","unstructured":"Zhu, H., Xu, J., Liu, S. & Jin, Y. Federated learning on non-IID data: a survey. Neurocomputing 465, 371\u2013390 (2021).","journal-title":"Neurocomputing"},{"key":"991_CR7","unstructured":"McMahan, B., Moore, E., Ramage, D., Hampson, S. & Arcas, B. A. y. Communication-efficient learning of deep networks from decentralized data. In Proc. 20th International Conference on Artificial Intelligence and Statistics PMLR 54, 1273\u20131282 (2017)."},{"key":"991_CR8","doi-asserted-by":"publisher","unstructured":"Zhou, J. et al. A survey on federated learning and its applications for accelerating industrial internet of things. Preprint at https:\/\/doi.org\/10.48550\/arXiv.2104.10501 (2021).","DOI":"10.48550\/arXiv.2104.10501"},{"key":"991_CR9","doi-asserted-by":"publisher","first-page":"106854","DOI":"10.1016\/j.cie.2020.106854","volume":"149","author":"L Li","year":"2020","unstructured":"Li, L., Fan, Y., Tse, M. & Lin, K.-Y. A review of applications in federated learning. Comput. Ind. Eng. 149, 106854 (2020).","journal-title":"Comput. Ind. Eng."},{"key":"991_CR10","first-page":"50","volume":"37","author":"T Li","year":"2020","unstructured":"Li, T., Sahu, A. K., Talwalkar, A. & Smith, V. Federated learning: challenges, methods, and future directions. IEEE Signal Process. Mag. 37, 50\u201360 (2020).","journal-title":"IEEE Signal Process. Mag."},{"key":"991_CR11","first-page":"131:1","volume":"54","author":"X Yin","year":"2021","unstructured":"Yin, X., Zhu, Y. & Hu, J. A comprehensive survey of privacy-preserving federated learning: a taxonomy, review, and future directions. ACM Comput. Surv. 54, 131:1\u2013131:36 (2021).","journal-title":"ACM Comput. Surv."},{"key":"991_CR12","unstructured":"Kairouz, P. et al. Advances and open problems in federated learning. Foundations and Trends in Machine Learning 14, 1\u2013210, (2021)."},{"key":"991_CR13","doi-asserted-by":"publisher","first-page":"885","DOI":"10.1007\/s10115-022-01664-x","volume":"64","author":"J Liu","year":"2022","unstructured":"Liu, J. et al. From distributed machine learning to federated learning: a survey. Knowl. Inf. Syst. 64, 885\u2013917 (2022).","journal-title":"Knowl. Inf. Syst."},{"key":"991_CR14","doi-asserted-by":"publisher","unstructured":"Kone\u010dn\u00fd, J., McMahan, H. B., Ramage, D. & Richt\u00e1rik, P. Federated optimization: distributed machine learning for on-device intelligence. Preprint at https:\/\/doi.org\/10.48550\/arXiv.1610.02527 (2016).","DOI":"10.48550\/arXiv.1610.02527"},{"key":"991_CR15","doi-asserted-by":"crossref","unstructured":"Abadi, M. et al. Deep learning with differential privacy. In Proc. 2016 ACM SIGSAC Conference on Computer and Communications Security 308\u2013318 (ACM, 2016).","DOI":"10.1145\/2976749.2978318"},{"key":"991_CR16","doi-asserted-by":"crossref","unstructured":"Dwork, C. Differential privacy: a survey of results. In Proc. International Conference on Theory and Applications of Models of Computation (eds Agrawal, M. et al.) 1\u201319 (Springer, 2008).","DOI":"10.1007\/978-3-540-79228-4_1"},{"key":"991_CR17","doi-asserted-by":"crossref","unstructured":"Long, G., Tan, Y., Jiang, J. & Zhang, C. in Federated Learning: Privacy and Incentive (eds Yang, Q. et al.) 240\u2013254 (Springer, 2020).","DOI":"10.1007\/978-3-030-63076-8_17"},{"key":"991_CR18","doi-asserted-by":"publisher","first-page":"119","DOI":"10.1038\/s41746-020-00323-1","volume":"3","author":"N Rieke","year":"2020","unstructured":"Rieke, N. et al. The future of digital health with federated learning. Npj Digit. Med. 3, 119 (2020).","journal-title":"Npj Digit. Med."},{"key":"991_CR19","first-page":"313","volume":"2019","author":"O Choudhury","year":"2020","unstructured":"Choudhury, O. et al. Predicting adverse drug reactions on distributed health data using federated learning. AMIA. Annu. Symp. Proc. 2019, 313\u2013322 (2020).","journal-title":"AMIA. Annu. Symp. Proc."},{"key":"991_CR20","doi-asserted-by":"crossref","unstructured":"Nguyen, D. C. et al. Federated learning for smart healthcare: a survey. ACM Computing Surveys (Csur) 55, 1\u201337 (2022).","DOI":"10.1145\/3501296"},{"key":"991_CR21","doi-asserted-by":"publisher","first-page":"529","DOI":"10.1007\/s11427-021-1946-0","volume":"65","author":"Z Xiong","year":"2022","unstructured":"Xiong, Z. et al. Facing small and biased data dilemma in drug discovery with enhanced federated learning approaches. Sci. China Life Sci. 65, 529\u2013539 (2022).","journal-title":"Sci. China Life Sci."},{"key":"991_CR22","doi-asserted-by":"crossref","unstructured":"Manu, D. et al. FL-DISCO: federated generative adversarial network for graph-based molecule drug discovery: special session paper. In Proc. 2021 IEEE\/ACM International Conference On Computer Aided Design (ICCAD) 1\u20137 (IEEE, 2021).","DOI":"10.1109\/ICCAD51958.2021.9643440"},{"key":"991_CR23","doi-asserted-by":"publisher","first-page":"2371","DOI":"10.1002\/int.22777","volume":"37","author":"S Naz","year":"2022","unstructured":"Naz, S., Phan, K. T. & Chen, Y.-P. P. A comprehensive review of federated learning for COVID-19 detection. Int. J. Intell. Syst. 37, 2371\u20132392 (2022).","journal-title":"Int. J. Intell. Syst."},{"key":"991_CR24","unstructured":"Goldsmith, M. R. et al. in Crop Protection Products for Sustainable Agriculture (eds Rauzan, B. M. & Lorsbach, B. A.) Vol. 1390, 181\u2013200 (American Chemical Society, 2021)."},{"key":"991_CR25","doi-asserted-by":"publisher","first-page":"2331","DOI":"10.1021\/acs.jcim.3c00799","volume":"64","author":"W Heyndrickx","year":"2024","unstructured":"Heyndrickx, W. et al. MELLODDY: cross-pharma federated learning at unprecedented scale unlocks benefits in QSAR without compromising proprietary information. J. Chem. Inf. Model. 64, 2331\u20132344 (2024).","journal-title":"J. Chem. Inf. Model."},{"key":"991_CR26","doi-asserted-by":"publisher","first-page":"102545","DOI":"10.1016\/j.sbi.2023.102545","volume":"79","author":"T Hanser","year":"2023","unstructured":"Hanser, T. Federated learning for molecular discovery. Curr. Opin. Struct. Biol. 79, 102545 (2023).","journal-title":"Curr. Opin. Struct. Biol."},{"key":"991_CR27","doi-asserted-by":"publisher","unstructured":"Kone\u010dn\u00fd, J. et al. Federated learning: strategies for improving communication efficiency. Preprint at https:\/\/doi.org\/10.48550\/arXiv.1610.05492 (2017).","DOI":"10.48550\/arXiv.1610.05492"},{"key":"991_CR28","doi-asserted-by":"publisher","DOI":"10.1038\/s41467-022-29763-x","volume":"13","author":"C Wu","year":"2022","unstructured":"Wu, C., Wu, F., Lyu, L., Huang, Y. & Xie, X. Communication-efficient federated learning via knowledge distillation. Nat. Commun. 13, 2032 (2022).","journal-title":"Nat. Commun."},{"key":"991_CR29","unstructured":"Zhu, X. Semi-Supervised Learning Literature Survey (Univ. Wisconsin, 2005); https:\/\/minds.wisconsin.edu\/handle\/1793\/60444"},{"key":"991_CR30","unstructured":"Hinton, G., Vinyals, O. & Dean, J. Distilling the knowledge in a neural network. Preprint at http:\/\/arxiv.org\/abs\/1503.02531 (2015)."},{"key":"991_CR31","unstructured":"Papernot, N., Abadi, M., Erlingsson, \u00da., Goodfellow, I. & Talwar, K. Semi-supervised knowledge transfer for deep learning from private training data. Preprint at http:\/\/arxiv.org\/abs\/1610.05755 (2016)."},{"key":"991_CR32","unstructured":"Papernot, N. et al. Scalable private learning with PATE. Preprint at http:\/\/arxiv.org\/abs\/1802.08908 (2018)."},{"key":"991_CR33","doi-asserted-by":"publisher","first-page":"123","DOI":"10.1007\/BF00058655","volume":"24","author":"L Breiman","year":"1996","unstructured":"Breiman, L. Bagging predictors. Mach. Learn. 24, 123\u2013140 (1996).","journal-title":"Mach. Learn."},{"key":"991_CR34","doi-asserted-by":"crossref","unstructured":"Dietterich, T. G. Ensemble methods in machine learning. In Proc. International Workshop on Multiple Classifier Systems (eds Kittler, J. & Roli, F.) 1\u201315 (Springer, 2000).","DOI":"10.1007\/3-540-45014-9_1"},{"key":"991_CR35","doi-asserted-by":"publisher","unstructured":"Li, L., Gou, J., Yu, B., Du, L. & Tao, Z. Y. D. Federated distillation: a survey. Preprint at https:\/\/doi.org\/10.48550\/arXiv.2404.08564 (2024).","DOI":"10.48550\/arXiv.2404.08564"},{"key":"991_CR36","doi-asserted-by":"crossref","unstructured":"Eldar, Y. C. et al. in Machine Learning and Wireless Communications (eds Goldsmith, A. et al.) 457\u2013485 (Cambridge Univ. Press, 2022).","DOI":"10.1017\/9781108966559"},{"key":"991_CR37","doi-asserted-by":"publisher","unstructured":"Li, D. & Wang, J. FedMD: heterogenous federated learning via model distillation. Preprint at https:\/\/doi.org\/10.48550\/arXiv.1910.03581 (2019).","DOI":"10.48550\/arXiv.1910.03581"},{"key":"991_CR38","doi-asserted-by":"publisher","first-page":"191","DOI":"10.1109\/TMC.2021.3070013","volume":"22","author":"S Itahara","year":"2023","unstructured":"Itahara, S., Nishio, T., Koda, Y., Morikura, M. & Yamamoto, K. Distillation-based semi-supervised federated learning for communication-efficient collaborative training with non-IID private data. IEEE Trans. Mob. Comput. 22, 191\u2013205 (2023).","journal-title":"IEEE Trans. Mob. Comput."},{"key":"991_CR39","unstructured":"Sattler, F., Marban, A., Rischke, R. & Samek, W. Communication-efficient federated distillation. Preprint at http:\/\/arxiv.org\/abs\/2012.00632 (2020)."},{"key":"991_CR40","doi-asserted-by":"crossref","unstructured":"Sui, D. et al. FedED: federated learning via ensemble distillation for medical relation extraction. In Proc. 2020 Conference on Empirical Methods in Natural Language Processing (EMNLP) (eds Webber, B. et al.) 2118\u20132128 (Association for Computational Linguistics, 2020).","DOI":"10.18653\/v1\/2020.emnlp-main.165"},{"key":"991_CR41","doi-asserted-by":"crossref","unstructured":"Han, S. et al. FedX: unsupervised federated learning with cross knowledge distillation. In European Conference on Computer Vision. (eds Avidan, S. et al.) 691\u2013707 (Springer Nature Switzerland, 2022).","DOI":"10.1007\/978-3-031-20056-4_40"},{"key":"991_CR42","unstructured":"Jeong, E. et al. Communication-efficient on-device machine learning: federated distillation and augmentation under non-IID private data. Preprint at http:\/\/arxiv.org\/abs\/1811.11479 (2023)."},{"key":"991_CR43","doi-asserted-by":"publisher","unstructured":"Choquette-Choo, C. A. et al. CaPC learning: confidential and private collaborative learning. Preprint at https:\/\/doi.org\/10.48550\/arXiv.2102.05188 (2021).","DOI":"10.48550\/arXiv.2102.05188"},{"key":"991_CR44","unstructured":"PyGrid: a peer-to-peer platform for private data science and federated learning OpenMined Blog https:\/\/blog.openmined.org\/what-is-pygrid-demo\/ (2020)."},{"key":"991_CR45","unstructured":"FLuID POC platform. GitHub https:\/\/github.com\/LhasaLimited\/FLuID_POC (2023)."},{"key":"991_CR46","doi-asserted-by":"publisher","first-page":"118","DOI":"10.1016\/j.pharmthera.2008.05.009","volume":"119","author":"JC Hancox","year":"2008","unstructured":"Hancox, J. C., McPate, M. J., El Harchi, A. & Zhang, Y. H. The hERG potassium channel and hERG screening for drug-induced torsades de pointes. Pharmacol. Ther. 119, 118\u2013132 (2008).","journal-title":"Pharmacol. Ther."},{"key":"991_CR47","unstructured":"Wolford, B. What is GDPR, the EU\u2019s new data protection law? GDPR.eu https:\/\/gdpr.eu\/what-is-gdpr\/ (2018)."},{"key":"991_CR48","doi-asserted-by":"crossref","unstructured":"Shokri, R., Stronati, M., Song, C. & Shmatikov, V. Membership inference attacks against machine learning model. In IEEE Symposium on Security and Privacy (SP) 3\u201318 (IEEE, 2017).","DOI":"10.1109\/SP.2017.41"},{"key":"991_CR49","doi-asserted-by":"crossref","unstructured":"Raipuria, G., Bonthu, S. & Singhal, N. Noise robust training of segmentation model using knowledge distillation. In Proc. Pattern Recognition. ICPR International Workshops and Challenges. ICPR 2021 (eds Del Bimbo, A. et al.) 97\u2013104 (Springer, 2021).","DOI":"10.1007\/978-3-030-68763-2_8"},{"key":"991_CR50","doi-asserted-by":"publisher","first-page":"442","DOI":"10.1016\/0005-2795(75)90109-9","volume":"405","author":"BW Matthews","year":"1975","unstructured":"Matthews, B. W. Comparison of the predicted and observed secondary structure of T4 phage lysozyme. Biochim. Biophys. Acta 405, 442\u2013451 (1975).","journal-title":"Biochim. Biophys. Acta"},{"key":"991_CR51","doi-asserted-by":"publisher","first-page":"1503","DOI":"10.1021\/acs.chemrestox.3c00137","volume":"36","author":"D Bassani","year":"2023","unstructured":"Bassani, D., Brigo, A. & Andrews-Morger, A. Federated learning in computational toxicology: an industrial perspective on the Effiris Hackathon. Chem. Res. Toxicol. 36, 1503\u20131517 (2023).","journal-title":"Chem. Res. Toxicol."},{"key":"991_CR52","doi-asserted-by":"publisher","first-page":"D1388","DOI":"10.1093\/nar\/gkaa971","volume":"49","author":"S Kim","year":"2021","unstructured":"Kim, S. et al. PubChem in 2021: new data content and improved web interfaces. Nucleic Acids Res. 49, D1388\u2013D1395 (2021).","journal-title":"Nucleic Acids Res."},{"key":"991_CR53","doi-asserted-by":"publisher","DOI":"10.1186\/s13321-015-0069-3","volume":"7","author":"D Bajusz","year":"2015","unstructured":"Bajusz, D., R\u00e1cz, A. & H\u00e9berger, K. Why is Tanimoto index an appropriate choice for fingerprint-based similarity calculations? J. Cheminformatics 7, 20 (2015).","journal-title":"J. Cheminformatics"},{"key":"991_CR54","first-page":"199","volume":"9","author":"R Glen","year":"2006","unstructured":"Glen, R. et al. Circular fingerprints: flexible molecular descriptors with applications from physical chemistry to ADME. IDrugs Investig. Drugs J. 9, 199\u2013204 (2006).","journal-title":"IDrugs Investig. Drugs J."},{"key":"991_CR55","doi-asserted-by":"publisher","first-page":"285","DOI":"10.1002\/qsar.19960150402","volume":"15","author":"BD Hudson","year":"1996","unstructured":"Hudson, B. D., Hyde, R. M., Rahr, E., Wood, J. & Osman, J. Parameter based methods for compound selection from chemical databases. Quant. Struct. Act. Relatsh. 15, 285\u2013289 (1996).","journal-title":"Quant. Struct. Act. Relatsh."},{"key":"991_CR56","doi-asserted-by":"publisher","first-page":"742","DOI":"10.1021\/ci100050t","volume":"50","author":"D Rogers","year":"2010","unstructured":"Rogers, D. & Hahn, M. Extended-connectivity fingerprints. J. Chem. Inf. Model. 50, 742\u2013754 (2010).","journal-title":"J. Chem. Inf. Model."},{"key":"991_CR57","doi-asserted-by":"publisher","first-page":"3186","DOI":"10.1021\/jm401411z","volume":"57","author":"G Maggiora","year":"2014","unstructured":"Maggiora, G., Vogt, M., Stumpfe, D. & Bajorath, J. Molecular similarity in medicinal chemistry. J. Med. Chem. 57, 3186\u20133204 (2014).","journal-title":"J. Med. Chem."},{"key":"991_CR58","unstructured":"Maggiora, G. M. Concepts and Applications of Molecular Similarity (eds Johnson, M. A. & Maggiora, G. M.) (John Wiley & Sons, 1990)."},{"key":"991_CR59","doi-asserted-by":"publisher","first-page":"1345","DOI":"10.1109\/TKDE.2009.191","volume":"22","author":"SJ Pan","year":"2010","unstructured":"Pan, S. J. & Yang, Q. A survey on transfer learning. IEEE Trans. Knowl. Data Eng. 22, 1345\u20131359 (2010).","journal-title":"IEEE Trans. Knowl. Data Eng."},{"key":"991_CR60","doi-asserted-by":"publisher","first-page":"D1100","DOI":"10.1093\/nar\/gkr777","volume":"40","author":"A Gaulton","year":"2012","unstructured":"Gaulton, A. et al. ChEMBL: a large-scale bioactivity database for drug discovery. Nucleic Acids Res. 40, D1100\u2013D1107 (2012).","journal-title":"Nucleic Acids Res."},{"key":"991_CR61","unstructured":"MacQueen, J. Some methods for classification and analysis of multivariate observations. In Proc. Fifth Berkeley Symp. Math. Stat. Probab. (eds Marie Le Cam, L. & Neyman, J.) Vol. 1, 281\u2013298 (1967)."},{"key":"991_CR62","doi-asserted-by":"publisher","first-page":"1224","DOI":"10.1021\/acs.jcim.8b00150","volume":"58","author":"VB Siramshetty","year":"2018","unstructured":"Siramshetty, V. B., Chen, Q., Devarakonda, P. & Preissner, R. The catch-22 of predicting hERG blockade using publicly accessible bioactivity data. J. Chem. Inf. Model. 58, 1224\u20131233 (2018).","journal-title":"J. Chem. Inf. Model."},{"key":"991_CR63","doi-asserted-by":"crossref","unstructured":"Ho, T. K. Random decision forests. In Proc. 3rd International Conference on Document Analysis and Recognition Vol. 1, 278\u2013282 (1995).","DOI":"10.1109\/ICDAR.1995.598994"},{"key":"991_CR64","doi-asserted-by":"publisher","unstructured":"Hanser, T., Barber, C., Marchaland, J. F. & Werner, S. Applicability domain: towards a more formal definition. SAR QSAR Environ. Res. https:\/\/doi.org\/10.1080\/1062936X.2016.1250229 (2016) .","DOI":"10.1080\/1062936X.2016.1250229"},{"key":"991_CR65","doi-asserted-by":"publisher","first-page":"2","DOI":"10.1186\/1758-2946-6-21","volume":"6","author":"T Hanser","year":"2014","unstructured":"Hanser, T. et al. Self organising hypothesis networks: a new approach for representing and structuring SAR knowledge. J. Cheminformatics 6, 21 (2014).","journal-title":"J. Cheminformatics"},{"key":"991_CR66","doi-asserted-by":"publisher","unstructured":"Carhart, R., Smith, D. H. & Venkataraghavan, R. Atom pairs as molecular features in structure-activity studies: definition and applications. J. Chem. Inf. Comput. Sci. https:\/\/doi.org\/10.1021\/ci00046a002 (1985).","DOI":"10.1021\/ci00046a002"},{"key":"991_CR67","doi-asserted-by":"publisher","DOI":"10.1186\/s13321-019-0334-y","volume":"11","author":"T Hanser","year":"2019","unstructured":"Hanser, T., Steinmetz, F. P., Plante, J., Rippmann, F. & Krier, M. Avoiding hERG-liability in drug design via synergetic combinations of different (Q)SAR methodologies and data sources: a case study in an industrial setting. J. Cheminformatics 11, 9 (2019).","journal-title":"J. Cheminformatics"},{"key":"991_CR68","doi-asserted-by":"publisher","unstructured":"Hanser, T., Werner, S. & Plante, J. FLuID POC a simulation platform for federated distillation. Zenodo https:\/\/doi.org\/10.5281\/zenodo.14531198 (2024).","DOI":"10.5281\/zenodo.14531198"},{"key":"991_CR69","first-page":"2579","volume":"9","author":"L van der Maaten","year":"2008","unstructured":"van der Maaten, L. & Hinton, G. Visualizing data using t-SNE. J. Mach. Learn. Res. 9, 2579\u20132605 (2008).","journal-title":"J. Mach. Learn. Res."}],"container-title":["Nature Machine Intelligence"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/www.nature.com\/articles\/s42256-025-00991-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/www.nature.com\/articles\/s42256-025-00991-2","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/www.nature.com\/articles\/s42256-025-00991-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,4,22]],"date-time":"2025-04-22T15:20:37Z","timestamp":1745335237000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.nature.com\/articles\/s42256-025-00991-2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,3,5]]},"references-count":69,"journal-issue":{"issue":"3","published-online":{"date-parts":[[2025,3]]}},"alternative-id":["991"],"URL":"https:\/\/doi.org\/10.1038\/s42256-025-00991-2","relation":{},"ISSN":["2522-5839"],"issn-type":[{"value":"2522-5839","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,3,5]]},"assertion":[{"value":"29 February 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"14 January 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"5 March 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"The authors declare no competing interests, except for R.J.B. who is an employee and shareholder of Sanofi, a pharmaceutical R&D company that may benefit from the outcome of this research.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}]}}