{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,7]],"date-time":"2026-03-07T13:36:19Z","timestamp":1772890579740,"version":"3.50.1"},"reference-count":84,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2025,2,27]],"date-time":"2025-02-27T00:00:00Z","timestamp":1740614400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2025,2,27]],"date-time":"2025-02-27T00:00:00Z","timestamp":1740614400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"funder":[{"name":"European Union\u2019s Horizon 2020 research and innovation program","award":["956832"],"award-info":[{"award-number":["956832"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Cheminform"],"DOI":"10.1186\/s13321-025-00970-0","type":"journal-article","created":{"date-parts":[[2025,2,28]],"date-time":"2025-02-28T12:58:16Z","timestamp":1740747496000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":10,"title":["Pretraining graph transformers with atom-in-a-molecule quantum properties for improved ADMET modeling"],"prefix":"10.1186","volume":"17","author":[{"given":"Alessio","family":"Fallani","sequence":"first","affiliation":[]},{"given":"Ramil","family":"Nugmanov","sequence":"additional","affiliation":[]},{"given":"Jose","family":"Arjona-Medina","sequence":"additional","affiliation":[]},{"given":"J\u00f6rg Kurt","family":"Wegner","sequence":"additional","affiliation":[]},{"given":"Alexandre","family":"Tkatchenko","sequence":"additional","affiliation":[]},{"given":"Kostiantyn","family":"Chernichenko","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,2,27]]},"reference":[{"key":"970_CR1","doi-asserted-by":"publisher","DOI":"10.1103\/PhysRevLett.108.058301","volume":"108","author":"M Rupp","year":"2012","unstructured":"Rupp M, Tkatchenko A, M\u00fcller K-R, von Lilienfeld OA (2012) Fast and accurate modeling of molecular atomization energies with machine learning. Phys Rev Lett 108:058301","journal-title":"Phys Rev Lett"},{"key":"970_CR2","doi-asserted-by":"publisher","first-page":"2326","DOI":"10.1021\/acs.jpclett.5b00831","volume":"6","author":"K Hansen","year":"2015","unstructured":"Hansen K, Biegler F, Ramakrishnan R, Pronobis W, von Lilienfeld OA, M\u00fcller K-R, Tkatchenko A (2015) Machine learning predictions of molecular properties: accurate many-body potentials and nonlocality in chemical space. J Phys Chem Lett 6:2326\u20132331","journal-title":"J Phys Chem Lett"},{"key":"970_CR3","doi-asserted-by":"publisher","first-page":"1883","DOI":"10.1007\/978-3-319-44677-6_67","volume-title":"Handbook of materials modeling: methods: theory and modeling","author":"B Huang","year":"2020","unstructured":"Huang B, Symonds NO, von Lilienfeld OA (2020) Handbook of materials modeling: methods: theory and modeling. Springer International Publishing, Cham, pp 1883\u20131909"},{"key":"970_CR4","doi-asserted-by":"publisher","first-page":"1241","DOI":"10.1016\/j.drudis.2018.01.039","volume":"23","author":"H Chen","year":"2018","unstructured":"Chen H, Engkvist O, Wang Y, Olivecrona M, Blaschke T (2018) The rise of deep learning in drug discovery. Drug Discov Today 23:1241\u20131250","journal-title":"Drug Discov Today"},{"key":"970_CR5","doi-asserted-by":"publisher","first-page":"175","DOI":"10.1038\/d41573-022-00025-1","volume":"21","author":"MK Jayatunga","year":"2022","unstructured":"Jayatunga MK, Xie W, Ruder L, Schulze U, Meier C (2022) AI in small-molecule drug discovery: a coming wave. Nat Rev Drug Discov 21:175\u2013176","journal-title":"Nat Rev Drug Discov"},{"key":"970_CR6","doi-asserted-by":"publisher","first-page":"954","DOI":"10.1111\/cbdd.13750","volume":"98","author":"M Bule","year":"2021","unstructured":"Bule M, Jalalimanesh N, Bayrami Z, Baeeri M, Abdollahi M (2021) The rise of deep learning and transformations in bioactivity prediction power of molecular modeling tools. Chem Biol Drug Des 98:954\u2013967","journal-title":"Chem Biol Drug Des"},{"key":"970_CR7","doi-asserted-by":"publisher","first-page":"1353","DOI":"10.1038\/s41551-022-00942-x","volume":"6","author":"MM Li","year":"2022","unstructured":"Li MM, Huang K, Zitnik M (2022) Graph representation learning in biomedicine and healthcare. Nat Biomed Eng 6:1353\u20131369","journal-title":"Nat Biomed Eng"},{"key":"970_CR8","doi-asserted-by":"publisher","first-page":"8705","DOI":"10.1021\/acs.jmedchem.0c00385","volume":"63","author":"KV Chuang","year":"2020","unstructured":"Chuang KV, Gunsalus LM, Keiser MJ (2020) Learning molecular representations for medicinal chemistry. J Med Chem 63:8705\u20138722","journal-title":"J Med Chem"},{"key":"970_CR9","doi-asserted-by":"publisher","first-page":"674","DOI":"10.1039\/D2DD00099G","volume":"2","author":"J Born","year":"2023","unstructured":"Born J, Markert G, Janakarajan N, Kimber TB, Volkamer A, Mart\u00ednez MR, Manica M (2023) Chemical representation learning for toxicity prediction. Digit Discov 2:674\u2013691","journal-title":"Digit Discov"},{"key":"970_CR10","doi-asserted-by":"publisher","first-page":"279","DOI":"10.1038\/s42256-022-00447-x","volume":"4","author":"Y Wang","year":"2022","unstructured":"Wang Y, Wang J, Cao Z, Barati Farimani A (2022) Molecular contrastive learning of representations via graph neural networks. Nat Mach Intell 4:279\u2013287","journal-title":"Nat Mach Intell"},{"key":"970_CR11","doi-asserted-by":"publisher","first-page":"1145","DOI":"10.1021\/acs.jcim.3c01753","volume":"64","author":"B Kaufman","year":"2024","unstructured":"Kaufman B, Williams EC, Underkoffler C, Pederson R, Mardirossian N, Watson I, Parkhill J (2024) COATI: multimodal contrastive pretraining for representing and traversing chemical space. J Chem Inf Model 64:1145\u20131157","journal-title":"J Chem Inf Model"},{"key":"970_CR12","doi-asserted-by":"publisher","first-page":"2300059","DOI":"10.1002\/minf.202300059","volume":"42","author":"A Ilnicka","year":"2023","unstructured":"Ilnicka A, Schneider G (2023) Compression of molecular fingerprints with autoencoder networks. Mol Inf 42:2300059","journal-title":"Mol Inf"},{"key":"970_CR13","unstructured":"Sanchez-Fernandez A, Rumetshofer E, Hochreiter S, Klambauer G. Contrastive learning of image- and structure-based representations in drug discovery. ICLR2022 Machine Learning for Drug Discovery. 2022"},{"key":"970_CR14","doi-asserted-by":"publisher","first-page":"542","DOI":"10.1038\/s42256-023-00654-0","volume":"5","author":"Y Fang","year":"2023","unstructured":"Fang Y, Zhang Q, Zhang N, Chen Z, Zhuang X, Shao X, Fan X, Chen H (2023) Knowledge graph-enhanced molecular contrastive learning with functional prompt. Nat Mach Intell 5:542\u2013553","journal-title":"Nat Mach Intell"},{"key":"970_CR15","doi-asserted-by":"publisher","first-page":"085","DOI":"10.1093\/bioinformatics\/btad085","volume":"39","author":"J Wen","year":"2023","unstructured":"Wen J et al (2023) Multimodal representation learning for predicting molecule-disease relations. Bioinformatics 39:085","journal-title":"Bioinformatics"},{"key":"970_CR16","unstructured":"Su B, Du D, Yang Z, Zhou Y, Li J, Rao A, Sun H, Lu Z, Wen J-R. A molecular multimodal foundation model associating molecule graphs with natural language. 2022. arXiv:2209.05481"},{"key":"970_CR17","unstructured":"Wang Z, Jiang T, Wang J, Xuan Q. Multi-modal representation learning for molecular property prediction: sequence, graph, geometry. 2024. arXiv:2401.03369"},{"key":"970_CR18","doi-asserted-by":"publisher","first-page":"3408","DOI":"10.1021\/acs.jcim.0c00451","volume":"60","author":"X Gao","year":"2020","unstructured":"Gao X, Ramezanghorbani F, Isayev O, Smith JS, Roitberg AE (2020) TorchANI: a free and open source PyTorch-based deep learning implementation of the ANI neural network potentials. J Chem Inf Model 60:3408\u20133415","journal-title":"J Chem Inf Model"},{"key":"970_CR19","first-page":"992","volume":"30","author":"K Sch\u00fctt","year":"2017","unstructured":"Sch\u00fctt K, Kindermans P-J, Sauceda Felix HE, Chmiela S, Tkatchenko A, M\u00fcller K-R (2017) SchNet: a continuous-filter convolutional neural network for modeling quantum interactions. Adv Neural Inf Process Syst 30:992\u20131002","journal-title":"Adv Neural Inf Process Syst"},{"key":"970_CR20","doi-asserted-by":"publisher","first-page":"2453","DOI":"10.1038\/s41467-022-29939-5","volume":"13","author":"S Batzner","year":"2022","unstructured":"Batzner S, Musaelian A, Sun L, Geiger M, Mailoa JP, Kornbluth M, Molinari N, Smidt TE, Kozinsky B (2022) E(3)-equivariant graph neural networks for data-efficient and accurate interatomic potentials. Nat Commun 13:2453","journal-title":"Nat Commun"},{"key":"970_CR21","doi-asserted-by":"publisher","first-page":"6395","DOI":"10.1038\/s41467-023-41948-6","volume":"14","author":"J Deng","year":"2023","unstructured":"Deng J, Yang Z, HW, et al (2023) A systematic study of key elements underlying molecular property prediction. Nat Commun 14:6395","journal-title":"Nat Commun"},{"key":"970_CR22","doi-asserted-by":"publisher","first-page":"8736","DOI":"10.1021\/acs.chemrev.3c00189","volume":"123","author":"B Dou","year":"2023","unstructured":"Dou B, Zhu Z, Merkurjev E, Ke L, Chen L, Jiang J, Zhu Y, Liu J, Zhang B, Wei G-W (2023) Machine learning methods for small data challenges in molecular science. Chem Rev 123:8736\u20138780","journal-title":"Chem Rev"},{"key":"970_CR23","doi-asserted-by":"publisher","first-page":"69","DOI":"10.1186\/s13321-019-0391-2","volume":"11","author":"M Glavatskikh","year":"2019","unstructured":"Glavatskikh M, Leguy J, Hunault G, Cauchy T, Da Mota B (2019) Dataset\u2019s chemical diversity limits the generalizability of machine learning predictions. J Cheminform 11:69","journal-title":"J Cheminform"},{"key":"970_CR24","doi-asserted-by":"crossref","unstructured":"Ektefaie Y, Shen A, Bykova D, Marin M, Zitnik M, Farhat M. Evaluating generalizability of artificial intelligence models for molecular datasets. 2024. bioRxiv","DOI":"10.1101\/2024.02.25.581982"},{"key":"970_CR25","doi-asserted-by":"publisher","first-page":"2100321","DOI":"10.1002\/minf.202100321","volume":"41","author":"F Broccatelli","year":"2022","unstructured":"Broccatelli F, Trager R, Reutlinger M, Karypis G, Li M (2022) Benchmarking accuracy and generalizability of four graph neural networks using large in vitro ADME datasets from different chemical spaces. Mol Inf 41:2100321","journal-title":"Mol Inf"},{"key":"970_CR26","doi-asserted-by":"publisher","first-page":"1045","DOI":"10.1080\/17460441.2021.1901685","volume":"16","author":"Z David","year":"2021","unstructured":"David Z, Huang JCB, Bahmanyar SS (2021) The challenges of generalizability in artificial intelligence for ADME\/Tox endpoint and activity prediction. Expert Opin Drug Discov 16:1045\u20131056","journal-title":"Expert Opin Drug Discov"},{"key":"970_CR27","doi-asserted-by":"publisher","first-page":"9816","DOI":"10.1021\/acs.chemrev.1c00107","volume":"121","author":"JA Keith","year":"2021","unstructured":"Keith JA, Vassilev-Galindo V, Cheng B, Chmiela S, Gastegger M, M\u00fcller K-R, Tkatchenko A (2021) Combining machine learning and computational chemistry for predictive insights into chemical systems. Chem Rev 121:9816\u20139872","journal-title":"Chem Rev"},{"key":"970_CR28","unstructured":"OpenAI et\u00a0al. GPT-4 Technical Report. 2024. arXiv:2303.08774"},{"key":"970_CR29","unstructured":"Touvron H, Lavril T, Izacard G, Martinet X, Lachaux M-A, Lacroix T, Rozi\u00e8re B, Goyal N, Hambro E, Azhar F, Rodriguez A, Joulin A, Grave E, Lample G. LLaMA: Open and Efficient Foundation Language Models. 2023. arXiv:2302.13971"},{"key":"970_CR30","doi-asserted-by":"publisher","first-page":"5077","DOI":"10.1021\/acs.jctc.3c00289","volume":"19","author":"Y Wang","year":"2023","unstructured":"Wang Y, Xu C, Li Z, Barati Farimani A (2023) Denoise pretraining on nonequilibrium molecules for accurate and transferable neural potentials. J Chem Theory Comput 19:5077\u20135087","journal-title":"J Chem Theory Comput"},{"key":"970_CR31","doi-asserted-by":"crossref","unstructured":"Xia J, Zhao C, Hu B, Gao Z, Tan C, Liu Y, Li S, Li SZ. Mole-BERT: Rethinking Pre-training Graph Neural Networks for Molecules. The Eleventh International Conference on Learning Representations. 2023","DOI":"10.26434\/chemrxiv-2023-dngg4"},{"key":"970_CR32","doi-asserted-by":"crossref","unstructured":"Xia J, Zhu Y, Du Y, Li SZ. A Systematic Survey of Chemical Pre-trained Models. Proceedings of the Thirty-Second International Joint Conference on Artificial Intelligence, IJCAI-23. Survey Track. 2023. pp 6787\u20136795","DOI":"10.24963\/ijcai.2023\/760"},{"key":"970_CR33","unstructured":"Hu W, Liu B, Gomes J, Zitnik M, Liang P, Pande V, Leskovec J. Strategies for Pre-training Graph Neural Networks. International Conference on Learning Representations. 2020"},{"key":"970_CR34","doi-asserted-by":"publisher","first-page":"273","DOI":"10.1021\/ci049687n","volume":"45","author":"ME Beck","year":"2005","unstructured":"Beck ME (2005) Do fukui function maxima relate to sites of metabolism? A critical case study. J Chem Inf Model 45:273\u2013282","journal-title":"J Chem Inf Model"},{"key":"970_CR35","doi-asserted-by":"publisher","DOI":"10.1016\/j.compbiomed.2023.106744","volume":"157","author":"X Wang","year":"2023","unstructured":"Wang X, Wang L, Wang S, Ren Y, Chen W, Li X, Han P, Song T (2023) QuantumTox: utilizing quantum chemistry with ensemble learning for molecular toxicity prediction. Comput Biol Med 157:106744","journal-title":"Comput Biol Med"},{"key":"970_CR36","doi-asserted-by":"publisher","first-page":"227","DOI":"10.1002\/9783527611249.ch24","volume-title":"Pesticide Chemistry","author":"ME Beck","year":"2007","unstructured":"Beck ME, Schindler M (2007) Pesticide Chemistry. John Wiley & Sons, Ltd, Hoboken, pp 227\u2013238"},{"key":"970_CR37","doi-asserted-by":"publisher","first-page":"37","DOI":"10.1016\/j.ddtec.2020.06.004","volume":"32\u201333","author":"AH G\u00f6ller","year":"2019","unstructured":"G\u00f6ller AH (2019) The art of atom descriptor design. Drug Discov Today Technol 32\u201333:37\u201343","journal-title":"Drug Discov Today Technol"},{"key":"970_CR38","doi-asserted-by":"publisher","first-page":"43","DOI":"10.1038\/s41597-021-00812-2","volume":"8","author":"J Hoja","year":"2021","unstructured":"Hoja J, Medrano Sandonas L, Ernst BG, Vazquez-Mayagoitia A, DiStasio RA Jr, Tkatchenko A (2021) QM7-X, a comprehensive dataset of quantum-mechanical properties spanning the chemical space of small organic molecules. Sci Data 8:43","journal-title":"Sci Data"},{"key":"970_CR39","doi-asserted-by":"publisher","first-page":"742","DOI":"10.1038\/s41597-024-03521-8","volume":"11","author":"L Medrano Sandonas","year":"2024","unstructured":"Medrano Sandonas L, Van Rompaey D, Fallani A, Hilfiker M, Hahn D, Perez-Benito L, Verhoeven J, Tresadern G, Kurt Wegner J, Ceulemans H, Tkatchenko A (2024) Dataset for quantum-mechanical exploration of conformers and solvent effects in large drug-like molecules. Sci Data 11:742","journal-title":"Sci Data"},{"key":"970_CR40","doi-asserted-by":"publisher","first-page":"273","DOI":"10.1038\/s41597-022-01390-7","volume":"9","author":"C Isert","year":"2022","unstructured":"Isert C, Atz K, Jim\u00e9nez-Luna J, Schneider G, QMugs, (2022) quantum mechanical properties of drug-like molecules. Sci Data 9:273","journal-title":"Sci Data"},{"key":"970_CR41","doi-asserted-by":"publisher","first-page":"15010","DOI":"10.1038\/npjcompumats.2015.10","volume":"1","author":"S Kirklin","year":"2015","unstructured":"Kirklin S, Saal JE, Meredig B, Thompson A, Doak JW, Aykol M, R\u00fchl S, Wolverton C (2015) The open quantum materials database (OQMD): assessing the accuracy of DFT formation energies. NPJ Comput Mater 1:15010","journal-title":"NPJ Comput Mater"},{"key":"970_CR42","doi-asserted-by":"publisher","first-page":"5891","DOI":"10.1021\/acs.jcim.0c00740","volume":"60","author":"M Nakata","year":"2020","unstructured":"Nakata M, Shimazaki T, Hashimoto M, Maeda T (2020) PubChemQC PM6: data sets of 221 million molecules with optimized molecular geometries and electronic properties. J Chem Inf Model 60:5891\u20135899","journal-title":"J Chem Inf Model"},{"key":"970_CR43","doi-asserted-by":"publisher","first-page":"6059","DOI":"10.1021\/acscatal.0c04525","volume":"11","author":"L Chanussot","year":"2021","unstructured":"Chanussot L et al (2021) Open catalyst 2020 (OC20) dataset and community challenges. ACS Catal 11:6059\u20136072","journal-title":"ACS Catal"},{"key":"970_CR44","doi-asserted-by":"publisher","DOI":"10.1126\/sciadv.1603015","volume":"3","author":"S Chmiela","year":"2017","unstructured":"Chmiela S, Tkatchenko A, Sauceda HE, Poltavsky I, Sch\u00fctt KT, M\u00fcller K-R (2017) Machine learning of accurate energy-conserving molecular force fields. Sci Adv 3:e1603015","journal-title":"Sci Adv"},{"key":"970_CR45","doi-asserted-by":"publisher","first-page":"2241","DOI":"10.1021\/jz200866s","volume":"2","author":"J Hachmann","year":"2011","unstructured":"Hachmann J, Olivares-Amaya R, Atahan-Evrenk S, Amador-Bedolla C, S\u00e1nchez-Carrera RS, Gold-Parker A, Vogt L, Brockway AM, Aspuru-Guzik A (2011) The harvard clean energy project: large-scale computational screening and design of organic photovoltaics on the world community grid. J Phys Chem Lett 2:2241\u20132251","journal-title":"J Phys Chem Lett"},{"key":"970_CR46","doi-asserted-by":"publisher","first-page":"711","DOI":"10.1007\/s10822-014-9747-x","volume":"28","author":"DL Mobley","year":"2014","unstructured":"Mobley DL, Guthrie JP (2014) FreeSolv: a database of experimental and calculated hydration free energies, with input files. J Comput Aided Mol Des 28:711\u2013720","journal-title":"J Comput Aided Mol Des"},{"key":"970_CR47","doi-asserted-by":"publisher","first-page":"D1045","DOI":"10.1093\/nar\/gkv1072","volume":"44","author":"MK Gilson","year":"2015","unstructured":"Gilson MK, Liu T, Baitaluk M, Nicola G, Hwang L, Chong J (2015) BindingDB in 2015: a public database for medicinal chemistry, computational chemistry and systems pharmacology. Nucleic Acids Res 44:D1045\u2013D1053","journal-title":"Nucleic Acids Res"},{"key":"970_CR48","doi-asserted-by":"publisher","DOI":"10.1063\/1.5023802","volume":"148","author":"JS Smith","year":"2018","unstructured":"Smith JS, Nebgen B, Lubbers N, Isayev O, Roitberg AE (2018) Less is more: sampling chemical space with active learning. J Chem Phys 148:241733","journal-title":"J Chem Phys"},{"key":"970_CR49","doi-asserted-by":"publisher","DOI":"10.1038\/sdata.2017.193","volume":"4","author":"JS Smith","year":"2017","unstructured":"Smith JS, Isayev O, Roitberg AE (2017) ANI-1, a data set of 20 million calculated off-equilibrium conformations for organic molecules. Sci Data 4:170193","journal-title":"Sci Data"},{"key":"970_CR50","unstructured":"Kl\u00e4ser K, Banaszewski B, Maddrell-Mander S, McLean C, M\u00fcller L, Parviz A, Huang S, Fitzgibbon A. MiniMol: A Parameter-Efficient Foundation Model for Molecular Learning. 2024. arXiv:2404.14986"},{"key":"970_CR51","doi-asserted-by":"publisher","first-page":"5028","DOI":"10.1021\/acs.jcim.4c00772","volume":"64","author":"J Kim","year":"2024","unstructured":"Kim J, Chang W, Ji H, Joung I (2024) Quantum-informed molecular representation learning enhancing ADMET property prediction. J Chem Inf Model 64:5028\u20135040","journal-title":"J Chem Inf Model"},{"key":"970_CR52","unstructured":"Raja A, Zhao H, Tyrchan C, Nittinger E, Bronstein MM, Deane C, Morris GM. On the Effectiveness of Quantum Chemistry Pre-training for Pharmacological Property Prediction. ICML 2024 AI for Science Workshop. 2024"},{"key":"970_CR53","unstructured":"Beaini D et\u00a0al. Towards foundational models for molecular learning on large-scale multi-task datasets. The Twelfth International Conference on Learning Representations. 2024"},{"key":"970_CR54","doi-asserted-by":"publisher","first-page":"6336","DOI":"10.1021\/acs.jcim.2c00245","volume":"62","author":"MA Lim","year":"2022","unstructured":"Lim MA, Yang S, Mai H, Cheng AC (2022) Exploring deep learning of quantum chemical properties for absorption, distribution, metabolism, and excretion predictions. J Chem Inf Model 62:6336\u20136341","journal-title":"J Chem Inf Model"},{"key":"970_CR55","unstructured":"Shoghi N, Kolluru A, Kitchin JR, Ulissi ZW, Zitnick CL, Wood BM. From molecules to materials: pre-training large generalizable models for atomic property prediction. ICLR. 2024"},{"key":"970_CR56","first-page":"28877","volume":"34","author":"C Ying","year":"2021","unstructured":"Ying C, Cai T, Luo S, Zheng S, Ke G, He D, Shen Y, Liu T-Y (2021) Do transformers really perform badly for graph representation? Adv Neural Inf Process Syst 34:28877\u201328888","journal-title":"Adv Neural Inf Process Syst"},{"key":"970_CR57","doi-asserted-by":"publisher","first-page":"3307","DOI":"10.1021\/acs.jcim.2c00344","volume":"62","author":"R Nugmanov","year":"2022","unstructured":"Nugmanov R, Dyubankova N, Gedich A, Wegner JK (2022) Bidirectional graphormer for reactivity understanding: neural network trained to reaction atom-to-atom mapping task. J Chem Inf Model 62:3307\u20133315","journal-title":"J Chem Inf Model"},{"key":"970_CR58","unstructured":"M\u00fcller L, Galkin M, Morris C, Ramp\u00e1\u0161ek L. Attending to Graph Transformers. Transactions on Machine Learning Research. 2024"},{"key":"970_CR59","doi-asserted-by":"publisher","first-page":"2198","DOI":"10.1039\/D0SC04823B","volume":"12","author":"Y Guan","year":"2021","unstructured":"Guan Y, Coley CW, Wu H, Ranasinghe D, Heid E, Struble TJ, Pattanaik L, Green WH, Jensen KF (2021) Regio-selectivity prediction with a machine-learned reaction representation and on-the-fly quantum mechanical descriptors. Chem Sci 12:2198\u20132208","journal-title":"Chem Sci"},{"key":"970_CR60","doi-asserted-by":"publisher","first-page":"1300","DOI":"10.1021\/acs.jcim.7b00083","volume":"57","author":"M Nakata","year":"2017","unstructured":"Nakata M, Shimazaki T (2017) PubChemQC project: a large-scale first-principles electronic structure database for data-driven chemistry. J Chem Inf Model 57:1300\u20131308","journal-title":"J Chem Inf Model"},{"key":"970_CR61","doi-asserted-by":"publisher","first-page":"1033","DOI":"10.1038\/s41589-022-01131-2","volume":"18","author":"K Huang","year":"2022","unstructured":"Huang K, Fu T, Gao W, Zhao Y, Roohani Y, Leskovec J, Coley CW, Xiao C, Sun J, Zitnik M (2022) Artificial intelligence foundation for therapeutic science. Nat Chem Biol 18:1033\u20131036","journal-title":"Nat Chem Biol"},{"key":"970_CR62","doi-asserted-by":"crossref","unstructured":"Abnar S, Zuidema WH. Quantifying Attention Flow in Transformers. 2020. arXiv:2005.00928","DOI":"10.18653\/v1\/2020.acl-main.385"},{"key":"970_CR63","unstructured":"Devlin J, Chang M-W, Lee K, Toutanova K. BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding. 2018"},{"key":"970_CR64","unstructured":"Fabian B, Edlich T, Gaspar H, Segler MHS, Meyers J, Fiscato M, Ahmed M. Molecular representation learning with language models and domain-relevant auxiliary tasks. CoRR. 2020. arXiv:2011.13230"},{"key":"970_CR65","unstructured":"Dong Y, Cordonnier J-B, Loukas A. Attention is Not All You Need: Pure Attention Loses Rank Doubly Exponentially with Depth. 2023. arXiv:2103.03404"},{"key":"970_CR66","unstructured":"Topping J, Giovanni FD, Chamberlain BP, Dong X, Bronstein MM. Understanding over-squashing and bottlenecks on graphs via curvature. International Conference on Learning Representations. 2022"},{"key":"970_CR67","unstructured":"Arjona-Medina J, Nugmanov R. Analysis of Atom-level pretraining with Quantum Mechanics (QM) data for Graph Neural Networks Molecular property models. 2024. arXiv:2405.14837"},{"key":"970_CR68","doi-asserted-by":"crossref","unstructured":"Fallani A, Arjona-Medina J, Chernichenko K, Nugmanov R, Wegner JK, Tkatchenko A. Atom-Level Quantum Pretraining Enhances the Spectral Perception of Molecular Graphs in Graphormer. AI in Drug Discovery. Cham, 2025. pp 71\u201381","DOI":"10.1007\/978-3-031-72381-0_7"},{"key":"970_CR69","unstructured":"Fabian B, Edlich T, Gaspar H, Segler M, Meyers J, Fiscato M, Ahmed M (2020) Molecular representation learning with language models and domain-relevant auxiliary tasks. Proc. NeurIPS 2020 Workshop on Machine Learning for Molecules. 2020"},{"key":"970_CR70","doi-asserted-by":"crossref","unstructured":"McInnes L, Healy J, Melville J. UMAP: Uniform Manifold Approximation and Projection for Dimension Reduction. 2018. arXiv:1802.03426","DOI":"10.21105\/joss.00861"},{"key":"970_CR71","doi-asserted-by":"publisher","first-page":"301","DOI":"10.1111\/j.1467-9868.2005.00503.x","volume":"67","author":"H Zou","year":"2005","unstructured":"Zou H, Hastie T (2005) Regularization and variable selection via the elastic net. J R Stat Soc Ser B Stat Methodol 67:301\u2013320","journal-title":"J R Stat Soc Ser B Stat Methodol"},{"key":"970_CR72","unstructured":"Shi H, GAO J, Xu H, Liang X, Li Z, Kong L, Lee SMS, Kwok J. Revisiting Over-smoothing in BERT from the Perspective of Graph. International Conference on Learning Representations. 2022"},{"key":"970_CR73","first-page":"54250","volume":"36","author":"L Noci","year":"2023","unstructured":"Noci L, Li C, Li M, He B, Hofmann T, Maddison CJ, Roy D (2023) The shaped transformer: attention models in the infinite depth-and-width limit. Adv Neural Inf Process Syst 36:54250\u201354281","journal-title":"Adv Neural Inf Process Syst"},{"key":"970_CR74","first-page":"27198","volume":"35","author":"L Noci","year":"2022","unstructured":"Noci L, Anagnostidis S, Biggio L, Orvieto A, Singh SP, Lucchi A (2022) Signal propagation in transformers: theoretical perspectives and the role of rank collapse. Adv Neural Inf Process Syst 35:27198\u201327211","journal-title":"Adv Neural Inf Process Syst"},{"key":"970_CR75","unstructured":"Roth A, Bause F, Kriege NM, Liebig T. Preventing Representational Rank Collapse in MPNNs by Splitting the Computational Graph. The Third Learning on Graphs Conference. 2024"},{"key":"970_CR76","unstructured":"Roth A, Liebig T. Rank Collapse Causes Over-Smoothing and Over-Correlation in Graph Neural Networks. Proceedings of the Second Learning on Graphs Conference. 2024; pp 35:1\u201335:23"},{"key":"970_CR77","doi-asserted-by":"publisher","first-page":"1749","DOI":"10.1002\/jcc.21177","volume":"30","author":"S Van Damme","year":"2009","unstructured":"Van Damme S, Bultinck P (2009) Conceptual DFT properties-based 3D QSAR: analysis of inhibitors of the nicotine metabolizing CYP2A6 enzyme. J Comput Chem 30:1749\u20131757","journal-title":"J Comput Chem"},{"key":"970_CR78","doi-asserted-by":"publisher","first-page":"589","DOI":"10.3109\/03602539709037593","volume":"29","author":"DF Lewis","year":"1997","unstructured":"Lewis DF (1997) Quantitative structure-activity relationships in substrates, inducers, and inhibitors of cytochrome P4501 (CYP1). Drug Metab Rev 29:589\u2013650","journal-title":"Drug Metab Rev"},{"key":"970_CR79","doi-asserted-by":"publisher","first-page":"1822","DOI":"10.1002\/jcc.21455","volume":"31","author":"C Ai","year":"2010","unstructured":"Ai C, Li Y, Wang Y, Li W, Dong P, Ge G, Yang L (2010) Investigation of binding features: effects on the interaction between CYP2A6 and inhibitors. J Comput Chem 31:1822\u20131831","journal-title":"J Comput Chem"},{"key":"970_CR80","doi-asserted-by":"publisher","first-page":"66","DOI":"10.1016\/j.comptc.2015.03.004","volume":"1060","author":"S Kaya","year":"2015","unstructured":"Kaya S, Kaya C (2015) A new method for calculation of molecular hardness: a theoretical study. Comput Theor Chem 1060:66\u201370","journal-title":"Comput Theor Chem"},{"key":"970_CR81","unstructured":"Bruna J, Zaremba W, Szlam A, LeCun Y. Spectral Networks and Locally Connected Networks on Graphs. 2014. arXiv:1312.6203"},{"key":"970_CR82","unstructured":"Kipf TN, Welling M. Semi-Supervised Classification with Graph Convolutional Networks. 2017. arXiv:1609.02907"},{"key":"970_CR83","unstructured":"Hammond DK, Vandergheynst P, Gribonval R. Wavelets on Graphs via Spectral Graph Theory. 2009. arXiv:0912.3848"},{"key":"970_CR84","unstructured":"Defferrard M, Bresson X, Vandergheynst P. Convolutional Neural Networks on Graphs with Fast Localized Spectral Filtering. 2017. arXiv:1606.09375"}],"container-title":["Journal of Cheminformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s13321-025-00970-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1186\/s13321-025-00970-0\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s13321-025-00970-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,2,28]],"date-time":"2025-02-28T12:58:30Z","timestamp":1740747510000},"score":1,"resource":{"primary":{"URL":"https:\/\/jcheminf.biomedcentral.com\/articles\/10.1186\/s13321-025-00970-0"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,2,27]]},"references-count":84,"journal-issue":{"issue":"1","published-online":{"date-parts":[[2025,12]]}},"alternative-id":["970"],"URL":"https:\/\/doi.org\/10.1186\/s13321-025-00970-0","relation":{},"ISSN":["1758-2946"],"issn-type":[{"value":"1758-2946","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,2,27]]},"assertion":[{"value":"11 October 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"7 February 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 February 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no competing interests.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}],"article-number":"25"}}