{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,6]],"date-time":"2026-03-06T16:54:32Z","timestamp":1772816072773,"version":"3.50.1"},"reference-count":81,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2026,2,4]],"date-time":"2026-02-04T00:00:00Z","timestamp":1770163200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2026,3,6]],"date-time":"2026-03-06T00:00:00Z","timestamp":1772755200000},"content-version":"vor","delay-in-days":30,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["BMC Bioinformatics"],"DOI":"10.1186\/s12859-026-06376-5","type":"journal-article","created":{"date-parts":[[2026,2,4]],"date-time":"2026-02-04T09:04:24Z","timestamp":1770195864000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Design and evaluation of semantically-valid negative samples integration techniques for scalable semi-automated drug repurposing prediction pipelines in rare disease research"],"prefix":"10.1186","volume":"27","author":[{"given":"Niccol\u00f2","family":"Bianchi","sequence":"first","affiliation":[]},{"given":"Armel E. J. L.","family":"Lefebvre","sequence":"additional","affiliation":[]},{"given":"Katherine J.","family":"Wolstencroft","sequence":"additional","affiliation":[]},{"given":"Marco","family":"Spruit","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2026,2,4]]},"reference":[{"key":"6376_CR1","doi-asserted-by":"publisher","first-page":"255","DOI":"10.1016\/j.tips.2021.01.003","volume":"42","author":"HI Roessler","year":"2021","unstructured":"Roessler HI, Knoers NVAM, van Haelst MM, van Haaften G. Drug repurposing for rare diseases. Trends Pharmacol Sci. 2021;42:255\u201367. https:\/\/doi.org\/10.1016\/j.tips.2021.01.003.","journal-title":"Trends Pharmacol Sci"},{"key":"6376_CR2","doi-asserted-by":"publisher","first-page":"37","DOI":"10.1038\/s41576-023-00683-w","volume":"25","author":"KD Kernohan","year":"2024","unstructured":"Kernohan KD, Boycott KM. The expanding diagnostic toolbox for rare genetic diseases. Nat Rev Genet. 2024;25:37\u201349. https:\/\/doi.org\/10.1038\/s41576-023-00683-w.","journal-title":"Nat Rev Genet"},{"key":"6376_CR3","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1038\/s12276-024-01243-w","volume":"9","author":"H Hwang","year":"2024","unstructured":"Hwang H, Jeon H, Yeo N, Baek D. Big data and deep learning for RNA biology. Nature. 2024;9:1\u201313. https:\/\/doi.org\/10.1038\/s12276-024-01243-w.","journal-title":"Nature"},{"key":"6376_CR4","doi-asserted-by":"publisher","first-page":"107","DOI":"10.1186\/s13023-020-01376-x","volume":"15","author":"K Kerr","year":"2020","unstructured":"Kerr K, McAneney H, Smyth LJ, Bailie C, McKee S, McKnight AJ. A scoping review and proposed workflow for multi-omic rare disease research. Orphanet J Rare Dis. 2020;15:107. https:\/\/doi.org\/10.1186\/s13023-020-01376-x.","journal-title":"Orphanet J Rare Dis"},{"key":"6376_CR5","doi-asserted-by":"publisher","first-page":"199","DOI":"10.1016\/j.ajhg.2015.06.009","volume":"97","author":"JX Chong","year":"2015","unstructured":"...Chong JX, Buckingham KJ, Jhangiani SN, Boehm C, Sobreira N, Smith JD, et al. The genetic basis of mendelian phenotypes: discoveries, challenges, and opportunities. Am J Hum Genet. 2015;97:199\u2013215. https:\/\/doi.org\/10.1016\/j.ajhg.2015.06.009.","journal-title":"Am J Hum Genet"},{"key":"6376_CR6","doi-asserted-by":"publisher","first-page":"704","DOI":"10.3390\/ijerph18020704","volume":"18","author":"D Rojas-Rueda","year":"2021","unstructured":"Rojas-Rueda D, Morales-Zamora E, Alsufyani WA, Herbst CH, AlBalawi SM, Alsukait R, et al. Environmental risk factors and health: an umbrella review of meta-analyses. Int J Environ Res Public Health. 2021;18:704. https:\/\/doi.org\/10.3390\/ijerph18020704.","journal-title":"Int J Environ Res Public Health"},{"key":"6376_CR7","unstructured":"National Organization for Rare Disorders: Barriers to Rare Disease Diagnosis, Care and Treatment in the US: A 30-Year Comparative Analysis. Report (2020). https:\/\/rarediseases.org\/wp-content\/uploads\/2020\/11\/NRD-2088-Barriers-30-Yr-Survey-Report_FNL-2.pdf"},{"key":"6376_CR8","doi-asserted-by":"publisher","first-page":"2928","DOI":"10.1111\/poms.13255","volume":"29","author":"AM Subramanian","year":"2020","unstructured":"Subramanian AM, L\u00e9vesque M, van de Vrande V. \u201cPulling the plug:\u2019\u2019 time allocation between drug discovery and development projects. Prod Oper Manag. 2020;29:2928\u201341. https:\/\/doi.org\/10.1111\/poms.13255.","journal-title":"Prod Oper Manag"},{"key":"6376_CR9","doi-asserted-by":"publisher","first-page":"627","DOI":"10.3390\/molecules26030627","volume":"26","author":"BG de la Torre","year":"2021","unstructured":"de la Torre BG, Albericio F. The pharmaceutical industry in 2020. An analysis of FDA drug approvals from the perspective of molecules. Molecules. 2021;26:627. https:\/\/doi.org\/10.3390\/molecules26030627.","journal-title":"Molecules"},{"issue":"7","key":"6376_CR10","doi-asserted-by":"publisher","first-page":"521","DOI":"10.1038\/s41573-025-01164-x","volume":"24","author":"Z Tanoli","year":"2025","unstructured":"...Tanoli Z, Fern\u00e1ndez-Torras A, \u00d6zcan UO, Kushnir A, Nader KM, Gadiya Y, et al. Computational drug repurposing: approaches, evaluation of in silico resources and case studies. Nat Rev Drug Discov. 2025;24(7):521\u201342. https:\/\/doi.org\/10.1038\/s41573-025-01164-x.","journal-title":"Nat Rev Drug Discov"},{"issue":"9","key":"6376_CR11","doi-asserted-by":"publisher","first-page":"977","DOI":"10.1080\/17460441.2021.1883585","volume":"16","author":"Z Tanoli","year":"2021","unstructured":"Tanoli Z, V\u00e4h\u00e4-Koskela M, Aittokallio T. Artificial intelligence, machine learning, and drug repurposing in cancer. Expert Opin Drug Discov. 2021;16(9):977\u201389. https:\/\/doi.org\/10.1080\/17460441.2021.1883585.","journal-title":"Expert Opin Drug Discov"},{"key":"6376_CR12","doi-asserted-by":"publisher","DOI":"10.1101\/2025.08.18.670836","author":"S Savander","year":"2025","unstructured":"Savander S, Curabaz NN, Abbasi AM, Khan A, Saeed K, Tanoli Z. Data-driven strategies for drug repurposing: insights, recommendations, and case studies. bioRxiv. 2025. https:\/\/doi.org\/10.1101\/2025.08.18.670836.","journal-title":"bioRxiv"},{"key":"6376_CR13","doi-asserted-by":"publisher","first-page":"97","DOI":"10.1186\/s13023-016-0475-2","volume":"11","author":"E Mina","year":"2016","unstructured":"Mina E, van Roon-Mom W, Hettne K, van Zwet E, Goeman J, Neri C, et al. Common disease signatures from gene expression analysis in Huntington\u2019s disease human blood and brain. Orphanet J Rare Dis. 2016;11:97. https:\/\/doi.org\/10.1186\/s13023-016-0475-2.","journal-title":"Orphanet J Rare Dis"},{"key":"6376_CR14","doi-asserted-by":"publisher","DOI":"10.1101\/cshperspect.a024240","volume":"7","author":"M Jimenez-Sanchez","year":"2017","unstructured":"Jimenez-Sanchez M, Licitra F, Underwood BR, Rubinsztein DC. Huntington\u2019s disease: mechanisms of pathogenesis and therapeutic strategies. Cold Spring Harb Perspect Med. 2017;7:024240. https:\/\/doi.org\/10.1101\/cshperspect.a024240.","journal-title":"Cold Spring Harb Perspect Med"},{"key":"6376_CR15","doi-asserted-by":"publisher","first-page":"165","DOI":"10.2174\/1570159X16666180302115032","volume":"17","author":"S Jamwal","year":"2019","unstructured":"Jamwal S, Kumar P. Insight into the emerging role of striatal neurotransmitters in the pathophysiology of Parkinson\u2019s disease and Huntington\u2019s disease: a review. Curr Neuropharmacol. 2019;17:165\u201375. https:\/\/doi.org\/10.2174\/1570159X16666180302115032.","journal-title":"Curr Neuropharmacol"},{"key":"6376_CR16","doi-asserted-by":"publisher","first-page":"497","DOI":"10.1007\/978-1-4939-7825-0","volume-title":"Huntington\u2019s disease","author":"RM Lane","year":"2018","unstructured":"Lane RM, Smith A, Baumann T, Gleichmann M, Norris D, Bennett CF, et al. Translating antisense technology into a treatment for Huntington\u2019s disease. In: Precious SV, Rosser AE, Dunnett SB, editors. Huntington\u2019s disease, vol. 1780. Springer; 2018. p. 497\u2013523. https:\/\/doi.org\/10.1007\/978-1-4939-7825-0."},{"key":"6376_CR17","doi-asserted-by":"publisher","first-page":"1128562","DOI":"10.3389\/fphar.2023.1128562","volume":"14","author":"A Ambesi-Impiombato","year":"2023","unstructured":"Ambesi-Impiombato A, Cox K, Ramboz S, Brunner D, Bansal M, Leahy E. Enrichment analysis of phenotypic data for drug repurposing in rare diseases. Front Pharmacol. 2023;14:1128562. https:\/\/doi.org\/10.3389\/fphar.2023.1128562.","journal-title":"Front Pharmacol"},{"key":"6376_CR18","doi-asserted-by":"publisher","first-page":"63","DOI":"10.1186\/1752-0509-6-63","volume":"6","author":"MC Oldham","year":"2012","unstructured":"Oldham MC, Langfelder P, Horvath S. Network methods for describing sample relationships in genomic datasets: application to Huntington\u2019s disease. BMC Syst Biol. 2012;6:63. https:\/\/doi.org\/10.1186\/1752-0509-6-63.","journal-title":"BMC Syst Biol"},{"key":"6376_CR19","doi-asserted-by":"publisher","first-page":"553","DOI":"10.1002\/mds.28866","volume":"37","author":"A Mohan","year":"2022","unstructured":"Mohan A, Sun Z, Ghosh S, Li Y, Sathe S, Hu J, et al. A machine-learning derived Huntington\u2019s disease progression model: insights for clinical trial design. Mov Disord. 2022;37:553\u201362. https:\/\/doi.org\/10.1002\/mds.28866.","journal-title":"Mov Disord"},{"key":"6376_CR20","doi-asserted-by":"publisher","first-page":"363","DOI":"10.1038\/s41597-024-03171-w","volume":"11","author":"TJ Callahan","year":"2024","unstructured":"...Callahan TJ, Tripodi IJ, Stefanski AL, Cappelletti L, Taneja SB, Wyrwa JM, et al. An open source knowledge graph ecosystem for the life sciences. Sci Data. 2024;11:363. https:\/\/doi.org\/10.1038\/s41597-024-03171-w.","journal-title":"Sci Data"},{"key":"6376_CR21","doi-asserted-by":"publisher","DOI":"10.1038\/sdata.2016.18","volume":"3","author":"MD Wilkinson","year":"2016","unstructured":"...Wilkinson MD, Dumontier M, Aalbersberg IJJ, Appleton G, Axton M, Baak A, et al. The fair guiding principles for scientific data management and stewardship. Sci Data. 2016;3:160018. https:\/\/doi.org\/10.1038\/sdata.2016.18.","journal-title":"Sci Data"},{"key":"6376_CR22","doi-asserted-by":"publisher","first-page":"264","DOI":"10.1162\/dint_a_00049","volume":"2","author":"M van Reisen","year":"2020","unstructured":"van Reisen M, Stokmans M, Basajja M, Ong\u2019ayo AO, Kirkpatrick C, Mons B. Towards the tipping point for fair implementation. Data Intell. 2020;2:264\u201375. https:\/\/doi.org\/10.1162\/dint_a_00049.","journal-title":"Data Intell"},{"key":"6376_CR23","unstructured":"National Institutes of Health: 2023 NIH Data Management and Sharing Policy 2023. https:\/\/oir.nih.gov\/sourcebook\/intramural-program-oversight\/intramural-data-sharing\/2023-nih-data-management-sharing-policy"},{"key":"6376_CR24","doi-asserted-by":"publisher","first-page":"15733","DOI":"10.1016\/j.heliyon.2023.e15733","volume":"9","author":"A Mart\u00ednez-Garc\u00eda","year":"2023","unstructured":"Mart\u00ednez-Garc\u00eda A, Alvarez-Romero C, Rom\u00e1n-Villar\u00e1n E, Bernabeu-Wittel M, Luis Parra-Calder\u00f3n C. Fair principles to improve the impact on health research management outcomes. Heliyon. 2023;9:15733. https:\/\/doi.org\/10.1016\/j.heliyon.2023.e15733.","journal-title":"Heliyon"},{"key":"6376_CR25","doi-asserted-by":"publisher","first-page":"10","DOI":"10.1162\/dint_r_00024","volume":"2","author":"A Jacobsen","year":"2020","unstructured":"...Jacobsen A, de Miranda Azevedo R, Juty N, Batista D, Coles S, Cornet R, et al. Fair principles: interpretations and implementation considerations. Data Intell. 2020;2:10\u201329. https:\/\/doi.org\/10.1162\/dint_r_00024.","journal-title":"Data Intell"},{"key":"6376_CR26","doi-asserted-by":"publisher","first-page":"622","DOI":"10.1038\/s41597-022-01710-x","volume":"9","author":"M Barker","year":"2022","unstructured":"Barker M, Chue Hong NP, Katz DS, Lamprecht A, Martinez-Ortiz C, Psomopoulos F, et al. Introducing the fair principles for research software. Sci Data. 2022;9:622. https:\/\/doi.org\/10.1038\/s41597-022-01710-x.","journal-title":"Sci Data"},{"key":"6376_CR27","doi-asserted-by":"publisher","first-page":"1003285","DOI":"10.1371\/journal.pcbi.1003285","volume":"9","author":"GK Sandve","year":"2013","unstructured":"Sandve GK, Nekrutenko A, Taylor J, Hovig E. Ten simple rules for reproducible computational research. PLoS Comput Biol. 2013;9:1003285. https:\/\/doi.org\/10.1371\/journal.pcbi.1003285.","journal-title":"PLoS Comput Biol"},{"key":"6376_CR28","doi-asserted-by":"publisher","first-page":"845","DOI":"10.1093\/nar\/gkz1021","volume":"48","author":"J Pi\u00f1ero","year":"2020","unstructured":"Pi\u00f1ero J, Ram\u00edrez-Anguita JM, Sa\u00fcch-Pitarch J, Ronzano F, Centeno E, Sanz F, et al. The disgenet knowledge platform for disease genomics: 2019 update. Nucleic Acids Res. 2020;48:845\u201355. https:\/\/doi.org\/10.1093\/nar\/gkz1021.","journal-title":"Nucleic Acids Res"},{"key":"6376_CR29","doi-asserted-by":"publisher","first-page":"20869","DOI":"10.1038\/s41598-022-24980-2","volume":"12","author":"Y Wang","year":"2022","unstructured":"Wang Y, Aldahdooh J, Hu Y, Yang H, V\u00e4h\u00e4-Koskela M, Tang J, et al. Drugrepo: a novel approach to repurposing drugs based on chemical and genomic features. Sci Rep. 2022;12:20869. https:\/\/doi.org\/10.1038\/s41598-022-24980-2.","journal-title":"Sci Rep"},{"key":"6376_CR30","doi-asserted-by":"publisher","first-page":"015","DOI":"10.1093\/database\/baaa015","volume":"2020","author":"N Queralt-Rosinach","year":"2020","unstructured":"Queralt-Rosinach N, Stupp GS, Li TS, Mayers M, Hoatlin ME, Might M, et al. Structured review for data and knowledge-drive research. Database. 2020;2020:015. https:\/\/doi.org\/10.1093\/database\/baaa015.","journal-title":"Database"},{"key":"6376_CR31","unstructured":"Reep CAT. Automated drug repurposing workflow for rare diseases 2022. https:\/\/theses.liacs.nl\/2302"},{"key":"6376_CR32","doi-asserted-by":"publisher","DOI":"10.1016\/j.drudis.2022.03.006","volume":"27","author":"C Choudhury","year":"2022","unstructured":"Choudhury C, Murugan NA, Priyakumar UD. Structure-based drug repurposing: traditional and advanced AI\/ML-aided methods. Drug Discov Today. 2022;27:103307. https:\/\/doi.org\/10.1016\/j.drudis.2022.03.006.","journal-title":"Drug Discov Today"},{"key":"6376_CR33","doi-asserted-by":"publisher","first-page":"67","DOI":"10.1038\/s41597-023-01960-3","volume":"10","author":"P Chandak","year":"2023","unstructured":"Chandak P, Huang K, Zitnik M. Building a knowledge graph to enable precision medicine. Sci Data. 2023;10:67. https:\/\/doi.org\/10.1038\/s41597-023-01960-3.","journal-title":"Sci Data"},{"key":"6376_CR34","doi-asserted-by":"publisher","first-page":"455","DOI":"10.1002\/jcc.21334","volume":"31","author":"O Trott","year":"2010","unstructured":"Trott O, Olson AJ. AutoDock Vina: improving the speed and accuracy of docking with a new scoring function, efficient optimization, and multithreading. J Comput Chem. 2010;31:455\u201361. https:\/\/doi.org\/10.1002\/jcc.21334.","journal-title":"J Comput Chem"},{"key":"6376_CR35","doi-asserted-by":"publisher","first-page":"492","DOI":"10.1038\/s41586-024-07487-w","volume":"636","author":"J Abramson","year":"2024","unstructured":"Abramson J, Adler J, Dunger J, Evans R, Green T, Pritzel A, et al. Accurate structure prediction of biomolecular interactions with AlphaFold 3. Nature. 2024;636:492\u2013500. https:\/\/doi.org\/10.1038\/s41586-024-07487-w.","journal-title":"Nature"},{"key":"6376_CR36","doi-asserted-by":"publisher","first-page":"583","DOI":"10.1038\/s41586-021-03819-2","volume":"596","author":"J Jumper","year":"2021","unstructured":"Jumper J, Evans R, Pritzel A, Green T, Figurnov M, Ronneberger O, et al. Highly accurate protein structure prediction with AlphaFold. Nature. 2021;596:583\u20139. https:\/\/doi.org\/10.1038\/s41586-021-03819-2.","journal-title":"Nature"},{"key":"6376_CR37","doi-asserted-by":"publisher","first-page":"1605","DOI":"10.1002\/jcc.20084","volume":"25","author":"EF Pettersen","year":"2004","unstructured":"Pettersen EF, Goddard TD, Huang CC, Couch GS, Greenblatt DM, Meng EC, et al. Ucsf chimera-a visualization system for exploratory research and analysis. J Comput Chem. 2004;25:1605\u201312. https:\/\/doi.org\/10.1002\/jcc.20084.","journal-title":"J Comput Chem"},{"key":"6376_CR38","doi-asserted-by":"publisher","first-page":"1227","DOI":"10.1093\/nar\/gkad1040","volume":"52","author":"M Cannon","year":"2024","unstructured":"Cannon M, Stevenson J, Stahl K, Basu R, Coffman A, Kiwala S, et al. DGIdb 5.0: rebuilding the drug-gene interaction database for precision medicine and drug discovery platforms. Nucleic Acids Res. 2024;52:1227\u201335. https:\/\/doi.org\/10.1093\/nar\/gkad1040.","journal-title":"Nucleic Acids Res"},{"key":"6376_CR39","doi-asserted-by":"publisher","first-page":"1102","DOI":"10.1093\/nar\/gky1033","volume":"47","author":"S Kim","year":"2019","unstructured":"Kim S, Chen J, Cheng T, Gindulyte A, He J, He S, et al. Pubchem 2019 update: improved access to chemical data. Nucleic Acids Res. 2019;47:1102\u20139. https:\/\/doi.org\/10.1093\/nar\/gky1033.","journal-title":"Nucleic Acids Res"},{"key":"6376_CR40","doi-asserted-by":"publisher","first-page":"1180","DOI":"10.1093\/nar\/gkad1004","volume":"52","author":"B Zdrazil","year":"2024","unstructured":"Zdrazil B, Felix E, Hunter F, Manchado UJP, Zhang J, Rule A, et al. The ChEMBL database in 2023: a drug discovery platform spanning multiple bioactivity data types and time periods. Nucleic Acids Res. 2024;52:1180\u201392. https:\/\/doi.org\/10.1093\/nar\/gkad1004.","journal-title":"Nucleic Acids Res"},{"key":"6376_CR41","doi-asserted-by":"publisher","first-page":"672","DOI":"10.1093\/nar\/gkad1025","volume":"52","author":"M Milacic","year":"2024","unstructured":"Milacic M, Haw R, Rothfels K, Wu G, Stein L, D\u2019Eustachio P. The reactome pathway knowledgebase 2024. Nucleic Acids Res. 2024;52:672\u20138. https:\/\/doi.org\/10.1093\/nar\/gkad1025.","journal-title":"Nucleic Acids Res"},{"key":"6376_CR42","doi-asserted-by":"publisher","first-page":"605","DOI":"10.1093\/nar\/gkaa1074","volume":"49","author":"D Szklarczyk","year":"2021","unstructured":"Szklarczyk D, Gable AL, Lyon D, Junge A, Wyder S, Huerta-Cepas J, et al. The string database in 2021: customizable protein-protein networks, and functional characterization of user-uploaded gene\/measurement sets. Nucleic Acids Res. 2021;49:605\u201312. https:\/\/doi.org\/10.1093\/nar\/gkaa1074.","journal-title":"Nucleic Acids Res"},{"key":"6376_CR43","doi-asserted-by":"publisher","first-page":"15545","DOI":"10.1073\/pnas.0506580102","volume":"102","author":"AM Subramanian","year":"2005","unstructured":"Subramanian AM, Tamayo P, Mootha VK, Mukherjee S, Ebert BL, Gillette MA, et al. Gene set enrichment analysis: A knowledge-based approach for interpreting genome-wide expression profiles. Proc Natl Acad Sci. 2005;102:15545\u201350. https:\/\/doi.org\/10.1073\/pnas.0506580102.","journal-title":"Proc Natl Acad Sci"},{"key":"6376_CR44","doi-asserted-by":"publisher","first-page":"452","DOI":"10.1093\/nar\/gkh052","volume":"32","author":"H Hermjakob","year":"2004","unstructured":"Hermjakob H, Montecchi-Palazzi L, Lewington C, Mudali S, Kerrien S, Orchard S, et al. Intact: an open source molecular interaction database. Nucleic Acids Res. 2004;32:452\u20135. https:\/\/doi.org\/10.1093\/nar\/gkh052.","journal-title":"Nucleic Acids Res"},{"key":"6376_CR45","doi-asserted-by":"publisher","first-page":"353","DOI":"10.1093\/nar\/gkw1092","volume":"45","author":"M Kanehisa","year":"2017","unstructured":"Kanehisa M, Furumichi M, Tanabe M, Sato Y, Morishima K. KEGG: new perspectives on genomes, pathways, diseases and drugs. Nucleic Acids Res. 2017;45:353\u201361. https:\/\/doi.org\/10.1093\/nar\/gkw1092.","journal-title":"Nucleic Acids Res"},{"key":"6376_CR46","doi-asserted-by":"publisher","first-page":"2131","DOI":"10.1109\/TCBB.2019.2911071","volume":"17","author":"A Ogunleye","year":"2020","unstructured":"Ogunleye A, Wang Q. Xgboost model for chronic kidney disease diagnosis. IEEE\/ACM Trans Comput Biol Bioinf. 2020;17:2131\u201340. https:\/\/doi.org\/10.1109\/TCBB.2019.2911071.","journal-title":"IEEE\/ACM Trans Comput Biol Bioinf"},{"key":"6376_CR47","unstructured":"Fey M, Lenssen JE. fast graph representation learning with PyTorch geometric 2019. Preprint at arXiv:1903.02428"},{"key":"6376_CR48","unstructured":"Kipf TN, Welling M. Semi-supervised classification with graph convolutional networks. OpenReview.net. 2017. arXiv:1609.02907"},{"key":"6376_CR49","doi-asserted-by":"publisher","first-page":"92","DOI":"10.1038\/s41392-024-01808-1","volume":"9","author":"Y Xia","year":"2024","unstructured":"Xia Y, Sun M, Huang H, Jin W-L. Drug repurposing for cancer therapy. Signal Transduct Target Ther. 2024;9:92. https:\/\/doi.org\/10.1038\/s41392-024-01808-1.","journal-title":"Signal Transduct Target Ther"},{"key":"6376_CR50","doi-asserted-by":"publisher","DOI":"10.1002\/alz.062169","volume":"18","author":"F Cheng","year":"2022","unstructured":"Cheng F, Fang J, Zhang P, Zhou Y, Chiang C-W, Tan J, et al. Sildenafil (Viagra) is a candidate drug for Alzheimer\u2019s disease. Alzheimer\u2019s Dementia. 2022;18:062169. https:\/\/doi.org\/10.1002\/alz.062169.","journal-title":"Alzheimer\u2019s Dementia"},{"key":"6376_CR51","doi-asserted-by":"publisher","first-page":"1057","DOI":"10.1080\/17460441.2021.1910673","volume":"16","author":"F MacLean","year":"2021","unstructured":"MacLean F. Knowledge graphs and their applications in drug discovery. Expert Opin Drug Discov. 2021;16:1057\u201369. https:\/\/doi.org\/10.1080\/17460441.2021.1910673.","journal-title":"Expert Opin Drug Discov"},{"key":"6376_CR52","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1186\/s13326-024-00310-5","volume":"15","author":"L Vogt","year":"2024","unstructured":"Vogt L, Kuhn T, Hoehndorf R. Semantic units: organizing knowledge graphs into semantically meaningful units of representation. J Biomed Semant. 2024;15:3. https:\/\/doi.org\/10.1186\/s13326-024-00310-5.","journal-title":"J Biomed Semant"},{"key":"6376_CR53","doi-asserted-by":"publisher","first-page":"938","DOI":"10.1093\/nar\/gkad1082","volume":"52","author":"TE Putman","year":"2024","unstructured":"Putman TE, Schaper K, Matentzoglu N, Rubinetti VP, Alquaddoomi FS, Cox C, et al. The monarch initiative in 2024: an analytic platform integrating phenotypes, genes and diseases across species. Nucleic Acids Res. 2024;52:938\u201349. https:\/\/doi.org\/10.1093\/nar\/gkad1082.","journal-title":"Nucleic Acids Res"},{"key":"6376_CR54","doi-asserted-by":"publisher","first-page":"667","DOI":"10.1016\/j.ins.2022.09.024","volume":"613","author":"R Miao","year":"2022","unstructured":"Miao R, Yang Y, Ma Y, Juan X, Xue H, Tang J, et al. Negative samples selecting strategy for graph contrastive learning. Inf Sci. 2022;613:667\u201381. https:\/\/doi.org\/10.1016\/j.ins.2022.09.024.","journal-title":"Inf Sci"},{"key":"6376_CR55","doi-asserted-by":"publisher","DOI":"10.1016\/j.inffus.2024.102563","volume":"102","author":"J Liu","year":"2024","unstructured":"Liu J, Hu F, Zou Q, Tiwari P, Wu H, Ding Y. Drug repositioning by multi-aspect heterogeneous graph contrastive learning and positive-fusion negative sampling strategy. Inf Fusion. 2024;102:102563. https:\/\/doi.org\/10.1016\/j.inffus.2024.102563.","journal-title":"Inf Fusion"},{"key":"6376_CR56","doi-asserted-by":"publisher","first-page":"18","DOI":"10.1007\/978-3-031-60626-7_2","volume":"14664","author":"N Hubert","year":"2024","unstructured":"Hubert N, Monnin P, Brun A, Monticolo D. Treat different negatives differently: Enriching loss functions with domain and range constraints for link prediction. The Semant Web. 2024;14664:18\u201336. https:\/\/doi.org\/10.1007\/978-3-031-60626-7_2.","journal-title":"The Semant Web"},{"key":"6376_CR57","doi-asserted-by":"publisher","first-page":"396","DOI":"10.1093\/nar\/gkt1079","volume":"42","author":"P Blohm","year":"2014","unstructured":"Blohm P, Frishman G, Smialowski P, Goebels F, Wachinger B, Ruepp B, et al. Negatome 2.0: a database of non-interacting proteins derived by literature mining, manual annotation and protein structure analysis. Nucleic Acids Res. 2014;42:396\u2013400. https:\/\/doi.org\/10.1093\/nar\/gkt1079.","journal-title":"Nucleic Acids Res"},{"key":"6376_CR58","doi-asserted-by":"publisher","first-page":"1017","DOI":"10.1093\/bib\/bbw075","volume":"18","author":"D Alvarez-Ponce","year":"2017","unstructured":"Alvarez-Ponce D. Recording negative results of protein-protein interaction assays: an easy way to deal with the biases and errors of interactomic data sets. Brief Bioinform. 2017;18:1017\u201323. https:\/\/doi.org\/10.1093\/bib\/bbw075.","journal-title":"Brief Bioinform"},{"key":"6376_CR59","doi-asserted-by":"publisher","first-page":"2697","DOI":"10.1021\/acs.jcim.0c01489","volume":"61","author":"D Deng","year":"2021","unstructured":"Deng D, Chen X, Zhang R, Lei Z, Wang X, Zhou F. Xgraphboost: extracting graph neural network-based features for a better prediction of molecular properties. J Chem Inf Model. 2021;61:2697\u2013705. https:\/\/doi.org\/10.1021\/acs.jcim.0c01489.","journal-title":"J Chem Inf Model"},{"key":"6376_CR60","doi-asserted-by":"publisher","DOI":"10.1145\/2939672.2939754","author":"A Grover","year":"2016","unstructured":"Grover A, Leskovec J. node2vec: scalable feature learning for networks. Assoc Comput Mach. 2016. https:\/\/doi.org\/10.1145\/2939672.2939754.","journal-title":"Assoc Comput Mach"},{"key":"6376_CR61","doi-asserted-by":"publisher","first-page":"494","DOI":"10.5195\/jmla.2018.512","volume":"106","author":"J Courneya","year":"2018","unstructured":"Courneya J, Mayo A. High-performance computing service for bioinformatics and data science. J Med Libr Assoc. 2018;106:494\u2013500. https:\/\/doi.org\/10.5195\/jmla.2018.512.","journal-title":"J Med Libr Assoc"},{"key":"6376_CR62","unstructured":"Cohen E. node2vec. GitHub repository. Python implementation of the node2vec algorithm 2020. https:\/\/github.com\/eliorc\/node2vec"},{"key":"6376_CR63","doi-asserted-by":"publisher","unstructured":"Bordes A, Usunier N, Garcia-Duran A, Weston J, Yakhnenko O. Translating embeddings for modeling multi-relational data. Curran Associates Inc. 2013. https:\/\/doi.org\/10.5555\/2999792.2999923","DOI":"10.5555\/2999792.2999923"},{"key":"6376_CR64","unstructured":"Yang B, Yih W, He X, Gao J, Deng L. Embedding Entities and Relations for Learning and Inference in Knowledge Bases 2015. https:\/\/arxiv.org\/abs\/1412.6575"},{"key":"6376_CR65","unstructured":"Trouillon T, Welbl J, Riedel S, Gaussier E, Bouchard G. Complex embeddings for simple link prediction. 2016. https:\/\/arxiv.org\/abs\/1606.06357"},{"key":"6376_CR66","doi-asserted-by":"crossref","unstructured":"Ristoski P, Paulheim H. Rdf2vec: Rdf graph embeddings for data mining. In: The semantic web \u2013 ISWC 2016. Springer; 2016. p. 498\u2013514.","DOI":"10.1007\/978-3-319-46523-4_30"},{"key":"6376_CR67","doi-asserted-by":"publisher","DOI":"10.3389\/fgene.2019.00381","author":"W Nelson","year":"2019","unstructured":"Nelson W, Zitnik M, Wang B, Leskovec J, Goldenberg A, Sharan R. To embed or not: network embedding as a paradigm in computational biology. Front Genet. 2019. https:\/\/doi.org\/10.3389\/fgene.2019.00381.","journal-title":"Front Genet"},{"issue":"4","key":"6376_CR68","doi-asserted-by":"publisher","first-page":"1241","DOI":"10.1093\/bioinformatics\/btz718","volume":"36","author":"X Yue","year":"2019","unstructured":"Yue X, Wang Z, Huang J, Parthasarathy S, Moosavinasab S, Huang Y, et al. Graph embedding on biomedical networks: methods, applications and evaluations. Bioinformatics. 2019;36(4):1241\u201351. https:\/\/doi.org\/10.1093\/bioinformatics\/btz718.","journal-title":"Bioinformatics"},{"key":"6376_CR69","doi-asserted-by":"publisher","first-page":"22829","DOI":"10.1007\/s00521-024-10425-6","volume":"36","author":"T Wallett","year":"2024","unstructured":"Wallett T, Jafari A. A benchmark for graph-based dynamic recommendation systems. Neural Comput Appl. 2024;36:22829\u201344. https:\/\/doi.org\/10.1007\/s00521-024-10425-6.","journal-title":"Neural Comput Appl"},{"key":"6376_CR70","doi-asserted-by":"publisher","first-page":"125","DOI":"10.1007\/s40588-022-00183-1","volume":"9","author":"BF Wasswa","year":"2022","unstructured":"Wasswa BF, Kassaza K, Nielsen K, Bazira J. Minion whole-genome sequencing in resource-limited settings: challenges and opportunities. Curr Clin Microbiol Rep. 2022;9:125\u201335. https:\/\/doi.org\/10.1007\/s40588-022-00183-1.","journal-title":"Curr Clin Microbiol Rep"},{"key":"6376_CR71","doi-asserted-by":"publisher","first-page":"712","DOI":"10.1016\/j.drudis.2017.01.014","volume":"22","author":"B Schmidt","year":"2017","unstructured":"Schmidt B, Hildebrandt A. Next-generation sequencing: big data meets high performance computing. Drug Discov Today. 2017;22:712\u20137. https:\/\/doi.org\/10.1016\/j.drudis.2017.01.014.","journal-title":"Drug Discov Today"},{"key":"6376_CR72","doi-asserted-by":"publisher","first-page":"052","DOI":"10.1093\/gigascience\/giaa052","volume":"9","author":"A Petrini","year":"2020","unstructured":"Petrini A, Mesiti M, Schubach M, Frasca M, Danis D, Re M, et al. parSMURF, a high-performance computing tool for the genome-wide detection of pathogenic variants. Gigascience. 2020;9:052. https:\/\/doi.org\/10.1093\/gigascience\/giaa052.","journal-title":"Gigascience"},{"key":"6376_CR73","unstructured":"Bianchi N. OMIM-converter. GitHub repository. JavaScript tool for OMIM-MONDO data conversion 2024. https:\/\/github.com\/NCMBianchi\/OMIM-converter"},{"key":"6376_CR74","doi-asserted-by":"publisher","first-page":"90","DOI":"10.1186\/s13321-022-00663-y","volume":"14","author":"A Lai","year":"2022","unstructured":"Lai A, Schaub J, Steinbeck C, Schymanski EL. An algorithm to classify homologous series within compound datasets. Journal of Cheminformatics. 2022;14:90. https:\/\/doi.org\/10.1186\/s13321-022-00663-y.","journal-title":"Journal of Cheminformatics"},{"key":"6376_CR75","doi-asserted-by":"publisher","first-page":"742","DOI":"10.1021\/ci100050t","volume":"50","author":"D Rogers","year":"2010","unstructured":"Rogers D, Hahn M. Extended-connectivity fingerprints. J Chem Inf Model. 2010;50:742\u201354. https:\/\/doi.org\/10.1021\/ci100050t.","journal-title":"J Chem Inf Model"},{"issue":"4","key":"6376_CR76","doi-asserted-by":"publisher","first-page":"328","DOI":"10.1093\/bib\/bbae328","volume":"25","author":"A Ianevski","year":"2024","unstructured":"Ianevski A, Kushnir A, Nader K, Miihkinen M, Xhaard H, Aittokallio T, et al. Repurposedrugs: an interactive web-portal and predictive platform for repurposing mono- and combination therapies. Brief Bioinform. 2024;25(4):328. https:\/\/doi.org\/10.1093\/bib\/bbae328.","journal-title":"Brief Bioinform"},{"issue":"2","key":"6376_CR77","doi-asserted-by":"publisher","first-page":"1656","DOI":"10.1093\/bib\/bbaa003","volume":"22","author":"Z Tanoli","year":"2020","unstructured":"Tanoli Z, Seemab U, Scherer A, Wennerberg K, Tang J, V\u00e4h\u00e4-Koskela M. Exploration of databases and methods supporting drug repurposing: a comprehensive survey. Brief Bioinform. 2020;22(2):1656\u201378. https:\/\/doi.org\/10.1093\/bib\/bbaa003.","journal-title":"Brief Bioinform"},{"issue":"1","key":"6376_CR78","doi-asserted-by":"publisher","first-page":"31","DOI":"10.1080\/17460441.2024.2430955","volume":"20","author":"Z Tanoli","year":"2025","unstructured":"Tanoli Z, Schulman A, Aittokallio T. Validation guidelines for drug-target prediction methods. Expert Opin Drug Discov. 2025;20(1):31\u201345. https:\/\/doi.org\/10.1080\/17460441.2024.2430955.","journal-title":"Expert Opin Drug Discov"},{"issue":"8","key":"6376_CR79","doi-asserted-by":"publisher","first-page":"496","DOI":"10.1093\/bioinformatics\/btae496","volume":"40","author":"A Schulman","year":"2024","unstructured":"Schulman A, Rousu J, Aittokallio T, Tanoli Z. Attention-based approach to predict drug\u2013target interactions across seven target superfamilies. Bioinformatics. 2024;40(8):496. https:\/\/doi.org\/10.1093\/bioinformatics\/btae496.","journal-title":"Bioinformatics"},{"issue":"D1","key":"6376_CR80","doi-asserted-by":"publisher","first-page":"1486","DOI":"10.1093\/nar\/gkae1127","volume":"53","author":"TT Duong Nguyen","year":"2024","unstructured":"Duong Nguyen TT, Tanoli Z, Hassan S, \u00d6zcan UO, Caroli J, Kooistra AJ, et al. PGxDB: an interactive web-platform for pharmacogenomics research. Nucleic Acids Res. 2024;53(D1):1486\u201397. https:\/\/doi.org\/10.1093\/nar\/gkae1127.","journal-title":"Nucleic Acids Res"},{"issue":"1","key":"6376_CR81","doi-asserted-by":"publisher","first-page":"106","DOI":"10.1093\/bioadv\/vbae106","volume":"4","author":"J Aldahdooh","year":"2024","unstructured":"Aldahdooh J, Tanoli Z, Tang J. Mining drug\u2014target interactions from biomedical literature using chemical and gene descriptions-based ensemble transformer model. Bioinform Adv. 2024;4(1):106. https:\/\/doi.org\/10.1093\/bioadv\/vbae106.","journal-title":"Bioinform Adv"}],"container-title":["BMC Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/article\/10.1186\/s12859-026-06376-5","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s12859-026-06376-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s12859-026-06376-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,6]],"date-time":"2026-03-06T10:44:55Z","timestamp":1772793895000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1186\/s12859-026-06376-5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,2,4]]},"references-count":81,"journal-issue":{"issue":"1","published-online":{"date-parts":[[2026,12]]}},"alternative-id":["6376"],"URL":"https:\/\/doi.org\/10.1186\/s12859-026-06376-5","relation":{},"ISSN":["1471-2105"],"issn-type":[{"value":"1471-2105","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,2,4]]},"assertion":[{"value":"22 July 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 January 2026","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"4 February 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no Conflict of interest.Specifically, Bianchi declares no conflict of interests with Universit\u00e0 degli Studi (Milan, Italy) and Politecnico di Milano (Italy) \u2013where he was enrolled as a MSc student in \"Bioinformatics for Computational Genomics\" at the start of this project\u2013 and prof. Wolstencroft declares no conflict of interests withLeiden University \u2013where she was employed at the beginning of this project.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"Not applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval and consent to participate"}},{"value":"Not applicable.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for publication"}}],"article-number":"60"}}