{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,26]],"date-time":"2026-03-26T19:47:54Z","timestamp":1774554474023,"version":"3.50.1"},"reference-count":37,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2023,8,14]],"date-time":"2023-08-14T00:00:00Z","timestamp":1691971200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0"},{"start":{"date-parts":[[2023,8,14]],"date-time":"2023-08-14T00:00:00Z","timestamp":1691971200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0"}],"funder":[{"DOI":"10.13039\/501100001871","name":"Funda\u00e7\u00e3o para a Ci\u00eancia e a Tecnologia","doi-asserted-by":"publisher","award":["ref. UIDB\/00408\/2020"],"award-info":[{"award-number":["ref. UIDB\/00408\/2020"]}],"id":[{"id":"10.13039\/501100001871","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001871","name":"Funda\u00e7\u00e3o para a Ci\u00eancia e a Tecnologia","doi-asserted-by":"publisher","award":["ref. UIDB\/00408\/2020"],"award-info":[{"award-number":["ref. UIDB\/00408\/2020"]}],"id":[{"id":"10.13039\/501100001871","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001871","name":"Funda\u00e7\u00e3o para a Ci\u00eancia e a Tecnologia","doi-asserted-by":"publisher","award":["ref. UIDB\/00408\/2020"],"award-info":[{"award-number":["ref. UIDB\/00408\/2020"]}],"id":[{"id":"10.13039\/501100001871","id-type":"DOI","asserted-by":"publisher"}]},{"name":"LASIGE Research Unit","award":["ref. UIDP\/00408\/2020"],"award-info":[{"award-number":["ref. UIDP\/00408\/2020"]}]},{"name":"LASIGE Research Unit","award":["ref. UIDP\/00408\/2020"],"award-info":[{"award-number":["ref. UIDP\/00408\/2020"]}]},{"name":"LASIGE Research Unit","award":["ref. UIDP\/00408\/2020"],"award-info":[{"award-number":["ref. UIDP\/00408\/2020"]}]},{"name":"KATY Project with European Union\u2019s Horizon 2020 research","award":["No 101017453"],"award-info":[{"award-number":["No 101017453"]}]},{"name":"KATY Project with European Union\u2019s Horizon 2020 research","award":["No 101017453"],"award-info":[{"award-number":["No 101017453"]}]},{"name":"FCT PhD grant","award":["ref. SFRH\/BD\/145377\/2019"],"award-info":[{"award-number":["ref. SFRH\/BD\/145377\/2019"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Biomed Semant"],"abstract":"<jats:title>Abstract<\/jats:title><jats:sec>\n                <jats:title>Background<\/jats:title>\n                <jats:p>Predicting gene-disease associations typically requires exploring diverse sources of information as well as sophisticated computational approaches. Knowledge graph embeddings can help tackle these challenges by creating representations of genes and diseases based on the scientific knowledge described in ontologies, which can then be explored by machine learning algorithms. However, state-of-the-art knowledge graph embeddings are produced over a single ontology or multiple but disconnected ones, ignoring the impact that considering multiple interconnected domains can have on complex tasks such as gene-disease association prediction.<\/jats:p>\n              <\/jats:sec><jats:sec>\n                <jats:title>Results<\/jats:title>\n                <jats:p>We propose a novel approach to predict gene-disease associations using rich semantic representations based on knowledge graph embeddings over multiple ontologies linked by logical definitions and compound ontology mappings. The experiments showed that considering richer knowledge graphs significantly improves gene-disease prediction and that different knowledge graph embeddings methods benefit more from distinct types of semantic richness.<\/jats:p>\n              <\/jats:sec><jats:sec>\n                <jats:title>Conclusions<\/jats:title>\n                <jats:p>This work demonstrated the potential for knowledge graph embeddings across multiple and interconnected biomedical ontologies to support gene-disease prediction. It also paved the way for considering other ontologies or tackling other tasks where multiple perspectives over the data can be beneficial. All software and data are freely available.<\/jats:p>\n              <\/jats:sec>","DOI":"10.1186\/s13326-023-00291-x","type":"journal-article","created":{"date-parts":[[2023,8,14]],"date-time":"2023-08-14T16:02:12Z","timestamp":1692028932000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":24,"title":["Multi-domain knowledge graph embeddings for gene-disease association prediction"],"prefix":"10.1186","volume":"14","author":[{"given":"Susana","family":"Nunes","sequence":"first","affiliation":[]},{"given":"Rita\u00a0T.","family":"Sousa","sequence":"additional","affiliation":[]},{"given":"Catia","family":"Pesquita","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2023,8,14]]},"reference":[{"key":"291_CR1","doi-asserted-by":"publisher","unstructured":"Amberger J, Bocchini C, Schiettecatte F, Scott A, Hamosh A. OMIM.org: Online Mendelian Inheritance in Man (OMIM\u00ae), an Online catalog of human genes and genetic disorders. Nucleic Acids Res. 2014;43. https:\/\/doi.org\/10.1093\/nar\/gku1205.","DOI":"10.1093\/nar\/gku1205"},{"issue":"13","key":"291_CR2","doi-asserted-by":"publisher","first-page":"e0208626","DOI":"10.1371\/journal.pone.0208626","volume":"12","author":"M Asif","year":"2018","unstructured":"Asif M, Martiniano H, Couto F. Identifying disease genes using machine learning and gene functional similarities, assessed through Gene Ontology. PLoS ONE. 2018;12(13):e0208626. https:\/\/doi.org\/10.1371\/journal.pone.0208626.","journal-title":"PLoS ONE."},{"key":"291_CR3","doi-asserted-by":"publisher","first-page":"D845","DOI":"10.1093\/nar\/gkz1021","volume":"48","author":"J Pi\u00f1ero","year":"2019","unstructured":"Pi\u00f1ero J, Ram\u00edrez-Anguita JM, Sa\u00fcch-Pitarch J, Ronzano F, Centeno E, Sanz F, et al. The DisGeNET knowledge platform for disease genomics: 2019 update. Nucleic Acids Res. 2019;48:D845\u201355. https:\/\/doi.org\/10.1093\/nar\/gkz1021.","journal-title":"Nucleic Acids Res."},{"issue":"8","key":"291_CR4","doi-asserted-by":"publisher","first-page":"677","DOI":"10.1101\/gr.9.8.677","volume":"9","author":"ST Sherry","year":"1999","unstructured":"Sherry ST, Ward M, Sirotkin K. dbSNP-database for single nucleotide polymorphisms and other classes of minor genetic variation. Genome Res. 1999;9(8):677\u20139.","journal-title":"Genome Res."},{"key":"291_CR5","doi-asserted-by":"publisher","unstructured":"Opap K, Mulder N. Recent advances in predicting gene-disease associations. F1000Research. 2017;6:578. https:\/\/doi.org\/10.12688\/f1000research.10788.1.","DOI":"10.12688\/f1000research.10788.1"},{"issue":"3","key":"291_CR6","doi-asserted-by":"publisher","first-page":"256","DOI":"10.1093\/bib\/bbl027","volume":"7","author":"O Bodenreider","year":"2006","unstructured":"Bodenreider O, Stevens R. Bio-ontologies: current trends and future directions. Brief Bioinforma. 2006;7(3):256\u201374. https:\/\/doi.org\/10.1093\/bib\/bbl027.","journal-title":"Brief Bioinforma."},{"key":"291_CR7","doi-asserted-by":"publisher","first-page":"489","DOI":"10.3233\/SW-160218","volume":"8","author":"H Paulheim","year":"2016","unstructured":"Paulheim H. Knowledge graph refinement: A survey of approaches and evaluation methods. Semantic Web. 2016;8:489\u2013508. https:\/\/doi.org\/10.3233\/SW-160218.","journal-title":"Semantic Web."},{"issue":"1","key":"291_CR8","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1371\/journal.pcbi.1000641","volume":"6","author":"O Vanunu","year":"2010","unstructured":"Vanunu O, Magger O, Ruppin E, Shlomi T, Sharan R. Associating genes and protein complexes with disease via network propagation. PLoS Comput Biol. 2010;6(1):1\u20139.","journal-title":"PLoS Comput Biol"},{"key":"291_CR9","doi-asserted-by":"publisher","first-page":"i447","DOI":"10.1093\/bioinformatics\/bty289","volume":"34","author":"P Zakeri","year":"2018","unstructured":"Zakeri P, Simm J, Arany A, ElShal S, Moreau Y. Gene prioritization using Bayesian matrix factorization with genomic and phenotypic side information. Bioinformatics. 2018;34:i447\u201356.","journal-title":"Bioinformatics."},{"issue":"2","key":"291_CR10","doi-asserted-by":"publisher","first-page":"340","DOI":"10.1101\/gr.160325.113","volume":"24","author":"P Robinson","year":"2014","unstructured":"Robinson P, K\u00f6hler S, Oellrich A, Genetics S, Wang K, Mungall C, et al. Improved exome prioritization of disease genes through cross-species phenotype comparison. PCR Methods Appl. 2014;24(2):340\u20138. https:\/\/doi.org\/10.1101\/gr.160325.113.","journal-title":"PCR Methods Appl."},{"key":"291_CR11","doi-asserted-by":"publisher","first-page":"270","DOI":"10.3389\/fgene.2019.00270","volume":"10","author":"P Luo","year":"2019","unstructured":"Luo P, Xiao Q, Wei PJ, Liao B, Wu FX. Identifying disease-gene associations with graph-regularized manifold learning. Front Genet. 2019;10:270.","journal-title":"Front Genet"},{"key":"291_CR12","doi-asserted-by":"crossref","unstructured":"Pesquita C, Faria D, Falc\u00e3o A, Lord P, Couto F. Semantic similarity in biomedical ontologies. PLoS Comput Biol. 2009;5(1-12).","DOI":"10.1371\/journal.pcbi.1000443"},{"key":"291_CR13","doi-asserted-by":"publisher","first-page":"2724","DOI":"10.1109\/TKDE.2017.2754499","volume":"29","author":"Q Wang","year":"2017","unstructured":"Wang Q, Mao Z, Wang B, Guo L. Knowledge Graph Embedding: A Survey of Approaches and Applications. IEEE Trans Knowl Data Eng. 2017;29:2724\u201343.","journal-title":"IEEE Trans Knowl Data Eng."},{"issue":"12","key":"291_CR14","doi-asserted-by":"publisher","first-page":"2133","DOI":"10.1093\/bioinformatics\/bty933","volume":"35","author":"FZ Smaili","year":"2019","unstructured":"Smaili FZ, Gao X, Hoehndorf R. OPA2Vec: combining formal and informal content of biomedical ontologies to improve similarity-based prediction. Bioinformatics. 2019;35(12):2133\u201340.","journal-title":"Bioinformatics."},{"issue":"17","key":"291_CR15","doi-asserted-by":"publisher","first-page":"2723","DOI":"10.1093\/bioinformatics\/btx275","volume":"33","author":"M Alshahrani","year":"2017","unstructured":"Alshahrani M, Khan MA, Maddouri O, Kinjo AR, Queralt-Rosinach N, Hoehndorf R. Neuro-symbolic representation learning on biological knowledge graphs. Bioinformatics. 2017;33(17):2723\u201330. https:\/\/doi.org\/10.1093\/bioinformatics\/btx275.","journal-title":"Bioinformatics."},{"key":"291_CR16","doi-asserted-by":"crossref","unstructured":"Vilela J, Asif M, Marques AR, Santos JX, Rasga C, Vicente A, et al. Biomedical knowledge graph embeddings for personalized medicine: Predicting disease-gene associations. Expert Syst. 2022;40:e13181.","DOI":"10.1111\/exsy.13181"},{"key":"291_CR17","unstructured":"Nunes S, Sousa RT, Pesquita C. Predicting gene-disease associations with knowledge graph embeddings over multiple ontologies. Bio-Ontologies COSI (ISMB 2021). arXiv preprint arXiv:2105.04944. 2021."},{"key":"291_CR18","doi-asserted-by":"crossref","unstructured":"Kaufman S, Rosset S, Perlich C. Leakage in data mining: formulation, detection, and avoidance. In: ACM Transactions on Knowledge Discovery from Data (TKDD), volume 6, number 4. New York: ACM; 2012. p. 1\u201321.","DOI":"10.1145\/2382577.2382579"},{"key":"291_CR19","doi-asserted-by":"publisher","first-page":"D506","DOI":"10.1093\/nar\/gky1049","volume":"47","author":"UniProt Consortium","year":"2019","unstructured":"UniProt Consortium. UniProt: a worldwide hub of protein knowledge. Nucleic Acids Res. 2019;47:D506\u201315. https:\/\/doi.org\/10.1093\/nar\/gky1049.","journal-title":"Nucleic Acids Res."},{"key":"291_CR20","doi-asserted-by":"publisher","unstructured":"Wakap S, Lambert D, Olry A, Rodwell C, Gueydan C, Val\u00e9rie L, et\u00a0al. Estimating cumulative point prevalence of rare diseases: analysis of the Orphanet database. Eur J Hum Genet. 2019;28. https:\/\/doi.org\/10.1038\/s41431-019-0508-0.","DOI":"10.1038\/s41431-019-0508-0"},{"key":"291_CR21","doi-asserted-by":"publisher","first-page":"D1207","DOI":"10.1093\/nar\/gkaa1043","volume":"49","author":"S K\u00f6hler","year":"2021","unstructured":"K\u00f6hler S, Gargano MA, Matentzoglu N, Carmody L, Lewis-Smith D, Vasilevsky NA, et al. The Human Phenotype Ontology in 2021. Nucleic Acids Res. 2021;49:D1207\u201317.","journal-title":"Nucleic Acids Res."},{"key":"291_CR22","unstructured":"K\u00f6hler S, Carmody L, Vasilevsky N, Jacobsen J, Danis D, Gourdine JP, et al. Expansion of the Human Phenotype Ontology (HPO) knowledge base and resources. Nucleic Acids Res. 2019;47(D1018\u2013D1027)."},{"issue":"D1","key":"291_CR23","doi-asserted-by":"publisher","first-page":"D325","DOI":"10.1093\/nar\/gkaa1113","volume":"49","author":"Consortium TGO","year":"2020","unstructured":"Consortium TGO. The Gene Ontology resource: enriching a GOld mine. Nucleic Acids Res. 2020;49(D1):D325\u201334. https:\/\/doi.org\/10.1093\/nar\/gkaa1113.","journal-title":"Nucleic Acids Res."},{"key":"291_CR24","doi-asserted-by":"publisher","first-page":"25","DOI":"10.1038\/75556","volume":"25","author":"MM Ashburner","year":"2000","unstructured":"Ashburner MM, Ball CAC, Blake J, Botstein D, Butler H, Cherry JMJ, et al. Gene Ontology: tool for the unification of biology. The Gene Ontology Consortium. Nat Genet. 2000;25:25\u20139.","journal-title":"Nat Genet."},{"key":"291_CR25","doi-asserted-by":"publisher","first-page":"418","DOI":"10.1186\/1471-2105-12-418","volume":"12","author":"S K\u00f6hler","year":"2011","unstructured":"K\u00f6hler S, Bauer S, Mungall CJ, Carletti GON, Smith CL, Schofield PN, et al. Improving ontologies by automatic reasoning and evaluation of logical definitions. BMC Bioinformatics. 2011;12:418\u2013418.","journal-title":"BMC Bioinformatics."},{"key":"291_CR26","doi-asserted-by":"publisher","unstructured":"Oliveira D, Pesquita C. Improving the interoperability of biomedical ontologies with compound alignments. J Biomed Semant. 2018;9. https:\/\/doi.org\/10.1186\/s13326-017-0171-8.","DOI":"10.1186\/s13326-017-0171-8"},{"key":"291_CR27","unstructured":"Faria D, Pesquita C, Santos E, Cruz IF, Couto FM. AgreementMakerLight results for OAEI 2013. In: Shvaiko P, Euzenat J, Srinivas K, Mao M, Jim\u00e9nez-Ruiz E, editors. Proceedings of the 8th International Workshop on Ontology Matching, volume 1111 of CEUR Workshop Proceedings; 2013. p. 101\u20138."},{"key":"291_CR28","doi-asserted-by":"crossref","unstructured":"Faria D, Pesquita C, Santos E, Palmonari M, Cruz IF, Couto FM. The agreementmakerlight ontology matching system. In: OTM Confederated International Conferences \u201cOn the Move to Meaningful Internet Systems\u201d. Springer; 2013. p. 527\u2013541.","DOI":"10.1007\/978-3-642-41030-7_38"},{"key":"291_CR29","doi-asserted-by":"publisher","unstructured":"Kulmanov M, Smaili FZ, Gao X, Hoehndorf R. Semantic similarity and machine learning with ontologies. Brief Bioinforma. 2020;22. https:\/\/doi.org\/10.1093\/bib\/bbaa199.","DOI":"10.1093\/bib\/bbaa199"},{"key":"291_CR30","unstructured":"Bordes A, Usunier N, Garc\u00eda-Dur\u00e1n A, Weston J, Yakhnenko O. Translating embeddings for modeling multi-relational data. In: Advances in Neural Information Processing Systems (NIPS), volume 26: Curran Associates, Inc.; 2013."},{"key":"291_CR31","doi-asserted-by":"publisher","unstructured":"Zhang Z, Cai J, Zhang Y, Wang J. Learning hierarchy-aware knowledge graph embeddings for link prediction. Proceedings of the AAAI Conference on Artificial Intelligence. 2020;34(03):3065\u201372. https:\/\/doi.org\/10.1609\/aaai.v34i03.5701.","DOI":"10.1609\/aaai.v34i03.5701"},{"key":"291_CR32","unstructured":"Yang B, Yih SWt, He X, Gao J, Deng L. Embedding Entities and Relations for Learning and Inference in Knowledge Bases. In: Proceedings of the International Conference on Learning Representations (ICLR) 2015. 2015. https:\/\/www.microsoft.com\/en-us\/research\/publication\/embedding-entities-and-relations-for-learning-and-inference-in-knowledge-bases\/."},{"key":"291_CR33","doi-asserted-by":"publisher","unstructured":"Ristoski P, Paulheim H. RDF2Vec: RDF graph embeddings for data mining. In: Groth P, editor. The Semantic Web - ISWC 2016 : 15th International Semantic Web Conference, Kobe, Japan, October 17-21, 2016, Proceedings, Part I. vol. 9981. Cham: Springer International Publishing; 2016. p. 498\u2013514. https:\/\/doi.org\/10.1007\/978-3-319-46523-4_30.","DOI":"10.1007\/978-3-319-46523-4_30"},{"key":"291_CR34","doi-asserted-by":"crossref","unstructured":"Chen J, Hu P, Jimenez-Ruiz E, Holter OM, Antonyrajah D, Horrocks I. OWL2Vec*: embedding of OWL ontologies. Mach Learn. 2021;110(7):1813\u201345.","DOI":"10.1007\/s10994-021-05997-6"},{"key":"291_CR35","doi-asserted-by":"crossref","unstructured":"Grover A, Leskovec J. node2vec: Scalable Feature Learning for Networks. Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining. 2016.","DOI":"10.1145\/2939672.2939754"},{"key":"291_CR36","doi-asserted-by":"publisher","first-page":"5","DOI":"10.1023\/A:1010933404324","volume":"45","author":"L Breiman","year":"2001","unstructured":"Breiman L. Machine Learning, Volume 45, Number 1 - SpringerLink. Mach Learn. 2001;45:5\u201332. https:\/\/doi.org\/10.1023\/A:1010933404324.","journal-title":"Mach Learn."},{"key":"291_CR37","doi-asserted-by":"crossref","unstructured":"Chen T, Guestrin C. XGBoost: a scalable tree boosting system. In: Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, KDD '16. New York: Association for Computing Machinery; 2016. p. 785\u201394.","DOI":"10.1145\/2939672.2939785"}],"container-title":["Journal of Biomedical Semantics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s13326-023-00291-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1186\/s13326-023-00291-x\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s13326-023-00291-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,11,17]],"date-time":"2023-11-17T13:39:19Z","timestamp":1700228359000},"score":1,"resource":{"primary":{"URL":"https:\/\/jbiomedsem.biomedcentral.com\/articles\/10.1186\/s13326-023-00291-x"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,8,14]]},"references-count":37,"journal-issue":{"issue":"1","published-online":{"date-parts":[[2023,12]]}},"alternative-id":["291"],"URL":"https:\/\/doi.org\/10.1186\/s13326-023-00291-x","relation":{},"ISSN":["2041-1480"],"issn-type":[{"value":"2041-1480","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,8,14]]},"assertion":[{"value":"5 December 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"29 July 2023","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"14 August 2023","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"Not applicable.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval and consent to participate"}},{"value":"Not applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for publication"}},{"value":"The authors declare that they have no competing interests.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}],"article-number":"11"}}