{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,19]],"date-time":"2026-05-19T19:02:02Z","timestamp":1779217322432,"version":"3.51.4"},"reference-count":37,"publisher":"Oxford University Press (OUP)","issue":"2","license":[{"start":{"date-parts":[[2025,1,29]],"date-time":"2025-01-29T00:00:00Z","timestamp":1738108800000},"content-version":"vor","delay-in-days":1,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"DOI":"10.13039\/501100001691","name":"Society for the Promotion of Science","doi-asserted-by":"crossref","id":[{"id":"10.13039\/501100001691","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100001691","name":"Grants-in-Aid for Scientific Research","doi-asserted-by":"crossref","award":["21H04915"],"award-info":[{"award-number":["21H04915"]}],"id":[{"id":"10.13039\/501100001691","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/100009619","name":"Japan Agency for Medical Research and Development","doi-asserted-by":"publisher","award":["JP18km0405209"],"award-info":[{"award-number":["JP18km0405209"]}],"id":[{"id":"10.13039\/100009619","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,2,4]]},"abstract":"<jats:title>Abstract<\/jats:title>\n               <jats:sec>\n                  <jats:title>Motivation<\/jats:title>\n                  <jats:p>Identifying effective therapeutic targets poses a challenge in drug discovery, especially for uncharacterized diseases without known therapeutic targets (e.g. rare diseases, intractable diseases).<\/jats:p>\n               <\/jats:sec>\n               <jats:sec>\n                  <jats:title>Results<\/jats:title>\n                  <jats:p>This study presents a novel machine learning approach using multimodal vector-quantized variational autoencoders (VQ-VAEs) for predicting therapeutic target molecules across diseases. To address the lack of known therapeutic target\u2013disease associations, we incorporate the information on uncharacterized diseases without known targets or uncharacterized proteins without known indications (applicable diseases) in the semi-supervised learning (SSL) framework. The method integrates disease-specific and protein perturbation profiles with genetic perturbations (e.g. gene knockdowns and gene overexpressions) at the transcriptome level. Cross-cell representation learning, facilitated by VQ-VAEs, was performed to extract informative features from protein perturbation profiles across diverse human cell types. Concurrently, cross-disease representation learning was performed, leveraging VQ-VAE, to extract informative features reflecting disease states from disease-specific profiles. The model\u2019s applicability to uncharacterized diseases or proteins is enhanced by considering the consistency between disease-specific and patient-specific signatures. The efficacy of the method is demonstrated across three practical scenarios for 79 diseases: target repositioning for target\u2013disease pairs, new target prediction for uncharacterized diseases, and new indication prediction for uncharacterized proteins. This method is expected to be valuable for identifying therapeutic targets across various diseases.<\/jats:p>\n               <\/jats:sec>\n               <jats:sec>\n                  <jats:title>Availability and implementation<\/jats:title>\n                  <jats:p>Code: github.com\/YamanishiLab\/SSL-VQ and Data: 10.5281\/zenodo.14644837.<\/jats:p>\n               <\/jats:sec>","DOI":"10.1093\/bioinformatics\/btaf039","type":"journal-article","created":{"date-parts":[[2025,1,30]],"date-time":"2025-01-30T00:18:56Z","timestamp":1738196336000},"source":"Crossref","is-referenced-by-count":1,"title":["SSL-VQ: vector-quantized variational autoencoders for semi-supervised prediction of therapeutic targets across diverse diseases"],"prefix":"10.1093","volume":"41","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-1873-8639","authenticated-orcid":false,"given":"Satoko","family":"Namba","sequence":"first","affiliation":[{"name":"Department of Bioscience and Bioinformatics, Faculty of Computer Science and Systems Engineering, Kyushu Institute of Technology , Kawazu , Iizuka, Fukuoka, 820-8502,","place":["Japan"]},{"name":"Department of Complex Systems Science, Graduate School of Informatics, Nagoya University , Chikusa , Nagoya, Aichi, 464-8601,","place":["Japan"]}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Chen","family":"Li","sequence":"additional","affiliation":[{"name":"Department of Bioscience and Bioinformatics, Faculty of Computer Science and Systems Engineering, Kyushu Institute of Technology , Kawazu , Iizuka, Fukuoka, 820-8502,","place":["Japan"]},{"name":"Department of Complex Systems Science, Graduate School of Informatics, Nagoya University , Chikusa , Nagoya, Aichi, 464-8601,","place":["Japan"]}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Noriko","family":"Yuyama Otani","sequence":"additional","affiliation":[{"name":"Department of Bioscience and Bioinformatics, Faculty of Computer Science and Systems Engineering, Kyushu Institute of Technology , Kawazu , Iizuka, Fukuoka, 820-8502,","place":["Japan"]},{"name":"Department of Complex Systems Science, Graduate School of Informatics, Nagoya University , Chikusa , Nagoya, Aichi, 464-8601,","place":["Japan"]}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yoshihiro","family":"Yamanishi","sequence":"additional","affiliation":[{"name":"Department of Bioscience and Bioinformatics, Faculty of Computer Science and Systems Engineering, Kyushu Institute of Technology , Kawazu , Iizuka, Fukuoka, 820-8502,","place":["Japan"]},{"name":"Department of Complex Systems Science, Graduate School of Informatics, Nagoya University , Chikusa , Nagoya, Aichi, 464-8601,","place":["Japan"]}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"286","published-online":{"date-parts":[[2025,1,28]]},"reference":[{"key":"2025030422240803200_btaf039-B1","doi-asserted-by":"crossref","first-page":"1438","DOI":"10.1093\/hmg\/ddq018","article-title":"Transcriptional changes in Huntington disease identified using genome-wide expression profiling and cross-platform analysis","volume":"19","author":"Becanovic","year":"2010","journal-title":"Hum Mol Genet"},{"key":"2025030422240803200_btaf039-B2","doi-asserted-by":"crossref","first-page":"6306","DOI":"10.1038\/s41467-021-26674-1","article-title":"Network analysis reveals rare disease signatures across multiple levels of biological organization","volume":"12","author":"Buphamalai","year":"2021","journal-title":"Nat Commun"},{"key":"2025030422240803200_btaf039-B3","doi-asserted-by":"crossref","first-page":"1696","DOI":"10.1101\/gad.267286.115","article-title":"ALS mutations in TLS\/FUS disrupt target gene expression","volume":"29","author":"Coady","year":"2015","journal-title":"Genes Dev"},{"key":"2025030422240803200_btaf039-B4","doi-asserted-by":"crossref","first-page":"2899","DOI":"10.1093\/hmg\/dds116","article-title":"Evaluating the role of the FUS\/TLS-related gene EWSR1 in amyotrophic lateral sclerosis","volume":"21","author":"Couthouis","year":"2012","journal-title":"Hum Mol Genet"},{"key":"2025030422240803200_btaf039-B5","doi-asserted-by":"crossref","first-page":"103329","DOI":"10.1016\/j.ebiom.2021.103329","article-title":"Evaluation of anti-TNF therapeutic response in patients with inflammatory bowel disease: current and novel biomarkers","volume":"66","author":"Cui","year":"2021","journal-title":"eBioMedicine"},{"key":"2025030422240803200_btaf039-B6","doi-asserted-by":"crossref","first-page":"64","DOI":"10.1038\/s41573-020-0087-3","article-title":"Improving target assessment in biomedical research: the GOT-IT recommendations","volume":"20","author":"Emmerich","year":"2021","journal-title":"Nat Rev Drug Discov"},{"key":"2025030422240803200_btaf039-B7","doi-asserted-by":"crossref","first-page":"939","DOI":"10.1021\/acscentsci.0c00229","article-title":"Deep docking: a deep learning platform for augmentation of structure based drug discovery","volume":"6","author":"Gentile","year":"2020","journal-title":"ACS Cent Sci"},{"key":"2025030422240803200_btaf039-B8","doi-asserted-by":"crossref","first-page":"76","DOI":"10.1038\/s41588-018-0286-6","article-title":"Discovery of common and rare genetic risk variants for colorectal cancer","volume":"51","author":"Huyghe","year":"2019","journal-title":"Nat Genet"},{"key":"2025030422240803200_btaf039-B9","doi-asserted-by":"crossref","first-page":"i191","DOI":"10.1093\/bioinformatics\/btz313","article-title":"Predicting drug-induced transcriptome responses of a wide range of human cell lines by a novel tensor-train decomposition algorithm","volume":"35","author":"Iwata","year":"2019","journal-title":"Bioinformatics"},{"key":"2025030422240803200_btaf039-B10","volume-title":"Encyclopedia of Molecular Targeting Therapies for Allergy and Autoimmune Diseases","author":"Kawai","year":"2013"},{"key":"2025030422240803200_btaf039-B11","doi-asserted-by":"crossref","first-page":"4","DOI":"10.1093\/function\/zqad034","article-title":"Structure and function of RhoBTB1 required for substrate specificity and cullin-3 ubiquitination","volume":"4","author":"Kumar","year":"2023","journal-title":"Function"},{"key":"2025030422240803200_btaf039-B12","author":"Laine","year":"2016"},{"key":"2025030422240803200_btaf039-B13","doi-asserted-by":"crossref","first-page":"421624","DOI":"10.1155\/2015\/421624","article-title":"Cytokine dysregulation in MECP2- and CDKL5-Related rett syndrome: relationships with aberrant redox homeostasis, inflammation, and \u03c9-3 PUFAs","volume":"2015","author":"Leoncini","year":"2015","journal-title":"Oxid Med Cell Longev"},{"key":"2025030422240803200_btaf039-B14","doi-asserted-by":"crossref","first-page":"580","DOI":"10.1038\/ng.2653","article-title":"The Genotype-Tissue Expression (GTEx) project","volume":"45","author":"Lonsdale","year":"2013","journal-title":"Nat Genet"},{"key":"2025030422240803200_btaf039-B15","doi-asserted-by":"crossref","first-page":"i68","DOI":"10.1093\/bioinformatics\/btac240","article-title":"From drug repositioning to target repositioning: prediction of therapeutic targets using genetically perturbed transcriptomic signatures","volume":"38","author":"Namba","year":"2022","journal-title":"Bioinformatics"},{"key":"2025030422240803200_btaf039-B16","doi-asserted-by":"crossref","first-page":"46","DOI":"10.1186\/s12859-016-0890-3","article-title":"A multiple kernel learning algorithm for drug\u2013target interaction prediction","volume":"17","author":"Nascimento","year":"2016","journal-title":"BMC Bioinformatics"},{"key":"2025030422240803200_btaf039-B17","doi-asserted-by":"crossref","first-page":"189","DOI":"10.1186\/s13059-022-02752-5","article-title":"Abnormal molecular signatures of inflammation, energy metabolism, and vesicle biology in human Huntington disease peripheral tissues","volume":"23","author":"Neueder","year":"2022","journal-title":"Genome Biol"},{"key":"2025030422240803200_btaf039-B18","doi-asserted-by":"crossref","first-page":"119","DOI":"10.1007\/s00401-019-02093-x","article-title":"Proteomics in cerebrospinal fluid and spinal cord suggests UCHL1, MAP2 and GPNMB as biomarkers and underpins importance of transcriptional pathways in amyotrophic lateral sclerosis","volume":"139","author":"Oeckl","year":"2020","journal-title":"Acta Neuropathol"},{"key":"2025030422240803200_btaf039-B19","first-page":"142","author":"Omura","year":"2015"},{"key":"2025030422240803200_btaf039-B20","author":"Oshitani","year":"2016"},{"key":"2025030422240803200_btaf039-B21","volume-title":"Current Medical Diagnosis and Treatment 2014","author":"Papadakis","year":"2014"},{"key":"2025030422240803200_btaf039-B22","first-page":"1","article-title":"Polyp segmentation with consistency training and continuous update of pseudo-label","volume":"2022","author":"Park","year":"2022","journal-title":"Sci Rep"},{"key":"2025030422240803200_btaf039-B23","doi-asserted-by":"crossref","first-page":"180","DOI":"10.1016\/j.cyto.2015.10.002","article-title":"Cytokines profile and peripheral blood mononuclear cells morphology in Rett and autistic patients","volume":"77","author":"Pecorelli","year":"2016","journal-title":"Cytokine"},{"key":"2025030422240803200_btaf039-B24","doi-asserted-by":"crossref","first-page":"462","DOI":"10.1038\/sj.bjc.6605511","article-title":"Gene expression profiling identifies Fibronectin 1 and CXCL9 as candidate biomarkers for breast cancer screening","volume":"102","author":"Ruiz-Garcia","year":"2010","journal-title":"Br J Cancer"},{"key":"2025030422240803200_btaf039-B25","doi-asserted-by":"crossref","first-page":"15","DOI":"10.1016\/j.trsl.2016.10.009","article-title":"Using GWAS to identify novel therapeutic targets for osteoporosis","volume":"181","author":"Sabik","year":"2017","journal-title":"Transl Res"},{"key":"2025030422240803200_btaf039-B26","doi-asserted-by":"crossref","first-page":"290","DOI":"10.4103\/0975-7406.72128","article-title":"Orphan drug: development trends and strategies","volume":"2","author":"Sharma","year":"2010","journal-title":"J Pharm Bioallied Sci"},{"key":"2025030422240803200_btaf039-B27","doi-asserted-by":"crossref","first-page":"871","DOI":"10.1007\/s10038-007-0200-z","article-title":"SNPs in disease gene mapping, medicinal drug development and evolution","volume":"52","author":"Shastry","year":"2007","journal-title":"J Hum Genet"},{"key":"2025030422240803200_btaf039-B28","doi-asserted-by":"crossref","first-page":"1437","DOI":"10.1016\/j.cell.2017.10.049","article-title":"A next generation connectivity map: L1000 platform and the first 1,000,000 profiles","volume":"171","author":"Subramanian","year":"2017","journal-title":"Cell"},{"key":"2025030422240803200_btaf039-B29","doi-asserted-by":"crossref","first-page":"3049","DOI":"10.1016\/j.apsb.2022.02.002","article-title":"Why 90% of clinical drug development fails and how to improve it?","volume":"12","author":"Sun","year":"2022","journal-title":"Acta Pharm Sin B"},{"key":"2025030422240803200_btaf039-B30","first-page":"20987","article-title":"SQ-VAE: variational bayes on discrete representation with self-annealed stochastic quantization","volume":"162","author":"Takida","year":"2022","journal-title":"Proc Mach Learn Res"},{"key":"2025030422240803200_btaf039-B31","first-page":"6309","author":"Van Den Oord","year":"2017"},{"key":"2025030422240803200_btaf039-B32","doi-asserted-by":"crossref","first-page":"12846","DOI":"10.1038\/ncomms12846","article-title":"Extraction and analysis of signatures from the gene expression omnibus by the crowd","volume":"7","author":"Wang","year":"2016","journal-title":"Nat Commun"},{"key":"2025030422240803200_btaf039-B33","doi-asserted-by":"crossref","first-page":"1826","DOI":"10.1038\/s41467-017-01261-5","article-title":"Functional mapping and annotation of genetic associations with FUMA","volume":"8","author":"Watanabe","year":"2017","journal-title":"Nat Commun"},{"key":"2025030422240803200_btaf039-B34","first-page":"4067","article-title":"Increased expression of hub gene CXCL10 in peripheral blood mononuclear cells of patients with systemic lupus erythematosus","volume":"18","author":"Zhang","year":"2019","journal-title":"Exp Ther Med"},{"key":"2025030422240803200_btaf039-B35","first-page":"1","article-title":"Targeting the Wnt\/\u03b2-catenin signaling pathway in cancer","volume":"2020","author":"Zhang","year":"2020","journal-title":"J. Hematol. Oncol"},{"key":"2025030422240803200_btaf039-B36","doi-asserted-by":"crossref","first-page":"1208","DOI":"10.1161\/CIRCRESAHA.116.308544","article-title":"Loss of adult cardiac myocyte GSK-3 leads to mitotic catastrophe resulting in fatal dilated cardiomyopathy","volume":"118","author":"Zhou","year":"2016","journal-title":"Circ Res"},{"key":"2025030422240803200_btaf039-B37","first-page":"1","article-title":"Optimization of molecules via","volume":"9","author":"Zh","year":"2019","journal-title":"Deep Reinforcement Learn Sci Rep"}],"container-title":["Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/academic.oup.com\/bioinformatics\/advance-article-pdf\/doi\/10.1093\/bioinformatics\/btaf039\/61686012\/btaf039.pdf","content-type":"application\/pdf","content-version":"am","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/41\/2\/btaf039\/61686012\/btaf039.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/41\/2\/btaf039\/61686012\/btaf039.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,3,4]],"date-time":"2025-03-04T22:25:04Z","timestamp":1741127104000},"score":1,"resource":{"primary":{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article\/doi\/10.1093\/bioinformatics\/btaf039\/7989445"}},"subtitle":[],"editor":[{"given":"Anthony","family":"Mathelier","sequence":"additional","affiliation":[],"role":[{"role":"editor","vocabulary":"crossref"}]}],"short-title":[],"issued":{"date-parts":[[2025,1,28]]},"references-count":37,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2025,2,4]]}},"URL":"https:\/\/doi.org\/10.1093\/bioinformatics\/btaf039","relation":{},"ISSN":["1367-4811"],"issn-type":[{"value":"1367-4811","type":"electronic"}],"subject":[],"published-other":{"date-parts":[[2025,2]]},"published":{"date-parts":[[2025,1,28]]},"article-number":"btaf039"}}