{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,18]],"date-time":"2026-06-18T22:34:44Z","timestamp":1781822084597,"version":"3.54.5"},"reference-count":33,"publisher":"Oxford University Press (OUP)","issue":"Supplement_1","license":[{"start":{"date-parts":[[2025,7,15]],"date-time":"2025-07-15T00:00:00Z","timestamp":1752537600000},"content-version":"vor","delay-in-days":14,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"DOI":"10.13039\/501100003725","name":"National Research Foundation of Korea","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100003725","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100014188","name":"Ministry of Science and ICT","doi-asserted-by":"publisher","award":["RS-2021-NR061451"],"award-info":[{"award-number":["RS-2021-NR061451"]}],"id":[{"id":"10.13039\/501100014188","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100014188","name":"Ministry of Science and ICT","doi-asserted-by":"publisher","award":["RS-2022-NR067277"],"award-info":[{"award-number":["RS-2022-NR067277"]}],"id":[{"id":"10.13039\/501100014188","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100009122","name":"Ministry of Education","doi-asserted-by":"publisher","award":["RS-2021-NR060140"],"award-info":[{"award-number":["RS-2021-NR060140"]}],"id":[{"id":"10.13039\/100009122","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,7,1]]},"abstract":"<jats:title>Abstract<\/jats:title>\n               <jats:sec>\n                  <jats:title>Motivation<\/jats:title>\n                  <jats:p>T cell receptors (TCRs) are fundamental components of the adaptive immune system, recognizing specific antigens for targeted immune responses. Understanding their sequence patterns is crucial for designing effective vaccines and immunotherapies. However, the vast diversity of TCR sequences and complex binding mechanisms pose significant challenges in generating TCRs that are specific to a particular epitope.<\/jats:p>\n               <\/jats:sec>\n               <jats:sec>\n                  <jats:title>Results<\/jats:title>\n                  <jats:p>Here, we propose TCR-epiDiff, a diffusion-based deep learning model for generating epitope-specific TCRs and predicting TCR\u2013epitope binding. TCR-epiDiff integrates epitope information during TCR sequence embedding using ProtT5-XL and employs a denoising diffusion probabilistic model for sequence generation. Using external validation datasets, we demonstrate the ability to generate biologically plausible, epitope-specific TCRs. Furthermore, we leverage the model\u2019s encoder to develop a TCR\u2013epitope binding predictor that shows robust performance on the external validation data. Our approach provides a comprehensive solution for both de novo generation of epitope-specific TCRs and TCR\u2013epitope binding prediction. This capability provides valuable insights into immune diversity and has the potential to advance targeted immunotherapies.<\/jats:p>\n               <\/jats:sec>\n               <jats:sec>\n                  <jats:title>Availability and implementation<\/jats:title>\n                  <jats:p>The data and source codes for our experiments are available at: https:\/\/github.com\/seoseyeon\/TCR-epiDiff.<\/jats:p>\n               <\/jats:sec>","DOI":"10.1093\/bioinformatics\/btaf202","type":"journal-article","created":{"date-parts":[[2025,7,15]],"date-time":"2025-07-15T13:02:05Z","timestamp":1752584525000},"page":"i125-i132","source":"Crossref","is-referenced-by-count":3,"title":["TCR-epiDiff: solving dual challenges of TCR generation and binding prediction"],"prefix":"10.1093","volume":"41","author":[{"given":"Se Yeon","family":"Seo","sequence":"first","affiliation":[{"name":"Department of Bioinformatics & Life Science, Soongsil University , Seoul 06978,","place":["Korea"]}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4811-8895","authenticated-orcid":false,"given":"Je-Keun","family":"Rhee","sequence":"additional","affiliation":[{"name":"Department of Bioinformatics & Life Science, Soongsil University , Seoul 06978,","place":["Korea"]}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"286","published-online":{"date-parts":[[2025,7,15]]},"reference":[{"key":"2025071509015742500_btaf202-B1","doi-asserted-by":"crossref","first-page":"D1057","DOI":"10.1093\/nar\/gkz874","article-title":"VDJdb in 2019: database extension, new analysis infrastructure and a T-cell receptor motif compendium","volume":"48","author":"Bagaev","year":"2020","journal-title":"Nucleic Acids Res"},{"key":"2025071509015742500_btaf202-B2","doi-asserted-by":"crossref","first-page":"848","DOI":"10.1038\/s41590-022-01224-z","article-title":"Epigenetic regulation of t cell exhaustion","volume":"23","author":"Belk","year":"2022","journal-title":"Nat Immunol"},{"key":"2025071509015742500_btaf202-B3","doi-asserted-by":"crossref","first-page":"663","DOI":"10.3390\/cancers15030663","article-title":"CAR-T: what is next?","volume":"15","author":"Chen","year":"2023","journal-title":"Cancers (Basel)"},{"key":"2025071509015742500_btaf202-B4","doi-asserted-by":"crossref","first-page":"395","DOI":"10.1038\/334395a0","article-title":"T-cell antigen receptor genes and T-cell recognition","volume":"334","author":"Davis","year":"1988","journal-title":"Nature"},{"key":"2025071509015742500_btaf202-B5","doi-asserted-by":"crossref","first-page":"119265","DOI":"10.1016\/j.biomaterials.2019.119265","article-title":"T cell immunotherapy enhanced by designer biomaterials","volume":"217","author":"Dunn","year":"2019","journal-title":"Biomaterials"},{"key":"2025071509015742500_btaf202-B6","doi-asserted-by":"crossref","first-page":"1725","DOI":"10.1093\/intimm\/10.11.1725","article-title":"Conserved sequence motifs of CDR3 loops of TCR specific for two major epitopes of the grass pollen allergen Phl p 1","volume":"10","author":"Friedl-Hajek","year":"1998","journal-title":"Int Immunol"},{"key":"2025071509015742500_btaf202-B7","doi-asserted-by":"crossref","first-page":"236","DOI":"10.1038\/s42256-023-00619-3","article-title":"Pan-peptide meta learning for T-cell receptor\u2013antigen binding recognition","volume":"5","author":"Gao","year":"2023","journal-title":"Nat Mach Intell"},{"key":"2025071509015742500_btaf202-B8","doi-asserted-by":"crossref","first-page":"40","DOI":"10.1038\/s41580-021-00407-0","article-title":"A guide to machine learning for biologists","volume":"23","author":"Greener","year":"2022","journal-title":"Nat Rev Mol Cell Biol"},{"key":"2025071509015742500_btaf202-B9","doi-asserted-by":"crossref","first-page":"136","DOI":"10.1038\/s44222-023-00114-9","article-title":"Diffusion models in bioinformatics and computational biology","volume":"2","author":"Guo","year":"2024","journal-title":"Nat Rev Bioeng"},{"key":"2025071509015742500_btaf202-B10","first-page":"6840","article-title":"Denoising diffusion probabilistic models","volume":"33","author":"Ho","year":"2020","journal-title":"Adv Neural Inf Process Syst"},{"key":"2025071509015742500_btaf202-B11","doi-asserted-by":"crossref","first-page":"1194","DOI":"10.1038\/s41587-020-0505-4","article-title":"Analyzing the Mycobacterium tuberculosis immune response by T-cell receptor clustering with GLIPH2 and genome-wide antigen screening","volume":"38","author":"Huang","year":"2020","journal-title":"Nat Biotechnol"},{"key":"2025071509015742500_btaf202-B12","doi-asserted-by":"crossref","first-page":"193","DOI":"10.1038\/nri.2015.16","article-title":"T cell migration, search strategies and mechanisms","volume":"16","author":"Krummel","year":"2016","journal-title":"Nat Rev Immunol"},{"key":"2025071509015742500_btaf202-B13","doi-asserted-by":"crossref","first-page":"202","DOI":"10.1016\/j.immuni.2018.01.007","article-title":"Human T cell development, localization, and function throughout life","volume":"48","author":"Kumar","year":"2018","journal-title":"Immunity"},{"key":"2025071509015742500_btaf202-B14","doi-asserted-by":"crossref","first-page":"4271","DOI":"10.1038\/s41467-024-48198-0","article-title":"Designing meaningful continuous representations of T cell receptor sequences with deep generative models","volume":"15","author":"Leary","year":"2024","journal-title":"Nat Commun"},{"key":"2025071509015742500_btaf202-B15","doi-asserted-by":"crossref","first-page":"794183","DOI":"10.3389\/fonc.2021.794183","article-title":"TCR-T immunotherapy: the challenges and solutions","volume":"11","author":"Liu","year":"2021","journal-title":"Front Oncol"},{"key":"2025071509015742500_btaf202-B16","doi-asserted-by":"crossref","first-page":"864","DOI":"10.1038\/s42256-021-00383-2","article-title":"Deep learning-based prediction of the T cell receptor\u2013antigen binding specificity","volume":"3","author":"Lu","year":"2021","journal-title":"Nat Mach Intell"},{"key":"2025071509015742500_btaf202-B17","doi-asserted-by":"crossref","first-page":"1073","DOI":"10.1126\/science.3317824","article-title":"The T cell receptor","volume":"238","author":"Marrack","year":"1987","journal-title":"Science"},{"key":"2025071509015742500_btaf202-B18","doi-asserted-by":"crossref","first-page":"1060","DOI":"10.1038\/s42003-021-02610-3","article-title":"NetTCR-2.0 enables accurate prediction of TCR-peptide binding by using paired TCR\u03b1 and \u03b2 sequence data","volume":"4","author":"Montemurro","year":"2021","journal-title":"Commun Biol"},{"key":"2025071509015742500_btaf202-B19","doi-asserted-by":"crossref","first-page":"btad284","DOI":"10.1093\/bioinformatics\/btad284","article-title":"epiTCR: a highly sensitive predictor for TCR\u2013peptide binding","volume":"39","author":"Pham","year":"2023","journal-title":"Bioinformatics"},{"key":"2025071509015742500_btaf202-B20","doi-asserted-by":"crossref","first-page":"16933","DOI":"10.1038\/s41598-022-21366-2","article-title":"Improving protein succinylation sites prediction using embeddings from protein language model","volume":"12","author":"Pokharel","year":"2022","journal-title":"Sci Rep"},{"key":"2025071509015742500_btaf202-B21","doi-asserted-by":"crossref","first-page":"1728","DOI":"10.1038\/s41467-022-29268-7","article-title":"Current progress and open challenges for applying deep learning across the biosciences","volume":"13","author":"Sapoval","year":"2022","journal-title":"Nat Commun"},{"key":"2025071509015742500_btaf202-B22","first-page":"372","article-title":"Mechanisms of resistance to CAR T cell therapy","volume":"16","author":"Shah","year":"2019","journal-title":"Nat Rev Clin Oncol"},{"key":"2025071509015742500_btaf202-B23","doi-asserted-by":"crossref","first-page":"3559","DOI":"10.1109\/TMI.2024.3418652","article-title":"Blind CT image quality assessment using DDPM-derived content and transformer-based evaluator","volume":"43","author":"Shi","year":"2024","journal-title":"IEEE Trans Med Imaging"},{"key":"2025071509015742500_btaf202-B24","doi-asserted-by":"crossref","first-page":"D419","DOI":"10.1093\/nar\/gkx760","article-title":"VDJdb: a curated database of T-cell receptor sequences with known antigen specificity","volume":"46","author":"Shugay","year":"2018","journal-title":"Nucleic Acids Res"},{"key":"2025071509015742500_btaf202-B25","doi-asserted-by":"crossref","first-page":"664514","DOI":"10.3389\/fimmu.2021.664514","article-title":"Contribution of T cell receptor alpha and beta CDR3, MHC typing, V and J genes to peptide binding prediction","volume":"12","author":"Springer","year":"2021","journal-title":"Front Immunol"},{"key":"2025071509015742500_btaf202-B26","doi-asserted-by":"crossref","first-page":"2924","DOI":"10.1093\/bioinformatics\/btx286","article-title":"McPAS-TCR: a manually curated catalogue of pathology-associated T cell receptor sequences","volume":"33","author":"Tickotsky","year":"2017","journal-title":"Bioinformatics"},{"key":"2025071509015742500_btaf202-B27","volume-title":"Advances in Neural Information Processing Systems","author":"Vaswani"},{"key":"2025071509015742500_btaf202-B28","author":"Yim","year":"2023"},{"key":"2025071509015742500_btaf202-B29","doi-asserted-by":"crossref","first-page":"nwae343","DOI":"10.1093\/nsr\/nwae343","article-title":"Artificial intelligence-guided strategies for next-generation biological sequence design","volume":"11","author":"Zhang","year":"2024","journal-title":"Natl Sci Rev"},{"key":"2025071509015742500_btaf202-B30","first-page":"663","article-title":"The recent advancement of tcr-t cell therapies for cancer treatment","volume":"56","author":"Zhao","year":"2024","journal-title":"Acta Biochim Biophys Sin (Shanghai)"},{"key":"2025071509015742500_btaf202-B31","first-page":"1","article-title":"Cancer incidence and mortality in China, 2016","volume":"2","author":"Zheng","year":"2022","journal-title":"J Natl Cancer Cent"},{"key":"2025071509015742500_btaf202-B32","doi-asserted-by":"crossref","first-page":"95","DOI":"10.1038\/s41421-024-00728-2","article-title":"A conditional protein diffusion model generates artificial programmable endonuclease sequences with enhanced activity","volume":"10","author":"Zhou","year":"2024","journal-title":"Cell Discov"},{"key":"2025071509015742500_btaf202-B33","doi-asserted-by":"crossref","DOI":"10.1093\/gpbjnl\/qzae010","article-title":"NeoTCR: an immunoinformatic database of experimentally-supported functional neoantigen-specific TCR sequences","author":"Zhou","year":"2024","journal-title":"Genom Proteom Bioinformatics"}],"container-title":["Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/41\/Supplement_1\/i125\/63745521\/btaf202.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/41\/Supplement_1\/i125\/63745521\/btaf202.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,7,15]],"date-time":"2025-07-15T13:02:09Z","timestamp":1752584529000},"score":1,"resource":{"primary":{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article\/41\/Supplement_1\/i125\/8199382"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,7,1]]},"references-count":33,"journal-issue":{"issue":"Supplement_1","published-print":{"date-parts":[[2025,7,1]]}},"URL":"https:\/\/doi.org\/10.1093\/bioinformatics\/btaf202","relation":{},"ISSN":["1367-4803","1367-4811"],"issn-type":[{"value":"1367-4803","type":"print"},{"value":"1367-4811","type":"electronic"}],"subject":[],"published-other":{"date-parts":[[2025,7]]},"published":{"date-parts":[[2025,7,1]]}}}