{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,25]],"date-time":"2026-02-25T21:59:03Z","timestamp":1772056743882,"version":"3.50.1"},"reference-count":53,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode"}],"funder":[{"name":"National Key Research and Development Program of China","award":["2023YFB2804701"],"award-info":[{"award-number":["2023YFB2804701"]}]},{"name":"Natural Science Foundation of China Project","award":["62525102"],"award-info":[{"award-number":["62525102"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE J. Sel. Areas Commun."],"published-print":{"date-parts":[[2026]]},"DOI":"10.1109\/jsac.2026.3655643","type":"journal-article","created":{"date-parts":[[2026,1,19]],"date-time":"2026-01-19T20:55:17Z","timestamp":1768856117000},"page":"3349-3364","source":"Crossref","is-referenced-by-count":0,"title":["You Only Transmit Once: Unified Generation and Comprehension for Efficient Semantic Communication"],"prefix":"10.1109","volume":"44","author":[{"ORCID":"https:\/\/orcid.org\/0009-0003-2351-2455","authenticated-orcid":false,"given":"Li","family":"Yao","sequence":"first","affiliation":[{"name":"Key Laboratory for Information Science of Electromagnetic Waves (MoE), College of Future Information Technology, Fudan University, Shanghai, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0000-2647-2688","authenticated-orcid":false,"given":"Yuan","family":"Wei","sequence":"additional","affiliation":[{"name":"Key Laboratory for Information Science of Electromagnetic Waves (MoE), College of Future Information Technology, Fudan University, Shanghai, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0000-6367-7324","authenticated-orcid":false,"given":"Yuning","family":"Zhou","sequence":"additional","affiliation":[{"name":"Key Laboratory for Information Science of Electromagnetic Waves (MoE), College of Future Information Technology, Fudan University, Shanghai, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9179-3995","authenticated-orcid":false,"given":"Ziwei","family":"Li","sequence":"additional","affiliation":[{"name":"Key Laboratory for Information Science of Electromagnetic Waves (MoE), College of Future Information Technology, Fudan University, Shanghai, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4966-3844","authenticated-orcid":false,"given":"Nan","family":"Chi","sequence":"additional","affiliation":[{"name":"Key Laboratory for Information Science of Electromagnetic Waves (MoE), College of Future Information Technology, Fudan University, Shanghai, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7521-0078","authenticated-orcid":false,"given":"Kai-Kit","family":"Wong","sequence":"additional","affiliation":[{"name":"Department of Electronic and Electrical Engineering, University College London, London, U.K."}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/MCOM.001.2001239"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/MCOM.001.2200099"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/NSW.2011.6004632"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/MWC.101.2100269"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/TCCN.2024.3435524"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/MCOM.005.2200829"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/GLOBECOM52923.2024.10901192"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01268"},{"key":"ref9","first-page":"6306","article-title":"Neural discrete representation learning","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"van den Oord"},{"key":"ref10","first-page":"31798","article-title":"SpeechTokenizer: Unified speech tokenizer for speech language models","volume-title":"Proc. Int. Conf. Learn. Represent.","author":"Zhang"},{"key":"ref11","first-page":"55371","article-title":"Libra: Building decoupled vision system on large language models","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Xu"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TCOMM.2024.3364990"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2022.3221952"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/MCOM.001.2300575"},{"key":"ref15","first-page":"39308","article-title":"Auto-encoding morph-tokens for multimodal LLM","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Pan"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2022.3221999"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/GLOBECOM48099.2022.10000901"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.findings-acl.807"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1145\/3295748"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2024.3523524"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/TCCN.2025.3531461"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/TCOMM.2025.3538850"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2020.2983926"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/LWC.2023.3255221"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00695"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP49359.2023.10222853"},{"key":"ref27","first-page":"8748","article-title":"Learning transferable visual models from natural language supervision","volume-title":"Proc. Int. Conf. Mach. Learn.","volume":"139","author":"Radford"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/SiPS47522.2019.9020494"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P16-1162"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46454-1_24"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D18-1437"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1609\/icwsm.v8i1.14550"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.52202\/079017-3273"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-72649-1_13"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01213"},{"key":"ref36","first-page":"1","article-title":"Density modeling of images using a generalized normalization transformation","volume-title":"Proc. Int. Conf. Learn. Represent.","author":"Ball\u00e9"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/MCOM.001.2000804"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/TCCN.2024.3424842"},{"key":"ref39","article-title":"Once-for-all: Controllable generative image compression with dynamic granularity adaptation","author":"Li","year":"2024","journal-title":"arXiv:2406.00758"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2014.2364537"},{"key":"ref41","first-page":"1","article-title":"Categorical reparameterization with gumbel-softmax","volume-title":"Proc. Int. Conf. Learn. Represent.","author":"Jang"},{"key":"ref42","first-page":"19730","article-title":"BLIP-2: Bootstrapping language-image pre-training with frozen image encoders and large language models","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Li"},{"key":"ref43","first-page":"11525","article-title":"Object-centric learning with slot attention","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Locatello"},{"key":"ref44","first-page":"3","article-title":"LoRA: Low-rank adaptation of large language models","volume-title":"Proc. Int. Conf. Learn. Represent.","author":"Hu"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-022-01653-1"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v37i2.25360"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.52202\/079017-4433"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01857"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10602-1_48"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/ADICS58448.2024.10533619"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v30i1.10475"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/TSP.2021.3071210"},{"key":"ref53","article-title":"ClipCap: CLIP prefix for image captioning","author":"Mokady","year":"2021","journal-title":"arXiv:2111.09734"}],"container-title":["IEEE Journal on Selected Areas in Communications"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/49\/11372474\/11358967.pdf?arnumber=11358967","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,2,25]],"date-time":"2026-02-25T20:57:31Z","timestamp":1772053051000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11358967\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026]]},"references-count":53,"URL":"https:\/\/doi.org\/10.1109\/jsac.2026.3655643","relation":{},"ISSN":["1558-0008","0733-8716"],"issn-type":[{"value":"1558-0008","type":"electronic"},{"value":"0733-8716","type":"print"}],"subject":[],"published":{"date-parts":[[2026]]}}}