{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,2]],"date-time":"2026-06-02T21:04:45Z","timestamp":1780434285084,"version":"3.54.1"},"reference-count":71,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"2","license":[{"start":{"date-parts":[[2026,4,1]],"date-time":"2026-04-01T00:00:00Z","timestamp":1775001600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2026,4,1]],"date-time":"2026-04-01T00:00:00Z","timestamp":1775001600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,4,1]],"date-time":"2026-04-01T00:00:00Z","timestamp":1775001600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"name":"Shenzhen Science and Technology Research and Development Fund","award":["KJZD20240903102802003"],"award-info":[{"award-number":["KJZD20240903102802003"]}]},{"name":"Shenzhen Science and Technology Research and Development Fund","award":["GXWD20231128103819001"],"award-info":[{"award-number":["GXWD20231128103819001"]}]},{"name":"Guangdong Provincial Key Laboratory","award":["2023B1212060076"],"award-info":[{"award-number":["2023B1212060076"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Affective Comput."],"published-print":{"date-parts":[[2026,4]]},"DOI":"10.1109\/taffc.2026.3660288","type":"journal-article","created":{"date-parts":[[2026,2,2]],"date-time":"2026-02-02T20:44:43Z","timestamp":1770065083000},"page":"2091-2104","source":"Crossref","is-referenced-by-count":0,"title":["Toward Multimodal Sentiment Analysis via Contrastive Cross-Modal Retrieval Augmentation and Hierachical Prompts"],"prefix":"10.1109","volume":"17","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-5482-3895","authenticated-orcid":false,"given":"Xianbing","family":"Zhao","sequence":"first","affiliation":[{"name":"School of Artificial Intelligence and Computer Science, Jiangnan University, Wuxi, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Shengzun","family":"Yang","sequence":"additional","affiliation":[{"name":"School of Computer Science and Technology, Harbin Institute of Technology, Shenzhen, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0271-8246","authenticated-orcid":false,"given":"Buzhou","family":"Tang","sequence":"additional","affiliation":[{"name":"School of Computer Science and Technology, Harbin Institute of Technology, Shenzhen, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5023-1259","authenticated-orcid":false,"given":"Ronghuan","family":"Jiang","sequence":"additional","affiliation":[{"name":"Chinese People&#x2019;s Liberation Army General Hospital, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/taffc.2025.3614159"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/taffc.2025.3612369"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/taffc.2025.3613302"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TAFFC.2022.3233070"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/TAFFC.2024.3396144"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P19-1656"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.214"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.naacl-main.79"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00258"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1145\/3462244.3479919"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v35i12.17289"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1145\/3503161.3547754"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1145\/3543507.3583406"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00641"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.acl-long.421"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1016\/j.inffus.2023.102031"},{"issue":"1","key":"ref17","article-title":"Retrieval-augmented generation for large language models: A survey","volume":"2","author":"Gao","year":"2023"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00683"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1162\/tacl_a_00605"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.52202\/068431-1114"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.findings-emnlp.11"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/ICAIIC.2019.8669073"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2022.3151098"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/TCSS.2023.3315754"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.emnlp-main.723"},{"key":"ref26","article-title":"Learning factorized multimodal representations","volume-title":"Proc. Int. Conf. Representation Learn.","author":"Tsai"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1145\/3136755.3136801"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1145\/3581783.3611974"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D17-1115"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P18-1209"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/TAFFC.2025.3529732"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1016\/j.inffus.2022.11.003"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.findings-acl.860"},{"key":"ref34","first-page":"4611","article-title":"Modal feature optimization network with prompt for multimodal sentiment analysis","volume-title":"Proc. 31st Int. Conf. Comput. Linguistics","author":"Zhang"},{"key":"ref35","first-page":"2834","article-title":"t-HNE: A text-guided hierarchical noise eliminator for multimodal sentiment analysis","volume-title":"Proc. 31st Int. Conf. Comput. Linguistics","author":"Li"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/TAFFC.2024.3430045"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1145\/3672758.3672824"},{"key":"ref38","article-title":"Mixtral of experts","year":"2023"},{"key":"ref39","article-title":"Gemma - Google\u2019s new open LLM","year":"2024"},{"key":"ref40","article-title":"ChatGPT: Large-scale language model fine-tuned for conversational applications","year":"2023"},{"key":"ref41","article-title":"Llama 2: Open foundation and fine-tuned chat models","author":"Touvron","year":"2023"},{"key":"ref42","article-title":"Gemini: Our largest and most capable AI model","year":"2023"},{"key":"ref43","article-title":"BLIP-2: Bootstrapping language-image pre-training with frozen image encoders and large language models","author":"Li","year":"2023"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2020.107479"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.emnlp-main.495"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1145\/3539618.3592085"},{"key":"ref47","first-page":"9459","article-title":"Retrieval-augmented generation for knowledge-intensive NLP tasks","volume-title":"Proc. Int. Conf. Neural Inf. Process. Syst.","author":"Lewis"},{"key":"ref48","article-title":"Vendi-RAG: Adaptively trading-off diversity and quality significantly improves retrieval augmented generation with LLMs","author":"Rezaei","year":"2025"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP49660.2025.10889933"},{"issue":"140","key":"ref50","first-page":"1","article-title":"Exploring the limits of transfer learning with a unified text-to-text transformer","volume":"21","author":"Raffel","year":"2020","journal-title":"J. Mach. Learn. Res."},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/FG.2018.00020"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2021.3122291"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1145\/3394171.3413678"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.acl-long.94"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.123"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref57","article-title":"MOSI: Multimodal corpus of sentiment intensity and subjectivity analysis in online opinion videos","author":"Zadeh","year":"2016"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P18-1208"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1109\/TAFFC.2022.3178231"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2024\/724"},{"key":"ref61","article-title":"Qwen2.5-VL","author":"Team","year":"2025"},{"key":"ref62","article-title":"Scaling instruction-finetuned language models","author":"Chung","year":"2022"},{"key":"ref63","article-title":"Gemma 3","author":"Team","year":"2025"},{"key":"ref64","article-title":"Qwen3 technical report","author":"Team","year":"2025"},{"key":"ref65","article-title":"SpinQuant: LLM quantization with learned rotations","author":"Liu","year":"2024"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1109\/MC.2022.3148714"},{"key":"ref67","article-title":"GPT-4V(ision) system card","year":"2023"},{"key":"ref68","article-title":"Meet claude","year":"2024"},{"key":"ref69","doi-asserted-by":"publisher","DOI":"10.1016\/j.inffus.2025.103204"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00393"},{"key":"ref71","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00975"}],"container-title":["IEEE Transactions on Affective Computing"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/5165369\/11540045\/11370533.pdf?arnumber=11370533","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,6,2]],"date-time":"2026-06-02T20:07:36Z","timestamp":1780430856000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11370533\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,4]]},"references-count":71,"journal-issue":{"issue":"2"},"URL":"https:\/\/doi.org\/10.1109\/taffc.2026.3660288","relation":{},"ISSN":["1949-3045","2371-9850"],"issn-type":[{"value":"1949-3045","type":"electronic"},{"value":"2371-9850","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,4]]}}}