{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,18]],"date-time":"2026-06-18T21:55:56Z","timestamp":1781819756502,"version":"3.54.5"},"reference-count":33,"publisher":"Elsevier BV","license":[{"start":{"date-parts":[[2026,7,1]],"date-time":"2026-07-01T00:00:00Z","timestamp":1782864000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[2026,7,1]],"date-time":"2026-07-01T00:00:00Z","timestamp":1782864000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/legal\/tdmrep-license"},{"start":{"date-parts":[[2026,4,20]],"date-time":"2026-04-20T00:00:00Z","timestamp":1776643200000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"content-domain":{"domain":["elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Array"],"published-print":{"date-parts":[[2026,7]]},"DOI":"10.1016\/j.array.2026.100849","type":"journal-article","created":{"date-parts":[[2026,4,22]],"date-time":"2026-04-22T16:13:15Z","timestamp":1776874395000},"page":"100849","update-policy":"https:\/\/doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":0,"special_numbering":"C","title":["GCR-TE: Grounded generative counterfactual rewriting for text enhanced multimodal sentiment analysis"],"prefix":"10.1016","volume":"30","author":[{"given":"Shibo","family":"Ji","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Bo","family":"Yang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"78","reference":[{"issue":"8","key":"10.1016\/j.array.2026.100849_b1","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1007\/s40747-025-01931-8","article-title":"EMVAS: end-to-end multimodal emotion visualization analysis system","volume":"11","author":"Zhu","year":"2025","journal-title":"Complex Intell Syst"},{"issue":"4","key":"10.1016\/j.array.2026.100849_b2","doi-asserted-by":"crossref","first-page":"1504","DOI":"10.1007\/s12559-024-10287-z","article-title":"A review of key technologies for emotion analysis using multimodal information","volume":"16","author":"Zhu","year":"2024","journal-title":"Cogn Comput"},{"issue":"5","key":"10.1016\/j.array.2026.100849_b3","doi-asserted-by":"crossref","first-page":"62","DOI":"10.1109\/MIS.2025.3597120","article-title":"A generative random modality dropout framework for robust multimodal emotion recognition","volume":"40","author":"Zhang","year":"2025","journal-title":"IEEE Intell Syst"},{"issue":"4","key":"10.1016\/j.array.2026.100849_b4","doi-asserted-by":"crossref","first-page":"78","DOI":"10.1007\/s10462-023-10685-z","article-title":"Multi-level textual-visual alignment and fusion network for multimodal aspect-based sentiment analysis","volume":"57","author":"Li","year":"2024","journal-title":"Artif Intell Rev"},{"key":"10.1016\/j.array.2026.100849_b5","doi-asserted-by":"crossref","unstructured":"Sun T, Ni J, Wang W, Jing L, Wei Y, Nie L. General debiasing for multimodal sentiment analysis. In: Proceedings of the 31st ACM international conference on multimedia. 2023, p. 5861\u20139.","DOI":"10.1145\/3581783.3612051"},{"key":"10.1016\/j.array.2026.100849_b6","doi-asserted-by":"crossref","DOI":"10.1016\/j.inffus.2023.101973","article-title":"Modality translation-based multimodal sentiment analysis under uncertain missing modalities","volume":"101","author":"Liu","year":"2024","journal-title":"Inf Fusion"},{"issue":"13s","key":"10.1016\/j.array.2026.100849_b7","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/3586075","article-title":"Multimodal sentiment analysis: a survey of methods, trends, and challenges","volume":"55","author":"Das","year":"2023","journal-title":"ACM Comput Surv"},{"key":"10.1016\/j.array.2026.100849_b8","article-title":"MulDeF: A model-agnostic debiasing framework for robust multimodal sentiment analysis","author":"Huan","year":"2024","journal-title":"IEEE Trans Multimed"},{"issue":"11","key":"10.1016\/j.array.2026.100849_b9","article-title":"Causality aware multimodal reasoning network in human emotion identification and sentiment understanding","volume":"16","author":"Thakre","year":"2025","journal-title":"Int J Adv Comput Sci Appl"},{"key":"10.1016\/j.array.2026.100849_b10","doi-asserted-by":"crossref","unstructured":"Ge X, Chen F, Xu S, Tao F, Jose JM. Cross-modal semantic enhanced interaction for image-sentence retrieval. In: Proceedings of the IEEE\/CVF winter conference on applications of computer vision. 2023, p. 1022\u201331.","DOI":"10.1109\/WACV56688.2023.00108"},{"key":"10.1016\/j.array.2026.100849_b11","doi-asserted-by":"crossref","DOI":"10.1016\/j.inffus.2024.102747","article-title":"Multimodal dual perception fusion framework for multimodal affective analysis","volume":"115","author":"Lu","year":"2025","journal-title":"Inf Fusion"},{"key":"10.1016\/j.array.2026.100849_b12","series-title":"2025 34th IEEE international conference on robot and human interactive communication","first-page":"1049","article-title":"Fusion in context: A multimodal approach to affective state recognition","author":"Mohamed","year":"2025"},{"key":"10.1016\/j.array.2026.100849_b13","series-title":"ICASSP 2025-2025 IEEE international conference on acoustics, speech and signal processing","first-page":"1","article-title":"LDGNet: LLMs debate-guided network for multimodal sarcasm detection","author":"Zhou","year":"2025"},{"issue":"1","key":"10.1016\/j.array.2026.100849_b14","doi-asserted-by":"crossref","first-page":"460","DOI":"10.1109\/TITS.2025.3626770","article-title":"Causality-driven explainable multimodal fusion with visual-text parallel computing for cloth-changing pedestrian re-identification","volume":"27","author":"Yin","year":"2025","journal-title":"IEEE Trans Intell Transp Syst"},{"key":"10.1016\/j.array.2026.100849_b15","unstructured":"Peng J, Ballard JL, Zhang M, Yun S, Xin J, Long Q, Zhang Y, Chen T. Modalities Contribute Unequally: Enhancing Medical Multi-modal Learning through Adaptive Modality Token Re-balancing. In: Forty-second international conference on machine learning."},{"key":"10.1016\/j.array.2026.100849_b16","article-title":"Causality-inspired graph neural networks for cross-modal retrieval","author":"Li","year":"2026","journal-title":"IEEE Trans Multimed"},{"key":"10.1016\/j.array.2026.100849_b17","series-title":"TextAugLLMEdge: A text augmentation framework using localized large language models for resource-constrained edge","author":"Ray","year":"2025"},{"key":"10.1016\/j.array.2026.100849_b18","series-title":"Interpretable concept-based deep learning framework for multimodal human behavior modeling","author":"Li","year":"2025"},{"key":"10.1016\/j.array.2026.100849_b19","unstructured":"Lu S, Chai J, Wang X. Mitigating Spurious Correlations in Zero-Shot Multimodal Models. In: The thirteenth international conference on learning representations. 2025."},{"key":"10.1016\/j.array.2026.100849_b20","first-page":"1601","article-title":"Enriching multimodal sentiment analysis through textual emotional descriptions of visual-audio content","volume":"vol. 39","author":"Wu","year":"2025"},{"key":"10.1016\/j.array.2026.100849_b21","doi-asserted-by":"crossref","unstructured":"Zhang X, Li J, Chu W, Xu R, Yang Y, Guan S, Xu J, Jing L, Cui P, et al. On the Out-Of-Distribution Generalization of Large Multimodal Models. In: Proceedings of the computer vision and pattern recognition conference. 2025, p. 10315\u201326.","DOI":"10.1109\/CVPR52734.2025.00965"},{"key":"10.1016\/j.array.2026.100849_b22","doi-asserted-by":"crossref","DOI":"10.1016\/j.patcog.2025.112277","article-title":"Multimodal sentiment analysis based on label semantic guidance under social links","volume":"171","author":"Liu","year":"2026","journal-title":"Pattern Recognit"},{"key":"10.1016\/j.array.2026.100849_b23","unstructured":"Li T, Liu D. MPID: A Modality-Preserving and Interaction-Driven Fusion Network for Multimodal Sentiment Analysis. In: Proceedings of the 31st international conference on computational linguistics. 2025, p. 4313\u201322."},{"issue":"3","key":"10.1016\/j.array.2026.100849_b24","doi-asserted-by":"crossref","first-page":"171","DOI":"10.1007\/s10489-024-06113-6","article-title":"UEFN: Efficient uncertainty estimation fusion network for reliable multimodal sentiment analysis","volume":"55","author":"Wang","year":"2025","journal-title":"Appl Intell"},{"issue":"4","key":"10.1016\/j.array.2026.100849_b25","doi-asserted-by":"crossref","first-page":"196","DOI":"10.1007\/s40747-025-01806-y","article-title":"H 2 CAN: heterogeneous hypergraph attention network with counterfactual learning for multimodal sentiment analysis","volume":"11","author":"Huang","year":"2025","journal-title":"Complex Intell Syst"},{"key":"10.1016\/j.array.2026.100849_b26","series-title":"2024 IEEE international conference on big data (bigData)","first-page":"1243","article-title":"Zero-shot LLM-guided counterfactual generation: A case study on NLP model evaluation","author":"Bhattacharjee","year":"2024"},{"key":"10.1016\/j.array.2026.100849_b27","series-title":"Mosi: multimodal corpus of sentiment intensity and subjectivity analysis in online opinion videos","author":"Zadeh","year":"2016"},{"key":"10.1016\/j.array.2026.100849_b28","doi-asserted-by":"crossref","unstructured":"Zadeh AB, Liang PP, Poria S, Cambria E, Morency L-P. Multimodal language analysis in the wild: Cmu-mosei dataset and interpretable dynamic fusion graph. In: Proceedings of the 56th annual meeting of the association for computational linguistics (volume 1: long papers). 2018, p. 2236\u201346.","DOI":"10.18653\/v1\/P18-1208"},{"key":"10.1016\/j.array.2026.100849_b29","doi-asserted-by":"crossref","DOI":"10.1109\/ACCESS.2024.3473314","article-title":"MAG-BERT-ARL for fair automated video interview assessment","author":"Putra","year":"2024","journal-title":"IEEE Access"},{"key":"10.1016\/j.array.2026.100849_b30","doi-asserted-by":"crossref","unstructured":"Hazarika D, Zimmermann R, Poria S. Misa: Modality-invariant and-specific representations for multimodal sentiment analysis. In: Proceedings of the 28th ACM international conference on multimedia. 2020, p. 1122\u201331.","DOI":"10.1145\/3394171.3413678"},{"issue":"4","key":"10.1016\/j.array.2026.100849_b31","doi-asserted-by":"crossref","first-page":"307","DOI":"10.1007\/s00530-025-01868-5","article-title":"Self-attention mechanism prior to modality fusion for multimodal sentiment analysis","volume":"31","author":"Chen","year":"2025","journal-title":"Multimedia Syst"},{"key":"10.1016\/j.array.2026.100849_b32","doi-asserted-by":"crossref","DOI":"10.1016\/j.knosys.2023.110502","article-title":"TeFNA: Text-centered fusion network with crossmodal attention for multimodal sentiment analysis","volume":"269","author":"Huang","year":"2023","journal-title":"Knowl-Based Syst"},{"key":"10.1016\/j.array.2026.100849_b33","doi-asserted-by":"crossref","unstructured":"Yang J, Yu Y, Niu D, Guo W, Xu Y. Confede: Contrastive feature decomposition for multimodal sentiment analysis. In: Proceedings of the 61st annual meeting of the association for computational linguistics (volume 1: long papers). 2023, p. 7617\u201330.","DOI":"10.18653\/v1\/2023.acl-long.421"}],"container-title":["Array"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S2590005626001724?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S2590005626001724?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2026,6,18]],"date-time":"2026-06-18T21:09:29Z","timestamp":1781816969000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S2590005626001724"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,7]]},"references-count":33,"alternative-id":["S2590005626001724"],"URL":"https:\/\/doi.org\/10.1016\/j.array.2026.100849","relation":{},"ISSN":["2590-0056"],"issn-type":[{"value":"2590-0056","type":"print"}],"subject":[],"published":{"date-parts":[[2026,7]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"GCR-TE: Grounded generative counterfactual rewriting for text enhanced multimodal sentiment analysis","name":"articletitle","label":"Article Title"},{"value":"Array","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.array.2026.100849","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2026 The Authors. Published by Elsevier Inc.","name":"copyright","label":"Copyright"}],"article-number":"100849"}}