{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,15]],"date-time":"2026-06-15T15:54:59Z","timestamp":1781538899813,"version":"3.54.5"},"publisher-location":"New York, NY, USA","reference-count":57,"publisher":"ACM","license":[{"start":{"date-parts":[[2026,6,15]],"date-time":"2026-06-15T00:00:00Z","timestamp":1781481600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode"}],"funder":[{"name":"National Natural Science Foundation of China","award":["U24A20250"],"award-info":[{"award-number":["U24A20250"]}]},{"name":"Sichuan Provincial Natural Science Foundation","award":["2024YFG0006"],"award-info":[{"award-number":["2024YFG0006"]}]},{"name":"Sichuan Provincial Natural Science Foundation","award":["2025ZNSFSC1487"],"award-info":[{"award-number":["2025ZNSFSC1487"]}]},{"DOI":"10.13039\/501100012226","name":"Fundamental Research Funds for the Central Universities","doi-asserted-by":"publisher","award":["ZYGX2024J022"],"award-info":[{"award-number":["ZYGX2024J022"]}],"id":[{"id":"10.13039\/501100012226","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100012226","name":"Fundamental Research Funds for the Central Universities","doi-asserted-by":"publisher","award":["ZYGX2024Z005"],"award-info":[{"award-number":["ZYGX2024Z005"]}],"id":[{"id":"10.13039\/501100012226","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2026,6,16]]},"DOI":"10.1145\/3805622.3810693","type":"proceedings-article","created":{"date-parts":[[2026,6,15]],"date-time":"2026-06-15T14:42:57Z","timestamp":1781534577000},"page":"1355-1364","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["ReNoRD: Learning from Relations under Noisy Pseudo Labels via Relational Distillation for Multimodal Sentiment"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0009-3742-0352","authenticated-orcid":false,"given":"Tiantai","family":"Zhai","sequence":"first","affiliation":[{"name":"University of Electronic Science and Technology of China, Chengdu, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7444-3275","authenticated-orcid":false,"given":"Yan","family":"Zhuang","sequence":"additional","affiliation":[{"name":"University of Electronic Science and Technology of China, Chengdu, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0602-8250","authenticated-orcid":false,"given":"Fuji","family":"Ren","sequence":"additional","affiliation":[{"name":"University of Electronic Science and Technology of China, Chengdu, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4222-7986","authenticated-orcid":false,"given":"Jiawen","family":"Deng","sequence":"additional","affiliation":[{"name":"University of Electronic Science and Technology of China, Chengdu, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4860-9184","authenticated-orcid":false,"given":"Liang","family":"Luo","sequence":"additional","affiliation":[{"name":"University of Electronic Science and Technology of China, Chengdu, China"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"320","published-online":{"date-parts":[[2026,6,15]]},"reference":[{"key":"e_1_3_3_1_2_2","unstructured":"Alexander\u00a0A. Alemi Ian Fischer Joshua\u00a0V. Dillon and Kevin Murphy. 2019. Deep Variational Information Bottleneck. arxiv:https:\/\/arXiv.org\/abs\/1612.00410\u00a0[cs.LG] https:\/\/arxiv.org\/abs\/1612.00410"},{"key":"e_1_3_3_1_3_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P18-1208"},{"key":"e_1_3_3_1_4_2","unstructured":"David Berthelot Nicholas Carlini Ian Goodfellow Nicolas Papernot Avital Oliver and Colin\u00a0A Raffel. 2019. Mixmatch: A holistic approach to semi-supervised learning. Advances in neural information processing systems 32 (2019)."},{"key":"e_1_3_3_1_5_2","doi-asserted-by":"crossref","unstructured":"Zhe Cao Tao Qin Tie\u00a0Yan Liu Ming\u00a0Feng Tsai and Hang Li. 2007. Learning to rank: From pairwise approach to listwise approach. ACM (2007).","DOI":"10.1145\/1273496.1273513"},{"key":"e_1_3_3_1_6_2","doi-asserted-by":"crossref","unstructured":"Baixu Chen Junguang Jiang Ximei Wang Pengfei Wan Jianmin Wang and Mingsheng Long. 2022. Debiased self-training for semi-supervised learning. Advances in Neural Information Processing Systems 35 (2022) 32424\u201332437.","DOI":"10.52202\/068431-2349"},{"key":"e_1_3_3_1_7_2","doi-asserted-by":"publisher","unstructured":"Chen Chen Hansheng Hong Jie Guo and Bin Song. 2023. Inter-Intra Modal Representation Augmentation With Trimodal Collaborative Disentanglement Network for Multimodal Sentiment Analysis. IEEE\/ACM Transactions on Audio Speech and Language Processing 31 (2023) 1476\u20131488. 10.1109\/TASLP.2023.3263801","DOI":"10.1109\/TASLP.2023.3263801"},{"key":"e_1_3_3_1_8_2","unstructured":"Rewon Child Scott Gray Alec Radford and Ilya Sutskever. 2019. Generating Long Sequences with Sparse Transformers. arxiv:https:\/\/arXiv.org\/abs\/1904.10509\u00a0[cs.LG] https:\/\/arxiv.org\/abs\/1904.10509"},{"key":"e_1_3_3_1_9_2","doi-asserted-by":"publisher","unstructured":"Weihang Dai Xiaomeng Li and Kwang-Ting Cheng. 2023. Semi-Supervised Deep Regression with Uncertainty Consistency and Variational Model Ensembling via Bayesian Neural Networks. Proceedings of the AAAI Conference on Artificial Intelligence 37 6 (June 2023) 7304\u20137313. 10.1609\/aaai.v37i6.25890","DOI":"10.1609\/aaai.v37i6.25890"},{"key":"e_1_3_3_1_10_2","doi-asserted-by":"publisher","unstructured":"Cunhang Fan Kang Zhu Jianhua Tao Guofeng Yi Jun Xue and Zhao Lv. 2025. Multi-Level Contrastive Learning: Hierarchical Alleviation of Heterogeneity in Multimodal Sentiment Analysis. IEEE Transactions on Affective Computing 16 1 (2025) 207\u2013222. 10.1109\/TAFFC.2024.3423671","DOI":"10.1109\/TAFFC.2024.3423671"},{"key":"e_1_3_3_1_11_2","volume-title":"Advances in Neural Information Processing Systems","author":"Grandvalet Yves","year":"2004","unstructured":"Yves Grandvalet and Yoshua Bengio. 2004. Semi-supervised Learning by Entropy Minimization. In Advances in Neural Information Processing Systems , L.\u00a0Saul, Y.\u00a0Weiss, and L.\u00a0Bottou (Eds.), Vol.\u00a017. MIT Press. https:\/\/proceedings.neurips.cc\/paper_files\/paper\/2004\/file\/96f2b50b5d3613adf9c27049b2a888c7-Paper.pdf"},{"key":"e_1_3_3_1_12_2","unstructured":"Devamanyu Hazarika Roger Zimmermann and Soujanya Poria. 2020. MISA: Modality-Invariant and-Specific Representations for Multimodal Sentiment Analysis. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2005.03545 (2020)."},{"key":"e_1_3_3_1_13_2","unstructured":"Marzi Heidari and Yuhong Guo. 2025. Bi-Level Optimization for Pseudo-Labeling Based Semi-Supervised Learning. (2025)."},{"key":"e_1_3_3_1_14_2","doi-asserted-by":"crossref","unstructured":"Wei-Ning Hsu Benjamin Bolte Yao-Hung\u00a0Hubert Tsai Kushal Lakhotia Ruslan Salakhutdinov and Abdelrahman Mohamed. 2021. Hubert: Self-supervised speech representation learning by masked prediction of hidden units. IEEE\/ACM transactions on audio speech and language processing 29 (2021) 3451\u20133460.","DOI":"10.1109\/TASLP.2021.3122291"},{"key":"e_1_3_3_1_15_2","volume-title":"The Thirty-eighth Annual Conference on Neural Information Processing Systems (NeurIPS)","author":"Huang Pin-Yen","year":"2024","unstructured":"Pin-Yen Huang, Szu-Wei Fu, and Yu Tsao. 2024. RankUp: Boosting Semi-Supervised Regression with an Auxiliary Ranking Classifier. In The Thirty-eighth Annual Conference on Neural Information Processing Systems (NeurIPS). https:\/\/openreview.net\/forum?id=d2lPM1Aczs"},{"key":"e_1_3_3_1_16_2","doi-asserted-by":"crossref","unstructured":"Yongwon Jo Hyungu Kahng and Seoung\u00a0Bum Kim. 2024. Deep semi-supervised regression via pseudo-label filtering and calibration. Applied Soft Computing 161 (2024) 111670.","DOI":"10.1016\/j.asoc.2024.111670"},{"key":"e_1_3_3_1_17_2","unstructured":"Samuli Laine and Timo Aila. 2016. Temporal ensembling for semi-supervised learning. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/1610.02242 (2016)."},{"key":"e_1_3_3_1_18_2","first-page":"896","volume-title":"Workshop on challenges in representation learning, ICML","author":"Lee Dong-Hyun","year":"2013","unstructured":"Dong-Hyun Lee et\u00a0al. 2013. Pseudo-label: The simple and efficient semi-supervised learning method for deep neural networks. In Workshop on challenges in representation learning, ICML , Vol.\u00a03. Atlanta, 896."},{"key":"e_1_3_3_1_19_2","doi-asserted-by":"publisher","DOI":"10.1145\/3731715.3733388"},{"key":"e_1_3_3_1_20_2","doi-asserted-by":"publisher","unstructured":"Shuzhen Li Tong Zhang and C.\u00a0L.\u00a0Philip Chen. 2024. SIA-Net: Sparse Interactive Attention Network for Multimodal Emotion Recognition. IEEE Transactions on Computational Social Systems 11 5 (2024) 6782\u20136794. 10.1109\/TCSS.2024.3409715","DOI":"10.1109\/TCSS.2024.3409715"},{"key":"e_1_3_3_1_21_2","doi-asserted-by":"publisher","DOI":"10.52202\/079017-1910"},{"key":"e_1_3_3_1_22_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00641"},{"key":"e_1_3_3_1_23_2","doi-asserted-by":"crossref","unstructured":"Zheng Lian Bin Liu and Jianhua Tao. 2022. Smin: Semi-supervised multi-modal interaction network for conversational emotion recognition. IEEE Transactions on Affective Computing 14 3 (2022) 2415\u20132429.","DOI":"10.1109\/TAFFC.2022.3141237"},{"key":"e_1_3_3_1_24_2","doi-asserted-by":"publisher","DOI":"10.1145\/3581783.3612836"},{"key":"e_1_3_3_1_25_2","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v39i2.32131"},{"key":"e_1_3_3_1_26_2","unstructured":"Yinhan Liu Myle Ott Naman Goyal Jingfei Du Mandar Joshi Danqi Chen Omer Levy Mike Lewis Luke Zettlemoyer and Veselin Stoyanov. 2019. Roberta: A robustly optimized bert pretraining approach. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/1907.11692 (2019)."},{"key":"e_1_3_3_1_27_2","doi-asserted-by":"publisher","unstructured":"Yihe Liu Ziqi Yuan Huisheng Mao Zhiyun Liang Wanqiuyue Yang Yuanzhe Qiu Tie Cheng Xiaoteng Li Hua Xu and Kai Gao. 2022. Make Acoustic and Visual Cues Matter: CH-SIMS v2.0 Dataset and AV-Mixup Consistent Module(ICMI \u201922). Association for Computing Machinery New York NY USA 247\u2013258. 10.1145\/3536221.3556630","DOI":"10.1145\/3536221.3556630"},{"key":"e_1_3_3_1_28_2","doi-asserted-by":"publisher","DOI":"10.1145\/3746027.3755591"},{"key":"e_1_3_3_1_29_2","unstructured":"Yuanyi Luo Wei Liu Qiang Sun Sirui Li Jichunyang Li Rui Wu and Xianglong Tang. 2025. TriagedMSA: Triaging sentimental disagreement in multimodal sentiment analysis. IEEE Transactions on Affective Computing (2025)."},{"key":"e_1_3_3_1_30_2","first-page":"1614","volume-title":"International conference on machine learning","author":"Martins Andre","year":"2016","unstructured":"Andre Martins and Ramon Astudillo. 2016. From softmax to sparsemax: A sparse model of attention and multi-label classification. In International conference on machine learning. PMLR, 1614\u20131623."},{"key":"e_1_3_3_1_31_2","doi-asserted-by":"publisher","unstructured":"Takeru Miyato Shin-Ichi Maeda Masanori Koyama and Shin Ishii. 2019. Virtual Adversarial Training: A Regularization Method for Supervised and Semi-Supervised Learning. IEEE Transactions on Pattern Analysis and Machine Intelligence 41 8 (2019) 1979\u20131993. 10.1109\/TPAMI.2018.2858821","DOI":"10.1109\/TPAMI.2018.2858821"},{"key":"e_1_3_3_1_32_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00409"},{"key":"e_1_3_3_1_33_2","unstructured":"Ben Peters Vlad Niculae and Andr\u00e9\u00a0FT Martins. 2019. Sparse sequence-to-sequence models. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/1905.05702 (2019)."},{"key":"e_1_3_3_1_34_2","first-page":"8748","volume-title":"International conference on machine learning","author":"Radford Alec","year":"2021","unstructured":"Alec Radford, Jong\u00a0Wook Kim, Chris Hallacy, Aditya Ramesh, Gabriel Goh, Sandhini Agarwal, Girish Sastry, Amanda Askell, Pamela Mishkin, Jack Clark, et\u00a0al. 2021. Learning transferable visual models from natural language supervision. In International conference on machine learning. PmLR, 8748\u20138763."},{"key":"e_1_3_3_1_35_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.214"},{"key":"e_1_3_3_1_36_2","doi-asserted-by":"publisher","DOI":"10.5555\/3157096.3157227"},{"key":"e_1_3_3_1_37_2","first-page":"596","volume-title":"Advances in Neural Information Processing Systems","author":"Sohn Kihyuk","year":"2020","unstructured":"Kihyuk Sohn, David Berthelot, Nicholas Carlini, Zizhao Zhang, Han Zhang, Colin\u00a0A Raffel, Ekin\u00a0Dogus Cubuk, Alexey Kurakin, and Chun-Liang Li. 2020. FixMatch: Simplifying Semi-Supervised Learning with Consistency and Confidence. In Advances in Neural Information Processing Systems , H.\u00a0Larochelle, M.\u00a0Ranzato, R.\u00a0Hadsell, M.F. Balcan, and H.\u00a0Lin (Eds.), Vol.\u00a033. Curran Associates, Inc., 596\u2013608. https:\/\/proceedings.neurips.cc\/paper_files\/paper\/2020\/file\/06964dce9addb1c5cb5d6e3d9838f733-Paper.pdf"},{"key":"e_1_3_3_1_38_2","unstructured":"Xueqing Sun Renzhen Wang Quanziang Wang Yichen Wu Xixi Jia and Deyu Meng. 2025. Semi-Supervised Regression with Heteroscedastic Pseudo-Labels. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2510.15266 (2025)."},{"key":"e_1_3_3_1_39_2","doi-asserted-by":"publisher","DOI":"10.1145\/3731715.3733356"},{"key":"e_1_3_3_1_40_2","doi-asserted-by":"publisher","unstructured":"Chuanqi Tao Jiaming Li Tianzi Zang and Peng Gao. 2025. A Multi-Focus-Driven Multi-Branch Network for Robust Multimodal Sentiment Analysis. Proceedings of the AAAI Conference on Artificial Intelligence 39 2 (Apr. 2025) 1547\u20131555. 10.1609\/aaai.v39i2.32146","DOI":"10.1609\/aaai.v39i2.32146"},{"key":"e_1_3_3_1_41_2","series-title":"(NIPS\u201917)","first-page":"1195","volume-title":"Proceedings of the 31st International Conference on Neural Information Processing Systems","author":"Tarvainen Antti","year":"2017","unstructured":"Antti Tarvainen and Harri Valpola. 2017. Mean teachers are better role models: Weight-averaged consistency targets improve semi-supervised deep learning results. In Proceedings of the 31st International Conference on Neural Information Processing Systems (Long Beach, California, USA) (NIPS\u201917). Curran Associates Inc., Red Hook, NY, USA, 1195\u20131204."},{"key":"e_1_3_3_1_42_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P19-1656"},{"key":"e_1_3_3_1_43_2","unstructured":"Ashish Vaswani Noam Shazeer Niki Parmar Jakob Uszkoreit Llion Jones Aidan\u00a0N Gomez \u0141ukasz Kaiser and Illia Polosukhin. 2017. Attention is all you need. Advances in neural information processing systems 30 (2017)."},{"key":"e_1_3_3_1_44_2","doi-asserted-by":"crossref","unstructured":"C Vinola and K Vimaladevi. 2015. A survey on human emotion recognition approaches databases and applications. ELCVIA Electronic Letters on Computer Vision and Image Analysis 14 2 (2015) 24\u201344.","DOI":"10.5565\/rev\/elcvia.795"},{"key":"e_1_3_3_1_45_2","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v39i20.35416"},{"key":"e_1_3_3_1_46_2","volume-title":"Advances in Neural Information Processing Systems (NeurIPS)","author":"Wang Yikai","year":"2020","unstructured":"Yikai Wang, Wenbing Huang, Fuchun Sun, Tingyang Xu, Yu Rong, and Junzhou Huang. 2020. Deep Multimodal Fusion by Channel Exchanging. In Advances in Neural Information Processing Systems (NeurIPS)."},{"key":"e_1_3_3_1_47_2","doi-asserted-by":"publisher","DOI":"10.1145\/3731715.3733355"},{"key":"e_1_3_3_1_48_2","doi-asserted-by":"publisher","unstructured":"Sheng Wu Dongxiao He Xiaobao Wang Longbiao Wang and Jianwu Dang. 2025. Enriching Multimodal Sentiment Analysis Through Textual Emotional Descriptions of Visual-Audio Content. Proceedings of the AAAI Conference on Artificial Intelligence 39 2 (Apr. 2025) 1601\u20131609. 10.1609\/aaai.v39i2.32152","DOI":"10.1609\/aaai.v39i2.32152"},{"key":"e_1_3_3_1_49_2","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2024\/724"},{"key":"e_1_3_3_1_50_2","unstructured":"Qizhe Xie Zihang Dai Eduard Hovy Thang Luong and Quoc Le. 2020. Unsupervised data augmentation for consistency training. Advances in neural information processing systems 33 (2020) 6256\u20136268."},{"key":"e_1_3_3_1_51_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.343"},{"key":"e_1_3_3_1_52_2","doi-asserted-by":"publisher","DOI":"10.1609\/AAAI.V35I12.17289"},{"key":"e_1_3_3_1_53_2","doi-asserted-by":"publisher","unstructured":"Ziqi Yuan Jingliang Fang Hua Xu and Kai Gao. 2024. Multimodal Consistency-Based Teacher for Semi-Supervised Multimodal Sentiment Analysis. IEEE\/ACM Trans. Audio Speech and Lang. Proc. 32 (July 2024) 3669\u20133683. 10.1109\/TASLP.2024.3430543","DOI":"10.1109\/TASLP.2024.3430543"},{"key":"e_1_3_3_1_54_2","doi-asserted-by":"publisher","DOI":"10.1109\/MIS.2016.94"},{"key":"e_1_3_3_1_55_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D17-1115"},{"key":"e_1_3_3_1_56_2","doi-asserted-by":"crossref","unstructured":"Amir Zadeh Paul\u00a0Pu Liang Navonil Mazumder Soujanya Poria Erik Cambria and Louis-Philippe Morency. 2018. Memory Fusion Network for Multi-view Sequential Learning. Proceedings of the Thirty-Second AAAI Conference on Artificial Intelligence (2018).","DOI":"10.1609\/aaai.v32i1.12021"},{"key":"e_1_3_3_1_57_2","doi-asserted-by":"crossref","unstructured":"Haoyu Zhang Yu Wang Guanghao Yin Kejun Liu Yuanyuan Liu and Tianshu Yu. 2023. Learning language-guided adaptive hyper-modality representation for multimodal sentiment analysis. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2310.05804 (2023).","DOI":"10.18653\/v1\/2023.emnlp-main.49"},{"key":"e_1_3_3_1_58_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.findings-acl.859"}],"event":{"name":"ICMR '26: International Conference on Multimedia Retrieval","location":"Amsterdam The Netherlands","acronym":"ICMR '26","sponsor":["SIGMM ACM Special Interest Group on Multimedia"]},"container-title":["Proceedings of the 2026 International Conference on Multimedia Retrieval"],"original-title":[],"deposited":{"date-parts":[[2026,6,15]],"date-time":"2026-06-15T15:08:54Z","timestamp":1781536134000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3805622.3810693"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,6,15]]},"references-count":57,"alternative-id":["10.1145\/3805622.3810693","10.1145\/3805622"],"URL":"https:\/\/doi.org\/10.1145\/3805622.3810693","relation":{},"subject":[],"published":{"date-parts":[[2026,6,15]]},"assertion":[{"value":"2026-06-15","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}