{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,3]],"date-time":"2026-04-03T15:33:55Z","timestamp":1775230435644,"version":"3.50.1"},"reference-count":66,"publisher":"Springer Science and Business Media LLC","issue":"13","license":[{"start":{"date-parts":[[2024,5,28]],"date-time":"2024-05-28T00:00:00Z","timestamp":1716854400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,5,28]],"date-time":"2024-05-28T00:00:00Z","timestamp":1716854400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"DOI":"10.1007\/s11042-024-19433-z","type":"journal-article","created":{"date-parts":[[2024,5,28]],"date-time":"2024-05-28T04:01:50Z","timestamp":1716868910000},"page":"12013-12035","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["NRAFN: a non-text reinforcement and adaptive fusion network for multimodal sentiment analysis"],"prefix":"10.1007","volume":"84","author":[{"given":"Jinlong","family":"Wei","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xinhui","family":"Shao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2024,5,28]]},"reference":[{"key":"19433_CR1","first-page":"pp 1","volume-title":"32nd Conference on Neural Information Processing Systems","author":"SH Dumpala","year":"2019","unstructured":"Dumpala SH, Sheikh I, Chakraborty R, Kopparapu SK (2019) Audio-visual fusion for sentiment classification using cross-modal autoencoder. 32nd Conference on Neural Information Processing Systems. p pp 1-4"},{"key":"19433_CR2","doi-asserted-by":"publisher","first-page":"100744","DOI":"10.1016\/j.dib.2021.107044","volume":"36","author":"B Hassan","year":"2021","unstructured":"Hassan B, Rashid T, Mirjalili S (2021) Performance evaluation results of evolutionary clustering algorithm star for clustering heterogeneous datasets. Data Brief 36:100744","journal-title":"Data Brief"},{"key":"19433_CR3","doi-asserted-by":"publisher","first-page":"pp 873","DOI":"10.18653\/v1\/P17-1081","volume-title":"Proceedings of the 55th annual meeting of the association for computational linguistics\u00a0(volume 1: Long papers)","author":"S Poria","year":"2017","unstructured":"Poria S, Cambria E, Hazarika D, Majumder N, Zadeh A, Morency LP (2017) Context-dependent sentiment analysis in user-generated videos. Proceedings of the 55th annual meeting of the association for computational linguistics\u00a0(volume 1: Long papers). p pp 873-883"},{"issue":"3","key":"19433_CR4","doi-asserted-by":"publisher","first-page":"281","DOI":"10.1007\/s10115-007-0107-1","volume":"16","author":"T Peng","year":"2008","unstructured":"Peng T, Zuo W, He F (2008) Svm based adaptive learning method for text classification from positive and unlabeled documents. Knowl Inf Syst 16(3):281\u2013301","journal-title":"Knowl Inf Syst"},{"issue":"4","key":"19433_CR5","doi-asserted-by":"publisher","first-page":"855","DOI":"10.1134\/S1054661817040228","volume":"27","author":"Z Qiao","year":"2017","unstructured":"Qiao Z, Kewen X, Panpan W, Wang H (2017) Lung nodule classification using curvelet transform, LDA algorithm and BAT-SVM algorithm. Pattern Recognit Image Anal 27(4):855\u2013862","journal-title":"Pattern Recognit Image Anal"},{"issue":"6","key":"19433_CR6","doi-asserted-by":"publisher","first-page":"1777","DOI":"10.1007\/s00521-018-3656-1","volume":"32","author":"S Afifi","year":"2020","unstructured":"Afifi S, GholamHosseini H, Sinha R (2020) Dynamic hardware system for cascade SVM classification of melanoma. Neural Comput Appl 32(6):1777\u20131788","journal-title":"Neural Comput Appl"},{"issue":"12","key":"19433_CR7","doi-asserted-by":"publisher","first-page":"8749","DOI":"10.1007\/s00521-018-3939-6","volume":"31","author":"P Kaur","year":"2019","unstructured":"Kaur P, Pannu HS, Malhi AK (2019) Plant disease recognition using fractional-order Zernike moments and SVM classifier. Neural Comput Appl 31(12):8749\u20138768","journal-title":"Neural Comput Appl"},{"key":"19433_CR8","doi-asserted-by":"publisher","DOI":"10.1016\/j.artmed.2022.102348","volume":"131","author":"M Abdulkhaleq","year":"2022","unstructured":"Abdulkhaleq M, Rashid T, Alsadoon A, Hassan B, Mohammadi M, Abdullah J, Chhabra A, Ali S, Othman R, Hasan H, Azad S, Mahmood N, Abdalrahman S, Rasul H, Bacanin N, Vimal S (2022) Harmony search: current studies and uses on healthcare systems. Artif Intell Med 131:102348","journal-title":"Artif Intell Med"},{"key":"19433_CR9","doi-asserted-by":"publisher","first-page":"7011","DOI":"10.1007\/s00521-020-05474-6","volume":"33","author":"B Hassan","year":"2021","unstructured":"Hassan B (2021) CSCF: a chaotic sine cosine firefly algorithm for practical application problems. Neural Comput Applic 33:7011\u20137030","journal-title":"Neural Comput Applic"},{"issue":"6","key":"19433_CR10","doi-asserted-by":"publisher","first-page":"17","DOI":"10.1109\/MIS.2018.2882362","volume":"33","author":"S Poria","year":"2018","unstructured":"Poria S, Majumder N, Hazarika D, Cambria E, Gelbukh A, Hussain A (2018) Multimodal sentiment analysis: addressing key issues and setting up the baselines. IEEE Intell Syst 33(6):17\u201325","journal-title":"IEEE Intell Syst"},{"key":"19433_CR11","first-page":"19","volume-title":"2019 IEEE International Conference on Big Data","author":"A Agarwal","year":"2019","unstructured":"Agarwal A, Yadav A, Vishwakarma DK (2019) Multimodal sentiment analysis via RNN variants. 2019 IEEE International Conference on Big Data. Cloud Computing, Data Science & Engineering. IEEE, pp 19\u201323"},{"key":"19433_CR12","doi-asserted-by":"publisher","first-page":"124","DOI":"10.1016\/j.knosys.2018.07.041","volume":"161","author":"N Majumder","year":"2018","unstructured":"Majumder N, Hazarika D, Gelbukh A, Cambria E, Poria S (2018) Multimodal sentiment analysis using hierarchical fusion with context modeling. Knowl-Based Syst 161:124\u2013133","journal-title":"Knowl-Based Syst"},{"key":"19433_CR13","doi-asserted-by":"publisher","first-page":"pp 34","DOI":"10.1145\/3380688.3380693","volume-title":"Proceedings of the 4th International Conference on Machine Learning and Soft Computing","author":"C Xi","year":"2020","unstructured":"Xi C, Lu G, Yan J (2020) Multimodal sentiment analysis based on multi-head attention mechanism. Proceedings of the 4th International Conference on Machine Learning and Soft Computing. p pp 34-39"},{"key":"19433_CR14","doi-asserted-by":"publisher","first-page":"10987","DOI":"10.1007\/s00521-020-05649-1","volume":"33","author":"B Hassan","year":"2021","unstructured":"Hassan B, Rashid T (2021) A multidisciplinary ensemble algorithm for clustering heterogeneous datasets. Neural Comput Applic 33:10987\u201311010","journal-title":"Neural Comput Applic"},{"key":"19433_CR15","doi-asserted-by":"publisher","first-page":"2383","DOI":"10.1007\/s40747-021-00422-w","volume":"7","author":"B Hassan","year":"2021","unstructured":"Hassan B, Rashid T, Mirjalili S (2021) Formal context reduction in deriving concept hierarchies from corpora using adaptive evolutionary clustering algorithm star. Complex Intell Syst 7:2383\u20132398","journal-title":"Complex Intell Syst"},{"key":"19433_CR16","first-page":"2514","volume":"2020","author":"Z Wang","year":"2020","unstructured":"Wang Z, Wan Z, Wan X (2020) Transmodality: an end2end fusion method with transformer for multimodal sentiment analysis. Proc Web Conf 2020:2514\u20132520","journal-title":"Proc Web Conf"},{"key":"19433_CR17","first-page":"pp 949","volume-title":"2017 IEEE International Conference on Multimedia and Expo. IEEE, pp 949\u2013954","author":"H Wang","year":"2017","unstructured":"Wang H, Meghawat A, Morency LP, Xing EP (2017) Select-additive learning: Improving generalization in multimodal sentiment analysis. 2017 IEEE International Conference on Multimedia and Expo. IEEE, pp 949\u2013954. p pp 949-954"},{"key":"19433_CR18","first-page":"pp 1033","volume-title":"2017 IEEE International Conference on Data Mining. IEEE","author":"S Poria","year":"2017","unstructured":"Poria S, Cambria E, Hazarika D, Mazumder N, Zadeh A, Morency L-P (2017) Multi-level multiple attentions for contextual multimodal sentiment analysis. 2017 IEEE International Conference on Data Mining. IEEE. p pp 1033-1038"},{"key":"19433_CR19","first-page":"pp 1103","volume-title":"Proceedings of the 2017 conference on empirical methods in natural language processing","author":"A Zadeh","year":"2017","unstructured":"Zadeh A, Chen M, Poria S, Cambria E, Morency L-P (2017) Tensor fusion network for multimodal sentiment analysis. Proceedings of the 2017 conference on empirical methods in natural language processing. p pp 1103-1114"},{"key":"19433_CR20","doi-asserted-by":"publisher","first-page":"pp 2247","DOI":"10.18653\/v1\/P18-1209","volume-title":"Proceedings of the 56th annual meeting of the association for computational linguistics (Volume 1: Long Papers)","author":"Z Liu","year":"2018","unstructured":"Liu Z, Shen Y, Lakshminarasimhan VB, Liang PP, Zadeh AB, Morency L-P (2018) Efficient low-rank multimodal fusion with modality-specific factors. Proceedings of the 56th annual meeting of the association for computational linguistics (Volume 1: Long Papers). p pp 2247-2256"},{"key":"19433_CR21","first-page":"pp 29","volume-title":"Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics","author":"S Sahay","year":"2020","unstructured":"Sahay S, Okur E, Kumar SH, Nachman L (2020) Low rank fusion based transformers for multimodal sequences. Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics. pp 29-34"},{"key":"19433_CR22","doi-asserted-by":"publisher","first-page":"pp 6558","DOI":"10.18653\/v1\/P19-1656","volume-title":"Proceedings of the 57th annual meeting of the association for computational linguistics","author":"Y-HH Tsai","year":"2019","unstructured":"Tsai Y-HH, Bai S, Liang PP, Kolter JZ, Morency L-P, Salakhutdinov R (2019) Multimodal transformer for unaligned multimodal language sequences. Proceedings of the 57th annual meeting of the association for computational linguistics. pp 6558-6569"},{"key":"19433_CR23","doi-asserted-by":"publisher","DOI":"10.1016\/j.compbiomed.2021.104866","volume":"138","author":"B Hassan","year":"2021","unstructured":"Hassan B, Rashid T, Hamarashid H (2021) A novel cluster detection of COVID-19 patients and medical disease conditions using improved evolutionary clustering algorithm star. Comput Biol Med 138:104866","journal-title":"Comput Biol Med"},{"key":"19433_CR24","doi-asserted-by":"publisher","first-page":"58","DOI":"10.1016\/j.neucom.2022.12.022","volume":"523","author":"C Xu","year":"2022","unstructured":"Xu C, Wu X, Wang M, Qiu F, Liu Y, Ren J (2022) Improving dynamic gesture recognition in untrimmed videos by an online lightweight framework and a new gesture dataset ZJUGesture. Neurocomputing 523:58\u201368","journal-title":"Neurocomputing"},{"issue":"30","key":"19433_CR25","doi-asserted-by":"publisher","first-page":"44059","DOI":"10.1007\/s11042-022-13260-w","volume":"81","author":"S Qader","year":"2022","unstructured":"Qader S, Hassan B, Rashid T (2022) An improved deep convolutional neural network by using hybrid optimization algorithms to detect and classify brain tumor using augmented MRI images. Multimed Tools Appl 81(30):44059\u201344086","journal-title":"Multimed Tools Appl"},{"key":"19433_CR26","doi-asserted-by":"publisher","first-page":"163","DOI":"10.1007\/s10844-023-00811-2","volume":"62","author":"J Feng","year":"2023","unstructured":"Feng J, Li H, Yu Z (2023) Enhancing aspect-based sentiment analysis with dependency-attention GCN and mutual assistance mechanism. J Intell Inform Syst 62:163\u2013189","journal-title":"J Intell Inform Syst"},{"key":"19433_CR27","doi-asserted-by":"publisher","first-page":"8041","DOI":"10.1007\/s11063-023-11296-z","volume":"55","author":"P Yang","year":"2023","unstructured":"Yang P, Zhang P, Li B, Ji S, Yi M (2023) Aspect-based sentiment analysis using adversarial BERT with capsule networks. Neural Process Lett 55:8041\u20138058","journal-title":"Neural Process Lett"},{"key":"19433_CR28","doi-asserted-by":"publisher","first-page":"1973","DOI":"10.1007\/s12559-023-10164-1","volume":"15","author":"Y Li","year":"2023","unstructured":"Li Y, Lin Z, Lin Y, Yin J, Chang L (2023) Learning sentiment-enhanced word representations by fusing external hybrid sentiment knowledge. Cogn Comput 15:1973\u20131987","journal-title":"Cogn Comput"},{"key":"19433_CR29","doi-asserted-by":"publisher","first-page":"15907","DOI":"10.1007\/s00521-023-08576-z","volume":"35","author":"Z Wang","year":"2023","unstructured":"Wang Z, Hu Z, Ho SB, Cambria E, Tan AH (2023) MiMuSA\u2014mimicking human language understanding for fine-grained multi-class sentiment analysis. Neural Comput Applic 35:15907\u201315921","journal-title":"Neural Comput Applic"},{"key":"19433_CR30","doi-asserted-by":"publisher","first-page":"21463","DOI":"10.1007\/s00521-023-08470-8","volume":"35","author":"P Hajek","year":"2023","unstructured":"Hajek P, Munk M (2023) Speech emotion recognition and text sentiment analysis for financial distress prediction. Neural Comput Applic 35:21463\u201321477","journal-title":"Neural Comput Applic"},{"key":"19433_CR31","first-page":"pp 439","volume-title":"2016 IEEE international conference on data mining. IEEE","author":"S Poria","year":"2016","unstructured":"Poria S, Chaturvedi I, Cambria E, Hussain A (2016) Convolutional MKL based multimodal emotion recognition and sentiment analysis. 2016 IEEE international conference on data mining. IEEE. p pp 439-448"},{"key":"19433_CR32","first-page":"pp 5634","volume-title":"Proceedings of the 32nd AAAI Conference on Artificial Intelligence","author":"A Zadeh","year":"2018","unstructured":"Zadeh A, Liang PP, Mazumder N, Poria S, Cambria E, Morency L-P (2018) Memory fusion network for multi-view sequential learning. Proceedings of the 32nd AAAI Conference on Artificial Intelligence. p pp 5634-5641"},{"key":"19433_CR33","first-page":"pp 5642","volume-title":"Proceedings of the 32nd AAAI conference on artificial intelligence","author":"A Zadeh","year":"2018","unstructured":"Zadeh A, Liang PP, Vij P, Poria S, Cambria E, Morency L-P (2018) Multi-attention recurrent network for human communication comprehension. Proceedings of the 32nd AAAI conference on artificial intelligence. p pp 5642-5649"},{"key":"19433_CR34","first-page":"pp 606","volume-title":"Proceedings of the 56th annual meeting of the association for computational linguistics","author":"O Kampman","year":"2018","unstructured":"Kampman O, Barezi EJ, BERTero D, Fung P (2018) Investigating audio, visual, and text fusion methods for end-to-end automatic personality prediction. Proceedings of the 56th annual meeting of the association for computational linguistics. p pp 606-611"},{"key":"19433_CR35","doi-asserted-by":"publisher","first-page":"pp 521","DOI":"10.1145\/3462244.3479931","volume-title":"Proceedings of the 2021 International Conference on Multimodal Interaction","author":"J Wu","year":"2021","unstructured":"Wu J, Mai S, Hu H (2021) Graph capsule aggregation for unaligned multimodal sequences. Proceedings of the 2021 International Conference on Multimodal Interaction. p pp 521-529"},{"key":"19433_CR36","doi-asserted-by":"publisher","first-page":"pp 2236","DOI":"10.18653\/v1\/P18-1208","volume-title":"Proceedings of the 56th annual meeting of the association for computational linguistics (Volume 1: Long Papers)","author":"A Zadeh","year":"2018","unstructured":"Zadeh A, Liang PP, Vanbriesen J, Poria S, Cambria E, Tong E, Cambria E, Chen M, Morency L-P (2018) Multimodal language analysis in the wild: Cmu-mosei dataset and interpretable dynamic fusion graph. Proceedings of the 56th annual meeting of the association for computational linguistics (Volume 1: Long Papers). p pp 2236-2246"},{"key":"19433_CR37","first-page":"pp 6892","volume-title":"Proceedings of the 33rd AAAI Conference on Artificial Intelligence","author":"H Pham","year":"2019","unstructured":"Pham H, Liang PP, Manzini T, Morency L-P, Poczos B (2019) Found in translation: Learning robust joint representations by cyclic translations between modalities. Proceedings of the 33rd AAAI Conference on Artificial Intelligence. p pp 6892-6899"},{"key":"19433_CR38","doi-asserted-by":"publisher","first-page":"131671","DOI":"10.1109\/ACCESS.2022.3219200","volume":"10","author":"M Xu","year":"2022","unstructured":"Xu M, Liang F, Su X, Fang C (2022) CMJRT: cross-modal joint representation transformer for multimodal sentiment analysis. IEEE Access 10:131671\u2013131679","journal-title":"IEEE Access"},{"key":"19433_CR39","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2021.107676","volume":"235","author":"T Wu","year":"2022","unstructured":"Wu T, Peng J, Zhang W, Zhang H, Tan S, Yi F, Ma C, Huang Y (2022) Video sentiment analysis with bimodal information-augmented multi-head attention. Knowl-Based Syst 235:107676","journal-title":"Knowl-Based Syst"},{"key":"19433_CR40","doi-asserted-by":"publisher","first-page":"1943","DOI":"10.1007\/s11063-021-10713-5","volume":"54","author":"X Zhuang","year":"2022","unstructured":"Zhuang X, Liu F, Hou J, Hao J, Cai X (2022) Transformer-based interactive multi-modal attention network for video sentiment detection. Neural Process Lett 54:1943\u20131960","journal-title":"Neural Process Lett"},{"key":"19433_CR41","doi-asserted-by":"publisher","first-page":"289","DOI":"10.1007\/s12559-022-10073-9","volume":"15","author":"F Wang","year":"2023","unstructured":"Wang F, Tian S, Yu L, Liu J, Wang J, Li K, Wang Y (2023) TEDT: transformer\u2013based encoding\u2013decoding translation network. Cogn Comput 15:289\u2013303","journal-title":"Cogn Comput"},{"key":"19433_CR42","first-page":"pp 8992","volume-title":"Proceedings of the 34th AAAI Conference on Artificial Intelligence","author":"Z Sun","year":"2020","unstructured":"Sun Z, Sarma P, Sethares W, Liang Y (2020) Learning relationships between text, audio, and video via deep canonical correlation for multimodal language analysis. Proceedings of the 34th AAAI Conference on Artificial Intelligence. p pp 8992-8999"},{"key":"19433_CR43","doi-asserted-by":"publisher","first-page":"pp 2359","DOI":"10.18653\/v1\/2020.acl-main.214","volume-title":"Proceedings of the 58th annual meeting of the association for computational linguistics","author":"W Rahman","year":"2020","unstructured":"Rahman W, Hasan MK, Lee S, Zadeh A, Mao C, Morency L-P, Hoque E (2020) Integrating multimodal information in large pre-trained transformers. Proceedings of the 58th annual meeting of the association for computational linguistics. p pp 2359-2369"},{"key":"19433_CR44","doi-asserted-by":"publisher","first-page":"pp 3722","DOI":"10.1145\/3503161.3548025","volume-title":"Proceedings of the 30th ACM international conference on multimedia","author":"H Sun","year":"2022","unstructured":"Sun H, Wang H, Liu J, Chen Y-W, Lin L (2022) CubeMLP: An MLP-based model for multimodal sentiment analysis and depression estimation. Proceedings of the 30th ACM international conference on multimedia. p pp 3722-3729"},{"key":"19433_CR45","doi-asserted-by":"publisher","first-page":"pp 9180","DOI":"10.18653\/v1\/2021.emnlp-main.723","volume-title":"Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing","author":"W Han","year":"2021","unstructured":"Han W, Chen H, Poria S (2021) Improving multimodal fusion with hierarchical mutual information maximization for multimodal sentiment analysis. Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing. p pp 9180-9192"},{"key":"19433_CR46","doi-asserted-by":"publisher","first-page":"pp 1122","DOI":"10.1145\/3394171.3413678","volume-title":"Proceedings of the 28th ACM International Conference on Multimedia","author":"D Hazarika","year":"2020","unstructured":"Hazarika D, Zimmermann R, Poria S (2020) MISA: Modality-invariant and -specific representations for multimodal sentiment analysis. Proceedings of the 28th ACM International Conference on Multimedia. p pp 1122-1131"},{"key":"19433_CR47","doi-asserted-by":"publisher","DOI":"10.1016\/j.ipm.2022.103229","volume":"60","author":"H Lin","year":"2023","unstructured":"Lin H, Zhang P, Ling J, Yang Z, Lee L, Liu W (2023) PS-Mixer: a polar-vector and strength-vector mixer model for multimodal sentiment analysis. Inf Process Manage 60:103229","journal-title":"Inf Process Manage"},{"key":"19433_CR48","first-page":"pp 5998","volume-title":"Advances in Neural Information Processing Systems","author":"A Vaswani","year":"2017","unstructured":"Vaswani A, Shazeer N, Parmar N, Uszkoreit J, Jones L, Gomez AN, Kaiser L, Polosukhin I (2017) Attention is all you need. Advances in Neural Information Processing Systems. p pp 5998-6008"},{"key":"19433_CR49","doi-asserted-by":"publisher","first-page":"pp 5027","DOI":"10.18653\/v1\/D18-1548","volume-title":"Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing","author":"E Strubell","year":"2018","unstructured":"Strubell E, Verga P, Andor D, Weiss D, McCallum A (2018) Linguistically-informed self-attention for semantic role labeling. Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing. p pp 5027-5038"},{"key":"19433_CR50","volume-title":"Adaptive input representations for neural language modeling","author":"A Baevski","year":"2018","unstructured":"Baevski A, Auli M (2018) Adaptive input representations for neural language modeling arXiv: 1809.10853"},{"key":"19433_CR51","first-page":"pp 213","volume-title":"European Conference on Computer Vision","author":"N Carion","year":"2020","unstructured":"Carion N, Massa F, Synnaeve G, Usunier N, Kirillov A, Zagoruyko S (2020) End-to-end object detection with transformers. European Conference on Computer Vision. Springer, p pp 213-229"},{"key":"19433_CR52","first-page":"pp 5904","volume-title":"2021 IEEE International Conference on Acoustics, Speech and Signal Processing. IEEE","author":"X Chen","year":"2021","unstructured":"Chen X, Wu Y, Wang Z, Liu S, Li J (2021) Developing real-time streaming transformer transducer for speech recognition on large scale dataset. 2021 IEEE International Conference on Acoustics, Speech and Signal Processing. IEEE. p pp 5904-5908"},{"key":"19433_CR53","volume-title":"BERT: pre-training of deep bidirectional transformers for language understanding","author":"J Devlin","year":"2018","unstructured":"Devlin J, Chang MW, Lee K, Toutanova K (2018) BERT: pre-training of deep bidirectional transformers for language understanding arXiv:1810.04805"},{"key":"19433_CR54","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2022.109259","volume":"136","author":"D Wang","year":"2023","unstructured":"Wang D, Guo X, Tian Y, Liu J, He L, Luo X (2023) TETFN: a text enhanced transformer fusion network for multimodal sentiment analysis. Pattern Recognit 136:109259","journal-title":"Pattern Recognit"},{"key":"19433_CR55","first-page":"pp 4753","volume-title":"2022 IEEE International Conference on Acoustics, Speech and Signal Processing. IEEE","author":"X Zhao","year":"2022","unstructured":"Zhao X, Chen Y, Li W, Gao L, Tang B (2022) MAG+: An extended multimodal adaptation gate for multimodal sentiment analysis. 2022 IEEE International Conference on Acoustics, Speech and Signal Processing. IEEE. p pp 4753-4757"},{"key":"19433_CR56","first-page":"pp 3707","volume-title":"Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition","author":"W Liu","year":"2015","unstructured":"Liu W, Mei T, Zhang Y, Che C, Luo J (2015) Multi-task deep visual-semantic embedding for video thumbnail selection. Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. p pp 3707-3715"},{"key":"19433_CR57","first-page":"pp 1475","volume-title":"21st ACM SIGKDD Conference on Knowledge Discovery and Data Mining","author":"W Zhang","year":"2015","unstructured":"Zhang W, Li R, Zeng T, Sun Q, Kumar S, Ye J, Ji S (2015) Deep model based transfer and multi-task learning for biological image analysis. 21st ACM SIGKDD Conference on Knowledge Discovery and Data Mining. p pp 1475-1484"},{"key":"19433_CR58","first-page":"pp 370","volume-title":"Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, vol 1 (Long and Short Papers)","author":"MS Akhtar","year":"2019","unstructured":"Akhtar MS, Chauhan D, Ghosal D, Poria S, Ekbal A, Bhattacharyya P (2019) Multi-task learning for multi-modal emotion recognition and sentiment analysis. Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, vol 1 (Long and Short Papers). p pp 370-379"},{"key":"19433_CR59","first-page":"pp 10790","volume-title":"Proceedings of the 35th AAAI Conference Onartificial Intelligence","author":"W Yu","year":"2021","unstructured":"Yu W, Xu H, Yuan Z, Wu J (2021) Learning modality-specific representations with self-supervised multi-task learning for multimodal sentiment analysis. Proceedings of the 35th AAAI Conference Onartificial Intelligence. p pp 10790-10797"},{"key":"19433_CR60","doi-asserted-by":"publisher","first-page":"pp 3718","DOI":"10.18653\/v1\/2020.acl-main.343","volume-title":"Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics","author":"W Yu","year":"2020","unstructured":"Yu W, Xu H, Meng F, Zhu Y, Wu J, Zou J, Yang K (2020) Ch-sims: a Chinese multimodal sentiment analysis dataset with fine-grained annotation of modality. Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics. p pp 3718-3727"},{"key":"19433_CR61","doi-asserted-by":"publisher","first-page":"200","DOI":"10.1109\/TETCI.2022.3224929","volume":"7","author":"S Zhang","year":"2023","unstructured":"Zhang S, Yin C, Yin Z (2023) Multimodal sentiment recognition with multi-task learning. IEEE Trans Emerg Top Comp Intell 7:200\u2013209","journal-title":"IEEE Trans Emerg Top Comp Intell"},{"key":"19433_CR62","doi-asserted-by":"publisher","first-page":"16332","DOI":"10.1007\/s10489-022-03343-4","volume":"53","author":"Q Zhang","year":"2022","unstructured":"Zhang Q, Shi L, Liu P, Zhu Z, Xu L (2022) ICDN: integrating consistency and difference networks by transformer for multimodal sentiment analysis. Appl Intell 53:16332\u201316345","journal-title":"Appl Intell"},{"key":"19433_CR63","first-page":"pp 960","volume-title":"2014 IEEE International Conference on Acoustics, Speech and Signal Processing. IEEE","author":"G Degottex","year":"2014","unstructured":"Degottex G, Kane J, Drugman T, Raitio T, Scherer S (2014) Covarep\u2013a collaborative voice analysis repository for speech technologies. 2014 IEEE International Conference on Acoustics, Speech and Signal Processing. IEEE. p pp 960-964"},{"key":"19433_CR64","first-page":"pp 1","volume-title":"IEEE Winter Conference on Applications of Computer Vision. IEEE","author":"T Baltru Aitis","year":"2016","unstructured":"Baltru Aitis T, Robinson P, Morency LP (2016) OpenFace: An open source facial behavior analysis toolkit. IEEE Winter Conference on Applications of Computer Vision. IEEE. p pp 1-10"},{"key":"19433_CR65","volume-title":"Mosi: multimodal corpus of sentiment intensity and subjectivity analysis in online opinion videos","author":"A Zadeh","year":"2016","unstructured":"Zadeh A, Zellers R, Pincus E, Morency L-P (2016) Mosi: multimodal corpus of sentiment intensity and subjectivity analysis in online opinion videos arXiv:1606.06259"},{"key":"19433_CR66","first-page":"35","volume":"2023","author":"Y Hwang","year":"2023","unstructured":"Hwang Y, Kim JH (2023) Self-supervised unimodal label generation strategy using recalibrated modality representations for multimodal sentiment analysis. Findings of the Association for Computational Linguistics: EACL 2023:35\u201346","journal-title":"Findings of the Association for Computational Linguistics: EACL"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-024-19433-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-024-19433-z\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-024-19433-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,5,6]],"date-time":"2025-05-06T08:38:51Z","timestamp":1746520731000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-024-19433-z"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,5,28]]},"references-count":66,"journal-issue":{"issue":"13","published-online":{"date-parts":[[2025,4]]}},"alternative-id":["19433"],"URL":"https:\/\/doi.org\/10.1007\/s11042-024-19433-z","relation":{},"ISSN":["1573-7721"],"issn-type":[{"value":"1573-7721","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,5,28]]},"assertion":[{"value":"29 July 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"19 March 2024","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"15 May 2024","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"28 May 2024","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"This manuscript does not contain any study performed with humans or animals.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical approval"}},{"value":"The authors declare that they have no conflict of interest.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}