{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,8]],"date-time":"2025-02-08T05:09:30Z","timestamp":1738991370739,"version":"3.37.0"},"reference-count":58,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2025,2,7]],"date-time":"2025-02-07T00:00:00Z","timestamp":1738886400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,2,7]],"date-time":"2025-02-07T00:00:00Z","timestamp":1738886400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/100009110","name":"Natural Science Foundation of Xinjiang Uygur Autonomous Region","doi-asserted-by":"publisher","award":["2023D01C176","2023D01C176","2023D01C176","2023D01C176","2023D01C176"],"award-info":[{"award-number":["2023D01C176","2023D01C176","2023D01C176","2023D01C176","2023D01C176"]}],"id":[{"id":"10.13039\/100009110","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Xinjiang Uygur Autonomous Region Universities Fundamental Research Funds Scientific Research Project","award":["XJEDU2 022P018","XJEDU2 022P018","XJEDU2 022P018","XJEDU2 022P018","XJEDU2 022P018"],"award-info":[{"award-number":["XJEDU2 022P018","XJEDU2 022P018","XJEDU2 022P018","XJEDU2 022P018","XJEDU2 022P018"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Supercomput"],"DOI":"10.1007\/s11227-025-06958-9","type":"journal-article","created":{"date-parts":[[2025,2,7]],"date-time":"2025-02-07T06:56:01Z","timestamp":1738911361000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["SFVE: visual information enhancement metaphor detection with multimodal splitting fusion"],"prefix":"10.1007","volume":"81","author":[{"given":"Qimeng","family":"Yang","sequence":"first","affiliation":[]},{"given":"Hao","family":"Meng","sequence":"additional","affiliation":[]},{"given":"Yuanbo","family":"Yan","sequence":"additional","affiliation":[]},{"given":"Shisong","family":"Guo","sequence":"additional","affiliation":[]},{"given":"Qixing","family":"Wei","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,2,7]]},"reference":[{"key":"6958_CR1","unstructured":"Campbell G (1988) The philosophy of rhetoric. SIU Press"},{"issue":"4","key":"6958_CR2","doi-asserted-by":"publisher","first-page":"579","DOI":"10.1162\/COLI_a_00233","volume":"41","author":"S Ekaterina","year":"2015","unstructured":"Ekaterina S (2015) Design and evaluation of metaphor processing systems. Comput Linguistics 41(4):579\u2013623","journal-title":"Comput Linguistics"},{"key":"6958_CR3","doi-asserted-by":"crossref","unstructured":"Steen G et al (2010) A method for linguistic metaphor identification from MIP to MIPVU preface, Method for linguistic metaphor identification: from MIP To MIPVU 14 pp.IX\u2013+","DOI":"10.1075\/celcr.14"},{"key":"6958_CR4","doi-asserted-by":"crossref","unstructured":"Dan A et al (2013) Why \"dark thoughts\u201d aren\u2019t really dark: a novel algorithm for metaphor identification. In: IEEE Symposium on Computational Intelligence, Cognitive Algorithms, Mind, and Brain (CCMB). IEEE. 2013:60\u201365","DOI":"10.1109\/CCMB.2013.6609166"},{"key":"6958_CR5","doi-asserted-by":"crossref","unstructured":"Bizzoni Y, Chatzikyriakidis S, Ghanimifard M (2017) \"deep\u201d learning: detecting metaphoricity in adjective-noun pairs. In: Proceedings of the Workshop on Stylistic Variation. pp.43\u201352","DOI":"10.18653\/v1\/W17-4906"},{"key":"6958_CR6","unstructured":"Lakoff G, Johnson M (2008) Metaphors we live by. University of Chicago press"},{"key":"6958_CR7","doi-asserted-by":"crossref","unstructured":"Wang S et al. (2023) Metaphor detection with effective context denoising. arXiv preprint arXiv:2302.05611","DOI":"10.18653\/v1\/2023.eacl-main.102"},{"key":"6958_CR8","unstructured":"Turney P et al. (2011) Literal and Metaphorical Sense Identification Through Concrete and Abstract Context. In: Proceedings of the 2011 Conference on Empirical Methods in Natural Language Processing. pp.680\u2013690"},{"key":"6958_CR9","doi-asserted-by":"crossref","unstructured":"Li L, Sporleder C (2009) Classifier Combination for Contextual Idiom Detection Without Labelled Data. In: Proceedings of the 2009 conference on empirical methods in natural language processing. pp.315\u2013323","DOI":"10.3115\/1699510.1699552"},{"key":"6958_CR10","unstructured":"Shutova E, Sun L, Korhonen A (2010) Metaphor Identification Using Verb and Noun Clustering. In: Proceedings of the 23rd International Conference on Computational Linguistics (Coling 2010). pp.1002\u20131010"},{"key":"6958_CR11","doi-asserted-by":"crossref","unstructured":"Ding Y et al. (2024) Clothes-Eraser: clothing-aware controllable disentanglement for clothes-changing person re-identification. In: Signal, Image and Video Processing. pp. 1\u201312","DOI":"10.1007\/s11760-024-03076-6"},{"key":"6958_CR12","doi-asserted-by":"crossref","unstructured":"Ding Y, Wang A, Zhang L (2024) Multidimensional semantic disentanglement network for clothes-changing person re-identification. In: Proceedings of the 2024 International Conference on Multimedia Retrieval. pp. 1025\u20131033","DOI":"10.1145\/3652583.3658037"},{"key":"6958_CR13","doi-asserted-by":"crossref","unstructured":"Do Dinh E-L, Gurevych I (2016) Token-level metaphor detection using neural networks. Proceedings of the Fourth Workshop on Metaphor in NLP. pp.28\u201333","DOI":"10.18653\/v1\/W16-1104"},{"key":"6958_CR14","doi-asserted-by":"crossref","unstructured":"Mykowiecka A, Wawer A, Marciniak M (2018) Detecting figurative word occurrences using recurrent neural networks. In: Proceedings of the Workshop on Figurative Language Processing. pp.124\u2013127","DOI":"10.18653\/v1\/W18-0916"},{"key":"6958_CR15","doi-asserted-by":"crossref","unstructured":"Song W et al (2021) Verb metaphor detection via contextual relation learning. In: Proceedings of the 59th Annual Meeting of the Association for Computational Linguistics and the 11th International Joint Conference on Natural Language Processing (Vol 1: Long Papers). pp.4240\u20134251","DOI":"10.18653\/v1\/2021.acl-long.327"},{"key":"6958_CR16","doi-asserted-by":"publisher","first-page":"30","DOI":"10.1016\/j.inffus.2022.06.002","volume":"86","author":"R Mao","year":"2022","unstructured":"Mao R et al (2022) MetaPro: a computational metaphor processing model for text pre-processing. Inform Fusion 86:30\u201343","journal-title":"Inform Fusion"},{"key":"6958_CR17","unstructured":"Zhang S, Liu Y (2022) Metaphor detection via linguistics enhanced Siamese network. In: Proceedings of the 29th International Conference on Computational Linguistics. pp.4149\u20134159"},{"key":"6958_CR18","doi-asserted-by":"crossref","unstructured":"Fu C et al (2020) Beyond literal visual modeling: Understanding image metaphor based on literal-implied concept mapping. In: MultiMedia Modeling: 26th International Conference, MMM 2020, Daejeon, South Korea, January 5\u20138, 2020, Proceedings, Part I 26. Springer. pp.111\u2013123","DOI":"10.1007\/978-3-030-37731-1_10"},{"key":"6958_CR19","doi-asserted-by":"crossref","unstructured":"Akula AR et al (2023) Metaclue: Towards comprehensive visual metaphors research. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition. pp.23201\u201323211","DOI":"10.1109\/CVPR52729.2023.02222"},{"key":"6958_CR20","doi-asserted-by":"crossref","unstructured":"He T et al (2024) Balanced active sampling for person re-identification. In: 2024 IEEE International Conference on Multimedia and Expo (ICME). IEEE. pp.1\u20136","DOI":"10.1109\/ICME57554.2024.10688230"},{"key":"6958_CR21","doi-asserted-by":"crossref","unstructured":"Shutova E, Kiela D, Maillard J (2016) Black holes and white rabbits: metaphor identification with visual features. In: Proceedings of the 2016 conference of the North American chapter of the association for computational linguistics: Human language technologies. pp.160\u2013170","DOI":"10.18653\/v1\/N16-1020"},{"key":"6958_CR22","unstructured":"Kehat G, Pustejovsky J (2020) Improving neural metaphor detection with visual datasets. In: Proceedings of the Twelfth Language Resources and Evaluation Conference. pp.5928\u20135933"},{"key":"6958_CR23","doi-asserted-by":"publisher","first-page":"166","DOI":"10.1016\/j.neucom.2020.11.051","volume":"429","author":"S Chang","year":"2021","unstructured":"Chang S et al (2021) Multimodal metaphor detection based on distinguishing concreteness. Neurocomputing 429:166\u2013173","journal-title":"Neurocomputing"},{"key":"6958_CR24","doi-asserted-by":"crossref","unstructured":"Zhang D et al (2021) In Your Face: Sentiment Analysis of Metaphor with Facial Expressive Features. In: 2021 International Joint Conference on Neural Networks (IJCNN). IEEE. pp.1\u20138","DOI":"10.1109\/IJCNN52387.2021.9533972"},{"key":"6958_CR25","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1007\/s40747-024-01660-4","volume":"11","author":"D Yongkang","year":"2025","unstructured":"Yongkang D et al (2025) Attention-enhanced multimodal feature fusion network for clothes-changing person re-identification. Complex Intell Syst 11:1\u201315","journal-title":"Complex Intell Syst"},{"key":"6958_CR26","unstructured":"Li W et al (2024) rLLM: Relational table learning with LLMs. arXiv preprint arXiv:2407.20157"},{"key":"6958_CR27","doi-asserted-by":"crossref","unstructured":"Wang Z et al (2024) From cluster assumption to graph convolution: Graph-based semi-supervised learning revisited. In: IEEE Transactions on Neural Networks and Learning Systems","DOI":"10.1109\/TNNLS.2024.3454710"},{"key":"6958_CR28","doi-asserted-by":"crossref","unstructured":"Wang Z et al (2021) Zero-shot node classification with decomposed graph prototype network. In: Proceedings of the 27th ACM SIGKDD conference on knowledge discovery & data mining. pp.1769\u20131779","DOI":"10.1145\/3447548.3467230"},{"issue":"11","key":"6958_CR29","first-page":"3634","volume":"33","author":"W Zheng","year":"2020","unstructured":"Zheng W et al (2020) Network embedding with completely-imbalanced labels. IEEE Trans Knowledge Data Eng 33(11):3634\u20133647","journal-title":"IEEE Trans Knowledge Data Eng"},{"key":"6958_CR30","doi-asserted-by":"crossref","unstructured":"Wang Z et al (2017) Multiple source detection without knowing the underlying propagation model. In: Proceedings of the AAAI Conference on Artificial Intelligence","DOI":"10.1609\/aaai.v31i1.10477"},{"key":"6958_CR31","doi-asserted-by":"crossref","unstructured":"Alnajjar K , H\u00e4m\u00e4l\u00e4inen M, Zhang S (2022) Ring that bell: A corpus and method for multimodal metaphor detection in videos. arXiv preprint arXiv:2301.01134","DOI":"10.18653\/v1\/2022.flp-1.4"},{"key":"6958_CR32","doi-asserted-by":"crossref","unstructured":"Zhang D et al (2021) MultiMET: a multimodal dataset for metaphor understanding. In: Proceedings of the 59th Annual Meeting of the Association for Computational Linguistics and the 11th International Joint Conference on Natural Language Processing (Volume 1: Long Papers). pp.3214\u20133225","DOI":"10.18653\/v1\/2021.acl-long.249"},{"key":"6958_CR33","doi-asserted-by":"crossref","unstructured":"Xu B et al (2022) Met-meme: a multimodal meme dataset rich in metaphors. In: Proceedings of the 45th international ACM SIGIR conference on research and development in information retrieval. pp.2887\u20132899","DOI":"10.1145\/3477495.3532019"},{"key":"6958_CR34","unstructured":"Kim J (2022) BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding"},{"issue":"7","key":"6958_CR35","doi-asserted-by":"publisher","first-page":"9277","DOI":"10.1007\/s11042-021-11549-w","volume":"81","author":"Z Liming","year":"2022","unstructured":"Liming Z et al (2022) An infrared and visible image fusion algorithm based on ResNet-152. Multimed Tools Appl 81(7):9277\u20139287","journal-title":"Multimed Tools Appl"},{"key":"6958_CR36","doi-asserted-by":"crossref","unstructured":"Zhou B et al (2016) Learning deep features for discriminative localization. Proceedings of the IEEE conference on computer vision and pattern recognition. pp.2921\u20132929","DOI":"10.1109\/CVPR.2016.319"},{"key":"6958_CR37","doi-asserted-by":"crossref","unstructured":"Hu J, Shen L, Sun G (2018) Squeeze-and-excitation networks. Proceedings of the IEEE conference on computer vision and pattern recognition. pp.7132\u20137141","DOI":"10.1109\/CVPR.2018.00745"},{"key":"6958_CR38","unstructured":"Zagoruyko S, Komodakis N (2016) Paying more attention to attention: Improving the performance of convolutional neural networks via attention transfer. arXiv preprint arXiv:1612.03928"},{"key":"6958_CR39","unstructured":"Joze HRV et al (2020) MMTM: multimodal transfer module for CNN fusion. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition. pp.13289\u201313299"},{"key":"6958_CR40","doi-asserted-by":"crossref","unstructured":"Cai Y, Cai H, Wan X (2019) Multi-modal sarcasm detection in twitter with hierarchical fusion model. In: Proceedings of the 57th annual meeting of the association for computational linguistics. pp.2506\u20132515","DOI":"10.18653\/v1\/P19-1239"},{"key":"6958_CR41","doi-asserted-by":"crossref","unstructured":"Lewis M et al (2019) Bart: denoising sequence-to-sequence pre-training for natural language generation, translation, and comprehension. arXiv preprint arXiv:1910.13461","DOI":"10.18653\/v1\/2020.acl-main.703"},{"key":"6958_CR42","doi-asserted-by":"crossref","unstructured":"Qassim H, Verma A, Feinzimer D (2018) Compressed residual-VGG16 CNN model for big data places image recognition. In: IEEE 8th annual computing and communication workshop and conference (CCWC). IEEE. 2018:169\u2013175","DOI":"10.1109\/CCWC.2018.8301729"},{"key":"6958_CR43","doi-asserted-by":"crossref","unstructured":"He K et al (2016) Deep residual learning for image recognition. In: Proceedings of the IEEE conference on computer vision and pattern recognition. pp.770\u2013778","DOI":"10.1109\/CVPR.2016.90"},{"key":"6958_CR44","doi-asserted-by":"crossref","unstructured":"Pan H et al (2020) Modeling intra and inter-modality incongruity for multi-modal sarcasm detection. In: Findings of the Association for Computational Linguistics: EMNLP 2020. pp.1383\u20131392","DOI":"10.18653\/v1\/2020.findings-emnlp.124"},{"key":"6958_CR45","doi-asserted-by":"publisher","first-page":"130","DOI":"10.1016\/j.neucom.2021.09.041","volume":"467","author":"B Yang","year":"2022","unstructured":"Yang B et al (2022) Multimodal sentiment analysis with unidirectional modality translation. Neurocomputing 467:130\u2013137","journal-title":"Neurocomputing"},{"key":"6958_CR46","doi-asserted-by":"crossref","unstructured":"de Toledo GL, Marcacini RM (2022) Transfer learning with joint fine-tuning for multimodal sentiment analysis. arXiv preprint arXiv:2210.05790","DOI":"10.52591\/lxai202207173"},{"key":"6958_CR47","doi-asserted-by":"crossref","unstructured":"Chen X et al (2022) Hybrid transformer with multi-level fusion for multimodal knowledge graph completion. In: Proceedings of the 45th international ACM SIGIR conference on research and development in information retrieval. pp.904\u2013915","DOI":"10.1145\/3477495.3531992"},{"issue":"1","key":"6958_CR48","first-page":"309","volume":"15","author":"S Licai","year":"2023","unstructured":"Licai S et al (2023) Efficient multimodal transformer with dual-level feature restoration for robust multimodal sentiment analysis. IEEE Trans Affect Comput 15(1):309\u2013325","journal-title":"IEEE Trans Affect Comput"},{"issue":"3","key":"6958_CR49","doi-asserted-by":"publisher","first-page":"103652","DOI":"10.1016\/j.ipm.2024.103652","volume":"61","author":"H Xiaoyu","year":"2024","unstructured":"Xiaoyu H et al (2024) VIEMF: multimodal metaphor detection via visual information enhancement with multimodal fusion. Inform Process Manage 61(3):103652","journal-title":"Inform Process Manage"},{"key":"6958_CR50","doi-asserted-by":"crossref","unstructured":"Xu N, Zeng Z, Mao W (2020) Reasoning with multimodal sarcastic tweets via modeling cross-modality contrast and semantic association. In: Proceedings of the 58th annual meeting of the association for computational linguistics. pp.3777\u20133786","DOI":"10.18653\/v1\/2020.acl-main.349"},{"key":"6958_CR51","doi-asserted-by":"crossref","unstructured":"Lou C et al (2021) Affective dependency graph for sarcasm detection. In: Proceedings of the 44th international ACM SIGIR conference on research and development in information retrieval. pp.1844\u20131849","DOI":"10.1145\/3404835.3463061"},{"key":"6958_CR52","doi-asserted-by":"crossref","unstructured":"Liang B et al (2022) Multi-modal sarcasm detection via cross-modal graph convolutional network. In: Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers). Association for Computational Linguistics. pp.1767\u20131777","DOI":"10.18653\/v1\/2022.acl-long.124"},{"key":"6958_CR53","doi-asserted-by":"publisher","first-page":"101921","DOI":"10.1016\/j.inffus.2023.101921","volume":"100","author":"Y Tan","year":"2023","unstructured":"Tan Y et al (2023) KnowleNet: knowledge fusion network for multimodal sarcasm detection. Inform Fusion 100:101921","journal-title":"Inform Fusion"},{"key":"6958_CR54","unstructured":"Clark K (2020) Electra: Pre-training text encoders as discriminators rather than generators, arXiv preprint arXiv:2003.10555"},{"key":"6958_CR55","doi-asserted-by":"publisher","first-page":"127","DOI":"10.1016\/j.inffus.2020.01.008","volume":"59","author":"H Cai","year":"2020","unstructured":"Cai H et al (2020) Feature-level fusion approaches based on multimodal EEG data for depression recognition. Inform Fusion 59:127\u2013138","journal-title":"Inform Fusion"},{"key":"6958_CR56","doi-asserted-by":"publisher","first-page":"625","DOI":"10.1007\/s00521-018-3882-6","volume":"32","author":"MKA Ghani","year":"2020","unstructured":"Ghani MKA et al (2020) Decision-level fusion scheme for nasopharyngeal carcinoma identification using machine learning techniques. Neural Comput Appl 32:625\u2013638","journal-title":"Neural Comput Appl"},{"key":"6958_CR57","doi-asserted-by":"publisher","first-page":"108580","DOI":"10.1016\/j.knosys.2022.108580","volume":"244","author":"MA Iqbal","year":"2022","unstructured":"Iqbal MA, Baibhav N, Sarbani R (2022) Deep learning based multimodal emotion recognition using model-level fusion of audio-visual modalities. Knowledge-Based Syst 244:108580","journal-title":"Knowledge-Based Syst"},{"key":"6958_CR58","doi-asserted-by":"crossref","unstructured":"Selvaraju RR et al (2017) Grad-cam: visual explanations from deep networks via gradient-based localization. Proceedings of the IEEE international conference on computer vision. pp.618\u2013626","DOI":"10.1109\/ICCV.2017.74"}],"container-title":["The Journal of Supercomputing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11227-025-06958-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11227-025-06958-9\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11227-025-06958-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,2,7]],"date-time":"2025-02-07T06:56:22Z","timestamp":1738911382000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11227-025-06958-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,2,7]]},"references-count":58,"journal-issue":{"issue":"3","published-online":{"date-parts":[[2025,2]]}},"alternative-id":["6958"],"URL":"https:\/\/doi.org\/10.1007\/s11227-025-06958-9","relation":{},"ISSN":["1573-0484"],"issn-type":[{"value":"1573-0484","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,2,7]]},"assertion":[{"value":"15 January 2025","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"7 February 2025","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no competing interests.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interests"}}],"article-number":"467"}}