{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,25]],"date-time":"2025-10-25T12:57:04Z","timestamp":1761397024396,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":19,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,12,13]],"date-time":"2024-12-13T00:00:00Z","timestamp":1734048000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,12,13]]},"DOI":"10.1145\/3711542.3711551","type":"proceedings-article","created":{"date-parts":[[2025,4,14]],"date-time":"2025-04-14T04:46:56Z","timestamp":1744606016000},"page":"310-316","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":1,"title":["Enhancing Multimodal Tweet Analysis Accuracy through Integration of CLIP Model and Multi-layer Attention Mechanism"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0000-7549-0575","authenticated-orcid":false,"given":"Yupu","family":"Liu","sequence":"first","affiliation":[{"name":"Trustworthy Multimodal Affective Intelligence and Knowledge Engineering Lab, Tokushima University, Tokushima, Tokushima, Japan"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9820-1470","authenticated-orcid":false,"given":"Kazuyuki","family":"Matsumoto","sequence":"additional","affiliation":[{"name":"Trustworthy Multimodal Affective Intelligence and Knowledge Engineering Lab, Tokushima University, Tokushima, Tokushima, Japan"}]}],"member":"320","published-online":{"date-parts":[[2025,4,13]]},"reference":[{"key":"e_1_3_3_1_2_2","doi-asserted-by":"crossref","unstructured":"Peng Zhang Xufei Wang Baoxin Li \u201cOn Predicting Twitter Trend: Factors and Models \u201d IEEE\/ACM International Conference on Advances in Social Networks Analysis and Mining pp.1427-1429 2013.","DOI":"10.1145\/2492517.2492576"},{"key":"e_1_3_3_1_3_2","unstructured":"Shouqiang S. U. N. and L. I. Qingqing. \"Multimodal negative sentiment recognition in online public opinion during public health emergencies based on fusion strategy.\" Journal of the China Society for Scientific and Technical Information 42.5 (2023): 611-622."},{"key":"e_1_3_3_1_4_2","doi-asserted-by":"crossref","unstructured":"Shi Yifeng et al. \"Open-transmind: A new baseline and benchmark for 1st foundation model challenge of intelligent transportation.\" Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 2023.","DOI":"10.1109\/CVPRW59228.2023.00673"},{"key":"e_1_3_3_1_5_2","unstructured":"Liu Nanqing et al. \"CLIP-guided Source-free Object Detection in Aerial Images.\" arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2401.05168 (2024)."},{"key":"e_1_3_3_1_6_2","doi-asserted-by":"crossref","unstructured":"Agarwal Ayush Ashima Yadav and Dinesh Kumar Vishwakarma. \"Multimodal sentiment analysis via RNN variants.\" 2019 IEEE International Conference on Big Data Cloud Computing Data Science & Engineering (BCD). IEEE 2019.","DOI":"10.1109\/BCD.2019.8885108"},{"key":"e_1_3_3_1_7_2","doi-asserted-by":"crossref","unstructured":"Huang Feiran et al. \"Image\u2013text sentiment analysis via deep multimodal attentive fusion.\" Knowledge-Based Systems 167 (2019): 26-37.","DOI":"10.1016\/j.knosys.2019.01.019"},{"key":"e_1_3_3_1_8_2","unstructured":"Xu Kelvin et al. \"Show attend and tell: Neural image caption generation with visual attention.\" International conference on machine learning. PMLR 2015."},{"key":"e_1_3_3_1_9_2","doi-asserted-by":"crossref","unstructured":"Lu Jiasen et al. \"Knowing when to look: Adaptive attention via a visual sentinel for image captioning.\" Proceedings of the IEEE conference on computer vision and pattern recognition. 2017.","DOI":"10.1109\/CVPR.2017.345"},{"key":"e_1_3_3_1_10_2","doi-asserted-by":"crossref","unstructured":"Song Jifei et al. \"Deep spatial-semantic attention for fine-grained sketch-based image retrieval.\" Proceedings of the IEEE international conference on computer vision. 2017.","DOI":"10.1109\/ICCV.2017.592"},{"key":"e_1_3_3_1_11_2","doi-asserted-by":"crossref","unstructured":"He Kaiming et al. \"Deep residual learning for image recognition.\" Proceedings of the IEEE conference on computer vision and pattern recognition. 2016.","DOI":"10.1109\/CVPR.2016.90"},{"key":"e_1_3_3_1_12_2","doi-asserted-by":"crossref","unstructured":"Ueda Nobuhiro Daisuke Kawahara and Sadao Kurohashi. \"BERT-based cohesion analysis of Japanese texts.\" Proceedings of the 28th International Conference on Computational Linguistics. 2020.","DOI":"10.18653\/v1\/2020.coling-main.114"},{"key":"e_1_3_3_1_13_2","doi-asserted-by":"crossref","unstructured":"Moro Gianluca Stefano Salvatori and Giacomo Frisoni. \"Efficient text-image semantic search: A multi-modal vision-language approach for fashion retrieval.\" Neurocomputing 538 (2023): 126196.","DOI":"10.1016\/j.neucom.2023.03.057"},{"key":"e_1_3_3_1_14_2","doi-asserted-by":"crossref","unstructured":"Liu Ze et al. \"Swin transformer: Hierarchical vision transformer using shifted windows.\" Proceedings of the IEEE\/CVF international conference on computer vision. 2021.","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"e_1_3_3_1_15_2","doi-asserted-by":"crossref","unstructured":"Yu Jianfei and Jing Jiang. \"Adapting BERT for target-oriented multimodal sentiment classification.\" IJCAI 2019.","DOI":"10.24963\/ijcai.2019\/751"},{"key":"e_1_3_3_1_16_2","unstructured":"Socher Richard et al. \"Zero-shot learning through cross-modal transfer.\" Advances in neural information processing systems 26 (2013)."},{"key":"e_1_3_3_1_17_2","doi-asserted-by":"crossref","unstructured":"Shi Yifeng et al. \"Open-transmind: A new baseline and benchmark for 1st foundation model challenge of intelligent transportation.\" Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 2023.","DOI":"10.1109\/CVPRW59228.2023.00673"},{"key":"e_1_3_3_1_18_2","doi-asserted-by":"crossref","unstructured":"Sangeeta and Nasib Singh Gill \"Review of Factors Affecting Efficiency of Twitter Data Sentiment Analysis \" International Journal of Computer Theory and Engineering vol. 12 no. 2 pp. 53-58 2020.","DOI":"10.7763\/IJCTE.2020.V12.1263"},{"key":"e_1_3_3_1_19_2","doi-asserted-by":"crossref","unstructured":"Xiaorui Shao Chang-So Kim and Kwak Dong Ryul \"A Study on Customers\u2019 Sentiment Analysis Based on Big Data Using Twitter Data \" International Journal of Computer Theory and Engineering vol. 11 no. 1 pp. 11-14 2019.","DOI":"10.7763\/IJCTE.2019.V11.1232"},{"key":"e_1_3_3_1_20_2","doi-asserted-by":"crossref","unstructured":"Susan Mathew K Deborah Alex Nidhi Deshpande Richa Sharma Arti Arya and D. P. Balendra \"Multilevel Troll Classification of Twitter Data Using Machine Learning Techniques \"International Journal of Computer Theory and Engineering vol. 16 no. 1 pp. 21-28 2024.","DOI":"10.7763\/IJCTE.2024.V16.1350"}],"event":{"name":"NLPIR 2024: 2024 8th International Conference on Natural Language Processing and Information Retrieval","acronym":"NLPIR 2024","location":"Okayama Japan"},"container-title":["Proceedings of the 2024 8th International Conference on Natural Language Processing and Information Retrieval"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3711542.3711551","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3711542.3711551","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T01:18:29Z","timestamp":1750295909000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3711542.3711551"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,12,13]]},"references-count":19,"alternative-id":["10.1145\/3711542.3711551","10.1145\/3711542"],"URL":"https:\/\/doi.org\/10.1145\/3711542.3711551","relation":{},"subject":[],"published":{"date-parts":[[2024,12,13]]},"assertion":[{"value":"2025-04-13","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}