{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,9]],"date-time":"2026-06-09T12:31:46Z","timestamp":1781008306175,"version":"3.54.1"},"reference-count":75,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2020,5,25]],"date-time":"2020-05-25T00:00:00Z","timestamp":1590364800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2020,5,25]],"date-time":"2020-05-25T00:00:00Z","timestamp":1590364800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimedia Systems"],"published-print":{"date-parts":[[2020,8]]},"DOI":"10.1007\/s00530-020-00656-7","type":"journal-article","created":{"date-parts":[[2020,5,25]],"date-time":"2020-05-25T12:02:42Z","timestamp":1590408162000},"page":"431-451","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":50,"title":["A deep learning architecture of RA-DLNet for visual sentiment analysis"],"prefix":"10.1007","volume":"26","author":[{"given":"Ashima","family":"Yadav","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1026-0047","authenticated-orcid":false,"given":"Dinesh Kumar","family":"Vishwakarma","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2020,5,25]]},"reference":[{"key":"656_CR1","doi-asserted-by":"crossref","unstructured":"You, Q., Luo, J., Jin, H., Yang, J.: Robust image sentiment analysis using progressively trained and domain transferred deep networks. In: Twenty-Ninth AAAI Conference on Artificial Intelligence, pp. 381\u2013388. USA (2015)","DOI":"10.1609\/aaai.v29i1.9179"},{"key":"656_CR2","doi-asserted-by":"publisher","first-page":"557","DOI":"10.1016\/j.patcog.2016.06.002","volume":"61","author":"E Ohn-bar","year":"2016","unstructured":"Ohn-bar, E., Trivedi, M.M.: Multi-scale volumes for deep object detection and localization. Pattern Recogn. 61, 557\u2013572 (2016)","journal-title":"Pattern Recogn."},{"issue":"1","key":"656_CR3","doi-asserted-by":"publisher","first-page":"142","DOI":"10.1109\/TPAMI.2015.2437384","volume":"38","author":"R Girshick","year":"2016","unstructured":"Girshick, R., Donahue, J., Darrell, T., Malik, J.: Region-based convolutional networks for accurate object detection and segmentation. IEEE Trans. Pattern Anal. Mach. Intell. 38(1), 142\u2013158 (2016)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"656_CR4","doi-asserted-by":"crossref","unstructured":"Oquab, M., Bottou, L.: Learning and transferring mid-level image representations using convolutional neural networks. In: IEEE Conference on Computer Vision and Pattern Recognition Learning,\u00a0pp. 1717\u20131724. Columbus, OH (2014)","DOI":"10.1109\/CVPR.2014.222"},{"key":"656_CR5","doi-asserted-by":"crossref","unstructured":"Deng, J., Dong, W., Socher, R., Li, L., Li, K., Fei-fei, L.: ImageNet: a large-scale hierarchical image database. In: IEEE Conference on Computer Vision and Pattern Recognition,\u00a0pp. 248\u2013255. Florida (2009)","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"656_CR6","first-page":"435","volume-title":"European Conference on Computer Vision","author":"B Chu","year":"2016","unstructured":"Chu, B., Madhavan, V., Beijbom, O., Hoffman, J., Darrell, T.: Best practices for fine-tuning visual classifiers to new domains. In: Hua, G., J\u00e9gou, H. (eds.) European Conference on Computer Vision, pp. 435\u2013442. Springer, Amsterdam (2016)"},{"key":"656_CR7","doi-asserted-by":"crossref","unstructured":"Borth, D., Ji, R., Chen, T., Breuel, T., Chang, S.-F.: Large-scale visual sentiment ontology and detectors using adjective noun pairs. In: 21st ACM International Conference on Multimedia,\u00a0pp. 223\u2013232 (2013)","DOI":"10.1145\/2502081.2502282"},{"key":"656_CR8","doi-asserted-by":"crossref","unstructured":"Siersdorfer, S., Minack, E., Deng, F., Hare, J.: Analyzing and predicting sentiment of images on the social web. In: 18th ACM International Conference on Multimedia,\u00a0pp. 715\u2013718 (2010)","DOI":"10.1145\/1873951.1874060"},{"key":"656_CR9","doi-asserted-by":"crossref","unstructured":"Vonikakis, V., Winkler, S.: Emotion-based sequence of family photos. In: Proceedings of the 20th ACM International conference on Multimedia,\u00a0pp. 1371\u20131372 (2012)","DOI":"10.1145\/2393347.2396490"},{"key":"656_CR10","doi-asserted-by":"crossref","unstructured":"Jia, J., Wu, S., Wang, X., Hu, P., Cai, L., Tang, J.: Can we understand van gogh\u2019s mood? Learning to infer affects from images in social networks. In: 20th ACM International Conference on Multimedia,\u00a0pp. 857\u2013860 (2012)","DOI":"10.1145\/2393347.2396330"},{"key":"656_CR11","doi-asserted-by":"crossref","unstructured":"Li, B., Feng, S., Xiong, W., Hu, W.: Scaring or pleasing: exploit emotional impact of an image. In: 20th ACM International Conference on Multimedia,\u00a0pp. 1365\u20131366 (2012)","DOI":"10.1145\/2393347.2396487"},{"issue":"12","key":"656_CR12","doi-asserted-by":"publisher","first-page":"2185","DOI":"10.1109\/TMM.2015.2484966","volume":"17","author":"S Wang","year":"2015","unstructured":"Wang, S., Wang, J., Wang, Z., Ji, Q.: Multiple emotion tagging for multimedia data by exploiting high-order dependencies among emotions. IEEE Trans. Multimedia 17(12), 2185\u20132197 (2015)","journal-title":"IEEE Trans. Multimedia"},{"key":"656_CR13","doi-asserted-by":"crossref","unstructured":"Yuan, J., You, Q., Mcdonough, S., Luo, J.: Sentribute: image sentiment analysis from a mid-level perspective. In: Second International Workshop on Issues of Sentiment Discovery and Opinion Mining,\u00a0pp. 1\u20138. Chicago (2013)","DOI":"10.1145\/2502069.2502079"},{"key":"656_CR14","doi-asserted-by":"crossref","unstructured":"Zhao, S., Gao, Y., Jiang, X., Yao, H., Chua, T., Sun, X.: Exploring principles-of-art features for image emotion recognition. In: 22nd ACM International Conference on Multimedia,\u00a0pp. 47\u201356. Florida (2014)","DOI":"10.1145\/2647868.2654930"},{"issue":"3","key":"656_CR15","doi-asserted-by":"publisher","first-page":"298","DOI":"10.1109\/TAFFC.2014.2388370","volume":"6","author":"Y Chen","year":"2015","unstructured":"Chen, Y., Chen, T., Liu, T., Liao, H.Y.M., Chang, S.: Assistive image comment robot\u2014a novel mid-level concept-based representation. IEEE Trans. Affect. Comput. 6(3), 298\u2013311 (2015)","journal-title":"IEEE Trans. Affect. Comput."},{"issue":"4","key":"656_CR16","doi-asserted-by":"publisher","first-page":"997","DOI":"10.1109\/TMM.2017.2757769","volume":"20","author":"F Chen","year":"2018","unstructured":"Chen, F., Ji, R., Su, J., Cao, D., Gao, Y.: Predicting microblog sentiments via weakly supervised multimodal deep learning. IEEE Trans. Multimedia 20(4), 997\u20131007 (2018)","journal-title":"IEEE Trans. Multimedia"},{"key":"656_CR17","doi-asserted-by":"publisher","first-page":"2513","DOI":"10.1109\/TMM.2018.2803520","volume":"20","author":"J Yang","year":"2018","unstructured":"Yang, J., She, D., Sun, M., Cheng, M.-M., Rosin, P.L., Wang, L.: Visual sentiment prediction based on automatic discovery of affective regions. IEEE Trans. Multimedia 20, 2513\u20132525 (2018)","journal-title":"IEEE Trans. Multimedia"},{"key":"656_CR18","first-page":"1","volume":"30","author":"H Xiong","year":"2019","unstructured":"Xiong, H., Liu, Q., Song, S., Cai, Y.: Region-based convolutional neural network using group sparse regularization for image sentiment classification. EURASIP J. Image Video Process. 30, 1\u20139 (2019)","journal-title":"EURASIP J. Image Video Process."},{"issue":"6","key":"656_CR19","doi-asserted-by":"publisher","first-page":"1245","DOI":"10.1109\/TMM.2017.2648498","volume":"19","author":"B Zhao","year":"2017","unstructured":"Zhao, B., Wu, X., Feng, J., Peng, Q., Yan, S.: Diversified visual attention networks for fine-grained object classification. IEEE Trans. Multimedia 19(6), 1245\u20131256 (2017)","journal-title":"IEEE Trans. Multimedia"},{"key":"656_CR20","doi-asserted-by":"crossref","unstructured":"Zoph, B., Vasudevan, V., Shlens, J., Le, Q.V.: Learning transferable architectures for scalable image recognition. In: IEEE Conference on Computer Vision and Pattern Recognition,\u00a0pp. 8697\u20138710. Utah (2018)","DOI":"10.1109\/CVPR.2018.00907"},{"key":"656_CR21","unstructured":"Simonyan, K., Zisserman, A.: Very deep convolutional networks for large-scale image recognition. In: International Conference on Learning Representations. California (2015)"},{"key":"656_CR22","doi-asserted-by":"crossref","unstructured":"Szegedy, C., Vanhoucke, V., Shlens, J., Wojna, Z.: Rethinking the inception architecture for computer vision. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 2818\u20132826 (2015)","DOI":"10.1109\/CVPR.2016.308"},{"key":"656_CR23","unstructured":"Bahdanau, D., Cho, K., Bengio, Y.: Neural machine translation by jointly learning to align and translate. In: International Conference on Learning Representations. California (2015)"},{"key":"656_CR24","doi-asserted-by":"crossref","unstructured":"Wang, F., Jiang, M., Qian, C., Yang, S., Li, C., Zhang, H., Wang, X., Tang, X.: Residual attention network for image classification. In: IEEE Conference on Computer Vision and Pattern Recognition,\u00a0pp. 3156\u20133164 (2017)","DOI":"10.1109\/CVPR.2017.683"},{"key":"656_CR25","doi-asserted-by":"crossref","unstructured":"Campos, V., Salvador, A., Jou, B., Gir\u00f3-i-nieto, X.: Diving deep into sentiment: understanding fine-tuned CNNs for visual sentiment prediction. In: 1st International Workshop on Affect & Sentiment in Multimedia,\u00a0pp. 57\u201362 (2015)","DOI":"10.1145\/2813524.2813530"},{"key":"656_CR26","unstructured":"Wang, J., Fu, J., Xu, Y., Mei, T.: Beyond object recognition: visual sentiment analysis with deep coupled adjective and noun neural networks. In: Twenty-Fifth International Joint Conference on Artificial Intelligence,\u00a0pp. 3484\u20133490. New York (2016)"},{"key":"656_CR27","doi-asserted-by":"publisher","first-page":"218","DOI":"10.1016\/j.neucom.2018.05.104","volume":"312","author":"K Song","year":"2018","unstructured":"Song, K., Yao, T., Ling, Q., Mei, T.: Boosting image sentiment analysis with visual attention. Neurocomputing 312, 218\u2013228 (2018)","journal-title":"Neurocomputing"},{"key":"656_CR28","doi-asserted-by":"crossref","unstructured":"Islam, J., Zhang, Y.: Visual sentiment analysis for social images using transfer learning approach. In: IEEE International Conferences on Big Data and Cloud Computing (BDCloud), Social Computing and Networking (SocialCom), Sustainable Computing and Communications (SustainCom),\u00a0pp. 124\u2013130. Atlanta (2016)","DOI":"10.1109\/BDCloud-SocialCom-SustainCom.2016.29"},{"key":"656_CR29","doi-asserted-by":"crossref","unstructured":"Fan, S., Jiang, M., Shen, Z., Koenig, B.L., Kankanhalli, M.S., Zhao, Q.: The role of visual attention in sentiment prediction. In: 25th ACM International Conference on Multimedia,\u00a0pp. 217\u2013225. California (2017)","DOI":"10.1145\/3123266.3123445"},{"key":"656_CR30","doi-asserted-by":"crossref","unstructured":"Sharma, R., Tan, L.N., Sadat, F.: Multimodal sentiment analysis using deep learning. In: 17th IEEE International Conference on Machine Learning and Applications,\u00a0pp. 1475\u20131478 (2018)","DOI":"10.1109\/ICMLA.2018.00240"},{"issue":"10","key":"656_CR31","doi-asserted-by":"publisher","first-page":"2693","DOI":"10.1109\/TMM.2018.2815998","volume":"20","author":"Z Li","year":"2018","unstructured":"Li, Z., Jiao, Y., Yang, X., Zhang, T., Huang, S.: 3D attention-based deep ranking model for video highlight detection. IEEE Trans. Multimedia 20(10), 2693\u20132705 (2018)","journal-title":"IEEE Trans. Multimedia"},{"key":"656_CR32","doi-asserted-by":"crossref","unstructured":"Szegedy, C., Ioffe, S., Vanhoucke, V., Alemi, A.: Inception-v4, inception-ResNet and the impact of residual connections on learning. In: 31st AAAI Conference on Artificial Intelligence,\u00a0pp. 4278\u20134284. Arizona (2016)","DOI":"10.1609\/aaai.v31i1.11231"},{"issue":"1","key":"656_CR33","doi-asserted-by":"publisher","first-page":"1115","DOI":"10.1007\/s11042-016-4310-5","volume":"77","author":"Z Li","year":"2017","unstructured":"Li, Z., Fan, Y., Liu, W., Wang, F.: Image sentiment prediction based on textual descriptions with adjective noun pairs. Multimedia Tools Appl. 77(1), 1115\u20131132 (2017)","journal-title":"Multimedia Tools Appl."},{"key":"656_CR34","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.patcog.2018.07.028","volume":"85","author":"H Yang","year":"2019","unstructured":"Yang, H., Yuan, C., Li, B., Du, Y., Xing, J.: Asymmetric 3D convolutional neural networks for action recognition. Pattern Recogn. 85, 1\u201312 (2019)","journal-title":"Pattern Recogn."},{"key":"656_CR35","doi-asserted-by":"crossref","unstructured":"Chollet, F.: Xception: deep learning with depthwise separable convolutions. In: IEEE Conference on Computer Vision and Pattern Recognition,\u00a0pp. 1251\u20131258. Honolulu\u00a0(2017)","DOI":"10.1109\/CVPR.2017.195"},{"key":"656_CR36","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778. Las Vegas (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"656_CR37","doi-asserted-by":"crossref","unstructured":"Xiao, T., Li, H., Ouyang, W., Wang, X.: Learning deep feature representations with domain guided dropout for person re-identification. In: IEEE Conference on Computer Vision and Pattern Recognition,\u00a0pp. 1249\u20131258. Las Vegas (2016)","DOI":"10.1109\/CVPR.2016.140"},{"key":"656_CR38","doi-asserted-by":"crossref","unstructured":"Toshev, A., Szegedy, C.: DeepPose: human pose estimation via deep neural networks. In: IEEE Conference on Computer Vision and Pattern Recognition, Columbus, pp. 1653\u20131660. Ohio (2014)","DOI":"10.1109\/CVPR.2014.214"},{"key":"656_CR39","doi-asserted-by":"crossref","unstructured":"Girshick, R., Donahue, J., Darrell, T., Malik, J.: Rich feature hierarchies for accurate object detection and semantic segmentation. In: IEEE Conference on Computer Vision and Pattern Recognition,\u00a0pp. 580\u2013587. Columbus, Ohio (2014)","DOI":"10.1109\/CVPR.2014.81"},{"key":"656_CR40","unstructured":"Schulman, J., Wolski, F., Dhariwal, P., Radford, A., Klimov, O.: Proximal policy optimization algorithms (2017). arXiv preprint arXiv:1707.06347"},{"key":"656_CR41","doi-asserted-by":"crossref","unstructured":"Machajdik, J., Hanbury, A.: Affective image classification using features inspired by psychology and art theory. In: ACM International Conference on Multimedia,\u00a0pp. 83\u201392 (2010)","DOI":"10.1145\/1873951.1873965"},{"key":"656_CR42","doi-asserted-by":"crossref","unstructured":"Wang, X., Jia, J., Yin, J., Cai, L.: Interpretable aesthetic features for affective image classification. In: IEEE International Conference on Image Processing,\u00a0pp. 3230\u20133234 (2013)","DOI":"10.1109\/ICIP.2013.6738665"},{"key":"656_CR43","doi-asserted-by":"crossref","unstructured":"Rao, T., Xu, M., Liu, H., Wang, J., Burnett, I.: Multi-scale blocks based image emotion classification using multiple instance learning. In: IEEE International Conference on Image Processing (ICIP),\u00a0pp. 634\u2013638. Arizona (2016)","DOI":"10.1109\/ICIP.2016.7532434"},{"issue":"13","key":"656_CR44","doi-asserted-by":"publisher","first-page":"17247","DOI":"10.1007\/s11042-017-5289-2","volume":"77","author":"T Rao","year":"2018","unstructured":"Rao, T., Xu, M., Liu, H.: Generating affective maps for images. Multimedia Tools Appl. 77(13), 17247\u201317267 (2018)","journal-title":"Multimedia Tools Appl."},{"key":"656_CR45","doi-asserted-by":"publisher","first-page":"576","DOI":"10.1016\/j.jvcir.2018.12.032","volume":"58","author":"X Liu","year":"2019","unstructured":"Liu, X., Li, N., Xia, Y.: Affective image classification by jointly using interpretable art features. J. Vis. Commun. Image Represent. 58, 576\u2013588 (2019)","journal-title":"J. Vis. Commun. Image Represent."},{"key":"656_CR46","doi-asserted-by":"publisher","first-page":"15","DOI":"10.1016\/j.imavis.2017.01.011","volume":"65","author":"V Campos","year":"2017","unstructured":"Campos, V., Jou, B., Giro-i-Nieto, X.: From pixels to sentiment: fine-tuning CNNs for visual sentiment prediction. Image Vis. Comput. 65, 15\u201322 (2017)","journal-title":"Image Vis. Comput."},{"key":"656_CR47","unstructured":"Zoph, B., Le, Q.V.: Neural architecture search with reinforcement learning. In: International Conference on Learning representations (2017)"},{"key":"656_CR48","unstructured":"Yadav, A., Vishwakarma, D.K.: Sentiment analysis using deep learning architectures: a review. Artificial Intelligence Review, pp. 1\u201351 (2019)"},{"issue":"5","key":"656_CR49","doi-asserted-by":"publisher","first-page":"1358","DOI":"10.1109\/TMM.2019.2939744","volume":"22","author":"D She","year":"2019","unstructured":"She, D., Yang, J., Cheng, M.M., Lai, Y.K., Rosin, P.L., Wang, L.: WSCNet: weakly supervised coupled networks for visual sentiment classification and detection. IEEE Trans. Multimedia. 22(5), 1358\u20131371 (2019)","journal-title":"IEEE Trans. Multimedia."},{"key":"656_CR50","doi-asserted-by":"crossref","unstructured":"Fan, S., Jiang, M., Koenig, B.L., Xu, J., Kankanhalli, M.S., Zhao, Q.: Emotional attention: a study of image sentiment and visual attention. In: IEEE\/CVF Conference on Computer Vision and Pattern Recognition,\u00a0pp. 7521\u20137531. Salt Lake (2018)","DOI":"10.1109\/CVPR.2018.00785"},{"key":"656_CR51","doi-asserted-by":"crossref","unstructured":"Lee, J., Kim, S., Kim, S., Park, J., Sohn, K.: Context-aware emotion recognition networks. In: Proceedings of the IEEE International Conference on Computer Vision,\u00a0pp. 10143\u201310152. Seoul (2019)","DOI":"10.1109\/ICCV.2019.01024"},{"issue":"12","key":"656_CR52","doi-asserted-by":"publisher","first-page":"9061","DOI":"10.1007\/s00521-018-3867-5","volume":"31","author":"VS Bawa","year":"2018","unstructured":"Bawa, V.S., Kumar, V.: \"Emotional sentiment analysis for a group of people based on transfer learning with a multi-modal system. Neural Comput. Appl. 31(12), 9061\u20139072 (2018)","journal-title":"Neural Comput. Appl."},{"key":"656_CR53","doi-asserted-by":"crossref","unstructured":"Yang, J., She, D., Sun, M.: Joint image emotion classification and distribution learning via deep convolutional neural network. In: Proceedings of the Twenty-Sixth International Joint Conference on Artificial Intelligence (IJCAI-17),\u00a0pp. 3266\u20133272 (2017)","DOI":"10.24963\/ijcai.2017\/456"},{"key":"656_CR54","doi-asserted-by":"crossref","unstructured":"Zhu, X., Li, L., Zhang, W., Rao, T., Xu, M., Huang, Q., Xu, D.: Dependency exploitation: a unified CNN-RNN approach for visual emotion recognition. In: Proceedings of the Twenty-Sixth International Joint Conference on Artificial Intelligence,\u00a0pp. 3595\u20133601 (2017)","DOI":"10.24963\/ijcai.2017\/503"},{"key":"656_CR55","doi-asserted-by":"crossref","unstructured":"Yang, J., She, D., Lai, Y.K., Yang, M.H.: Retrieving and classifying affective images via deep metric learning. In: The Thirty-Second AAAI Conference on Artificial Intelligence (AAAI-18), pp. 491\u2013498. Louisiana (2018)","DOI":"10.1609\/aaai.v32i1.11275"},{"key":"656_CR56","doi-asserted-by":"crossref","unstructured":"Zhao, S., Lin, C., Xu, P., Zhao, S., Guo, Y., Krishna, R., Ding, G., Keutzer, K.: CycleEmotionGAN: emotional semantic consistency preserved CycleGAN for adapting image emotions. In: The Thirty-Third AAAI Conference on Artificial Intelligence (AAAI-19),\u00a0pp. 2620\u20132627. Hawaii (2019)","DOI":"10.1609\/aaai.v33i01.33012620"},{"issue":"2","key":"656_CR57","doi-asserted-by":"publisher","first-page":"515","DOI":"10.1109\/TMM.2019.2928998","volume":"22","author":"W Zhang","year":"2019","unstructured":"Zhang, W., He, X., Lu, W.: Exploring discriminative representations for image emotion recognition with CNNs. IEEE Trans. Multimed. 22(2), 515\u2013523 (2019)","journal-title":"IEEE Trans. Multimed."},{"key":"656_CR58","unstructured":"Chen, T., Borth, D., Darrell, T., Chang, S.F.: Deepsentibank: Visual sentiment concept classification with deep convolutional neural networks (2014). arXiv preprint arXiv:1410.8586"},{"key":"656_CR59","doi-asserted-by":"crossref","unstructured":"Katsurai, M., Satoh, S.: Image sentiment analysis using latent correlations among visual, textual, and sentiment views. In: IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP),\u00a0pp. 2837\u20132841 (2016)","DOI":"10.1109\/ICASSP.2016.7472195"},{"key":"656_CR60","doi-asserted-by":"crossref","unstructured":"He, X., Zhang, H., Li, N., Feng, L., Zheng, F.: A multi-attentive pyramidal model for visual sentiment analysis. In: International Joint Conference on Neural Networks, pp. 1\u20138 (2019)","DOI":"10.1109\/IJCNN.2019.8852317"},{"key":"656_CR61","doi-asserted-by":"crossref","unstructured":"Yang, J., She, D., Lai, Y.K., Rosin, P.L., Yang, M.H.: Weakly supervised coupled networks for visual sentiment analysis. In: 2018 IEEE\/CVF Conference on Computer Vision and Pattern Recognition,\u00a0pp. 7584\u20137592. Salt Lake City (2018)","DOI":"10.1109\/CVPR.2018.00791"},{"key":"656_CR62","unstructured":"Zadeh, A., Zellers, R., Pincus, E., Morency, L.P.: MOSI: multimodal corpus of sentiment intensity and subjectivity analysis in online opinion videos (2016). arXiv preprint arXiv:1606.06259"},{"key":"656_CR63","unstructured":"Zadeh, A., Liang, P.P., Vanbriesen, J., Poria, S., Tong, E., Cambria, E., Chen, M., Morency, L.P.: Multimodal language analysis in the wild: Cmu-mosei dataset and interpretable dynamic fusion graph. In: Proceedings of the 56th Annual Meeting of the Association for Computational Linguistics, vol. 1, pp. 2236\u20132246 (2018)"},{"key":"656_CR64","doi-asserted-by":"crossref","unstructured":"You, Q., Luo, J., Jin, H., Yang, J.: Building a large scale dataset for image emotion recognition: the fine print and the benchmark. In: Proceedings of the Thirtieth AAAI Conference on Artificial Intelligence (AAAI-16),\u00a0pp. 308\u2013314. Arizona (2016)","DOI":"10.1609\/aaai.v30i1.9987"},{"key":"656_CR65","doi-asserted-by":"crossref","unstructured":"Dumpala, S.H., Sheikh, I., Chakraborty, R., Kopparapu, S.K.: Sentiment classification on erroneous ASR transcripts: a multi view learning approach. In: IEEE Spoken Language Technology Workshop (SLT 2018), pp. 807\u2013814. Greece (2018)","DOI":"10.1109\/SLT.2018.8639665"},{"key":"656_CR66","unstructured":"Dumpala, S.H., Sheikh, I., Chakraborty, R., Kopparapu, S.K.: Audio-visual fusion for sentiment classification using cross-modal autoencoder. In: 32nd Conference on Neural Information Processing Systems (NIPS 2018),\u00a0pp. 1\u20134. Canada (2018)"},{"key":"656_CR67","doi-asserted-by":"crossref","unstructured":"Chauhan, D.S., Akhtar, M.S., Ekbal, A., Bhattacharyya, P.: Context-aware interactive attention for multi-modal sentiment and emotion analysis. In: Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing, pp. 5646\u20135656 (2019)","DOI":"10.18653\/v1\/D19-1566"},{"key":"656_CR68","doi-asserted-by":"crossref","unstructured":"Akhtar, M.S., Chauhan, D.S., Ghosal, D., Poria, S., Ekbal, A., Bhattacharyya, P.: Multi-task learning for multi-modal emotion recognition and sentiment analysis. In: Proceedings of 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, vol. 1, pp. 370\u2013379. Minnesota (2019)","DOI":"10.18653\/v1\/N19-1034"},{"key":"656_CR69","doi-asserted-by":"crossref","unstructured":"Sun, Z., Sarma, P.K., Sethares, W.A., Liang, Y.: Learning relationships between text, audio, and video via deep canonical correlation for multimodal language analysis. In: AAAI Conference on Artificial Intelligence (AAAI) (2019)","DOI":"10.1609\/aaai.v34i05.6431"},{"key":"656_CR70","doi-asserted-by":"crossref","unstructured":"Zadeh, A., Chen, M., Poria, S., Cambria, E., Morency, L.P.: Tensor fusion network for multimodal sentiment analysis. In: Proceedings of the 2017 Conference on Empirical Methods in Natural Language Processing,\u00a0pp. 1103\u20131114 (2017)","DOI":"10.18653\/v1\/D17-1115"},{"key":"656_CR71","doi-asserted-by":"crossref","unstructured":"Chen, M., Wang,S., Liang, P.P., Baltru\u0161aitis, T., Zadeh, A., Morency, L.P.: Multimodal sentiment analysis with word-level fusion and reinforcement learning. In: Proceedings of the 19th ACM International Conference on Multimodal Interaction (ICMI),\u00a0pp. 163\u2013171 (2017)","DOI":"10.1145\/3136755.3136801"},{"key":"656_CR72","doi-asserted-by":"crossref","unstructured":"Li, H., Xu, H.: Video-based sentiment analysis with hvnLBP-TOP feature and bi-LSTM. In: The Thirty-Third AAAI Conference on Artificial Intelligence (AAAI-19),\u00a0pp. 9963\u20139964. Hawaii (2019)","DOI":"10.1609\/aaai.v33i01.33019963"},{"key":"656_CR73","doi-asserted-by":"crossref","unstructured":"Zadeh, A., Liang, P.P., Poria, S., Vij, P., Cambria, E., Morency, L.P.: Multi-attention recurrent network for human communication comprehension. In: Thirty-Second AAAI Conference on Artificial Intelligence,\u00a0pp. 5642\u20135649. Louisiana (2018)","DOI":"10.1609\/aaai.v32i1.12024"},{"key":"656_CR74","doi-asserted-by":"publisher","DOI":"10.1007\/s10586-020-03062-w","author":"A Yadav","year":"2020","unstructured":"Yadav, A., Vishwakarma, D.K.: A comparative study on bio-inspired algorithms for sentiment analysis. Cluster Comput. (2020). https:\/\/doi.org\/10.1007\/s10586-020-03062-w","journal-title":"Cluster Comput."},{"key":"656_CR75","doi-asserted-by":"crossref","unstructured":"Sun, Z., Sarma, P.K., Sethares, W., Bucy, E.P.: Multi-modal sentiment analysis using deep canonical correlation analysis. In: The 20th Annual Conference of the International Speech Communication Association (INTERSPEECH), pp. 1323\u20131327 (2019)","DOI":"10.21437\/Interspeech.2019-2482"}],"container-title":["Multimedia Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00530-020-00656-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00530-020-00656-7\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00530-020-00656-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,10,24]],"date-time":"2022-10-24T20:09:38Z","timestamp":1666642178000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00530-020-00656-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,5,25]]},"references-count":75,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2020,8]]}},"alternative-id":["656"],"URL":"https:\/\/doi.org\/10.1007\/s00530-020-00656-7","relation":{},"ISSN":["0942-4962","1432-1882"],"issn-type":[{"value":"0942-4962","type":"print"},{"value":"1432-1882","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020,5,25]]},"assertion":[{"value":"6 November 2019","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"8 May 2020","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"25 May 2020","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}