{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,5]],"date-time":"2026-02-05T10:52:46Z","timestamp":1770288766280,"version":"3.49.0"},"reference-count":20,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"2","license":[{"start":{"date-parts":[[2022,4,1]],"date-time":"2022-04-01T00:00:00Z","timestamp":1648771200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2022,4,1]],"date-time":"2022-04-01T00:00:00Z","timestamp":1648771200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2022,4,1]],"date-time":"2022-04-01T00:00:00Z","timestamp":1648771200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"name":"National Key R&#x0026;D Program of China","award":["2018YFB1305200"],"award-info":[{"award-number":["2018YFB1305200"]}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62176182"],"award-info":[{"award-number":["62176182"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61976216"],"award-info":[{"award-number":["61976216"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Tianjin Municipal Science and Technology","award":["19ZXZNGX00030"],"award-info":[{"award-number":["19ZXZNGX00030"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE MultiMedia"],"published-print":{"date-parts":[[2022,4,1]]},"DOI":"10.1109\/mmul.2022.3161411","type":"journal-article","created":{"date-parts":[[2022,3,23]],"date-time":"2022-03-23T19:28:10Z","timestamp":1648063690000},"page":"94-103","source":"Crossref","is-referenced-by-count":22,"title":["Emotion Recognition With Multimodal Transformer Fusion Framework Based on Acoustic and Lexical Information"],"prefix":"10.1109","volume":"29","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-5526-0980","authenticated-orcid":false,"given":"Lili","family":"Guo","sequence":"first","affiliation":[{"name":"School of Computer Science and Technology, China University of Mining and Technology, Xuzhou, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8094-6861","authenticated-orcid":false,"given":"Longbiao","family":"Wang","sequence":"additional","affiliation":[{"name":"Tianjin Key Laboratory of Cognitive Computing and Application, College of Intelligence and Computing, Tianjin University, Tianjin, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9237-4821","authenticated-orcid":false,"given":"Jianwu","family":"Dang","sequence":"additional","affiliation":[{"name":"Tianjin Key Laboratory of Cognitive Computing and Application, College of Intelligence and Computing, Tianjin University, Tianjin, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8379-5993","authenticated-orcid":false,"given":"Yahui","family":"Fu","sequence":"additional","affiliation":[{"name":"Tianjin Key Laboratory of Cognitive Computing and Application, College of Intelligence and Computing, Tianjin University, Tianjin, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9691-8470","authenticated-orcid":false,"given":"Jiaxing","family":"Liu","sequence":"additional","affiliation":[{"name":"Tianjin Key Laboratory of Cognitive Computing and Application, College of Intelligence and Computing, Tianjin University, Tianjin, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1391-2717","authenticated-orcid":false,"given":"Shifei","family":"Ding","sequence":"additional","affiliation":[{"name":"School of Computer Science and Technology, China University of Mining and Technology, Xuzhou, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref10","first-page":"6000","article-title":"Attention is your need","author":"vaswani","year":"0"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9053762"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2021.3049898"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.3390\/s21144913"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.306"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2010-739"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1145\/1873951.1874246"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1007\/s10579-008-9076-6"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P19-1050"},{"key":"ref19","article-title":"Multimodal speech emotion recognition and ambiguity resolution","author":"sahu","year":"2019"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2015.7178872"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1145\/3133944.3133946"},{"key":"ref6","article-title":"Multimodal emotion recognition on IEMOCAP dataset using deep learning","author":"tripathi","year":"2019"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2017.7953274"},{"key":"ref8","first-page":"5079","article-title":"Deep multimodal learning for emotion recognition in spoken language","author":"gu","year":"0","journal-title":"Proc IEEE Int Conf Acoust Speech Signal Process"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1016\/j.ipm.2019.102185"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2019.8683077"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1080\/08839510590910174"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2018-2466"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/D14-1181"}],"container-title":["IEEE MultiMedia"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/93\/9830637\/09740502.pdf?arnumber=9740502","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,8,29]],"date-time":"2022-08-29T21:24:25Z","timestamp":1661808265000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9740502\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,4,1]]},"references-count":20,"journal-issue":{"issue":"2"},"URL":"https:\/\/doi.org\/10.1109\/mmul.2022.3161411","relation":{},"ISSN":["1070-986X","1941-0166"],"issn-type":[{"value":"1070-986X","type":"print"},{"value":"1941-0166","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022,4,1]]}}}