{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,29]],"date-time":"2026-03-29T04:50:07Z","timestamp":1774759807070,"version":"3.50.1"},"reference-count":181,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"4","license":[{"start":{"date-parts":[[2023,10,1]],"date-time":"2023-10-01T00:00:00Z","timestamp":1696118400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2023,10,1]],"date-time":"2023-10-01T00:00:00Z","timestamp":1696118400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,10,1]],"date-time":"2023-10-01T00:00:00Z","timestamp":1696118400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"name":"Hainan Provincial Natural Science Foundation of China","award":["623QN266"],"award-info":[{"award-number":["623QN266"]}]},{"DOI":"10.13039\/501100012226","name":"Fundamental Research Funds for the Central Universities","doi-asserted-by":"publisher","award":["233110002"],"award-info":[{"award-number":["233110002"]}],"id":[{"id":"10.13039\/501100012226","id-type":"DOI","asserted-by":"publisher"}]},{"name":"National Key R&amp;D Program of China","award":["2018AAA0101500"],"award-info":[{"award-number":["2018AAA0101500"]}]},{"name":"National Key R&amp;D Program of China","award":["2022YFB4703700"],"award-info":[{"award-number":["2022YFB4703700"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Affective Comput."],"published-print":{"date-parts":[[2023,10,1]]},"DOI":"10.1109\/taffc.2023.3282704","type":"journal-article","created":{"date-parts":[[2023,6,5]],"date-time":"2023-06-05T13:53:22Z","timestamp":1685973202000},"page":"2595-2613","source":"Crossref","is-referenced-by-count":49,"title":["Two Birds With One Stone: Knowledge-Embedded Temporal Convolutional Transformer for Depression Detection and Emotion Recognition"],"prefix":"10.1109","volume":"14","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-9732-3217","authenticated-orcid":false,"given":"Wenbo","family":"Zheng","sequence":"first","affiliation":[{"name":"School of Computer Science and Artificial Intelligence, Wuhan University of Technology, Wuhan, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6452-9649","authenticated-orcid":false,"given":"Lan","family":"Yan","sequence":"additional","affiliation":[{"name":"College of Information Science and Engineering, Hunan University, Changsha, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9185-3989","authenticated-orcid":false,"given":"Fei-Yue","family":"Wang","sequence":"additional","affiliation":[{"name":"State Key Laboratory for Management and Control of Complex Systems, Institute of Automation, Chinese Academy of Sciences, Beijing, China"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/icme46284.2020.9102872"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/MIS.2017.4531228"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/mis.2021.3093659"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1038\/s41562-021-01130-8"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/MSPEC.2021.9423818"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/3340555.3353762"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1145\/3382507.3420055"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-99736-6_35"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/MIS.2018.2882362"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/MIS.2019.2904691"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1145\/3512527.3531385"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/MIS.2020.2992799"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-25075-0_42"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/taffc.2022.3170428"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1145\/3097983.3098126"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01187"},{"key":"ref17","first-page":"813","article-title":"Is space-time attention all you need for video understanding?","volume-title":"Proc. 38th Int. Conf. Mach. Learn.","author":"Bertasius"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00320"},{"key":"ref19","first-page":"1","article-title":"Measuring depression symptom severity from spoken language and 3D facial expressions","volume-title":"Proc. Mach. Learn. Health Workshop NeurIPS","author":"Haque"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1631\/fitee.2100463"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/BIBM52615.2021.9669546"},{"key":"ref22","first-page":"1438","article-title":"Into the wild: Transitioning from recognizing mood in clinical interactions to personal conversations for individuals with bipolar disorder","volume-title":"Proc. Annu. Conf. Int. Speech Commun. Assoc.","author":"Matton"},{"issue":"1","key":"ref23","doi-asserted-by":"crossref","DOI":"10.1186\/s40359-018-0255-y","article-title":"Emotion regulation and its relation to symptoms of anxiety and depression in children aged 8\u201312 years: Does parental gender play a differentiating role?","volume":"6","author":"Loevaas","year":"2018","journal-title":"BMC Psychol."},{"key":"ref24","volume-title":"Cognitive Therapy and the Emotional Disorders","author":"Beck","year":"1979"},{"issue":"1","key":"ref25","doi-asserted-by":"crossref","DOI":"10.1038\/s41398-022-01927-9","article-title":"The relationship between emotional regulation and hemispheric lateralization in depression: A systematic review and a meta-analysis","volume":"12","author":"Horato","year":"2022","journal-title":"Transl. Psychiatry"},{"key":"ref26","article-title":"The dark triad and depressive symptoms among chinese adolescents: Moderated mediation models of age and emotion regulation strategies","volume-title":"Curr. Psychol.","author":"Shen","year":"2022"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/MIS.2016.31"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1145\/2661806.2661819"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/TAFFC.2016.2634527"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1145\/3133944.3133945"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/TCSS.2020.3021467"},{"issue":"13","key":"ref32","doi-asserted-by":"crossref","first-page":"10 309","DOI":"10.1007\/s00521-021-06208-y","article-title":"Suicidal ideation and mental disorder detection with attentive relation networks","volume":"34","author":"Ji","year":"2022","journal-title":"Neural Comput. Appl."},{"key":"ref33","first-page":"94","article-title":"Hierarchical attention network for explainable depression detection on Twitter aided by metaphor concept mappings","volume-title":"Proc. 29th Int. Conf. Comput. Linguistics","author":"Han"},{"key":"ref34","first-page":"45","article-title":"Multi-modal emotion recognition from speech and text","volume-title":"Proc. Int. J. Comput. Linguistics Chin. Lang. Process.","author":"Chuang"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2023.126262"},{"key":"ref36","first-page":"6818","article-title":"DialogueRNN: An attentive RNN for emotion detection in conversations","volume-title":"Proc. AAAI Conf. Artif. Intell.","author":"Majumder"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/CIHLI.2013.6613272"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2021.3072412"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1145\/3475957.3484451"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/TAFFC.2020.3005660"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/AVSS.2019.8909841"},{"key":"ref42","article-title":"Temporal convolutional attention-based network for sequence modeling","author":"Hao","year":"2020"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2020.2995273"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2022.3152247"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00009"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298965"},{"key":"ref47","first-page":"1","article-title":"Layer normalization","volume-title":"Proc. Int. Conf. Neural Inf. Process. Syst.","author":"LeiBa"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.195"},{"key":"ref49","volume-title":"Deep Learning","author":"Goodfellow","year":"2016"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref51","article-title":"An empirical evaluation of generic convolutional and recurrent networks for sequence modeling","author":"Bai","year":"2018"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.1609.03499"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1016\/j.inffus.2021.05.015"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1016\/j.inffus.2021.07.009"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1016\/j.inffus.2021.12.003"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1007\/s10462-022-10166-9"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-55130-8_12"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1109\/JSTSP.2020.2987728"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2020.2969791"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1007\/s11280-020-00811-0"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1109\/ICTAI50040.2020.00153"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00532"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.1810.04805"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.1007\/978-981-16-6054-2"},{"key":"ref65","first-page":"1","article-title":"Semi-supervised classification with graph convolutional networks","volume-title":"Proc. 5th Int. Conf. Learn. Representations","author":"Kipf"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1201\/9781003170082"},{"key":"ref67","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00010"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.1145\/3240508.3240523"},{"key":"ref69","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00380"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1038\/s41576-019-0122-6"},{"key":"ref71","doi-asserted-by":"publisher","DOI":"10.1007\/s11633-022-1369-5"},{"key":"ref72","doi-asserted-by":"publisher","DOI":"10.1038\/s41597-022-01211-x"},{"key":"ref73","doi-asserted-by":"publisher","DOI":"10.3389\/fnbot.2021.684037"},{"key":"ref74","first-page":"3123","article-title":"The distress analysis interview corpus of human and computer interviews","volume-title":"Proc. 9th Int. Conf. Lang. Resour. Eval.","author":"Gratch"},{"key":"ref75","first-page":"1061","article-title":"SimSensei kiosk: A virtual human interviewer for healthcare decision support","volume-title":"Proc. Int. Conf. Auton. Agents Multi-Agent Syst.","author":"DeVault"},{"key":"ref76","doi-asserted-by":"publisher","DOI":"10.1145\/3133944.3133953"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.1145\/3347320.3357688"},{"key":"ref78","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v36i11.21483"},{"issue":"1","key":"ref79","doi-asserted-by":"crossref","DOI":"10.1038\/s41597-020-00630-y","article-title":"K-EmoCon, a multimodal sensor dataset for continuous emotion recognition in naturalistic conversations","volume":"7","author":"Park","year":"2020","journal-title":"Sci. Data"},{"key":"ref80","doi-asserted-by":"publisher","DOI":"10.1109\/TAMD.2015.2431497"},{"key":"ref81","doi-asserted-by":"publisher","DOI":"10.1109\/NER.2013.6695876"},{"key":"ref82","doi-asserted-by":"publisher","DOI":"10.1109\/TAFFC.2020.2994159"},{"key":"ref83","doi-asserted-by":"publisher","DOI":"10.1109\/TCYB.2018.2797176"},{"key":"ref84","first-page":"527","article-title":"MELD: A multimodal multi-party dataset for emotion recognition in conversations","volume-title":"Proc. 57th Annu. Meeting Assoc. Comput. Linguistics","author":"Poria"},{"key":"ref85","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0196391"},{"key":"ref86","doi-asserted-by":"crossref","first-page":"38","DOI":"10.1016\/j.patrec.2022.07.012","article-title":"ERANNs: Efficient residual audio neural networks for audio pattern recognition","volume":"161","author":"Verbitskiy","year":"2022","journal-title":"Pattern Recognit. Lett."},{"key":"ref87","first-page":"4441","article-title":"MEISD: A multimodal multi-label emotion, intensity and sentiment dialogue dataset for emotion recognition and sentiment analysis in conversations","volume-title":"Proc. 28th Int. Conf. Comput. Linguistics","author":"Firdaus"},{"key":"ref88","article-title":"BIOS: An algorithmically generated biomedical knowledge graph","author":"Yu","year":"2022"},{"key":"ref89","article-title":"Answering visual-relational queries in web-extracted knowledge graphs","volume-title":"Proc. 1st Conf. Automated Knowl. Base Construction","author":"O\u00f1oro-Rubio"},{"key":"ref90","first-page":"4816","article-title":"Learning sequence encoders for temporal knowledge graph completion","volume-title":"Proc. Conf. Empirical Methods Natural Lang. Process.","author":"Garc\u00eda-Dur\u00e1n"},{"key":"ref91","article-title":"Very deep convolutional networks for large-scale image recognition","author":"Simonyan","year":"2014"},{"key":"ref92","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.243"},{"key":"ref93","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref94","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00291"},{"key":"ref95","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.634"},{"key":"ref96","first-page":"6105","article-title":"EfficientNet: Rethinking model scaling for convolutional neural networks","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Tan"},{"key":"ref97","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2010.11929"},{"key":"ref98","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00745"},{"key":"ref99","first-page":"10 347","article-title":"Training data-efficient image transformers & distillation through attention","volume-title":"Proc. 38th Int. Conf. Mach. Learn.","author":"Touvron"},{"key":"ref100","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01054"},{"key":"ref101","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.308"},{"key":"ref102","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19803-8_5"},{"key":"ref103","first-page":"4278","article-title":"Inception-v4, inception-ResNet and the impact of residual connections on learning","volume-title":"Proc. AAAI Conf. Artif. Intell.","author":"Szegedy"},{"key":"ref104","doi-asserted-by":"publisher","DOI":"10.1145\/2988257.2988267"},{"key":"ref105","doi-asserted-by":"publisher","DOI":"10.1109\/FG.2018.00032"},{"key":"ref106","doi-asserted-by":"publisher","DOI":"10.1145\/2988257.2988263"},{"key":"ref107","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2018-2522"},{"key":"ref108","article-title":"Text-based depression detection: What triggers an alert","author":"Dinkel","year":"2019"},{"key":"ref109","article-title":"Decoupled weight decay regularization","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Loshchilov"},{"key":"ref110","doi-asserted-by":"publisher","DOI":"10.1126\/science.132.3434.1115"},{"key":"ref111","doi-asserted-by":"publisher","DOI":"10.1023\/a:1007614523901"},{"key":"ref112","doi-asserted-by":"publisher","DOI":"10.1007\/978-0-387-84858-7"},{"key":"ref113","doi-asserted-by":"publisher","DOI":"10.1109\/EMBC.2017.8037103"},{"key":"ref114","doi-asserted-by":"publisher","DOI":"10.1109\/78.650093"},{"key":"ref115","first-page":"1103","article-title":"Tensor fusion network for multimodal sentiment analysis","volume-title":"Proc. Conf. Empirical Methods Natural Lang. Process.","author":"Zadeh"},{"key":"ref116","doi-asserted-by":"publisher","DOI":"10.1109\/EMBC46164.2021.9630252"},{"key":"ref117","doi-asserted-by":"publisher","DOI":"10.1109\/TAFFC.2016.2625250"},{"key":"ref118","doi-asserted-by":"publisher","DOI":"10.1145\/3460421.3480427"},{"key":"ref119","doi-asserted-by":"publisher","DOI":"10.1109\/TCDS.2016.2587290"},{"key":"ref120","doi-asserted-by":"publisher","DOI":"10.1109\/TCYB.2017.2788081"},{"key":"ref121","doi-asserted-by":"publisher","DOI":"10.1109\/TAFFC.2018.2817622"},{"key":"ref122","doi-asserted-by":"publisher","DOI":"10.1109\/TAFFC.2018.2885474"},{"key":"ref123","doi-asserted-by":"publisher","DOI":"10.1109\/TCDS.2020.2999337"},{"key":"ref124","doi-asserted-by":"publisher","DOI":"10.1109\/TAFFC.2019.2922912"},{"key":"ref125","doi-asserted-by":"publisher","DOI":"10.1109\/TNN.2010.2091281"},{"key":"ref126","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2013.368"},{"issue":"62","key":"ref127","first-page":"1687","article-title":"Large scale transductive SVMs","volume":"7","author":"Collobert","year":"2006","journal-title":"J. Mach. Learn. Res."},{"key":"ref128","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-04221-9_36"},{"key":"ref129","doi-asserted-by":"publisher","DOI":"10.3389\/fnins.2021.778488"},{"key":"ref130","article-title":"A novel transfer learning framework with prototypical representation based pairwise learning for cross-subject cross-session EEG-based emotion recognition","author":"Zhou","year":"2022"},{"key":"ref131","doi-asserted-by":"crossref","DOI":"10.1016\/j.knosys.2022.108819","article-title":"Horizontal and vertical features fusion network based on different brain regions for emotion recognition","volume":"247","author":"Guo","year":"2022","journal-title":"Knowl.-Based Syst."},{"key":"ref132","first-page":"13 789","article-title":"DialogXL: All-in-one XLNet for multi-party conversation emotion recognition","volume-title":"Proc. AAAI Conf. Artif. Intell.","author":"Shen"},{"key":"ref133","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW56347.2022.00511"},{"key":"ref134","doi-asserted-by":"publisher","DOI":"10.3390\/app10134447"},{"key":"ref135","first-page":"5669","article-title":"CoMPM: Context modeling with speakers pre-trained memory tracking for emotion recognition in conversation","volume-title":"Proc. Conf. North Amer. Chapter Assoc. Comput. Linguistics: Hum. Lang. Technol.","author":"Lee"},{"key":"ref136","first-page":"4190","article-title":"HiTrans: A transformer-based context- and speaker-sensitive model for emotion detection in conversations","volume-title":"Proc. 28th Int. Conf. Comput. Linguistics","author":"Li"},{"key":"ref137","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP43922.2022.9746464"},{"key":"ref138","article-title":"Multi-task learning with auxiliary speaker identification for conversational emotion recognition","author":"Li","year":"2020"},{"key":"ref139","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.findings-emnlp.239"},{"key":"ref140","first-page":"247","article-title":"Static and dynamic speaker modeling based on graph neural network for emotion recognition in conversation","volume-title":"Proc. Conf. North Amer. Chapter Assoc. Comput. Linguistics: Hum. Lang. Technol.: Student Res. Workshop","author":"Saxena"},{"key":"ref141","first-page":"7360","article-title":"Relation-aware graph attention networks with relational position encodings for emotion recognition in conversations","volume-title":"Proc. Conf. Empirical Methods Natural Lang. Process.","author":"Ishiwatari"},{"key":"ref142","article-title":"EmoBERTa: Speaker-aware emotion recognition in conversation with RoBERTa","author":"Kim","year":"2021"},{"key":"ref143","doi-asserted-by":"crossref","first-page":"73","DOI":"10.1016\/j.neucom.2021.09.057","article-title":"BiERU: Bidirectional emotional recurrent unit for conversational sentiment analysis","volume":"467","author":"Li","year":"2022","journal-title":"Neurocomputing"},{"key":"ref144","first-page":"1571","article-title":"Topic-driven and knowledge-aware transformer for dialogue emotion detection","volume-title":"Proc. 59th Annu. Meeting Assoc. Comput. Linguistics 11th Int. Joint Conf. Natural Lang. Process.","author":"Zhu"},{"key":"ref145","first-page":"4078","article-title":"An iterative emotion interaction network for emotion recognition in conversations","volume-title":"Proc. 28th Int. Conf. Comput. Linguistics","author":"Lu"},{"key":"ref146","first-page":"443","article-title":"Graph based network with contextualized representations of turns in dialogue","volume-title":"Proc. Conf. Empirical Methods Natural Lang. Process.","author":"Lee"},{"key":"ref147","first-page":"2470","article-title":"COSMIC: COmmonSense knowledge for eMotion identification in conversations","volume-title":"Proc. Findings Assoc. Comput. Linguistics","author":"Ghosal"},{"key":"ref148","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP43922.2022.9747397"},{"key":"ref149","first-page":"1204","article-title":"Past, present, and future: Conversational emotion recognition through structural modeling of psychological knowledge","volume-title":"Proc. Findings Assoc. Comput. Linguistics","author":"Li"},{"key":"ref150","first-page":"4153","article-title":"Summarize before aggregate: A global-to-local heterogeneous graph inference network for conversational emotion recognition","volume-title":"Proc. 28th Int. Conf. Comput. Linguistics","author":"Sheng"},{"key":"ref151","first-page":"7042","article-title":"DialogueCRN: Contextual reasoning networks for emotion recognition in conversations","volume-title":"Proc. 59th Annu. Meeting Assoc. Comput. Linguistics 11th Int. Joint Conf. Natural Lang. Process.","author":"Hu"},{"key":"ref152","first-page":"11 002","article-title":"Contrast and generation make bart a good dialogue emotion recognizer","volume-title":"Proc. AAAI Conf. Artif. Intell.","author":"Li"},{"key":"ref153","first-page":"186","article-title":"Contextualized emotion recognition in conversation as sequence tagging","volume-title":"Proc. 21th Annu. Meeting Special Int. Group Discourse Dialogue","author":"Wang"},{"key":"ref154","first-page":"2949","article-title":"A discourse-aware graph neural network for emotion recognition in multi-party conversation","volume-title":"Proc. Findings Assoc. Comput. Linguistics","author":"Sun"},{"key":"ref155","first-page":"165","article-title":"Knowledge-enriched transformer for emotion detection in textual conversations","volume-title":"Proc. Conf. Empirical Methods Natural Lang. Process. 9th Int. Joint Conf. Natural Lang. Process.","author":"Zhong"},{"key":"ref156","first-page":"1610","article-title":"EmoCaps: Emotion capsule based model for conversational emotion recognition","volume-title":"Proc. Findings Assoc. Comput. Linguistics","author":"Li"},{"key":"ref157","first-page":"154","article-title":"DialogueGCN: A graph convolutional neural network for emotion recognition in conversation","volume-title":"Proc. Conf. Empirical Methods Natural Lang. Process. 9th Int. Joint Conf. Natural Lang. Process.","author":"Ghosal"},{"key":"ref158","first-page":"1551","article-title":"Directed acyclic graph network for conversational emotion recognition","volume-title":"Proc. 59th Annu. Meeting Assoc. Comput. Linguistics 11th Int. Joint Conf. Natural Lang. Process.","author":"Shen"},{"key":"ref159","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2019\/752"},{"key":"ref160","article-title":"S+ PAGE: A speaker and position-aware graph neural network model for emotion recognition in conversation","author":"Liang","year":"2021"},{"key":"ref161","first-page":"2879","article-title":"Knowledge-interactive network with sentiment polarity intensity-aware multi-task learning for emotion recognition in conversations","volume-title":"Proc. Conf. Findings Assoc. Comput. Linguistics","author":"Xie"},{"key":"ref162","first-page":"873","article-title":"Context-dependent sentiment analysis in user-generated videos","volume-title":"Proc. 55th Annu. Meeting Assoc. Comput. Linguistics","author":"Poria"},{"key":"ref163","doi-asserted-by":"publisher","DOI":"10.1109\/ACII.2019.8925444"},{"key":"ref164","article-title":"MSAF: Multimodal split attention fusion","author":"Su","year":"2020"},{"key":"ref165","article-title":"A cross-modal fusion network based on self-attention and residual structure for multimodal emotion recognition","author":"Fu","year":"2021"},{"issue":"22","key":"ref166","doi-asserted-by":"crossref","DOI":"10.3390\/s21227665","article-title":"Multimodal emotion recognition on RAVDESS dataset using transfer learning","volume":"21","author":"Luna-Jim\u00e9nez","year":"2021","journal-title":"Sensors"},{"key":"ref167","doi-asserted-by":"crossref","DOI":"10.1016\/j.knosys.2022.108580","article-title":"Deep learning based multimodal emotion recognition using model-level fusion of audio\u2013visual modalities","volume":"244","author":"Middya","year":"2022","journal-title":"Knowl.-Based Syst."},{"key":"ref168","doi-asserted-by":"publisher","DOI":"10.1109\/IVMSP54334.2022.9816349"},{"key":"ref169","first-page":"1746","article-title":"Convolutional neural networks for sentence classification","volume-title":"Proc. Conf. Empirical Methods Natural Lang. Process.","author":"Kim"},{"key":"ref170","article-title":"Trellis networks for sequence modeling","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Bai"},{"key":"ref171","article-title":"Temporal convolutional attention-based network for sequence modeling","author":"Hao","year":"2020"},{"key":"ref172","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW56347.2022.00286"},{"key":"ref173","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2020.2983686"},{"key":"ref174","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"ref175","first-page":"4444","article-title":"ConceptNet 5.5: An open multilingual graph of general knowledge","volume-title":"Proc. AAAI Conf. Artif. Intell.","author":"Speer"},{"key":"ref176","first-page":"225","article-title":"Affective and contextual embedding for sarcasm detection","volume-title":"Proc. 28th Int. Conf. Comput. Linguistics","author":"Babanejad"},{"key":"ref177","article-title":"Enriching BERT with knowledge graph embeddings for document classification","author":"Ostendorff","year":"2019"},{"key":"ref178","doi-asserted-by":"crossref","DOI":"10.1016\/j.csl.2021.101257","article-title":"Joint emotion label space modeling for affect lexica","volume":"71","author":"De Bruyne","year":"2022","journal-title":"Comput. Speech Lang."},{"key":"ref179","doi-asserted-by":"publisher","DOI":"10.1109\/ACII52823.2021.9597390"},{"key":"ref180","first-page":"1208","article-title":"UPB at SemEval-2020 task 8: Joint textual and visual modeling in a multi-task learning architecture for memotion analysis","volume-title":"Proc. 14th Workshop Semantic Eval.","author":"Vlad"},{"key":"ref181","first-page":"370","article-title":"Multi-task learning for multi-modal emotion recognition and sentiment analysis","volume-title":"Proc. Conf. North Amer. Chapter Assoc. Comput. Linguistics: Hum. Lang. Technol.","author":"Akhtar"}],"container-title":["IEEE Transactions on Affective Computing"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/5165369\/10330166\/10143696.pdf?arnumber=10143696","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,10,20]],"date-time":"2025-10-20T17:50:13Z","timestamp":1760982613000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10143696\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,10,1]]},"references-count":181,"journal-issue":{"issue":"4"},"URL":"https:\/\/doi.org\/10.1109\/taffc.2023.3282704","relation":{},"ISSN":["1949-3045","2371-9850"],"issn-type":[{"value":"1949-3045","type":"electronic"},{"value":"2371-9850","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,10,1]]}}}