{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,5,13]],"date-time":"2025-05-13T18:06:06Z","timestamp":1747159566837,"version":"3.37.3"},"reference-count":20,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,7,5]],"date-time":"2021-07-05T00:00:00Z","timestamp":1625443200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,7,5]],"date-time":"2021-07-05T00:00:00Z","timestamp":1625443200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,7,5]]},"DOI":"10.1109\/icme51207.2021.9428327","type":"proceedings-article","created":{"date-parts":[[2021,6,9]],"date-time":"2021-06-09T21:14:21Z","timestamp":1623273261000},"page":"1-6","source":"Crossref","is-referenced-by-count":7,"title":["Dual-Waveform Emotion Recognition Model for Conversations"],"prefix":"10.1109","author":[{"given":"Jiayi","family":"Zhang","sequence":"first","affiliation":[{"name":"Beijing University of Posts and Telecommunications,Beijing Key Laboratory of Intelligent Telecommunications Software and Multimedia,Beijing,China,100876"}]},{"given":"Zihe","family":"Liu","sequence":"additional","affiliation":[{"name":"Beijing University of Posts and Telecommunications,Beijing Key Laboratory of Intelligent Telecommunications Software and Multimedia,Beijing,China,100876"}]},{"given":"Peihang","family":"Liu","sequence":"additional","affiliation":[{"name":"Beijing University of Posts and Telecommunications,Beijing Key Laboratory of Intelligent Telecommunications Software and Multimedia,Beijing,China,100876"}]},{"given":"Bin","family":"Wu","sequence":"additional","affiliation":[{"name":"Beijing University of Posts and Telecommunications,Beijing Key Laboratory of Intelligent Telecommunications Software and Multimedia,Beijing,China,100876"}]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8461368"},{"key":"ref11","first-page":"3165","article-title":"Fastspeech: Fast, robust and controllable text to speech","author":"ren","year":"2019","journal-title":"NeurIPS"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.510"},{"key":"ref13","article-title":"AL-BERT: A lite BERT for self-supervised learning of language representations","author":"lan","year":"2020","journal-title":"ICLRE"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2019.8683713"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1037\/0022-3514.76.6.893"},{"key":"ref16","first-page":"469","article-title":"Mirroring facial expressions and emotions in dyadic conversations","author":"navarretta","year":"2016","journal-title":"LREC"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1007\/s10579-008-9076-6"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/T-AFFC.2011.20"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D17-1115"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D19-1015"},{"key":"ref3","first-page":"5642","article-title":"Multi-attention recurrent network for human communication comprehension","author":"zadeh","year":"2018","journal-title":"AAAI"},{"key":"ref6","first-page":"5634","article-title":"Memory fusion network for multi-view sequential learning","author":"zadeh","year":"2018","journal-title":"AAAI"},{"key":"ref5","first-page":"873","article-title":"Context-dependent sentiment analysis in user-generated videos","author":"poria","year":"2017","journal-title":"ACL"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.33016818"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N18-1193"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/JSTSP.2017.2764438"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/D14-1179"},{"year":"0","key":"ref9","article-title":"Gentle: A robust yet lenient forced aligner built on kaldi"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D18-1280"}],"event":{"name":"2021 IEEE International Conference on Multimedia and Expo (ICME)","start":{"date-parts":[[2021,7,5]]},"location":"Shenzhen, China","end":{"date-parts":[[2021,7,9]]}},"container-title":["2021 IEEE International Conference on Multimedia and Expo (ICME)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9428049\/9428068\/09428327.pdf?arnumber=9428327","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,6,27]],"date-time":"2022-06-27T21:28:36Z","timestamp":1656365316000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9428327\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,7,5]]},"references-count":20,"URL":"https:\/\/doi.org\/10.1109\/icme51207.2021.9428327","relation":{},"subject":[],"published":{"date-parts":[[2021,7,5]]}}}