{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,7]],"date-time":"2025-10-07T08:43:54Z","timestamp":1759826634915,"version":"3.28.0"},"reference-count":29,"publisher":"IEEE","license":[{"start":{"date-parts":[[2023,12,10]],"date-time":"2023-12-10T00:00:00Z","timestamp":1702166400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,12,10]],"date-time":"2023-12-10T00:00:00Z","timestamp":1702166400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023,12,10]]},"DOI":"10.1109\/cvmi59935.2023.10464855","type":"proceedings-article","created":{"date-parts":[[2024,3,20]],"date-time":"2024-03-20T18:12:20Z","timestamp":1710958340000},"page":"1-6","source":"Crossref","is-referenced-by-count":1,"title":["Enhancing Emotion Classification Through Speech and Correlated Emotional Sounds via a Variational Auto-Encoder Model with Prosodic Regularization"],"prefix":"10.1109","author":[{"given":"Andrea Veronica","family":"Porco","sequence":"first","affiliation":[{"name":"University of The Ryukyus,Dept. Information Engineering,Nishihara,Japan"}]},{"given":"Dongshik","family":"Kang","sequence":"additional","affiliation":[{"name":"University of The Ryukyus,Dept. Information Engineering,Nishihara,Japan"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2020-1520"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1016\/j.specom.2022.11.005"},{"key":"ref3","doi-asserted-by":"crossref","first-page":"44","DOI":"10.1016\/j.specom.2020.11.005","article-title":"Acoustic differences in emotional speech of people with dysarthria","volume":"126","author":"Alhinti","year":"2021","journal-title":"Speech Communication"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TAFFC.2022.3188223"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/TAFFC.2018.2858255"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.23919\/EUSIPCO.2019.8903014"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.3390\/app9122470"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.21437\/interspeech.2018-1568"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2016-1183"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/taslp.2023.3268571"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ISCSLP49672.2021.9362098"},{"journal-title":"Variational autoencoders for Learning latent representations of speech emotion","year":"2017","author":"Siddique","key":"ref12"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.14569\/ijacsa.2021.0121096"},{"key":"ref14","article-title":"Auto-encoding variational Bayes","volume-title":"Proc. 2nd International Conference on Learning Representations","author":"Kingma","year":"2014"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/access.2019.2936124"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0196391"},{"key":"ref17","first-page":"1","article-title":"Emotion Intensity and its control for emotional voice conversion","author":"Zhou","year":"2022","journal-title":"arXiv preprint"},{"key":"ref18","article-title":"Vaw-gan for the disentanglement and recomposition of emotional elements in speech","author":"Zhou","year":"2020","journal-title":"arXiv preprint"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9053571"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8462018"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.2017.8268911"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1007\/s12559-017-9533-x"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-2236"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2019.8683704"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2018-1820"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2018.07.041"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2009.2034771"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-2103"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2018-1113"}],"event":{"name":"2023 IEEE International Conference on Computer Vision and Machine Intelligence (CVMI)","start":{"date-parts":[[2023,12,10]]},"location":"Gwalior, India","end":{"date-parts":[[2023,12,11]]}},"container-title":["2023 IEEE International Conference on Computer Vision and Machine Intelligence (CVMI)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10464390\/10464398\/10464855.pdf?arnumber=10464855","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,26]],"date-time":"2024-03-26T19:43:26Z","timestamp":1711482206000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10464855\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,12,10]]},"references-count":29,"URL":"https:\/\/doi.org\/10.1109\/cvmi59935.2023.10464855","relation":{},"subject":[],"published":{"date-parts":[[2023,12,10]]}}}