{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,13]],"date-time":"2026-05-13T17:45:43Z","timestamp":1778694343685,"version":"3.51.4"},"publisher-location":"ISCA","reference-count":0,"publisher":"ISCA","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"DOI":"10.21437\/interspeech.2024-2350","type":"proceedings-article","created":{"date-parts":[[2024,9,1]],"date-time":"2024-09-01T07:10:12Z","timestamp":1725174612000},"page":"3724-3728","source":"Crossref","is-referenced-by-count":9,"title":["Multimodal Fusion of Music Theory-Inspired and Self-Supervised Representations for Improved Emotion Recognition"],"prefix":"10.21437","author":[{"given":"Xiaohan","family":"Shi","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xingfeng","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Tomoki","family":"Toda","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"8866","published-online":{"date-parts":[[2024,9,1]]},"event":{"name":"Interspeech 2024","acronym":"interspeech_2024"},"container-title":["Interspeech 2024"],"original-title":[],"deposited":{"date-parts":[[2024,11,8]],"date-time":"2024-11-08T20:29:47Z","timestamp":1731097787000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.isca-archive.org\/interspeech_2024\/shi24i_interspeech.html"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,9,1]]},"references-count":0,"URL":"https:\/\/doi.org\/10.21437\/interspeech.2024-2350","relation":{},"subject":[],"published":{"date-parts":[[2024,9,1]]}}}