{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,3]],"date-time":"2026-04-03T07:05:40Z","timestamp":1775199940823,"version":"3.50.1"},"reference-count":13,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,12,6]],"date-time":"2025-12-06T00:00:00Z","timestamp":1764979200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,12,6]],"date-time":"2025-12-06T00:00:00Z","timestamp":1764979200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,12,6]]},"DOI":"10.1109\/asru65441.2025.11434694","type":"proceedings-article","created":{"date-parts":[[2026,4,2]],"date-time":"2026-04-02T19:48:04Z","timestamp":1775159284000},"page":"1-4","source":"Crossref","is-referenced-by-count":0,"title":["Audio Aesthetics Prediction System QAM16k Based on Pre-trained Audio Encoder"],"prefix":"10.1109","author":[{"given":"Linping","family":"Xu","sequence":"first","affiliation":[{"name":"ByteDance,MMLab,Beijing,China"}]},{"given":"Ziqian","family":"Wu","sequence":"additional","affiliation":[{"name":"ByteDance,MMLab,Beijing,China"}]},{"given":"Dejun","family":"Zhang","sequence":"additional","affiliation":[{"name":"ByteDance,MMLab,Beijing,China"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2001.941023"},{"issue":"6","key":"ref2","first-page":"366","article-title":"Perceptual objective listening quality assessment (POLQA), the third generation itu-t standard for end-to-end speech quality measurement part i-temporal alignment","volume":"61","author":"Beerends","year":"2013","journal-title":"journal of the audio engineering society"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1145\/3664647.3681688"},{"key":"ref4","article-title":"Analyzable chain-of-musical-thought prompting for high-fidelity music generation","author":"Lam","year":"2025","journal-title":"arXiv preprint arXiv:2503.19611"},{"key":"ref5","article-title":"Seed-music: A unified framework for high quality and controlled music generation","author":"Bai","year":"2024","journal-title":"arXiv preprint arXiv:2409.09214"},{"key":"ref6","article-title":"Meta audiobox aesthetics: Unified automatic quality assessment for speech, music, and sound","author":"Tjandra","year":"2025","journal-title":"arXiv preprint arXiv:2502.05139"},{"key":"ref7","volume-title":"AudioMOS challenge"},{"key":"ref8","article-title":"Songeval: A benchmark dataset for song aesthetics evaluation","author":"Yao","year":"2025","journal-title":"arXiv preprint arXiv:2505.10793"},{"key":"ref9","first-page":"1298","article-title":"Data2vec: A general framework for self-supervised learning in speech, vision and language","volume-title":"International conference on machine learning.","author":"Baevski"},{"key":"ref10","first-page":"28492","article-title":"Robust speech recognition via large-scale weak supervision","volume-title":"International conference on machine learning.","author":"Radford"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2024-246"},{"key":"ref12","article-title":"Qwen2-audio technical report","volume-title":"arXiv preprint arXiv:2407.10759","author":"Chu","year":"2024"},{"key":"ref13","article-title":"High fidelity neural audio compression","author":"D\u00e9fossez","year":"2022","journal-title":"arXiv preprint arXiv:2210.13438"}],"event":{"name":"2025 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","location":"Honolulu, HI, USA","start":{"date-parts":[[2025,12,6]]},"end":{"date-parts":[[2025,12,10]]}},"container-title":["2025 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11434577\/11433836\/11434694.pdf?arnumber=11434694","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,4,3]],"date-time":"2026-04-03T04:58:25Z","timestamp":1775192305000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11434694\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,12,6]]},"references-count":13,"URL":"https:\/\/doi.org\/10.1109\/asru65441.2025.11434694","relation":{},"subject":[],"published":{"date-parts":[[2025,12,6]]}}}