{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,25]],"date-time":"2026-02-25T17:29:50Z","timestamp":1772040590975,"version":"3.50.1"},"publisher-location":"ISCA","reference-count":0,"publisher":"ISCA","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"DOI":"10.21437\/interspeech.2025-1137","type":"proceedings-article","created":{"date-parts":[[2025,10,22]],"date-time":"2025-10-22T11:47:41Z","timestamp":1761133661000},"page":"4233-4237","source":"Crossref","is-referenced-by-count":6,"title":["EzAudio: Enhancing Text-to-Audio Generation with Efficient Diffusion Transformer"],"prefix":"10.21437","author":[{"given":"Jiarui","family":"Hai","sequence":"first","affiliation":[]},{"given":"Yong","family":"Xu","sequence":"additional","affiliation":[]},{"given":"Hao","family":"Zhang","sequence":"additional","affiliation":[]},{"given":"Chenxing","family":"Li","sequence":"additional","affiliation":[]},{"given":"Helin","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Mounya","family":"Elhilali","sequence":"additional","affiliation":[]},{"given":"Dong","family":"Yu","sequence":"additional","affiliation":[]}],"member":"8866","published-online":{"date-parts":[[2025,8,17]]},"event":{"name":"Interspeech 2025","acronym":"interspeech_2025"},"container-title":["Interspeech 2025"],"original-title":[],"deposited":{"date-parts":[[2025,10,22]],"date-time":"2025-10-22T11:49:01Z","timestamp":1761133741000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.isca-archive.org\/interspeech_2025\/hai25_interspeech.html"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,8,17]]},"references-count":0,"URL":"https:\/\/doi.org\/10.21437\/interspeech.2025-1137","relation":{},"subject":[],"published":{"date-parts":[[2025,8,17]]}}}