{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,2]],"date-time":"2026-05-02T14:52:44Z","timestamp":1777733564251,"version":"3.51.4"},"publisher-location":"ISCA","reference-count":0,"publisher":"ISCA","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"DOI":"10.21437\/interspeech.2025-1032","type":"proceedings-article","created":{"date-parts":[[2025,10,22]],"date-time":"2025-10-22T11:47:41Z","timestamp":1761133661000},"page":"1243-1247","source":"Crossref","is-referenced-by-count":4,"title":["Audiobox TTA-RAG: Improving Zero-Shot and Few-Shot Text-To-Audio with Retrieval-Augmented Generation"],"prefix":"10.21437","author":[{"given":"Mu","family":"Yang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Bowen","family":"Shi","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Matthew","family":"Le","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Wei-Ning","family":"Hsu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Andros","family":"Tjandra","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"8866","published-online":{"date-parts":[[2025,8,17]]},"event":{"name":"Interspeech 2025","acronym":"interspeech_2025"},"container-title":["Interspeech 2025"],"original-title":[],"deposited":{"date-parts":[[2025,10,22]],"date-time":"2025-10-22T11:48:52Z","timestamp":1761133732000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.isca-archive.org\/interspeech_2025\/yang25h_interspeech.html"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,8,17]]},"references-count":0,"URL":"https:\/\/doi.org\/10.21437\/interspeech.2025-1032","relation":{},"subject":[],"published":{"date-parts":[[2025,8,17]]}}}