{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,7,27]],"date-time":"2025-07-27T07:20:18Z","timestamp":1753600818089,"version":"3.33.0"},"reference-count":47,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,12,2]],"date-time":"2024-12-02T00:00:00Z","timestamp":1733097600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,12,2]],"date-time":"2024-12-02T00:00:00Z","timestamp":1733097600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/100006785","name":"Google","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100006785","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100015591","name":"Rose Hills Foundation","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100015591","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,12,2]]},"DOI":"10.1109\/slt61566.2024.10832354","type":"proceedings-article","created":{"date-parts":[[2025,1,16]],"date-time":"2025-01-16T18:31:27Z","timestamp":1737052287000},"page":"711-718","source":"Crossref","is-referenced-by-count":1,"title":["Fast, High-Quality and Parameter-Efficient Articulatory Synthesis Using Differentiable DSP"],"prefix":"10.1109","author":[{"given":"Yisi","family":"Liu","sequence":"first","affiliation":[{"name":"UC Berkeley"}]},{"given":"Bohan","family":"Yu","sequence":"additional","affiliation":[{"name":"UC Berkeley"}]},{"given":"Drake","family":"Lin","sequence":"additional","affiliation":[{"name":"UC Berkeley"}]},{"given":"Peter","family":"Wu","sequence":"additional","affiliation":[{"name":"UC Berkeley"}]},{"given":"Cheol Jun","family":"Cho","sequence":"additional","affiliation":[{"name":"UC Berkeley"}]},{"given":"Gopala Krishna","family":"Anumanchipalli","sequence":"additional","affiliation":[{"name":"UC Berkeley"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1159\/000261913"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2022-10892"},{"key":"ref3","article-title":"Articulatory encodec: Vocal tract kinematics as a codec for speech","author":"Cho","year":"2024","journal-title":"arXiv preprint arXiv:2406.12998"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ISCAS51556.2021.9401485"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9054233"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1038\/s41586-019-1119-1"},{"article-title":"Ddsp: Differentiable digital signal processing","volume-title":"International Conference on Learning Representations","author":"Engel","key":"ref7"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.3389\/frsip.2023.1284100"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1016\/S0016-0032(39)90816-1"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1121\/1.1907169"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1016\/0167-6393(82)90017-6"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0060603"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1587\/transinf.2015EDP7457"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2018-2484"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.21437\/interspeech.2018-999"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9053795"},{"key":"ref17","first-page":"17022","article-title":"Hifigan: Generative adversarial networks for efficient and high fidelity speech synthesis","volume":"33","author":"Kong","year":"2020","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP49357.2023.10095404"},{"key":"ref19","article-title":"Chunked autoregressive gan for conditional waveform synthesis","author":"Morrison","year":"2022","journal-title":"ICLR"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2019.2956145"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP48485.2024.10447948"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2020-3188"},{"key":"ref23","article-title":"Differentiable world synthesizerbased neural vocoder with application to end-to-end audio style transfer","author":"Nercessian","year":"2022","journal-title":"arXiv preprint arXiv:2208.07282"},{"article-title":"Speech synthesis and control using differentiable dsp","year":"2020","author":"Fabbro","key":"ref24"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/WASPAA52581.2021.9632754"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/icassp40776.2020.9053047"},{"article-title":"Hierarchical timbre-painting and articulation generation","volume-title":"International Society for Music Information Retrieval Conference","author":"Michelashvili","key":"ref27"},{"key":"ref28","article-title":"Neural waveshaping synthesis","author":"Hayes","year":"2021","journal-title":"arXiv preprint arXiv:2107.05050"},{"key":"ref29","article-title":"Latent space explorations of singing voice synthesis using ddsp","author":"Alonso","year":"2021","journal-title":"arXiv preprint arXiv:2103.07197"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP49357.2023.10094872"},{"article-title":"Midi-ddsp: Detailed control of musical performance via hierarchical modeling","volume-title":"International Conference on Learning Representations","author":"Wu","key":"ref31"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref33","doi-asserted-by":"crossref","DOI":"10.1609\/aaai.v32i1.11671","article-title":"Film: Visual reasoning with a general conditioning layer","volume-title":"AAAI Conference on Artificial Intelligence","author":"Perez"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2021-1016"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.304"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.21437\/interspeech.2011-316"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8461329"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.31527\/analesafa.2018.29.2.51"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1121\/10.0009844"},{"article-title":"The 1 j speech dataset","year":"2017","author":"Ito","key":"ref40"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP49357.2023.10094711"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP48485.2024.10447345"},{"key":"ref43","article-title":"Weight normalization: A simple reparameterization to accelerate training of deep neural networks","volume":"29","author":"Salimans","year":"2016","journal-title":"Advances in neural information processing systems"},{"key":"ref44","first-page":"28492","article-title":"Robust speech recognition via large-scale weak supervision","volume-title":"International Conference on Machine Learning","author":"Radford"},{"article-title":"auraloss: Audio focused loss functions in PyTorch","volume-title":"Digital Music Research Network One-day Workshop (DMRN+15)","author":"Steinmetz","key":"ref45"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2001.941023"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2022-439"}],"event":{"name":"2024 IEEE Spoken Language Technology Workshop (SLT)","start":{"date-parts":[[2024,12,2]]},"location":"Macao","end":{"date-parts":[[2024,12,5]]}},"container-title":["2024 IEEE Spoken Language Technology Workshop (SLT)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10830790\/10830793\/10832354.pdf?arnumber=10832354","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,17]],"date-time":"2025-01-17T07:50:48Z","timestamp":1737100248000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10832354\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,12,2]]},"references-count":47,"URL":"https:\/\/doi.org\/10.1109\/slt61566.2024.10832354","relation":{},"subject":[],"published":{"date-parts":[[2024,12,2]]}}}