{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,1,15]],"date-time":"2025-01-15T20:10:08Z","timestamp":1736971808069,"version":"3.33.0"},"reference-count":35,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,11,7]],"date-time":"2024-11-07T00:00:00Z","timestamp":1730937600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,11,7]],"date-time":"2024-11-07T00:00:00Z","timestamp":1730937600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,11,7]]},"DOI":"10.1109\/iscslp63861.2024.10799994","type":"proceedings-article","created":{"date-parts":[[2024,12,23]],"date-time":"2024-12-23T19:11:17Z","timestamp":1734981077000},"page":"581-585","source":"Crossref","is-referenced-by-count":0,"title":["TF-DiffuSE: Time-Frequency Prior-Conditioned Diffusion Model for Speech Enhancement"],"prefix":"10.1109","author":[{"given":"Wenjun","family":"Ding","sequence":"first","affiliation":[{"name":"School of Computer Science and Communication Engineering, Jiangsu University"}]},{"given":"Xinsheng","family":"Wang","sequence":"additional","affiliation":[{"name":"School of Computer Science and Communication Engineering, Jiangsu University"}]},{"given":"Lijian","family":"Gao","sequence":"additional","affiliation":[{"name":"School of Computer Science and Communication Engineering, Jiangsu University"}]},{"given":"Qirong","family":"Mao","sequence":"additional","affiliation":[{"name":"School of Computer Science and Communication Engineering, Jiangsu University"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/TASSP.1984.1164453"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2024.3407511"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2024.3369536"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.21437\/interspeech.2020-2537"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2022-11269"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP43922.2022.9746901"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v37i11.26597"},{"key":"ref8","article-title":"Dose: Dif-fusion dropout with adaptive prior for speech enhancement","volume":"36","author":"Tai","year":"2024","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref9","first-page":"2031","article-title":"Metricgan: Gen-erative adversarial networks based black-box metric scores optimization for speech enhancement","volume-title":"International Conference on Machine Learning","author":"Fu"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2019.8683799"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/icassp.2018.8461530"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP39728.2021.9413999"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2023.3285241"},{"key":"ref14","first-page":"8780","article-title":"Diffusion models beat gans on image synthesis","volume-title":"Advances in neural information processing systems","volume":"34","author":"Dhariwal","year":"2021"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01042"},{"key":"ref16","article-title":"Dif-fwave: A versatile diffusion model for audio synthesis","volume-title":"arXiv preprint","author":"Kong","year":"2020"},{"key":"ref17","first-page":"8599","article-title":"Grad-tts: A diffusion probabilistic model for text-to-speech","volume-title":"International Conference on Machine Learning","author":"Popov"},{"key":"ref18","first-page":"6840","article-title":"Denoising diffusion probabilis-tic models","volume":"33","author":"Ho","year":"2020","journal-title":"Advances in neural information processing systems"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2021-46"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP43922.2022.9746454"},{"key":"ref21","first-page":"02502","article-title":"Denoising diffusion implicit models","author":"Song","year":"2020","journal-title":"arXiv preprint"},{"key":"ref22","article-title":"Dpm-solver++: Fast solver for guided sampling of diffusion probabilis-tic models","author":"Lu","year":"2022","journal-title":"arXiv preprint"},{"key":"ref23","article-title":"Score-based generative modeling through stochas-tic differential equations","author":"Song","year":"2020","journal-title":"arXiv preprint"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2019.8683855"},{"key":"ref25","article-title":"Denoising diffusion bridge models","author":"Zhou","year":"2023","journal-title":"arXiv preprint"},{"key":"ref26","first-page":"26565","article-title":"Elucidating the design space of diffusion-based generative models","volume":"35","author":"Karras","year":"2022","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.21437\/SSW.2016-24"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.6028\/nist.ir.4930"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1016\/0167-6393(93)90095-3"},{"key":"ref30","first-page":"659","article-title":"A study on speech enhancement based on diffusion probabilistic model","volume-title":"Asia-Pacific Sig-nal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","author":"Lu"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP49357.2023.10095046"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP49357.2023.10096064"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/ICME55011.2023.00294"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP49357.2023.10095850"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2023.3294692"}],"event":{"name":"2024 IEEE 14th International Symposium on Chinese Spoken Language Processing (ISCSLP)","start":{"date-parts":[[2024,11,7]]},"location":"Beijing, China","end":{"date-parts":[[2024,11,10]]}},"container-title":["2024 IEEE 14th International Symposium on Chinese Spoken Language Processing (ISCSLP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10799944\/10799969\/10799994.pdf?arnumber=10799994","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,15]],"date-time":"2025-01-15T19:28:45Z","timestamp":1736969325000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10799994\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,11,7]]},"references-count":35,"URL":"https:\/\/doi.org\/10.1109\/iscslp63861.2024.10799994","relation":{},"subject":[],"published":{"date-parts":[[2024,11,7]]}}}