{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,27]],"date-time":"2025-11-27T05:41:02Z","timestamp":1764222062143,"version":"3.46.0"},"reference-count":30,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,10,19]],"date-time":"2025-10-19T00:00:00Z","timestamp":1760832000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,10,19]],"date-time":"2025-10-19T00:00:00Z","timestamp":1760832000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,10,19]]},"DOI":"10.1109\/sped67700.2025.11251799","type":"proceedings-article","created":{"date-parts":[[2025,11,26]],"date-time":"2025-11-26T19:00:27Z","timestamp":1764183627000},"page":"120-124","source":"Crossref","is-referenced-by-count":0,"title":["ADNAC: Audio Denoiser using Neural Audio Codec"],"prefix":"10.1109","author":[{"given":"Daniel","family":"Jimon","sequence":"first","affiliation":[{"name":"Technical University of Cluj-Napoca,Romania"}]},{"given":"Mircea","family":"Vaida","sequence":"additional","affiliation":[{"name":"Technical University of Cluj-Napoca,Romania"}]},{"given":"Adriana","family":"Stan","sequence":"additional","affiliation":[{"name":"Technical University of Cluj-Napoca,Romania"}]}],"member":"263","reference":[{"volume-title":"Learning to Denoise Historical Music","year":"2020","author":"Li","key":"ref1"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0146790"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.3390\/app12094161"},{"key":"ref4","article-title":"Audio Denoiser Using U-NET Architecture (accepted for publication)","author":"Jimon","year":"2025","journal-title":"Acta Technica Napocensis \u2013 Electronic\u0103 \u015fi Telecomunica\u0163ii-Electronics and Telecommunications"},{"volume-title":"High-Fidelity Audio Compression with Improved RVQGAN","year":"2023","author":"Kumar","key":"ref5"},{"volume-title":"Improved Speech Enhancement with the Wave-U-Net","year":"2018","author":"Craig Macartney","key":"ref6"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-22482-4_11"},{"key":"ref8","doi-asserted-by":"crossref","DOI":"10.21437\/Interspeech.2013-130","article-title":"Speech enhancement based on deep denoising Auto-Encoder","author":"Lu","year":"2013","journal-title":"Interspeech 2013"},{"article-title":"CMGAN: Conformer-based Metric GAN for Speech Enhancement","volume-title":"Interspeech 2022, ISCA","author":"Ruizhe","key":"ref9"},{"volume-title":"DPT-FSNet: Dual-path Transformer Based Full-band and Sub-band Fusion Network for Speech Enhancement","year":"2021","author":"Dang","key":"ref10"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2024.3445871"},{"volume-title":"Speech Enhancement and Dereverberation with Diffusion-based Generative Models","year":"2022","author":"Richter","key":"ref12"},{"volume-title":"SoundStream: An End-to-End Neural Audio Codec","year":"2021","author":"Zeghidour","key":"ref13"},{"journal-title":"GitHub","article-title":"EnCodec: High Fidelity Neural Audio Compression","year":"2023","key":"ref14"},{"article-title":"IRMAS: a dataset for instrument recognition in musical audio signals (1.0) [Data set]","volume-title":"13th International Society for Music Information Retrieval Conference (ISMIR 2012)","author":"Bosch","key":"ref15"},{"journal-title":"GitHub","key":"ref16","article-title":"MusicECAN: Automatic Recorded Music Denoising Network with Efficient Channel Attention"},{"key":"ref17","article-title":"MUSAN: A Music, Speech, and Noise Corpus","author":"Povey","year":"2015","journal-title":"arXiv:1510.08484v1"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1145\/2647868.2655045"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/taslp.2021.3133208"},{"journal-title":"github","key":"ref20","article-title":"pedalboard"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/JSTSP.2019.2917582"},{"journal-title":"GitHub","key":"ref22","article-title":"descript-audio-codec"},{"volume-title":"Descript Audio Codec (DAC)","key":"ref23"},{"key":"ref24","article-title":"U-Net: Convolutional Networks for Biomedical Image Segmentation","author":"Ronnenberg","year":"2015","journal-title":"Medical Image Computing and Computer-Assisted Intervention \u2013 MICCAI"},{"key":"ref25","article-title":"SDR - half-baked or well done?","author":"Le Roux","year":"2018","journal-title":"arXiv"},{"key":"ref26","article-title":"Decoupled Weight Decay Regularization","author":"Loshchilov","year":"2017","journal-title":"arXiv"},{"volume-title":"ReduceLROnPlateau","key":"ref27"},{"journal-title":"ITU-T P.862","year":"2001","key":"ref28"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2010.5495701"},{"journal-title":"BS. 1534: Method for the subjective assessment of intermediate quality level of audio systems","year":"2015","key":"ref30"}],"event":{"name":"2025 International Conference on Speech Technology and Human-Computer Dialogue (SpeD)","start":{"date-parts":[[2025,10,19]]},"location":"Cluj-Napoca, Romania","end":{"date-parts":[[2025,10,22]]}},"container-title":["2025 International Conference on Speech Technology and Human-Computer Dialogue (SpeD)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11251505\/11251597\/11251799.pdf?arnumber=11251799","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,11,27]],"date-time":"2025-11-27T05:37:32Z","timestamp":1764221852000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11251799\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,19]]},"references-count":30,"URL":"https:\/\/doi.org\/10.1109\/sped67700.2025.11251799","relation":{},"subject":[],"published":{"date-parts":[[2025,10,19]]}}}