{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,25]],"date-time":"2025-10-25T12:47:32Z","timestamp":1761396452298,"version":"3.28.0"},"reference-count":32,"publisher":"IEEE","license":[{"start":{"date-parts":[[2023,1,9]],"date-time":"2023-01-09T00:00:00Z","timestamp":1673222400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,1,9]],"date-time":"2023-01-09T00:00:00Z","timestamp":1673222400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023,1,9]]},"DOI":"10.1109\/slt54892.2023.10023356","type":"proceedings-article","created":{"date-parts":[[2023,1,27]],"date-time":"2023-01-27T18:54:03Z","timestamp":1674845643000},"page":"451-457","source":"Crossref","is-referenced-by-count":14,"title":["Exploring WavLM on Speech Enhancement"],"prefix":"10.1109","author":[{"given":"Hyungchan","family":"Song","sequence":"first","affiliation":[{"name":"Gwanju Institute of Science and Technology,Republic of Korea"}]},{"given":"Sanyuan","family":"Chen","sequence":"additional","affiliation":[{"name":"Microsoft,China"}]},{"given":"Zhuo","family":"Chen","sequence":"additional","affiliation":[{"name":"Microsoft,USA"}]},{"given":"Yu","family":"Wu","sequence":"additional","affiliation":[{"name":"Microsoft,China"}]},{"given":"Takuya","family":"Yoshioka","sequence":"additional","affiliation":[{"name":"Microsoft,USA"}]},{"given":"Min","family":"Tang","sequence":"additional","affiliation":[{"name":"Microsoft,USA"}]},{"given":"Jong Won","family":"Shin","sequence":"additional","affiliation":[{"name":"Gwanju Institute of Science and Technology,Republic of Korea"}]},{"given":"Shujie","family":"Liu","sequence":"additional","affiliation":[{"name":"Microsoft,China"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.21437\/interspeech.2019-1873"},{"article-title":"vq-wav2vec: Self-supervised learning of discrete speech representations","volume-title":"International Conference on Learning Repre-sentations","author":"Baevski","key":"ref2"},{"key":"ref3","first-page":"12449","article-title":"wav2vec 2.0: A framework for self-supervised learning of speech representations","volume":"33","author":"Baevski","year":"2020","journal-title":"Advances in Neural Infor-mation Processing Systems"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2021.3122291"},{"key":"ref5","first-page":"10937","article-title":"Unispeech: Unified speech representation learning with labeled and unla-beled data","volume-title":"International Conference on Machine Learning. PMLR","author":"Wang"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU51503.2021.9688253"},{"key":"ref7","article-title":"Unispeech at scale: An empirical study of pre-training method on large-scale speech recognition dataset","author":"Wang","year":"2021","journal-title":"arXiv preprint"},{"key":"ref8","first-page":"4171","article-title":"Bert: Pre-training of deep bidirectional transformers for language understanding","volume-title":"Proceedings of NAACL-HLT","author":"Kenton"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9053925"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.21437\/interspeech.2021-734"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/JSTSP.2022.3181782"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP43922.2022.9747077"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/JSTSP.2022.3188113"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.21437\/interspeech.2021-1775"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.21437\/interspeech.2021-1609"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.acl-long.427"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP39728.2021.9413580"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP39728.2021.9413423"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/TSP52935.2021.9522648"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2020-2409"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2021-2207"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2020-2537"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2021-1482"},{"key":"ref25","article-title":"Real-time monau-ral speech enhancement with short-time discrete cosine transform","author":"Li","year":"2021","journal-title":"arXiv preprint"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/JSTSP.2022.3200911"},{"journal-title":"International Society for Music Information Retrieval (ISMIR)","article-title":"Free sound datasets: a platform for the creation of open audio datasets","author":"Fonseca","key":"ref27"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP43922.2022.9746108"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9052942"},{"key":"ref30","article-title":"Self-supervised learning for speech enhancement","author":"Wang","year":"2020","journal-title":"ar Xiv preprint"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2020.2997118"},{"key":"ref32","first-page":"3846","article-title":"Unsupervised sound separation using mixture invariant training","volume":"33","author":"Wisdom","year":"2020","journal-title":"Advances in Neural In-formation Processing Systems"}],"event":{"name":"2022 IEEE Spoken Language Technology Workshop (SLT)","start":{"date-parts":[[2023,1,9]]},"location":"Doha, Qatar","end":{"date-parts":[[2023,1,12]]}},"container-title":["2022 IEEE Spoken Language Technology Workshop (SLT)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10022052\/10022330\/10023356.pdf?arnumber=10023356","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,2,13]],"date-time":"2024-02-13T06:42:24Z","timestamp":1707806544000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10023356\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,1,9]]},"references-count":32,"URL":"https:\/\/doi.org\/10.1109\/slt54892.2023.10023356","relation":{},"subject":[],"published":{"date-parts":[[2023,1,9]]}}}