{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,9]],"date-time":"2026-05-09T20:38:33Z","timestamp":1778359113442,"version":"3.51.4"},"reference-count":34,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,12,2]],"date-time":"2024-12-02T00:00:00Z","timestamp":1733097600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,12,2]],"date-time":"2024-12-02T00:00:00Z","timestamp":1733097600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/100005289","name":"National Institute of Justice","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100005289","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,12,2]]},"DOI":"10.1109\/slt61566.2024.10832284","type":"proceedings-article","created":{"date-parts":[[2025,1,16]],"date-time":"2025-01-16T18:31:27Z","timestamp":1737052287000},"page":"782-787","source":"Crossref","is-referenced-by-count":14,"title":["SVDD 2024: The Inaugural Singing Voice Deepfake Detection Challenge"],"prefix":"10.1109","author":[{"given":"You","family":"Zhang","sequence":"first","affiliation":[{"name":"University of Rochester,Rochester,NY,USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yongyi","family":"Zang","sequence":"additional","affiliation":[{"name":"University of Rochester,Rochester,NY,USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jiatong","family":"Shi","sequence":"additional","affiliation":[{"name":"Carnegie Mellon University,Pittsburgh,PA,USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ryuichi","family":"Yamamoto","sequence":"additional","affiliation":[{"name":"Nagoya University,Nagoya,Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Tomoki","family":"Toda","sequence":"additional","affiliation":[{"name":"Nagoya University,Nagoya,Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zhiyao","family":"Duan","sequence":"additional","affiliation":[{"name":"University of Rochester,Rochester,NY,USA"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.5334\/tismir.100"},{"key":"ref2","article-title":"Avoiding an AI-imposed taylor\u2019s version of all music history","author":"Collins","year":"2024","journal-title":"arXiv preprint arXiv:2402.14589"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP48485.2024.10448184"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP48485.2024.10446271"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2024-1185"},{"key":"ref6","article-title":"Detecting music deepfakes is easy but actually hard","author":"Afchar","year":"2024","journal-title":"arXiv preprint arXiv:2405.04181"},{"key":"ref7","article-title":"SVDD challenge, 2024: A singing voice deepfake detection challenge evaluation plan","author":"Zhang","year":"2024","journal-title":"arXiv preprint arXiv:2405.05244"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2024-2242"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2022-48"},{"key":"ref10","article-title":"M4singer: A multi-style, multi-singer and musical score provided mandarin singing corpus","volume-title":"Proc. NeurIPS (Dataset and Benchmarks Track)","author":"Zhang"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2024-33"},{"key":"ref12","article-title":"ACE Studio"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1250\/ast.42.140"},{"key":"ref14","article-title":"JVS-MuSiC: Japanese multispeaker singing-voice corpus","author":"Tamaru","year":"2020","journal-title":"arXiv preprint arXiv:2001.07044"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2022-10039"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP49357.2023.10096239"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v36i10.21350"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU57964.2023.10389779"},{"issue":"198","key":"ref19","first-page":"1","article-title":"Codalab competitions: An open source platform to organize scientific challenges","volume":"24","author":"Pavao","year":"2023","journal-title":"J M L R"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP43922.2022.9747766"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2022-143"},{"key":"ref22","article-title":"Automatic speaker verification spoofing and deepfake detection using wav 2 vec 2.0 and data augmentation","volume-title":"Proc. Odyssey","author":"Tak"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/TBIOM.2021.3059479"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2021-1599"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1145\/3474085.3475437"},{"key":"ref26","article-title":"Children\u2019s song dataset for singing voice research","volume-title":"Proc. ISMIR","author":"Choi"},{"key":"ref27","first-page":"487","article-title":"PJS: Phoneme-balanced japanese singing-voice corpus","volume-title":"Proc. APSIPA. IEEE","author":"Koguchi"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.5334\/tismir.108"},{"key":"ref29","first-page":"1180","article-title":"Unsupervised domain adaptation by backpropagation","volume-title":"Proc. ICML. PMLR","author":"Ganin"},{"key":"ref30","first-page":"17022","article-title":"HiFi-GAN: Generative adversarial networks for efficient and high fidelity speech synthesis","volume-title":"Proc. NeurIPS","volume":"33","author":"Kong"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2024-1472"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/SLT61566.2024.10832226"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1145\/3664647.3681345"},{"key":"ref34","article-title":"Singsong: Generating musical accompaniments from singing","volume-title":"Proc. ICML","author":"Donahue"}],"event":{"name":"2024 IEEE Spoken Language Technology Workshop (SLT)","location":"Macao","start":{"date-parts":[[2024,12,2]]},"end":{"date-parts":[[2024,12,5]]}},"container-title":["2024 IEEE Spoken Language Technology Workshop (SLT)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10830790\/10830793\/10832284.pdf?arnumber=10832284","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,17]],"date-time":"2025-01-17T07:50:18Z","timestamp":1737100218000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10832284\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,12,2]]},"references-count":34,"URL":"https:\/\/doi.org\/10.1109\/slt61566.2024.10832284","relation":{},"subject":[],"published":{"date-parts":[[2024,12,2]]}}}