{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,27]],"date-time":"2025-10-27T16:24:21Z","timestamp":1761582261580,"version":"3.28.0"},"reference-count":27,"publisher":"IEEE","license":[{"start":{"date-parts":[[2022,12,7]],"date-time":"2022-12-07T00:00:00Z","timestamp":1670371200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2022,12,7]],"date-time":"2022-12-07T00:00:00Z","timestamp":1670371200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2022,12,7]]},"DOI":"10.1109\/snpd54884.2022.10051811","type":"proceedings-article","created":{"date-parts":[[2023,3,6]],"date-time":"2023-03-06T18:37:15Z","timestamp":1678127835000},"page":"235-239","source":"Crossref","is-referenced-by-count":2,"title":["StyleFormerGAN-VC:Improving Effect of few shot Cross-Lingual Voice Conversion Using VAE-StarGAN and Attention-AdaIN"],"prefix":"10.1109","author":[{"given":"Dengfeng","family":"Ke","sequence":"first","affiliation":[{"name":"School of Information Science, Beijing Language and Culture University,Beijing,China"}]},{"given":"Wenhan","family":"Yao","sequence":"additional","affiliation":[{"name":"School of Information Science, Beijing Language and Culture University,Beijing,China"}]},{"given":"Ruixin","family":"Hu","sequence":"additional","affiliation":[{"name":"School of Information Science, Beijing Language and Culture University,Beijing,China"}]},{"given":"Liangjie","family":"Huang","sequence":"additional","affiliation":[{"name":"School of Information Science, Beijing Language and Culture University,Beijing,China"}]},{"given":"Qi","family":"Luo","sequence":"additional","affiliation":[{"name":"School of Information Science, Beijing Language and Culture University,Beijing,China"}]},{"given":"Wentao","family":"Shu","sequence":"additional","affiliation":[{"name":"School of Information Science, Beijing Language and Culture University,Beijing,China"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.21437\/interspeech.2019-2663"},{"key":"ref2","first-page":"7836","article-title":"Unsupervised speech decomposition via triple information bottleneck","volume-title":"International Conference on Machine Learning","author":"Qian","year":"2020"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP43922.2022.9747763"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2022-571"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2019.8682897"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/icassp39728.2021.9414851"},{"journal-title":"arXiv preprint","article-title":"Stargan-vc2: Rethinking conditional methods for stargan-based voice conversion","year":"2019","key":"ref7"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2021-319"},{"key":"ref9","article-title":"Efficient non-autoregressive gan voice conversion using vqwav2vec features and dynamic convolution","author":"Chen","year":"2022","journal-title":"arXiv preprint"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU46091.2019.9003798"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP39728.2021.9414788"},{"key":"ref12","article-title":"Voice conversion challenge 2020: Intralingual semi-parallel and cross-lingual voice conversion","author":"Zhao","year":"2020","journal-title":"arXiv preprint"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/SLT.2018.8639535"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-2307"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP39728.2021.9415042"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref17","article-title":"Parallel-data-free voice conversion using cycle-consistent adversarial networks","author":"Kaneko","year":"2017","journal-title":"arXiv preprint"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.33016706"},{"key":"ref19","article-title":"Fastspeech 2: Fast and high-quality end-to-end text to speech","author":"Ren","year":"2020","journal-title":"arXiv preprint"},{"key":"ref20","article-title":"Weight normalization: A simple reparameterization to accelerate training of deep neural networks","volume":"29","author":"Salimans","year":"2016","journal-title":"Advances in neural information processing systems"},{"key":"ref21","article-title":"Variational dropout and the local reparameterization trick","volume":"28","author":"Kingma","year":"2015","journal-title":"Advances in neural information processing systems"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.21437\/interspeech.2021-755"},{"key":"ref23","article-title":"Cstr vctk corpus: English multi-speaker corpus for cstr voice cloning toolkit","author":"Christophe","year":"2016","journal-title":"The Centre for Speech Technology Research (CSTR)"},{"key":"ref24","first-page":"17022","article-title":"Hifi-gan: Generative adversarial networks for efficient and high fidelity speech synthesis","volume":"33","author":"Kong","year":"2020","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref25","article-title":"Adam: A method for stochastic optimization","author":"Kingma","year":"2014","journal-title":"arXiv preprint"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.29007\/wc97"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP39728.2021.9413959"}],"event":{"name":"2022 IEEE\/ACIS 23rd International Conference on Software Engineering, Artificial Intelligence, Networking and Parallel\/Distributed Computing (SNPD)","start":{"date-parts":[[2022,12,7]]},"location":"Taichung, Taiwan","end":{"date-parts":[[2022,12,9]]}},"container-title":["2022 IEEE\/ACIS 23rd International Conference on Software Engineering, Artificial Intelligence, Networking and Parallel\/Distributed Computing (SNPD)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10051724\/10051766\/10051811.pdf?arnumber=10051811","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,2,13]],"date-time":"2024-02-13T15:10:55Z","timestamp":1707837055000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10051811\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,12,7]]},"references-count":27,"URL":"https:\/\/doi.org\/10.1109\/snpd54884.2022.10051811","relation":{},"subject":[],"published":{"date-parts":[[2022,12,7]]}}}