{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,30]],"date-time":"2024-10-30T07:24:26Z","timestamp":1730273066195,"version":"3.28.0"},"reference-count":33,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018,11]]},"DOI":"10.1109\/iscslp.2018.8706660","type":"proceedings-article","created":{"date-parts":[[2019,5,20]],"date-time":"2019-05-20T22:58:35Z","timestamp":1558393115000},"page":"56-60","source":"Crossref","is-referenced-by-count":0,"title":["Frame Selection in SI-DNN Phonetic Space with WaveNet Vocoder for Voice Conversion without Parallel Training Data"],"prefix":"10.1109","author":[{"given":"Feng-Long","family":"Xie","sequence":"first","affiliation":[]},{"given":"Frank K.","family":"Soong","sequence":"additional","affiliation":[]},{"given":"Xi","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Lei","family":"He","sequence":"additional","affiliation":[]},{"given":"Li","family":"Haifeng","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref33","first-page":"357","article-title":"The design for the Wall Street Journalbased CSR corpus","author":"paul","year":"1992","journal-title":"Proc DARPA SLS Workshop"},{"journal-title":"The CMU ARCTIC databases for speech synthesis","year":"2003","author":"kominek","key":"ref32"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2000.861820"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1214\/aoms\/1177729694"},{"key":"ref10","article-title":"A first step towards text-independent voice conversion","author":"sundermann","year":"2004","journal-title":"Proc ICSLP"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2006.1659962"},{"key":"ref12","article-title":"Voice conversion for unkown speakers","author":"ye","year":"2004","journal-title":"Proc ICSLP"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2009.2038669"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2010.2041688"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2014.6855140"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2016-116"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2016.7472732"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ICME.2016.7552917"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8462258"},{"key":"ref28","doi-asserted-by":"crossref","DOI":"10.21437\/Interspeech.2017-1672","article-title":"Speech enhancement using bayesian WaveNet","author":"qian","year":"2017","journal-title":"Proc INTERSPEECH"},{"key":"ref4","first-page":"3053","article-title":"Joint spectral distribution modeling using restricted Boltzmann machines for voice conversion","author":"chen","year":"2013","journal-title":"Proc INTERSPEECH"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8461368"},{"key":"ref3","first-page":"2283","article-title":"Sequence error(SE) minimization training of neural network for voice conversion","author":"xie","year":"2014","journal-title":"Proc INTERSPEECH"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2016.7472664"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.1984.1172448"},{"key":"ref5","doi-asserted-by":"crossref","first-page":"1506","DOI":"10.1109\/TASLP.2014.2333242","article-title":"Exemplar-based sparse representation with residual compensation for voice conversion","volume":"22","author":"wu","year":"2014","journal-title":"IEEE Trans on Audio Speech and Language Processing"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2016-970"},{"key":"ref7","first-page":"4869","article-title":"Voice conversion using deep bidirectional long short-term memory Based recurrent neural networks","author":"sun","year":"2016","journal-title":"Proc ICASSP"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2010.2047683"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2014.2353991"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2007.907344"},{"key":"ref20","doi-asserted-by":"crossref","first-page":"3364","DOI":"10.21437\/Interspeech.2017-63","article-title":"Voice conversion from unaligned corpora using variational autoencoding Wasserstein generative adversarial networks","author":"hsu","year":"2017","journal-title":"Proc INTERSPEECH"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2017-247"},{"key":"ref21","first-page":"677","article-title":"Sparse representation of phonetic features for voice conversion with and without parallel data","author":"iman","year":"2017","journal-title":"Proc ASRU"},{"key":"ref24","doi-asserted-by":"crossref","first-page":"1118","DOI":"10.21437\/Interspeech.2017-314","article-title":"Speaker-dependent WaveNet vocoder","author":"tamamori","year":"2017","journal-title":"Proc INTERSPEECH"},{"journal-title":"WaveNet A Generative Model for Raw Audio","year":"2016","author":"van den oord","key":"ref23"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8461332"},{"key":"ref25","doi-asserted-by":"crossref","first-page":"1138","DOI":"10.21437\/Interspeech.2017-986","article-title":"Statistical voice conversion with WaveNet-based waveform generation","author":"kobayashi","year":"2017","journal-title":"Proc INTERSPEECH"}],"event":{"name":"2018 11th International Symposium on Chinese Spoken Language Processing (ISCSLP)","start":{"date-parts":[[2018,11,26]]},"location":"Taipei City, Taiwan","end":{"date-parts":[[2018,11,29]]}},"container-title":["2018 11th International Symposium on Chinese Spoken Language Processing (ISCSLP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8701133\/8706262\/08706660.pdf?arnumber=8706660","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,8,23]],"date-time":"2020-08-23T23:10:50Z","timestamp":1598224250000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8706660\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,11]]},"references-count":33,"URL":"https:\/\/doi.org\/10.1109\/iscslp.2018.8706660","relation":{},"subject":[],"published":{"date-parts":[[2018,11]]}}}