{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T21:13:42Z","timestamp":1740172422187,"version":"3.37.3"},"reference-count":41,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"12","license":[{"start":{"date-parts":[[2018,12,1]],"date-time":"2018-12-01T00:00:00Z","timestamp":1543622400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"}],"funder":[{"DOI":"10.13039\/100000002","name":"National Institutes of Health","doi-asserted-by":"publisher","award":["R15","DC016383"],"award-info":[{"award-number":["R15","DC016383"]}],"id":[{"id":"10.13039\/100000002","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE\/ACM Trans. Audio Speech Lang. Process."],"published-print":{"date-parts":[[2018,12]]},"DOI":"10.1109\/taslp.2018.2860682","type":"journal-article","created":{"date-parts":[[2018,7,27]],"date-time":"2018-07-27T19:03:29Z","timestamp":1532718209000},"page":"2267-2276","source":"Crossref","is-referenced-by-count":7,"title":["Structured Sparse Spectral Transforms and Structural Measures for Voice Conversion"],"prefix":"10.1109","volume":"26","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-5511-3692","authenticated-orcid":false,"given":"Yunxin","family":"Zhao","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7900-2364","authenticated-orcid":false,"given":"Mili","family":"Kuruvilla-Dugdale","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Minguang","family":"Song","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref39","first-page":"314","author":"huang","year":"2001","journal-title":"Spoken Language Processing A Guide to Theory Algorithm and System Development"},{"year":"2016","key":"ref38"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/PROC.1972.8727"},{"journal-title":"Fundamental of Speech Recognition","year":"1993","author":"rabiner","key":"ref32"},{"article-title":"CMU ARCTIC database for speech synthesis","year":"2003","author":"kominek","key":"ref31"},{"key":"ref30","first-page":"556","article-title":"Algorithm for nonnegative matrix factorization","author":"lee","year":"0","journal-title":"Proc 13th Int Conf Neural Inf Process Syst"},{"key":"ref37","first-page":"3933","article-title":"TANDEM STRAIGHT: A temporally stable power\n spectral representation for periodic signals and applications to interference-free spectrum, F0, and aperiodicity\n estimation","author":"kawahara","year":"0","journal-title":"Proc Int Conf Acoust Speech Signal Process"},{"key":"ref36","first-page":"111","article-title":"Development of exploratory research tools\n based on TANDEM-STRAIGHT","author":"kawahara","year":"0","journal-title":"Proc Asia Pac Signal Inf Process Assoc Annu Summit Conf"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2017.7953212"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2012.2227735"},{"key":"ref10","doi-asserted-by":"crossref","first-page":"1506","DOI":"10.1109\/TASLP.2014.2333242","article-title":"Examplar based sparse representation with residue\n compensation for voice conversion","volume":"22","author":"wu","year":"2014","journal-title":"IEEE Trans Audio Speech Lang Process"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1121\/1.1919184"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2014.6855137"},{"key":"ref12","first-page":"5175","article-title":"Examplar-based sparse representation on timbre and prosody for voice conversion","author":"ming","year":"0","journal-title":"Proc Int Conf Acoust Speech Signal Process"},{"key":"ref13","first-page":"3057","article-title":"Examplar-based unit selection for voice conversion utilizing temporal\n information","author":"wu","year":"0","journal-title":"Proc INTERSPEECH"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2016.7472761"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2009.4960478"},{"key":"ref16","first-page":"369","article-title":"Voice conversion in high-order eigen\n space using deep belief nets","author":"nakashika","year":"0","journal-title":"Proc INTERSPEECH"},{"key":"ref17","first-page":"2283","article-title":"Sequence error minimization error training of neural network for\n voice conversion","author":"xie","year":"0","journal-title":"Proc INTERSPEECH"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ICME.2016.7552917"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.1992.225951"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2011.2114881"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2010.2049685"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1121\/1.1804628"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2007.907344"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2012.6288922"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2009.4960576"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.1988.196671"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2009.2038663"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2010.2041699"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.1998.674423"},{"key":"ref9","first-page":"841","article-title":"Voice conversion algorithm based on Gaussian micture model with dynamic frequency warping of STRAIGHT\n spectrum","author":"toda","year":"0","journal-title":"Proc Int Conf Acoust Speech Signal Process"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/89.661472"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2016-1066"},{"key":"ref22","first-page":"669","article-title":"Voice conversion using GMM with enhanced global variance","author":"benisty","year":"0","journal-title":"Proc INTERSPEECH"},{"key":"ref21","first-page":"1637","article-title":"Analysis\n of the voice conversion challeng 2016 evaluation results","author":"wester","year":"0","journal-title":"Proc INTERSPEECH"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2017.2723721"},{"article-title":"Concepts and applications of inferential statistics","year":"2011","author":"richard","key":"ref41"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/ISCSLP.2014.6936725"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2003.819861"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1198\/106186006X113430"}],"container-title":["IEEE\/ACM Transactions on Audio, Speech, and Language Processing"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6570655\/8440863\/08421612.pdf?arnumber=8421612","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,1,26]],"date-time":"2022-01-26T15:21:15Z","timestamp":1643210475000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8421612\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,12]]},"references-count":41,"journal-issue":{"issue":"12"},"URL":"https:\/\/doi.org\/10.1109\/taslp.2018.2860682","relation":{},"ISSN":["2329-9290","2329-9304"],"issn-type":[{"type":"print","value":"2329-9290"},{"type":"electronic","value":"2329-9304"}],"subject":[],"published":{"date-parts":[[2018,12]]}}}