{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,2]],"date-time":"2025-11-02T16:45:06Z","timestamp":1762101906229,"version":"build-2065373602"},"reference-count":27,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2016,6]]},"DOI":"10.1109\/icis.2016.7550889","type":"proceedings-article","created":{"date-parts":[[2016,8,25]],"date-time":"2016-08-25T16:57:40Z","timestamp":1472144260000},"page":"1-5","source":"Crossref","is-referenced-by-count":25,"title":["Emotional voice conversion using deep neural networks with MCC and F0 features"],"prefix":"10.1109","author":[{"given":"Zhaojie","family":"Luo","sequence":"first","affiliation":[]},{"given":"Tetsuya","family":"Takiguchi","sequence":"additional","affiliation":[]},{"given":"Yasuo","family":"Ariki","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2010.2041699"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2009.4960478"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ChinaSIP.2013.6625307"},{"key":"ref13","first-page":"369","article-title":"Voice conversion in high-order eigen space using deep belief nets","author":"nakashika","year":"2013","journal-title":"INTER-SPEECH"},{"key":"ref14","article-title":"Approaching automatic recognition of emotion from voice: a rough benchmark","author":"mcgilloway","year":"2000","journal-title":"ISCA Tutorial and Research Workshop (ITRW) on Speech and Emotion"},{"key":"ref15","doi-asserted-by":"crossref","first-page":"1145","DOI":"10.1109\/TASL.2006.876113","article-title":"Prosody conversion from neutral speech to emotional speech","volume":"14","author":"tao","year":"2006","journal-title":"Audio Speech and Language Processing IEEE Transactions on"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.5923\/j.ajsp.20120205.06"},{"key":"ref17","article-title":"Minimum trajectory error training for deep neural networks, combined with stacked bottleneck features","author":"wu","year":"2015","journal-title":"Sixteenth Annual Conference of the International Speech Communication Association"},{"article-title":"F0 discontinuity as a marker of prosodic boundary strength in lombard speech","year":"2015","author":"be?u\u0161","key":"ref18"},{"key":"ref19","article-title":"Using f0 contours to assess nativeness in a sentence repeat task","author":"ma","year":"2015","journal-title":"Sixteenth Annual Conference of the International Speech Communication Association"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1515\/lp-2013-0003"},{"key":"ref27","article-title":"Architectures for deep neural network based acoustic models defined over windowed speech waveforms","author":"bhargava","year":"2015","journal-title":"Sixteenth Annual Conference of the InternationalSpeech Communication Association"},{"key":"ref3","first-page":"29","article-title":"Individuality-preserving voice conversion for articulation disorders using dictionary selective nonnegative matrix factorization","author":"aihara","year":"2014","journal-title":"ACL 2014"},{"key":"ref6","article-title":"Frequency warping based on mapping formant parameters","author":"shuang","year":"2006","journal-title":"Ninth International Conference on Spoken Language Processing"},{"key":"ref5","article-title":"Phase perception of the glottal excitation of vocoded speech","author":"raitio","year":"2015","journal-title":"Sixteenth Annual Conference of the InternationalSpeech Communication Association"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.1992.225953"},{"key":"ref7","first-page":"1965","article-title":"Weighted frequency warping for voice conversion","author":"erro","year":"2007","journal-title":"InterSpeech"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/ICME.2006.262725"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2007.907344"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.1998.674423"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1250\/ast.27.349"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1016\/j.specom.2009.04.004"},{"key":"ref21","first-page":"191","article-title":"Comparative evaluation of various mfcc implementations on the speaker verification task","volume":"1","author":"ganchev","year":"2005","journal-title":"Proceedings of the SPECOM"},{"key":"ref24","first-page":"2401","article-title":"Gmm-based voice conversion applied to emotional speech synthesis","volume":"7","author":"kawanami","year":"2003","journal-title":"IEEE Trans Speech Audio Proc"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/FSKD.2007.347"},{"key":"ref26","article-title":"Learning the speech front-end with raw waveform cldnns","author":"sainath","year":"2015","journal-title":"Sixteenth Annual Conference of the InternationalSpeech Communication Association"},{"key":"ref25","article-title":"High-order sequence modeling using speaker-dependent recurrent temporal restricted boltzmann machines for voice conversion","author":"nakashika","year":"2014","journal-title":"Fifteenth Annual Conference of the InternationalSpeech Communication Association"}],"event":{"name":"2016 IEEE\/ACIS 15th International Conference on Computer and Information Science (ICIS)","start":{"date-parts":[[2016,6,26]]},"location":"Okayama, Japan","end":{"date-parts":[[2016,6,29]]}},"container-title":["2016 IEEE\/ACIS 15th International Conference on Computer and Information Science (ICIS)"],"original-title":[],"link":[{"URL":"http:\/\/ieeexplore.ieee.org\/iel7\/7537873\/7550716\/07550889.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7537873\/7550716\/07550889.pdf?arnumber=7550889","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,6,24]],"date-time":"2017-06-24T17:23:57Z","timestamp":1498325037000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7550889\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,6]]},"references-count":27,"URL":"https:\/\/doi.org\/10.1109\/icis.2016.7550889","relation":{},"subject":[],"published":{"date-parts":[[2016,6]]}}}