{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,2]],"date-time":"2025-11-02T16:28:32Z","timestamp":1762100912798,"version":"3.37.0"},"reference-count":38,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"8","license":[{"start":{"date-parts":[[2009,11,1]],"date-time":"2009-11-01T00:00:00Z","timestamp":1257033600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Audio Speech Lang. Process."],"published-print":{"date-parts":[[2009,11]]},"DOI":"10.1109\/tasl.2009.2023161","type":"journal-article","created":{"date-parts":[[2009,5,19]],"date-time":"2009-05-19T20:01:24Z","timestamp":1242763284000},"page":"1567-1576","source":"Crossref","is-referenced-by-count":13,"title":["Modeling the Expressivity of Input Text Semantics for Chinese Text-to-Speech Synthesis in a Spoken Dialog System"],"prefix":"10.1109","volume":"17","author":[{"family":"Zhiyong Wu","sequence":"first","affiliation":[]},{"given":"H.M.","family":"Meng","sequence":"additional","affiliation":[]},{"family":"Hongwu Yang","sequence":"additional","affiliation":[]},{"family":"Lianhong Cai","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref38","article-title":"aperiodicity extraction and control using mixed mode excitation and group delay manipulation for a high quality speech analysis, modification and synthesis system straight","author":"kawahara","year":"2001","journal-title":"Proc Int Workshop Models and Analysis of Vocal Emissions for Biomedical Applications"},{"journal-title":"Discover Hong Kong","year":"0","key":"ref33"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1007\/11939993_63"},{"key":"ref31","doi-asserted-by":"crossref","first-page":"29","DOI":"10.1145\/1082473.1082478","article-title":"alma: a layered model of affect","author":"gebhard","year":"2005","journal-title":"Proc Int Joint Conf Autonomous Agents and Multiagent Systems"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1177\/001316447803800431"},{"journal-title":"A Grammar of Spoken Chinese","year":"1968","author":"chao","key":"ref37"},{"key":"ref36","first-page":"417","author":"tseng","year":"2004","journal-title":"From Traditional Phonology To Modern Speech Processing"},{"journal-title":"Prosodic Phonol","year":"1986","author":"nespor","key":"ref35"},{"journal-title":"Dialog Acts in VERBMOBIL-2","year":"0","author":"alexandersson","key":"ref34"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1121\/1.405558"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1016\/S0167-6393(02)00084-5"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1007\/11550617_34"},{"key":"ref13","doi-asserted-by":"crossref","first-page":"37","DOI":"10.21437\/Eurospeech.2003-10","article-title":"isca special session: hot topics in speech synthesis","author":"bailly","year":"2003","journal-title":"Proc EUROSPEECH"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2006.876118"},{"key":"ref15","first-page":"217","article-title":"accounting for voice-quality variation","author":"campbell","year":"2004","journal-title":"Proc 3rd Int Conf Speech Prosody"},{"key":"ref16","first-page":"2417","article-title":"voice quality: the 4th prosodic dimension","author":"campbell","year":"2003","journal-title":"Proc Congr Phon Sci"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1016\/j.specom.2005.02.016"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1016\/S0167-6393(02)00070-5"},{"key":"ref19","first-page":"60","article-title":"automated extraction of tobi annotation data from the reading\/leeds emotional speech corpus","author":"stibbard","year":"2000","journal-title":"Proc ISCA workshop Speech Emotion"},{"key":"ref28","first-page":"339","article-title":"framework for a comprehensive description and measurement of emotional states","volume":"121","author":"mehrabian","year":"1995","journal-title":"Genetic Social Gen Psychol Monographs"},{"key":"ref4","doi-asserted-by":"crossref","first-page":"1637","DOI":"10.21437\/Eurospeech.2003-470","article-title":"towards synthesizing expressive speech: designing and collecting expressive speech data","author":"campbell","year":"2003","journal-title":"Proc EUROSPEECH"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1016\/j.specom.2005.02.017"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/JPROC.2003.817141"},{"key":"ref6","first-page":"175","author":"bulut","year":"2004","journal-title":"Text to Speech Synthesis New Paradigms and Advances"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1016\/0092-6566(77)90037-X"},{"key":"ref5","first-page":"2577","article-title":"the ibm expressive speech synthesis system","author":"hamza","year":"2004","journal-title":"Proc ICSLP"},{"key":"ref8","first-page":"1","article-title":"the generation of affect in synthesized speech","volume":"8","author":"cahn","year":"1990","journal-title":"J American Voice I\/O Society"},{"key":"ref7","first-page":"1185","article-title":"constructing emotional speech synthesizers with limited speech database","author":"tsuzuki","year":"2004","journal-title":"Proc ICSLP"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/AFGR.2002.1004186"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ICSLP.1996.607983"},{"key":"ref1","doi-asserted-by":"crossref","DOI":"10.7551\/mitpress\/1140.001.0001","author":"picard","year":"1997","journal-title":"Affective Computing"},{"key":"ref20","first-page":"39","article-title":"a new emotion database: considerations, sources and scope","author":"douglas-cowie","year":"2000","journal-title":"Proc ISCA workshop Speech Emotion"},{"key":"ref22","doi-asserted-by":"crossref","first-page":"1649","DOI":"10.21437\/Eurospeech.2003-473","article-title":"unit selection and emotion speech","author":"black","year":"2003","journal-title":"Proc EUROSPEECH"},{"key":"ref21","first-page":"61","article-title":"the jst\/crest esp projecta midterm progress report","author":"campbell","year":"2003","journal-title":"Proc Int Workshop Expressive Speech Process"},{"key":"ref24","article-title":"expressive speech synthesis using a concatenative synthesizer","author":"bulut","year":"2002","journal-title":"Proc ICSLP"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1016\/S0167-6393(02)00081-X"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2006.876113"},{"key":"ref25","article-title":"investigating the role of phoneme-level modifications in emotional speech resynthesis","author":"bulut","year":"2005","journal-title":"Proc EUROSPEECH"}],"container-title":["IEEE Transactions on Audio, Speech, and Language Processing"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx5\/10376\/5200684\/04926212.pdf?arnumber=4926212","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,2,9]],"date-time":"2025-02-09T15:55:34Z","timestamp":1739116534000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/4926212\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2009,11]]},"references-count":38,"journal-issue":{"issue":"8"},"URL":"https:\/\/doi.org\/10.1109\/tasl.2009.2023161","relation":{},"ISSN":["1558-7916"],"issn-type":[{"type":"print","value":"1558-7916"}],"subject":[],"published":{"date-parts":[[2009,11]]}}}