{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,31]],"date-time":"2025-10-31T07:43:23Z","timestamp":1761896603244,"version":"3.37.3"},"reference-count":52,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"1","license":[{"start":{"date-parts":[[2018,1,1]],"date-time":"2018-01-01T00:00:00Z","timestamp":1514764800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"}],"funder":[{"name":"European Union's Horizon 2020 research and innovation programme under the Marie Sklodowska-Curie","award":["655764"],"award-info":[{"award-number":["655764"]}]},{"DOI":"10.13039\/501100000266","name":"EPSRC","doi-asserted-by":"publisher","award":["EP\/I031022\/1"],"award-info":[{"award-number":["EP\/I031022\/1"]}],"id":[{"id":"10.13039\/501100000266","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE\/ACM Trans. Audio Speech Lang. Process."],"published-print":{"date-parts":[[2018,1]]},"DOI":"10.1109\/taslp.2017.2761546","type":"journal-article","created":{"date-parts":[[2017,10,9]],"date-time":"2017-10-09T18:11:18Z","timestamp":1507572678000},"page":"57-70","source":"Crossref","is-referenced-by-count":14,"title":["A Log Domain Pulse Model for Parametric Speech Synthesis"],"prefix":"10.1109","volume":"26","author":[{"given":"Gilles","family":"Degottex","sequence":"first","affiliation":[]},{"given":"Pierre","family":"Lanchantin","sequence":"additional","affiliation":[]},{"given":"Mark","family":"Gales","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/78.382394"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1016\/j.csl.2016.08.002"},{"key":"ref33","first-page":"1653","article-title":"The importance of phase on voice\n quality assessment","author":"koutsogiannaki","year":"0","journal-title":"Proc Annu Conf Int Speech Commun Assoc"},{"key":"ref32","first-page":"1633","article-title":"Phase distortion statistics as a representation of the glottal source: Application to the\n classification of voice qualities","author":"degottex","year":"0","journal-title":"Proc Annu Conf Int Speech Commun Assoc"},{"article-title":"REAPER: Robust Epoch And Pitch EstimatoR","year":"2015","author":"talkin","key":"ref31"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2010.5495142"},{"key":"ref37","first-page":"2316","article-title":"HMM-based synthesis of creaky voice","author":"raitio","year":"0","journal-title":"Proc Annu Conf Int Speech Commun Assoc"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1016\/j.csl.2014.03.002"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2013.2266772"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/TASSP.1986.1164910"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1250\/ast.28.140"},{"key":"ref27","first-page":"89","article-title":"Intelligibility of degraded speech from\n smeared STRAIGHT spectrum","author":"kawahara","year":"0","journal-title":"Proc Annu Conf Int Speech Commun Assoc"},{"key":"ref29","first-page":"1735","article-title":"Parameterization of vocal fry in\n HMM-based speech synthesis","author":"sil\u00e9n","year":"0","journal-title":"Proc Annu Conf Int Speech Commun Assoc"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1093\/ietisy\/e90-d.5.825"},{"key":"ref1","first-page":"967","article-title":"Using\n HMM-based speech synthesis to reconstruct the voice of individuals with degenerative speech disorders","author":"veaux","year":"0","journal-title":"Proc Annu Conf Int Speech Commun Assoc"},{"article-title":"Harmonic plus noise models for speech combined with statistical\n methods, for speech and speaker modification","year":"1996","author":"stylianou","key":"ref20"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/29.1651"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-66286-7"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1016\/0167-6393(96)00038-6"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.21437\/SSW.2016-35"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1121\/1.4777797"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1121\/1.421421"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2015.7178814"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.1992.225953"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1093\/ietisy\/e90-1.1.325"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2010.2076805"},{"key":"ref11","first-page":"1082","article-title":"Uniform concatenative excitation model for synthesising speech\n without voiced\/unvoiced classification","author":"cabral","year":"0","journal-title":"Proc Annu Conf Int Speech Commun Assoc"},{"article-title":"A unified theory of time-frequency reassignment","year":"2009","author":"fitz","key":"ref40"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1186\/s13636-014-0038-1"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1016\/S0167-6393(98)00085-5"},{"key":"ref14","article-title":"Aperiodicity extraction and control using mixed mode excitation and group delay manipulation for a high quality speech\n analysis, modification and synthesis system STRAIGHT","author":"kawahara","year":"0","journal-title":"Proc 7th Int Workshop Models Anal Vocal Emissions Biomed Appl"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2011.2169787"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1016\/j.specom.2012.08.010"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/JSTSP.2013.2283471"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2015.7178768"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2011.5947410"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.21437\/SSW.2016-33"},{"key":"ref3","first-page":"5140","article-title":"Investigating gated recurrent neural networks for speech synthesis","volume":"1","author":"wu","year":"0","journal-title":"Proc IEEE Int Conf Acoustics Speech and Signal Process (ICASSP)"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.1989.266409"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.1996.541110"},{"key":"ref8","first-page":"1504","article-title":"Measuring the perceptual effects of modelling assumptions in\n speech synthesis using stimuli constructed from repeated natural speech","author":"henter","year":"0","journal-title":"Proc Annu Conf Int Speech Commun Assoc"},{"year":"2016","key":"ref7","article-title":"The Blizzard Challenge 2016"},{"key":"ref49","first-page":"136","article-title":"Evaluating\n speech synthesis intelligibility using Amazon Mechanical Turk","author":"wolters","year":"0","journal-title":"Proc 7th ISCA Speech Synthesis Workshop"},{"key":"ref9","first-page":"1068","article-title":"WaveNet: A generative model for raw audio","volume":"43","author":"van den oord","year":"1995","journal-title":"Trans Signal Process"},{"key":"ref46","first-page":"3552","article-title":"Intelligibility enhancing speech modifications: The hurricane challenge","author":"cooke","year":"0","journal-title":"Proc Annu Conf Int Speech Commun Assoc"},{"key":"ref45","first-page":"223","article-title":"The CMU ARCTIC speech databases","author":"kominek","year":"0","journal-title":"Proc ISCA Speech Synthesis Workshop"},{"key":"ref48","first-page":"1","article-title":"Creating speech and language data with amazons mechanical turk","author":"callison-burch","year":"0","journal-title":"NAACL HLT Workshop on Creating Speech and Language Data with Amazon's Mechanical Turk"},{"year":"2003","key":"ref47","article-title":"En-general methods for the subjective assessment of sound\n quality"},{"journal-title":"Digital Signal Processing","year":"1978","author":"oppenheim","key":"ref42"},{"journal-title":"Image Analysis and Mathematical Morphology","year":"1983","author":"serra","key":"ref41"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1016\/0167-6393(90)90021-Z"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.1992.225951"}],"container-title":["IEEE\/ACM Transactions on Audio, Speech, and Language Processing"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6570655\/8124117\/08063442.pdf?arnumber=8063442","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,1,12]],"date-time":"2022-01-12T16:24:16Z","timestamp":1642004656000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/8063442\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,1]]},"references-count":52,"journal-issue":{"issue":"1"},"URL":"https:\/\/doi.org\/10.1109\/taslp.2017.2761546","relation":{},"ISSN":["2329-9290","2329-9304"],"issn-type":[{"type":"print","value":"2329-9290"},{"type":"electronic","value":"2329-9304"}],"subject":[],"published":{"date-parts":[[2018,1]]}}}