{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T01:14:52Z","timestamp":1740100492339,"version":"3.37.3"},"reference-count":34,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,11,18]],"date-time":"2021-11-18T00:00:00Z","timestamp":1637193600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2021,11,18]],"date-time":"2021-11-18T00:00:00Z","timestamp":1637193600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,11,18]],"date-time":"2021-11-18T00:00:00Z","timestamp":1637193600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/100006203","name":"JSC","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100006203","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,11,18]]},"DOI":"10.1109\/o-cocosda202152914.2021.9660445","type":"proceedings-article","created":{"date-parts":[[2022,1,3]],"date-time":"2022-01-03T20:19:17Z","timestamp":1641241157000},"page":"199-205","source":"Crossref","is-referenced-by-count":1,"title":["A Study on Neural-Network-Based Text-to-Speech Adaptation Techniques for Vietnamese"],"prefix":"10.1109","author":[{"given":"Pham Ngoc","family":"Phuong","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Chung Tran","family":"Quang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Quoc Truong","family":"Do","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mai Chi","family":"Luong","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref33","first-page":"19","article-title":"Improving prosodic phrasing of vietnamese text-to-speech systems","author":"ngoc","year":"0","journal-title":"Proceedings of the 7th International Workshop on Vietnamese Language and Speech Processing"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2020-1745"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2019.8683862"},{"key":"ref30","article-title":"Sam-ple efficient adaptive text-to-speech","author":"yutian","year":"2018","journal-title":"ArXiv Preprint"},{"key":"ref34","article-title":"Syn-thesizer voice quality of new languages calibrated with mean mel cepstral distortion","author":"kominek","year":"2008","journal-title":"Spoken Language Technologies for Under-resoured Languages"},{"key":"ref10","article-title":"Glow-tts: A generative flow for text-to-speech via monotonic alignment search","author":"kim","year":"2020","journal-title":"ar Xiv preprint"},{"key":"ref11","article-title":"Adaptation techniques for speech synthesis in under-resourced languages","author":"anumanchipalli","year":"2010","journal-title":"Spoken Languages Technolo-giesfor Under-Resourced Languages"},{"key":"ref12","article-title":"A survey on neural speech synthesis","author":"tan","year":"2021","journal-title":"ar Xiv preprint"},{"key":"ref13","article-title":"Adadurian: Few-shot adaptation for neural text-to-speech with durian","author":"zhang","year":"2020","journal-title":"ArXiv Preprint"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-1705"},{"key":"ref15","first-page":"7639","article-title":"Boffin tts: Few-shot speaker adaptation by bayesian optimization","author":"henry","year":"0","journal-title":"ICASSP 2020&#x2013;2020 IEEE International Conference on Acoustics Speech and Signal Processing (ICASSP)"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2020-2096"},{"key":"ref17","article-title":"Adaspeech: Adaptive text to speech for custom voice","author":"chen","year":"2021","journal-title":"ar Xiv preprint"},{"key":"ref18","article-title":"Meta-stylespeech: Multi-speaker adaptive text-to-speech generation","author":"min","year":"2021","journal-title":"ArXiv Preprint"},{"key":"ref19","first-page":"35","article-title":"Vietnamese text-to-speech shared task vlsp 2020: Remaining problems with state-of-the-art techniques","author":"nguyen","year":"0","journal-title":"Proceedings of the 7th International Workshop on Vietnamese Language and Speech Processing"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1016\/j.procs.2016.04.046"},{"key":"ref4","first-page":"4779","article-title":"Natural tts synthesis by conditioning wavenet on mel spectrogram predictions","author":"jonathan","year":"0","journal-title":"2018 IEEE International Conference on Acoustics Speech and Signal Processing (ICASSP)"},{"key":"ref27","first-page":"3145","article-title":"An efficient algorithm to search for a minimum sentence set for collecting speech database","author":"zhang","year":"0","journal-title":"Proc ICPhS"},{"key":"ref3","article-title":"Tacotron: Towards end-to-end speech synthesis","author":"wang","year":"2017","journal-title":"ArXiv Preprint"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.33016706"},{"key":"ref29","article-title":"Transfer learning from speaker verification to multispeaker text-to-speech synthesis","author":"ye","year":"2018","journal-title":"ArXiv Preprint"},{"journal-title":"Deep voice 3 2000-speaker neural text-to-speech","year":"2017","author":"ping","key":"ref5"},{"key":"ref8","first-page":"7586","article-title":"Non-autoregressive neural text-to-speech","author":"peng","year":"0","journal-title":"International Conference on Machine Learning"},{"key":"ref7","article-title":"Fastspeech: Fast, robust and controllable text to speech","author":"ren","year":"2019","journal-title":"ar Xiv preprint"},{"key":"ref2","article-title":"Wavenet: A generative model for raw audio","author":"van den oord","year":"2016","journal-title":"ArXiv Preprint"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9054484"},{"key":"ref1","first-page":"7962","article-title":"Sta-tistical parametric speech synthesis using deep neural networks","author":"ze","year":"0","journal-title":"2013 IEEE International Conference on Acoustics Speech and Signal Processing"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP39728.2021.9414872"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2020.3034994"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9053371"},{"key":"ref24","article-title":"Using ipa-based tacotron for data efficient cross-lingual speaker adaptation and pronunciation enhancement","author":"hemati","year":"2020","journal-title":"ar Xiv preprint"},{"key":"ref23","first-page":"52","article-title":"Ex-ploring transfer learning for low resource emotional tts","author":"tits","year":"0","journal-title":"Proceedings of SAI Intelligent Systems Conference"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.15625\/1813-9663\/34\/4\/13165"},{"key":"ref25","article-title":"A high quality and phonetic balanced speech corpus for vietnamese","author":"phuong","year":"2019","journal-title":"ArXiv Preprint"}],"event":{"name":"2021 24th Conference of the Oriental COCOSDA International Committee for the Co-ordination and Standardisation of Speech Databases and Assessment Techniques (O-COCOSDA)","start":{"date-parts":[[2021,11,18]]},"location":"Singapore, Singapore","end":{"date-parts":[[2021,11,20]]}},"container-title":["2021 24th Conference of the Oriental COCOSDA International Committee for the Co-ordination and Standardisation of Speech Databases and Assessment Techniques (O-COCOSDA)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9660212\/9660400\/09660445.pdf?arnumber=9660445","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,5,10]],"date-time":"2022-05-10T16:56:38Z","timestamp":1652201798000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9660445\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,11,18]]},"references-count":34,"URL":"https:\/\/doi.org\/10.1109\/o-cocosda202152914.2021.9660445","relation":{},"subject":[],"published":{"date-parts":[[2021,11,18]]}}}