{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,9]],"date-time":"2024-09-09T13:52:04Z","timestamp":1725889924806},"publisher-location":"Berlin, Heidelberg","reference-count":16,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783642327896"},{"type":"electronic","value":"9783642327902"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2012]]},"DOI":"10.1007\/978-3-642-32790-2_55","type":"book-chapter","created":{"date-parts":[[2012,8,6]],"date-time":"2012-08-06T07:45:48Z","timestamp":1344239148000},"page":"456-463","source":"Crossref","is-referenced-by-count":6,"title":["On the Impact of Annotation Errors on\u00a0Unit-Selection\u00a0Speech\u00a0Synthesis"],"prefix":"10.1007","author":[{"given":"Jind\u0159ich","family":"Matou\u0161ek","sequence":"first","affiliation":[]},{"given":"Daniel","family":"Tihelka","sequence":"additional","affiliation":[]},{"given":"Lubo\u0161","family":"\u0160m\u00eddl","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"55_CR1","doi-asserted-by":"crossref","unstructured":"Tihelka, D., Kala, J., Matou\u0161ek, J.: Enhancements of Viterbi Search for Fast Unit Selection Synthesis. In: Proc. Interspeech, Makuhari, Japan, pp. 174\u2013177 (2010)","DOI":"10.21437\/Interspeech.2010-78"},{"key":"55_CR2","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"291","DOI":"10.1007\/978-3-642-15760-8_37","volume-title":"Text, Speech and Dialogue","author":"Z. Hanzl\u00ed\u010dek","year":"2010","unstructured":"Hanzl\u00ed\u010dek, Z.: Czech HMM-Based Speech Synthesis. In: Sojka, P., Hor\u00e1k, A., Kope\u010dek, I., Pala, K. (eds.) TSD 2010. LNCS, vol.\u00a06231, pp. 291\u2013298. Springer, Heidelberg (2010)"},{"key":"55_CR3","doi-asserted-by":"crossref","unstructured":"Cox, S., Brady, R., Jackson, P.: Techniques for Accurate Automatic Annotation of Speech Waveforms. In: Proc. ICSLP, Sydney, Australia (1998)","DOI":"10.21437\/ICSLP.1998-22"},{"key":"55_CR4","doi-asserted-by":"crossref","unstructured":"Tachibana, R., Nagano, T., Kurata, G., Nishimura, M., Babaguchi, N.: Preliminary Experiments Toward Automatic Generation of New TTS Voices from Recorded Speech Alone. In: Proc. Interspeech, Antwerp, Belgium, pp. 1917\u20131920 (2007)","DOI":"10.21437\/Interspeech.2007-532"},{"key":"55_CR5","doi-asserted-by":"crossref","unstructured":"Aylett, M.P., King, S., Yamagishi, J.: Speech Synthesis Without a Phone Inventory. In: Proc. Interspeech, Brighton, England, pp. 2087\u20132090 (2009)","DOI":"10.21437\/Interspeech.2009-598"},{"key":"55_CR6","series-title":"Lecture Notes in Artificial Intelligence","doi-asserted-by":"publisher","first-page":"326","DOI":"10.1007\/978-3-540-74628-7_43","volume-title":"Text, Speech and Dialogue","author":"J. Matou\u0161ek","year":"2007","unstructured":"Matou\u0161ek, J., Romportl, J.: Recording and Annotation of Speech Corpus for Czech Unit Selection Speech Synthesis. In: Matou\u0161ek, V., Mautner, P. (eds.) TSD 2007. LNCS (LNAI), vol.\u00a04629, pp. 326\u2013333. Springer, Heidelberg (2007)"},{"key":"55_CR7","series-title":"Lecture Notes in Artificial Intelligence","doi-asserted-by":"publisher","first-page":"287","DOI":"10.1007\/978-3-540-39398-6_41","volume-title":"Text, Speech and Dialogue","author":"J. Matou\u0161ek","year":"2003","unstructured":"Matou\u0161ek, J., Tihelka, D., Psutka, J.V.: Experiments with Automatic Segmentation for Czech Speech Synthesis. In: Matou\u0161ek, V., Mautner, P. (eds.) TSD 2003. LNCS (LNAI), vol.\u00a02807, pp. 287\u2013294. Springer, Heidelberg (2003)"},{"key":"55_CR8","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"568","DOI":"10.1007\/978-3-642-15760-8_72","volume-title":"Text, Speech and Dialogue","author":"J. \u0160vec","year":"2010","unstructured":"\u0160vec, J., \u0160m\u00eddl, L.: Prototype of Czech Spoken Dialog System with Mixed Initiative for Railway Information Service. In: Sojka, P., Hor\u00e1k, A., Kope\u010dek, I., Pala, K. (eds.) TSD 2010. LNCS, vol.\u00a06231, pp. 568\u2013575. Springer, Heidelberg (2010)"},{"key":"55_CR9","doi-asserted-by":"publisher","first-page":"3657","DOI":"10.1016\/j.sigpro.2006.02.039","volume":"12","author":"M. \u017delezn\u00fd","year":"2006","unstructured":"\u017delezn\u00fd, M., Kr\u0148oul, Z., C\u00edsa\u0159, P., Matou\u0161ek, J.: Design, Implementation and Evaluation of the Czech Realistic Audio-Visual Speech Synthesis. Signal Processing\u00a012, 3657\u20133673 (2006)","journal-title":"Signal Processing"},{"key":"55_CR10","series-title":"Lecture Notes in Artificial Intelligence","doi-asserted-by":"publisher","first-page":"259","DOI":"10.1007\/3-540-45323-7_44","volume-title":"Text, Speech and Dialogue","author":"L. M\u00fcller","year":"2000","unstructured":"M\u00fcller, L., Psutka, J.V., \u0160m\u00eddl, L.: Design of Speech Recognition Engine. In: Sojka, P., Kope\u010dek, I., Pala, K. (eds.) TSD 2000. LNCS (LNAI), vol.\u00a01902, pp. 259\u2013264. Springer, Heidelberg (2000)"},{"key":"55_CR11","first-page":"49","volume-title":"Recent Advances in Signals and Systems","author":"L. \u0160m\u00eddl","year":"2009","unstructured":"\u0160m\u00eddl, L., Trmal, J.: Keyword Spotting Result Post-processing to Reduce False Alarms. In: Recent Advances in Signals and Systems, vol.\u00a09, pp. 49\u201352. WSEAS Press, Budapest (2009)"},{"key":"55_CR12","doi-asserted-by":"publisher","first-page":"503","DOI":"10.1016\/S0167-6393(02)00131-0","volume":"40","author":"F. Malfrere","year":"2003","unstructured":"Malfrere, F., Deroo, O., Dutoit, T., Ris, C.: Phonetic Alignment: Speech Synthesis-Based Vs. Viterbi-Based. Speech Communication\u00a040, 503\u2013515 (2003)","journal-title":"Viterbi-Based. Speech Communication"},{"key":"55_CR13","doi-asserted-by":"crossref","unstructured":"Lu, H., Wei, S., Dai, L., Wang, R.-H.: Automatic Error Detection for Unit Selection Speech Synthesis Using Log Likelihood Ratio Based SVM Classifier. In: Proc. Interspeech, Makuhari, Japan, pp. 162\u2013165 (2010)","DOI":"10.21437\/Interspeech.2010-75"},{"key":"55_CR14","doi-asserted-by":"crossref","unstructured":"Gr\u016fber, M.: Acoustic Analysis of Czech Expressive Recordings from a Single Speaker in Terms of Various Communicative Functions. In: Proc. ISSPIT, Bilbao, Spain, pp. 267\u2013272 (2011)","DOI":"10.1109\/ISSPIT.2011.6151576"},{"key":"55_CR15","doi-asserted-by":"publisher","first-page":"72","DOI":"10.2478\/v10048-010-0017-3","volume":"10","author":"J. P\u0159ibil","year":"2010","unstructured":"P\u0159ibil, J., P\u0159ibilov\u00e1, A.: An Experiment with Evaluation of Emotional Speech Conversion by Spectrograms. Measurement Science Review\u00a010, 72\u201377 (2010)","journal-title":"Measurement Science Review"},{"key":"55_CR16","doi-asserted-by":"crossref","unstructured":"Matou\u0161ek, J., Skarnitzl, R., Macha\u010d, P., Trmal, J.: Identification and Automatic Detection of Parasitic Speech Sounds. In: Proc. Interspeech, Brighton, England, pp. 876\u2013879 (2009)","DOI":"10.21437\/Interspeech.2009-265"}],"container-title":["Lecture Notes in Computer Science","Text, Speech and Dialogue"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-32790-2_55.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,6,25]],"date-time":"2023-06-25T05:25:11Z","timestamp":1687670711000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-642-32790-2_55"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2012]]},"ISBN":["9783642327896","9783642327902"],"references-count":16,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-32790-2_55","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2012]]}}}