{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,25]],"date-time":"2025-03-25T14:40:33Z","timestamp":1742913633107,"version":"3.40.3"},"publisher-location":"Cham","reference-count":16,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783030878016"},{"type":"electronic","value":"9783030878023"}],"license":[{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021]]},"DOI":"10.1007\/978-3-030-87802-3_43","type":"book-chapter","created":{"date-parts":[[2021,9,21]],"date-time":"2021-09-21T23:36:52Z","timestamp":1632267412000},"page":"472-482","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Explicit Control of the Level of Expressiveness in DNN-Based Speech Synthesis by Embedding Interpolation"],"prefix":"10.1007","author":[{"given":"Tijana","family":"Nosek","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Sini\u0161a","family":"Suzi\u0107","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mia","family":"Vujovi\u0107","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Darko","family":"Pekar","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Milan","family":"Se\u010dujski","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Vlado","family":"Deli\u0107","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2021,9,22]]},"reference":[{"key":"43_CR1","unstructured":"Gong, L., Nass, C., Simard, C., Takhteyev, Y.: Usability Evaluation and Interface Design: Cognitive Engineering, Intelligent Agents, and Virtual Reality, When non-human is better than semi-human: Consistency in speech interfaces, vol.\u00a03, pp.\u00a0390\u2013394 (2001)"},{"key":"43_CR2","series-title":"Lecture Notes in Computer Science (Lecture Notes in Artificial Intelligence)","doi-asserted-by":"publisher","first-page":"44","DOI":"10.1007\/978-3-319-99582-3_5","volume-title":"Interactive Collaborative Robotics","author":"V Deli\u0107","year":"2018","unstructured":"Deli\u0107, V., et al.: Toward more expressive speech communication in human-robot interaction. In: Ronzhin, A., Rigoll, G., Meshcheryakov, R. (eds.) ICR 2018. LNCS (LNAI), vol. 11097, pp. 44\u201351. Springer, Cham (2018). https:\/\/doi.org\/10.1007\/978-3-319-99582-3_5"},{"key":"43_CR3","volume-title":"Emotion in Human-Computer Interaction, the Human-Computer Interaction Handbook: Fundamentals, Evolving Technologies and Emerging Applications","author":"S Brave","year":"2002","unstructured":"Brave, S., Clifford, N.: Emotion in Human-Computer Interaction, the Human-Computer Interaction Handbook: Fundamentals, Evolving Technologies and Emerging Applications. CRC Press, Boca Raton (2002)"},{"key":"43_CR4","doi-asserted-by":"crossref","unstructured":"Hamacher, A., Bianchi-Berthouze, N., Pipe, A.G., Eder, K.: Believing in BERT: Using expressive communication to enhance trust and counteract operational error in physical Human-Robot Interaction. In: Robot and Human Interactive Communication (2016)","DOI":"10.1109\/ROMAN.2016.7745163"},{"key":"43_CR5","doi-asserted-by":"crossref","unstructured":"Suzi\u0107, S., Deli\u0107, T., Jovanovi\u0107, V., Se\u010dujski, M., Pekar, D., Deli\u0107, V.: A comparison of multi-style DNN-based TTS approaches using small datasets. In: MATEC Web of Conferences, vol.\u00a0161, P.\u00a003005, EDP Sciences (2018)","DOI":"10.1051\/matecconf\/201816103005"},{"key":"43_CR6","doi-asserted-by":"crossref","unstructured":"Tachibana, M., Yamagishi, J., Onishi, K., Masuko, T., Kobayashi, T.: HMM-based speech synthesis with various speaking styles using model interpolation. In: Speech Prosody 2004, International Conference (2004)","DOI":"10.21437\/SpeechProsody.2004-94"},{"key":"43_CR7","doi-asserted-by":"crossref","unstructured":"Masuko, T., Kobayashi, T., Miyanaga, K.: A style control technique for HMM-based speech synthesis. In: Eighth International Conference on Spoken Language Processing (2004)","DOI":"10.21437\/Interspeech.2004-551"},{"issue":"2","key":"43_CR8","doi-asserted-by":"publisher","first-page":"347","DOI":"10.1016\/j.specom.2012.09.003","volume":"55","author":"T Nose","year":"2013","unstructured":"Nose, T., Kobayashi, T.: An intuitive style control technique in HMM-based expressive speech synthesis using subjective style intensity and multiple-regression global variance model. Speech Commun. 55(2), 347\u2013357 (2013)","journal-title":"Speech Commun."},{"key":"43_CR9","doi-asserted-by":"publisher","first-page":"135","DOI":"10.1016\/j.specom.2018.03.002","volume":"99","author":"J Lorenzo-Trueba","year":"2018","unstructured":"Lorenzo-Trueba, J., Henter, G.E., Takaki, S., Yamagishi, J., Morino, Y., Ochiai, Y.: Investigating different representations for modeling and controlling multiple emotions in DNN-based speech synthesis. Speech Commun. 99, 135\u2013143 (2018)","journal-title":"Speech Commun."},{"key":"43_CR10","doi-asserted-by":"publisher","first-page":"151","DOI":"10.1016\/j.cogsys.2019.09.009","volume":"59","author":"X Zhu","year":"2020","unstructured":"Zhu, X., Xue, L.: Building a controllable expressive speech synthesis system with multiple emotion strengths. Cogn. Syst. Res. 59, 151\u2013159 (2020)","journal-title":"Cogn. Syst. Res."},{"key":"43_CR11","first-page":"2579","volume":"9","author":"L van der Maaten","year":"2008","unstructured":"van der Maaten, L., Hinton, G.: Visualizing data using t-SNE. J. Mach. Learn. Res. 9, 2579\u20132605 (2008)","journal-title":"J. Mach. Learn. Res."},{"issue":"4","key":"43_CR12","doi-asserted-by":"publisher","first-page":"434","DOI":"10.3897\/jucs.2020.023","volume":"26","author":"M Se\u010dujski","year":"2020","unstructured":"Se\u010dujski, M., Pekar, D., Suzi\u0107, S., Smirnov, A., Nosek, T.: Speaker\/style-dependent neural network speech synthesis based on speaker\/style embedding. J. Univers. Comput. Sci. 26(4), 434\u2013453 (2020)","journal-title":"J. Univers. Comput. Sci."},{"key":"43_CR13","doi-asserted-by":"crossref","unstructured":"Wu, Z., Watts, O., King, S.: Merlin: An Open Source Neural Network Speech Synthesis System. In: Proc. 9th ISCA Speech Synthesis Workshop (2016)","DOI":"10.21437\/SSW.2016-33"},{"key":"43_CR14","unstructured":"Abadi, M., et al.: A System for Large-scale Machine Learning. In: 12th USENIX symposium on operating systems design and implementation (OSDI 16), pp.\u00a0265\u2013283 (2016)"},{"issue":"7","key":"43_CR15","doi-asserted-by":"publisher","first-page":"1877","DOI":"10.1587\/transinf.2015EDP7457","volume":"99","author":"WM Morise","year":"2016","unstructured":"Morise, W.M., Yokomori, F., Ozawa, K.: WORLD: a vocoder-based high-quality speech synthesis system for real-time applications. IEICE Trans. Inf. Syst. 99(7), 1877\u20131884 (2016)","journal-title":"IEICE Trans. Inf. Syst."},{"key":"43_CR16","doi-asserted-by":"publisher","first-page":"1162","DOI":"10.1016\/j.specom.2006.04.003","volume":"48","author":"D Ververidis","year":"2006","unstructured":"Ververidis, D., Kotropoulos, C.: Emotional speech recognition: resources, features and methods. Speech Commun. 48, 1162\u20131181 (2006)","journal-title":"Speech Commun."}],"container-title":["Lecture Notes in Computer Science","Speech and Computer"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-87802-3_43","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,8]],"date-time":"2024-09-08T17:39:39Z","timestamp":1725817179000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-030-87802-3_43"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021]]},"ISBN":["9783030878016","9783030878023"],"references-count":16,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-87802-3_43","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2021]]},"assertion":[{"value":"22 September 2021","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"SPECOM","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Speech and Computer","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"St Petersburg","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Russia","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2021","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"27 September 2021","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"30 September 2021","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"23","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"specom2021","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/specom.nw.ru\/2021\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Single-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"EasyChair","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"163","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"74","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"0","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"45% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3.5","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"5.5","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"The conference was held online due to the COVID-19 pandemic.","order":10,"name":"additional_info_on_review_process","label":"Additional Info on Review Process","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}