{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,31]],"date-time":"2026-03-31T04:35:17Z","timestamp":1774931717888,"version":"3.50.1"},"publisher-location":"Cham","reference-count":35,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031708787","type":"print"},{"value":"9783031708794","type":"electronic"}],"license":[{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024]]},"DOI":"10.1007\/978-3-031-70879-4_4","type":"book-chapter","created":{"date-parts":[[2024,9,4]],"date-time":"2024-09-04T19:02:20Z","timestamp":1725476540000},"page":"66-84","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["Resilience of\u00a0Voice Assistants to\u00a0Synthetic Speech"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-9009-2193","authenticated-orcid":false,"given":"Kamil","family":"Malinka","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4717-1910","authenticated-orcid":false,"given":"Anton","family":"Firc","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Petr","family":"Ka\u0161ka","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Tom\u00e1\u0161","family":"Lap\u0161ansk\u00fd","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Oskar","family":"\u0160andor","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0790-0875","authenticated-orcid":false,"given":"Ivan","family":"Homoliak","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2024,9,5]]},"reference":[{"key":"4_CR1","unstructured":"Bixby Developers \u2014 bixbydevelopers.com. https:\/\/bixbydevelopers.com\/dev\/docs\/bhs-dev-guide. Accessed 29 Nov 2023"},{"key":"4_CR2","unstructured":"Google Assistant for Android\u2014Documentation \u2014 Android Developers \u2014 developer.android.com. https:\/\/developer.android.com\/guide\/app-actions\/overview. Accessed 29 Nov 2023"},{"key":"4_CR3","unstructured":"SiriKit \u2014 Apple Developer Documentation \u2014 developer.apple.com. https:\/\/developer.apple.com\/documentation\/sirikit\/. Accessed 29 Nov 2023"},{"key":"4_CR4","unstructured":"Ahmed, M.E., Kwak, I.Y., Huh, J.H., Kim, I., Oh, T., Kim, H.: Void: a fast and light voice liveness detection system. In: 29th USENIX Security Symposium (USENIX Security 2020), pp. 2685\u20132702. USENIX Association, August 2020. https:\/\/www.usenix.org\/conference\/usenixsecurity20\/presentation\/ahmed-muhammad"},{"key":"4_CR5","unstructured":"Alegre, F., Janicki, A., Evans, N.: Re-assessing the threat of replay spoofing attacks against automatic speaker verification. In: Proceedings of the Conference Name. EURECOM and Warsaw University of Technology, Sophia Antipolis, France and Warsaw, Poland (2023)"},{"key":"4_CR6","doi-asserted-by":"publisher","first-page":"17841","DOI":"10.1109\/ACCESS.2017.2730220","volume":"5","author":"E Alepis","year":"2017","unstructured":"Alepis, E., Patsakis, C.: Monkey says, monkey does: security and privacy on voice assistants. IEEE Access 5, 17841\u201317851 (2017). https:\/\/doi.org\/10.1109\/ACCESS.2017.2730220","journal-title":"IEEE Access"},{"key":"4_CR7","unstructured":"Bateman, J.: Deepfakes and synthetic media in the financial system: assessing threat scenarios. Technical report, Carnegie Endowment for International Peace (2020). http:\/\/www.jstor.org\/stable\/resrep25783.1"},{"key":"4_CR8","unstructured":"Betker, J.: Better speech synthesis through scaling (2023)"},{"key":"4_CR9","doi-asserted-by":"publisher","unstructured":"Bilika, D., Michopoulou, N., Alepis, E., Patsakis, C.: Hello me, meet the real me: voice synthesis attacks on voice assistants. Comput. Secur. 137, 103617 (2024). https:\/\/doi.org\/10.1016\/j.cose.2023.103617. https:\/\/www.sciencedirect.com\/science\/article\/pii\/S0167404823005278","DOI":"10.1016\/j.cose.2023.103617"},{"key":"4_CR10","doi-asserted-by":"publisher","unstructured":"Boddy, C.R.: Sample size for qualitative research. Qual. Market Res. Int. J. 19(4), 426\u2013432 (2016). https:\/\/doi.org\/10.1108\/qmr-06-2016-0053. http:\/\/dx.doi.org\/10.1108\/QMR-06-2016-0053","DOI":"10.1108\/qmr-06-2016-0053"},{"key":"4_CR11","unstructured":"BotPenguin: which are the 7 best voice assistants of 2023? November 2023. https:\/\/botpenguin.com\/blogs\/which-are-the-7-best-voice-assistants-of-2023"},{"key":"4_CR12","unstructured":"Casanova, E., Weber, J., Shulby, C., Junior, A.C., G\u00f6lge, E., Ponti, M.A.: YourTTS: towards zero-shot multi-speaker TTS and zero-shot voice conversion for everyone (2023)"},{"key":"4_CR13","doi-asserted-by":"publisher","unstructured":"Combs, M., Hazelwood, C., Joyce, R.: Are you listening? \u2013 an observational wake word privacy study. Organ. Cybersecur. J. Pract. Process People 2(2), 113\u2013123 (2022). https:\/\/doi.org\/10.1108\/ocj-12-2021-0036. http:\/\/dx.doi.org\/10.1108\/OCJ-12-2021-0036","DOI":"10.1108\/ocj-12-2021-0036"},{"key":"4_CR14","unstructured":"Daniel Ruby: 65 Voice Search Statistics for 2023 (Updated Data) (2023). https:\/\/www.demandsage.com\/voice-search-statistics\/"},{"key":"4_CR15","doi-asserted-by":"publisher","unstructured":"Evans, N., Kinnunen, T., Yamagishi, J.: Spoofing and countermeasures for automatic speaker verification. In: Proceedings of INTERSPEECH 2013, 14th Annual Conference of the International Speech Communication Association, Lyon, France, August 2013. https:\/\/doi.org\/10.21437\/Interspeech.2013-288","DOI":"10.21437\/Interspeech.2013-288"},{"key":"4_CR16","doi-asserted-by":"publisher","unstructured":"Firc, A., Malinka, K.: The dawn of a text-dependent society: deepfakes as a threat to speech verification systems, pp. 1646\u20131655 (2022). https:\/\/doi.org\/10.1145\/3477314.3507013, cited by: 2","DOI":"10.1145\/3477314.3507013"},{"issue":"4","key":"4_CR17","doi-asserted-by":"publisher","DOI":"10.1016\/j.heliyon.2023.e15090","volume":"9","author":"A Firc","year":"2023","unstructured":"Firc, A., Malinka, K., Han\u00e1\u010dek, P.: Deepfakes as a threat to a speaker and facial recognition: an overview of tools and attack vectors. Heliyon 9(4), e15090 (2023). https:\/\/doi.org\/10.1016\/j.heliyon.2023.e15090","journal-title":"Heliyon"},{"key":"4_CR18","unstructured":"Gupta, P., Gupta, S., Patil, H.: Voice liveness detection using bump wavelet with CNN. In: 9th International Conference on Pattern Recognition and Machine Intelligence, Kolkata, India, December 2021. https:\/\/hal.science\/hal-03690065"},{"key":"4_CR19","doi-asserted-by":"publisher","unstructured":"Hoy, M.B.: Alexa, siri, cortana, and more: an introduction to voice assistants. Med. Ref. Serv. Q. 37(1), 81\u201388 (2018). https:\/\/doi.org\/10.1080\/02763869.2018.1404391","DOI":"10.1080\/02763869.2018.1404391"},{"key":"4_CR20","unstructured":"Wakefield, J.: Burger King advert sabotaged on Wikipedia (2017). https:\/\/www.bbc.com\/news\/technology-39589013"},{"key":"4_CR21","unstructured":"Kim, J., Kong, J., Son, J.: Conditional variational autoencoder with adversarial learning for end-to-end text-to-speech (2021)"},{"key":"4_CR22","doi-asserted-by":"publisher","unstructured":"Lien, J., Al\u00a0Momin, M.A., Yuan, X.: Attacks on Voice Assistant Systems, pp. 61\u201377. IGI Global (2022). https:\/\/doi.org\/10.4018\/978-1-7998-7323-5.ch004. http:\/\/dx.doi.org\/10.4018\/978-1-7998-7323-5.ch004","DOI":"10.4018\/978-1-7998-7323-5.ch004"},{"key":"4_CR23","doi-asserted-by":"publisher","unstructured":"Liu, X., et al.: Asvspoof 2021: towards spoofed and deepfake speech detection in the wild. IEEE\/ACM Trans. Audio Speech Lang. Process. 31, 2507\u20132522 (2023). https:\/\/doi.org\/10.1109\/TASLP.2023.3285283","DOI":"10.1109\/TASLP.2023.3285283"},{"key":"4_CR24","doi-asserted-by":"publisher","first-page":"4169","DOI":"10.1109\/ACCESS.2021.3139508","volume":"10","author":"I Lopez-Espejo","year":"2022","unstructured":"Lopez-Espejo, I., Tan, Z.H., Hansen, J.H.L., Jensen, J.: Deep spoken keyword spotting: an overview. IEEE Access 10, 4169\u20134199 (2022). https:\/\/doi.org\/10.1109\/ACCESS.2021.3139508","journal-title":"IEEE Access"},{"key":"4_CR25","unstructured":"Memey-McMemeFace: Alexa what is my current location (2020). https:\/\/www.reddit.com\/r\/WatchPeopleDieInside\/comments\/iky0qd\/alexa_what_is_my_current_location. Accessed 14 Dec 2023"},{"key":"4_CR26","series-title":"LNNS","doi-asserted-by":"publisher","first-page":"413","DOI":"10.1007\/978-3-031-21333-5_41","volume-title":"UCAm I 2022","author":"E Nacimiento-Garc\u00eda","year":"2023","unstructured":"Nacimiento-Garc\u00eda, E., Caballero-Gil, C., Nacimiento-Garc\u00eda, A., Gonz\u00e1lez-Gonz\u00e1lez, C.: Alexa, do what i want to. Implementing a voice spoofing attack tool for virtual voice assistants. In: Bravo, J., Ochoa, S., Favela, J. (eds.) UCAm I 2022. LNNS, vol. 594, pp. 413\u2013418. Springer, Cham (2023). https:\/\/doi.org\/10.1007\/978-3-031-21333-5_41"},{"key":"4_CR27","doi-asserted-by":"publisher","unstructured":"Poushneh, A.: Humanizing voice assistant: the impact of voice assistant personality on consumers\u2019 attitudes and behaviors. J. Retail. Consum. Serv. 58, 102283 (2021). https:\/\/doi.org\/10.1016\/j.jretconser.2020.102283. https:\/\/www.sciencedirect.com\/science\/article\/pii\/S0969698920312911","DOI":"10.1016\/j.jretconser.2020.102283"},{"key":"4_CR28","unstructured":"Qualcomm: Getting personal with on-device AI (2023). https:\/\/www.qualcomm.com\/news\/onq\/2023\/10\/getting-personal-with-on-device-ai"},{"key":"4_CR29","unstructured":"Seymour, J., Aqil, A.: Your voice is my passport (2018). https:\/\/www.blackhat.com\/us-18\/briefings\/schedule\/#your-voice-is-my-passport-11395"},{"key":"4_CR30","unstructured":"Simmons, D.: BBC news, May 2017. https:\/\/www.bbc.com\/news\/technology-39965545"},{"key":"4_CR31","unstructured":"Staff, R.: The best voice assistant, September 2021. https:\/\/www.zdnet.com\/home-and-office\/smart-home\/the-best-voice-assistant\/"},{"key":"4_CR32","unstructured":"Ubert, J.: Fake it: attacking privacy through exploiting digital assistants using voice deepfakes. Ph.D. thesis (2023). https:\/\/www.proquest.com\/dissertations-theses\/fake-attacking-privacy-through-exploiting-digital\/docview\/2811176534\/se-2. Copyright - Database copyright ProQuest LLC; ProQuest does not claim copyright in the individual underlying works; Last updated - 2023-05-18"},{"key":"4_CR33","doi-asserted-by":"publisher","unstructured":"Wang, Y., Cai, W., Gu, T., Shao, W., Li, Y., Yu, Y.: Secure your voice: an oral airflow-based continuous liveness detection for voice assistants. Proc. ACM Interact. Mob. Wearable Ubiquitous Technol. 3(4) (2020). https:\/\/doi.org\/10.1145\/3369811","DOI":"10.1145\/3369811"},{"key":"4_CR34","unstructured":"Wu, Z., Gao, S., Chng, E.S., Li, H.: A study on replay attack and anti-spoofing for text-dependent speaker verification. In: Proceedings of the Conference Name. Centre for Speech Technology Research, University of Edinburgh, United Kingdom and Human Language Technology Department, Institute for Infocomm Research, Singapore and School of Computer Engineering, Nanyang Technological University, Singapore (2021)"},{"key":"4_CR35","doi-asserted-by":"crossref","unstructured":"Zhang, R., Chen, X., Lu, J., Wen, S., Nepal, S., Xiang, Y.: Using AI to hack IA: a new stealthy spyware against voice assistance functions in smart phones. arXiv preprint arXiv:1805.06187 (2018)","DOI":"10.1109\/ACCESS.2019.2945791"}],"container-title":["Lecture Notes in Computer Science","Computer Security \u2013 ESORICS 2024"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-70879-4_4","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,4]],"date-time":"2024-09-04T19:02:58Z","timestamp":1725476578000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-70879-4_4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024]]},"ISBN":["9783031708787","9783031708794"],"references-count":35,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-70879-4_4","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024]]},"assertion":[{"value":"5 September 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ESORICS","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Symposium on Research in Computer Security","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Bydgoszcz","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Poland","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"16 September 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"20 September 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"esorics2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/esorics2024.org","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}