{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,5]],"date-time":"2026-05-05T00:46:16Z","timestamp":1777941976248,"version":"3.51.4"},"reference-count":111,"publisher":"Springer Science and Business Media LLC","issue":"S1","license":[{"start":{"date-parts":[[2023,6,28]],"date-time":"2023-06-28T00:00:00Z","timestamp":1687910400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,6,28]],"date-time":"2023-06-28T00:00:00Z","timestamp":1687910400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Artif Intell Rev"],"published-print":{"date-parts":[[2023,10]]},"DOI":"10.1007\/s10462-023-10539-8","type":"journal-article","created":{"date-parts":[[2023,6,28]],"date-time":"2023-06-28T13:02:01Z","timestamp":1687957321000},"page":"513-566","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":35,"title":["Battling voice spoofing: a review, comparative analysis, and generalizability evaluation of state-of-the-art voice spoofing counter measures"],"prefix":"10.1007","volume":"56","author":[{"given":"Awais","family":"Khan","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Khalid Mahmood","family":"Malik","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"James","family":"Ryan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mikul","family":"Saravanan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2023,6,28]]},"reference":[{"key":"10539_CR1","doi-asserted-by":"crossref","unstructured":"Alegre F, Amehraye A, Evans N (2013) Spoofing counter measures to protect automatic speaker verification from voice conversion. In: 2013 IEEE international conference on acoustics, speech and signal processing, pp. 3068\u20133072. IEEE","DOI":"10.1109\/ICASSP.2013.6638222"},{"key":"10539_CR2","doi-asserted-by":"publisher","first-page":"3524","DOI":"10.1109\/TIFS.2021.3082303","volume":"16","author":"M Aljasem","year":"2021","unstructured":"Aljasem M, Irtaza A, Malik H, Saba N, Javed A, Malik KM, Meharmohammadi M (2021) Secure automatic speaker verification (sasv) system through sm-altp features and asymmetric bagging. IEEE Trans Inf Forensics Secur 16:3524\u20133537. https:\/\/doi.org\/10.1109\/TIFS.2021.3082303","journal-title":"IEEE Trans Inf Forensics Secur"},{"issue":"5","key":"10539_CR3","doi-asserted-by":"publisher","first-page":"155","DOI":"10.3390\/a15050155","volume":"15","author":"Z Almutairi","year":"2022","unstructured":"Almutairi Z, Elgibreen H (2022) A review of modern audio deepfake detection methods: challenges and future directions. Algorithms 15(5):155","journal-title":"Algorithms"},{"key":"10539_CR4","unstructured":"Aravind P, Nechiyil U, Paramparambath N, et al (2020) Audio spoofing verification using deep convolutional neural networks by transfer learning. arXiv preprint arXiv:2008.03464"},{"key":"10539_CR5","doi-asserted-by":"publisher","first-page":"162857","DOI":"10.1109\/ACCESS.2021.3133134","volume":"9","author":"T Arif","year":"2021","unstructured":"Arif T, Javed A, Alhameed M, Jeribi F, Tahir A (2021) Voice spoofing countermeasure for logical access attacks detection. IEEE Access 9:162857\u2013162868. https:\/\/doi.org\/10.1109\/ACCESS.2021.3133134","journal-title":"IEEE Access"},{"key":"10539_CR6","doi-asserted-by":"crossref","unstructured":"Ba Z, Wen Q, Cheng P, Wang Y, Lin F, Lu L, Liu Z (2023) Transferring audio deepfake detection capability across languages. In: Proceedings of the ACM web conference 2023, pp. 2033\u20132044","DOI":"10.1145\/3543507.3583222"},{"key":"10539_CR7","doi-asserted-by":"publisher","first-page":"84229","DOI":"10.1109\/ACCESS.2019.2923806","volume":"7","author":"B Balamurali","year":"2019","unstructured":"Balamurali B, Lin KE, Lui S, Chen J-M, Herremans D (2019) Toward robust audio spoofing detection: a detailed comparison of traditional and learned features. IEEE Access 7:84229\u201384241","journal-title":"IEEE Access"},{"key":"10539_CR8","doi-asserted-by":"publisher","first-page":"84229","DOI":"10.1109\/ACCESS.2019.2923806","volume":"7","author":"BT Balamurali","year":"2019","unstructured":"Balamurali BT, Lin KE, Lui S, Chen J-M, Herremans D (2019) Toward robust audio spoofing detection: a detailed comparison of traditional and learned features. IEEE Access 7:84229\u201384241. https:\/\/doi.org\/10.1109\/ACCESS.2019.2923806","journal-title":"IEEE Access"},{"key":"10539_CR9","doi-asserted-by":"publisher","DOI":"10.1016\/j.csl.2020.101132","volume":"65","author":"R Baumann","year":"2021","unstructured":"Baumann R, Malik KM, Javed A, Ball A, Kujawa B, Malik H (2021) Voice spoofing detection corpus for single and multi-order audio replays. Comput Speech Lang 65:101132","journal-title":"Comput Speech Lang"},{"key":"10539_CR10","doi-asserted-by":"crossref","unstructured":"Cai W, Cai D, Liu W, Li G, Li M (2017) counter measures for automatic speaker verification replay spoofing attack: on data augmentation, feature representation, classification and fusion. In INTERSPEECH, pp. 17\u201321","DOI":"10.21437\/Interspeech.2017-906"},{"key":"10539_CR11","unstructured":"Cai W, Doshi A, Valle R (2018) Attacking speaker recognition with deep generative models. CoRR abs\/1801.02384arXiv:1801.02384"},{"issue":"1","key":"10539_CR12","first-page":"11","volume":"5","author":"S Chakroborty","year":"2009","unstructured":"Chakroborty S, Saha G (2009) Improved text-independent speaker identification using fused mfcc & imfcc feature sets based on gaussian filter. Int J Signal Process 5(1):11\u201319","journal-title":"Int J Signal Process"},{"key":"10539_CR13","doi-asserted-by":"crossref","unstructured":"Chen N, Qian Y, Dinkel H, Chen B, Yu K (2015) Robust deep feature for spoofing detection\u2013the sjtu system for asvspoof 2015 challenge. In: Sixteenth annual conference of the international speech communication association","DOI":"10.21437\/Interspeech.2015-474"},{"key":"10539_CR15","doi-asserted-by":"publisher","unstructured":"Chen Z, Xie Z, Zhang W, Xu X (2017) ResNet and model fusion for automatic spoofing detection. Interspeech 2017: 102\u2013106. https:\/\/doi.org\/10.21437\/Interspeech.2017-1085","DOI":"10.21437\/Interspeech.2017-1085"},{"key":"10539_CR14","doi-asserted-by":"publisher","unstructured":"Chen X, Zhang Y, Zhu G, Duan Z (2021) UR channel-robust synthetic speech detection system for ASVspoof 2021. In: Proc. 2021 edition of the automatic speaker verification and spoofing counter measures challenge, pp. 75\u201382. https:\/\/doi.org\/10.21437\/ASVSPOOF.2021-12","DOI":"10.21437\/ASVSPOOF.2021-12"},{"key":"10539_CR16","doi-asserted-by":"publisher","unstructured":"Chen F, Deng S, Zheng T, He Y, Han J (2023) Graph-based spectro-temporal dependency modeling for anti-spoofing. In: ICASSP 2023\u20132023 IEEE international conference on acoustics, speech and signal processing (ICASSP), pp. 1\u20135. https:\/\/doi.org\/10.1109\/ICASSP49357.2023.10096741","DOI":"10.1109\/ICASSP49357.2023.10096741"},{"key":"10539_CR17","doi-asserted-by":"crossref","unstructured":"Chettri B, Kinnunen T, Benetos E (2020) Deep generative variational autoencoding for replay spoof detection in automatic speaker verification","DOI":"10.21437\/Odyssey.2020-48"},{"key":"10539_CR18","doi-asserted-by":"crossref","unstructured":"Chung JS, Nagrani A, Zisserman A (2018) Voxceleb2: Deep speaker recognition. arXiv preprint arXiv:1806.05622","DOI":"10.21437\/Interspeech.2018-1929"},{"key":"10539_CR20","doi-asserted-by":"crossref","unstructured":"Delgado H, Todisco M, Sahidullah M, Evans N, Kinnunen T, Lee KA, Yamagishi J (2018) Asvspoof 2017 version 2.0: meta-data analysis and baseline enhancements. In: Odyssey 2018-The Speaker and Language Recognition Workshop","DOI":"10.21437\/Odyssey.2018-42"},{"key":"10539_CR19","unstructured":"Delgado H, Evans N, Kinnunen T, Lee KA, Liu X, Nautsch A, Patino J, Sahidullah M, Todisco M, Wang X, et al (2021) Asvspoof 2021: automatic speaker verification spoofing and counter measures challenge evaluation plan. arXiv preprint arXiv:2109.00535"},{"key":"10539_CR21","doi-asserted-by":"publisher","unstructured":"Ding S, Zhang Y, Duan Z (2023) Samo: Speaker attractor multi-center one-class learning for voice anti-spoofing. In: ICASSP 2023\u20132023 IEEE international conference on acoustics, speech and signal processing (ICASSP), pp. 1\u20135. https:\/\/doi.org\/10.1109\/ICASSP49357.2023.10094704","DOI":"10.1109\/ICASSP49357.2023.10094704"},{"key":"10539_CR22","doi-asserted-by":"crossref","unstructured":"Dinkel H, Chen N, Qian Y, Yu K (2017) End-to-end spoofing detection with raw waveform cldnns. In: 2017 IEEE international conference on acoustics, speech and signal processing (ICASSP), pp. 4860\u20134864","DOI":"10.1109\/ICASSP.2017.7953080"},{"key":"10539_CR23","doi-asserted-by":"crossref","unstructured":"Erg\u00fcnay SK, Khoury E, Lazaridis A, Marcel S (2015) On the vulnerability of speaker verification to realistic voice spoofing. In: 2015 IEEE 7th international conference on biometrics theory, applications and systems (BTAS), pp. 1\u20136. IEEE","DOI":"10.1109\/BTAS.2015.7358783"},{"key":"10539_CR24","doi-asserted-by":"crossref","unstructured":"Font R, Esp\u00edn JM, Cano MJ (2017) Experimental analysis of features for replay attack detection-results on the asvspoof 2017 challenge. In: Interspeech, pp. 7\u201311","DOI":"10.21437\/Interspeech.2017-450"},{"key":"10539_CR25","doi-asserted-by":"publisher","unstructured":"Gerlings J, Shollo A, Constantiou I (2020) Reviewing the need for explainable artificial iintelligence (xAI). arXiv. https:\/\/doi.org\/10.48550\/ARXIV.2012.01007. arXiv:2012.01007","DOI":"10.48550\/ARXIV.2012.01007"},{"key":"10539_CR111","unstructured":"grandviewresearch: voice biometrics market forecast. https:\/\/www.grandviewresearch.com\/industry-analysis\/us-voice-recognition-market. Accessed: May 25 2023"},{"key":"10539_CR26","doi-asserted-by":"publisher","unstructured":"Gunendradasan T, Wickramasinghe B, Le P, Ambikairajah E, Epps J (2018) Detection of replay-spoofing attacks using frequency modulation features. In INTERSPEECH, pp. 636\u2013640. https:\/\/doi.org\/10.21437\/Interspeech.2018-1473","DOI":"10.21437\/Interspeech.2018-1473"},{"key":"10539_CR27","doi-asserted-by":"publisher","unstructured":"Gunendradasan T, Irtza S, Ambikairajah E, Epps J (2019) Transmission line cochlear model based am-fm features for replay attack detection. In: ICASSP 2019 - 2019 IEEE international conference on acoustics, speech and signal processing (ICASSP), pp. 6136\u20136140. https:\/\/doi.org\/10.1109\/ICASSP.2019.8682771","DOI":"10.1109\/ICASSP.2019.8682771"},{"key":"10539_CR28","doi-asserted-by":"publisher","unstructured":"Hassan F, Javed A (2021) Voice spoofing countermeasure for synthetic speech detection. In: 2021 International conference on artificial intelligence (ICAI), pp. 209\u2013212. https:\/\/doi.org\/10.1109\/ICAI52203.2021.9445238","DOI":"10.1109\/ICAI52203.2021.9445238"},{"key":"10539_CR29","doi-asserted-by":"publisher","first-page":"1813","DOI":"10.1109\/TASLP.2020.2998870","volume":"28","author":"L Huang","year":"2020","unstructured":"Huang L, Pun C-M (2020) Audio replay spoof attack detection by joint segment-based linear filter bank feature extraction and attention-enhanced densenet-bilstm network. IEEE\/ACM Trans Audio Speech Lang Process 28:1813\u20131825","journal-title":"IEEE\/ACM Trans Audio Speech Lang Process"},{"key":"10539_CR30","doi-asserted-by":"publisher","DOI":"10.1016\/j.csl.2021.101199","volume":"68","author":"A Jati","year":"2021","unstructured":"Jati A, Hsu C-C, Pal M, Peri R, AbdAlmageed W, Narayanan S (2021) Adversarial attack and defense strategies for deep speaker recognition systems. Comput Speech Lang 68:101199. https:\/\/doi.org\/10.1016\/j.csl.2021.101199","journal-title":"Comput Speech Lang"},{"key":"10539_CR31","doi-asserted-by":"publisher","DOI":"10.1016\/j.apacoust.2021.108283","volume":"183","author":"A Javed","year":"2021","unstructured":"Javed A, Malik KM, Irtaza A, Malik H (2021) Towards protecting cyber-physical and IoT systems from single-and multi-order voice spoofing attacks. Appl Acoust 183:108283","journal-title":"Appl Acoust"},{"key":"10539_CR32","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2022.116770","volume":"198","author":"A Javed","year":"2022","unstructured":"Javed A, Malik KM, Malik H, Irtaza A (2022) Voice spoofing detector: a unified anti-spoofing framework. Expert Syst Appl 198:116770","journal-title":"Expert Syst Appl"},{"key":"10539_CR33","doi-asserted-by":"crossref","unstructured":"Ji Z, Li Z-Y, Li P, An M, Gao S, Wu D, Zhao F (2017) Ensemble learning for countermeasure of audio replay spoofing attack in asvspoof2017. In: Interspeech, pp. 87\u201391","DOI":"10.21437\/Interspeech.2017-1246"},{"key":"10539_CR34","doi-asserted-by":"crossref","unstructured":"Jose A, Joseph J, Devadhas G, Shinu MM (2018) Influence of filter bank structure on the statistical significance of coefficients in cepstral analysis for acoustic signals. In: Thampi, S.M., Krishnan, S.r., Corchado\u00a0Rodriguez, J.M., Das, S., Wozniak, M., Al-Jumeily, D. (eds.) Advances in signal processing and intelligent recognition systems, Springer, Cham, pp. 91\u2013104","DOI":"10.1007\/978-3-319-67934-1_9"},{"key":"10539_CR38","doi-asserted-by":"crossref","unstructured":"Jung J-w, Shim H-j, Heo H-S, Yu H-J (2019) Replay attack detection with complementary high-resolution information using end-to-end dnn for the asvspoof 2019 challenge. arXiv preprint arXiv:1904.10134","DOI":"10.21437\/Interspeech.2019-1991"},{"key":"10539_CR36","doi-asserted-by":"publisher","unstructured":"Jung J-w, Heo H-S, Tak H, Shim H-j, Chung JS, Lee B-J, Yu H-J, Evans N (2021) AASIST: Audio anti-spoofing using integrated spectro-temporal graph attention networks. arXiv . https:\/\/doi.org\/10.48550\/ARXIV.2110.01200. arXiv:2110.01200","DOI":"10.48550\/ARXIV.2110.01200"},{"key":"10539_CR35","doi-asserted-by":"crossref","unstructured":"Jung J-w, Heo H-S, Tak H, Shim H-j, Chung JS, Lee B-J, Yu H-J, Evans N (2022) Aasist: audio anti-spoofing using integrated spectro-temporal graph attention networks. In: ICASSP 2022-2022 IEEE international conference on acoustics, speech and signal processing (ICASSP), pp. 6367\u20136371. IEEE","DOI":"10.1109\/ICASSP43922.2022.9747766"},{"key":"10539_CR37","doi-asserted-by":"crossref","unstructured":"Jung J-w, Tak H, Shim H-j, Heo H-S, Lee B-J, Chung S-W, Yu H-J, Evans N, Kinnunen T (2022) Sasv 2022: The first spoofing-aware speaker verification challenge. arXiv preprint arXiv:2203.14732","DOI":"10.21437\/Interspeech.2022-11270"},{"key":"10539_CR39","doi-asserted-by":"publisher","DOI":"10.1017\/ATSIP.2019.21","volume":"9","author":"MR Kamble","year":"2020","unstructured":"Kamble MR, Sailor HB, Patil HA, Li H (2020) Advances in anti-spoofing: from the perspective of asvspoof challenges. APSIPA Trans Signal and Inf Process 9:e2","journal-title":"APSIPA Trans Signal and Inf Process"},{"key":"10539_CR40","doi-asserted-by":"publisher","unstructured":"Kinnunen T, Sahidullah M, Delgado H, Todisco M, Evans N, Yamagishi J, Lee KA (2017a)The asvspoof 2017 challenge: Assessing the limits of replay spoofing attack detection. In: INTERSPEECH. https:\/\/doi.org\/10.21437\/Interspeech.2017-1111","DOI":"10.21437\/Interspeech.2017-1111"},{"key":"10539_CR41","doi-asserted-by":"crossref","unstructured":"Kinnunen TH, Sahidullah M, Falcone M, Costantini L, Hautam\u00e4ki RG, Thomsen DAL, Sarkar AK, Tan Z, Delgado H, Todisco M, Evans NWD, Hautam\u00e4ki V, Lee K-A (2017b) Reddots replayed: a new replay spoofing attack corpus for text-dependent speaker verification research. 2017 IEEE international conference on acoustics, speech and signal processing (ICASSP), 5395\u20135399","DOI":"10.1109\/ICASSP.2017.7953187"},{"key":"10539_CR42","doi-asserted-by":"crossref","unstructured":"Kinnunen T, Sahidullah M, Delgado H, Todisco M, Evans N, Yamagishi J, Lee KA (2017c) The asvspoof 2017 challenge: assessing the limits of replay spoofing attack detection","DOI":"10.21437\/Interspeech.2017-1111"},{"key":"10539_CR43","doi-asserted-by":"crossref","unstructured":"Kinnunen T, Lee KA, Delgado H, Evans N, Todisco M, Sahidullah M, Yamagishi J, Reynolds DA (2018) t-dcf: a detection cost function for the tandem assessment of spoofing counter measures and automatic speaker verification. arXiv preprint arXiv:1804.09618","DOI":"10.21437\/Odyssey.2018-44"},{"key":"10539_CR44","doi-asserted-by":"crossref","unstructured":"Korshunov P, Marcel S, Muckenhirn H, Gon\u00e7alves AR, Mello AS, Violato RV, Simoes FO, Neto MU, de Assis\u00a0Angeloni M, Stuchi JA, et al (2016) Overview of btas 2016 speaker anti-spoofing competition. In: 2016 IEEE 8th international conference on biometrics theory, applications and systems (BTAS), pp. 1\u20136. IEEE","DOI":"10.1109\/BTAS.2016.7791200"},{"key":"10539_CR45","doi-asserted-by":"crossref","unstructured":"Korshunov P, Gon\u00e7alves AR, Violato RP, Sim\u00f5es FO, Marcel S (2018) On the use of convolutional neural networks for speech presentation attack detection. In: 2018 IEEE 4th international conference on identity, security, and behavior analysis (ISBA), pp. 1\u20138. IEEE","DOI":"10.1109\/ISBA.2018.8311474"},{"key":"10539_CR46","doi-asserted-by":"crossref","unstructured":"Kreuk F, Adi Y, Cisse M, Keshet J (2018) Fooling end-to-end speaker verification with adversarial examples. In: 2018 IEEE international conference on acoustics, speech and signal processing (ICASSP), pp. 1962\u20131966. IEEE","DOI":"10.1109\/ICASSP.2018.8462693"},{"key":"10539_CR47","unstructured":"Kua JMK, Thiruvaran T, Nosratighods M, Ambikairajah E, Epps J (2010) Investigation of spectral centroid magnitude and frequency for speaker recognition. In: Odyssey, p. 7"},{"key":"10539_CR48","doi-asserted-by":"publisher","first-page":"49140","DOI":"10.1109\/ACCESS.2023.3275790","volume":"11","author":"I-Y Kwak","year":"2023","unstructured":"Kwak I-Y, Kwag S, Lee J, Jeon Y, Hwang J, Choi H-J, Yang J-H, Han S-Y, Huh JH, Lee C-H, Yoon JW (2023) Voice spoofing detection through residual network, max feature map, and depthwise separable convolution. IEEE Access 11:49140\u201349152. https:\/\/doi.org\/10.1109\/ACCESS.2023.3275790","journal-title":"IEEE Access"},{"key":"10539_CR49","doi-asserted-by":"crossref","unstructured":"Kwon H, Lee K, Ryu J, Lee J (2023) Audio adversarial example detection using the audio style transfer learning method. IEEE Access","DOI":"10.1109\/ACCESS.2022.3216075"},{"key":"10539_CR50","doi-asserted-by":"crossref","unstructured":"Lai C-I, Abad A, Richmond K, Yamagishi J, Dehak N, King S (2019) Attentive filtering networks for audio replay attack detection. In: ICASSP 2019-2019 IEEE international conference on acoustics, speech and signal processing (ICASSP), pp. 6316\u20136320. IEEE","DOI":"10.1109\/ICASSP.2019.8682640"},{"key":"10539_CR51","doi-asserted-by":"crossref","unstructured":"Lai C-I, Chen N, Villalba J, Dehak N (2019) Assert: Anti-spoofing with squeeze-excitation and residual networks. arXiv preprint arXiv:1904.01120","DOI":"10.21437\/Interspeech.2019-1794"},{"key":"10539_CR52","doi-asserted-by":"crossref","unstructured":"Lee K-A, Larcher A, Wang G, Kenny P, Br\u00fcmmer N, van Leeuwen DA, Aronowitz H, Kockmann M, Vaquero C, Ma B, Li H, Stafylakis T, Alam MJ, Swart A, P\u00e9rez J (2015) The reddots data collection for speaker recognition. In INTERSPEECH","DOI":"10.21437\/Interspeech.2015-95"},{"key":"10539_CR54","doi-asserted-by":"crossref","unstructured":"Li Z, Shi C, Xie Y, Liu J, Yuan B, Chen Y (2020) Practical adversarial attacks against speaker recognition systems. In: Proceedings of the 21st international workshop on mobile computing systems and applications, pp. 9\u201314","DOI":"10.1145\/3376897.3377856"},{"key":"10539_CR53","doi-asserted-by":"crossref","unstructured":"Li X, Li N, Weng C, Liu X, Su D, Yu D, Meng H (2021) Replay and synthetic speech detection with res2net architecture. In: ICASSP 2021-2021 IEEE international conference on acoustics, speech and signal processing (ICASSP), pp. 6354\u20136358. IEEE","DOI":"10.1109\/ICASSP39728.2021.9413828"},{"key":"10539_CR55","doi-asserted-by":"publisher","first-page":"141170","DOI":"10.1109\/ACCESS.2020.3013066","volume":"8","author":"L Liu","year":"2020","unstructured":"Liu L, Yang J (2020) Study on feature complementarity of statistics, energy, and principal information for spoofing detection. IEEE Access 8:141170\u2013141181. https:\/\/doi.org\/10.1109\/ACCESS.2020.3013066","journal-title":"IEEE Access"},{"key":"10539_CR56","doi-asserted-by":"crossref","unstructured":"Liu X, Sahidullah M, Kinnunen T (2022) Spoofing-aware speaker verification with unsupervised domain adaptation. arXiv preprint arXiv:2203.10992","DOI":"10.21437\/Odyssey.2022-12"},{"key":"10539_CR57","doi-asserted-by":"publisher","unstructured":"Ma Y, Ren Z, Xu S (2021) RW-Resnet: a novel speech anti-spoofing model using raw waveform. arXiv. https:\/\/doi.org\/10.48550\/ARXIV.2108.05684. arXiv:2108.05684","DOI":"10.48550\/ARXIV.2108.05684"},{"issue":"5","key":"10539_CR58","doi-asserted-by":"publisher","first-page":"982","DOI":"10.1109\/JSTSP.2020.2999828","volume":"14","author":"KM Malik","year":"2020","unstructured":"Malik KM, Javed A, Malik H, Irtaza A (2020) A light-weight replay detection framework for voice controlled IoT devices. IEEE J Sel Top Signal Processing 14(5):982\u2013996","journal-title":"IEEE J Sel Top Signal Processing"},{"issue":"5","key":"10539_CR59","doi-asserted-by":"publisher","first-page":"982","DOI":"10.1109\/JSTSP.2020.2999828","volume":"14","author":"KM Malik","year":"2020","unstructured":"Malik KM, Javed A, Malik H, Irtaza A (2020) A light-weight replay detection framework for voice controlled IoT devices. IEEE J Sel Top Signal Process 14(5):982\u2013996. https:\/\/doi.org\/10.1109\/JSTSP.2020.2999828","journal-title":"IEEE J Sel Top Signal Process"},{"key":"10539_CR60","first-page":"1","volume":"25","author":"A Mittal","year":"2021","unstructured":"Mittal A, Dua M (2021) Automatic speaker verification systems and spoof detection techniques: review and analysis. Int J Speech Technol 25:1\u201330","journal-title":"Int J Speech Technol"},{"key":"10539_CR61","unstructured":"Muda L, Begam M, Elamvazuthi I (2010) Voice recognition algorithms using mel frequency cepstral coefficient (mfcc) and dynamic time warping (dtw) techniques. arXiv preprint arXiv:1003.4083"},{"key":"10539_CR62","doi-asserted-by":"crossref","unstructured":"Nagarsheth P, el Khoury E, Patil K, Garland M (2017) Replay attack detection using dnn for channel discrimination. In INTERSPEECH","DOI":"10.21437\/Interspeech.2017-1377"},{"key":"10539_CR63","doi-asserted-by":"crossref","unstructured":"Nagrani A, Chung JS, Zisserman A (2017) Voxceleb: a large-scale speaker identification dataset. arXiv preprint arXiv:1706.08612","DOI":"10.21437\/Interspeech.2017-950"},{"key":"10539_CR64","doi-asserted-by":"publisher","first-page":"603","DOI":"10.1007\/978-981-10-7245-1_59","volume-title":"Intelligent Computing and Information and Communication","author":"R Naika","year":"2018","unstructured":"Naika R (2018) An overview of automatic speaker verification system. Intelligent computing and information and communication. Springer, Cham, pp 603\u2013610"},{"key":"10539_CR65","doi-asserted-by":"crossref","unstructured":"Novoselov S, Kozlov A, Lavrentyeva G, Simonchik K, Shchemelinin V (2016) Stc anti-spoofing systems for the asvspoof 2015 challenge. In: 2016 IEEE international conference on acoustics, speech and signal processing (ICASSP), pp. 5475\u20135479. IEEE","DOI":"10.1109\/ICASSP.2016.7472724"},{"key":"10539_CR66","doi-asserted-by":"crossref","unstructured":"Patil HA, Kamble MR (2018) A survey on replay attack detection for automatic speaker verification (asv) system. In: 2018 Asia-Pacific signal and information processing association annual summit and conference (APSIPA ASC), pp. 1047\u20131053. IEEE","DOI":"10.23919\/APSIPA.2018.8659666"},{"key":"10539_CR67","doi-asserted-by":"crossref","unstructured":"Paul D, Pal M, Saha G (2015) Novel speech features for improved detection of spoofing attacks. In: 2015 annual IEEE India conference (INDICON), pp. 1\u20136. IEEE","DOI":"10.1109\/INDICON.2015.7443805"},{"key":"10539_CR68","first-page":"2825","volume":"12","author":"F Pedregosa","year":"2011","unstructured":"Pedregosa F, Varoquaux G, Gramfort A, Michel V, Thirion B, Grisel O, Blondel M, Prettenhofer P, Weiss R, Dubourg V, Vanderplas J, Passos A, Cournapeau D, Brucher M, Perrot M, Duchesnay E (2011) Scikit-learn: machine learning in Python. J Mach Learn Res 12:2825\u20132830","journal-title":"J Mach Learn Res"},{"key":"10539_CR69","doi-asserted-by":"publisher","first-page":"686","DOI":"10.1016\/j.jcp.2018.10.045","volume":"378","author":"M Raissi","year":"2019","unstructured":"Raissi M, Perdikaris P, Karniadakis GE (2019) Physics-informed neural networks: a deep learning framework for solving forward and inverse problems involving nonlinear partial differential equations. J Comput phys 378:686\u2013707","journal-title":"J Comput phys"},{"key":"10539_CR70","doi-asserted-by":"crossref","unstructured":"Rajan P, Kinnunen T, Hanilci C, Pohjalainen J, Alku P (2013) Using group delay functions from all-pole models for speaker recognition. In INTERSPEECH, pp. 2489\u20132493. Citeseer","DOI":"10.21437\/Interspeech.2013-416"},{"key":"10539_CR71","unstructured":"Research EM (2023) Voice biometrics market forecast. https:\/\/www.expertmarketresearch.com\/reports\/voice-assistant-application-market. Accessed: May 25 2023"},{"key":"10539_CR72","unstructured":"Rostami AM, Homayounpour MM, Nickabadi A (2021) Efficient attention branch network with combined loss function for automatic speaker verification spoof detection. arXiv preprint arXiv:2109.02051"},{"key":"10539_CR74","doi-asserted-by":"crossref","unstructured":"Sahidullah M, Delgado H, Todisco M, Yu H, Kinnunen T, Evans N, Tan Z-H (2016) Integrated spoofing counter measures and automatic speaker verification: an evaluation on asvspoof 2015","DOI":"10.21437\/Interspeech.2016-1280"},{"key":"10539_CR73","doi-asserted-by":"publisher","first-page":"321","DOI":"10.1007\/978-3-319-92627-8_15","volume-title":"Handbook of biometric anti-spoofing","author":"M Sahidullah","year":"2019","unstructured":"Sahidullah M, Delgado H, Todisco M, Kinnunen T, Evans N, Yamagishi J, Lee K-A (2019) Introduction to voice presentation attack detection and recent advances. Handbook of biometric anti-spoofing. Springer, New York, pp 321\u2013361"},{"issue":"1","key":"10539_CR75","doi-asserted-by":"publisher","first-page":"84","DOI":"10.1109\/TASLP.2017.2761547","volume":"26","author":"Y Saito","year":"2018","unstructured":"Saito Y, Takamichi S, Saruwatari H (2018) Statistical parametric speech synthesis incorporating generative adversarial networks. IEEE\/ACM Trans Audio Speech Lang Process 26(1):84\u201396. https:\/\/doi.org\/10.1109\/TASLP.2017.2761547","journal-title":"IEEE\/ACM Trans Audio Speech Lang Process"},{"key":"10539_CR76","doi-asserted-by":"publisher","unstructured":"Saranya MS, Padmanabhan R, Murthy HA (2018) Replay attack detection in speaker verification using non-voiced segments and decision level feature switching. In: 2018 International conference on signal processing and communications (SPCOM), pp. 332\u2013336. https:\/\/doi.org\/10.1109\/SPCOM.2018.8724469","DOI":"10.1109\/SPCOM.2018.8724469"},{"key":"10539_CR77","doi-asserted-by":"publisher","unstructured":"Saratxaga I, Hern\u00e1ez I, Pucher M, Sainz I (2012) Perceptual importance of the phase related information in speech. In: INTERSPEECH, vol. 2. https:\/\/doi.org\/10.21437\/Interspeech.2012-411","DOI":"10.21437\/Interspeech.2012-411"},{"key":"10539_CR78","doi-asserted-by":"publisher","unstructured":"Suthokumar G, Sriskandaraja K, Sethu V, Wijenayake C, Ambikairajah E (2019) Phoneme specific modelling and scoring techniques for anti spoofing system. In: ICASSP 2019 - 2019 IEEE international conference on acoustics, speech and signal processing (ICASSP), pp. 6106\u20136110. https:\/\/doi.org\/10.1109\/ICASSP.2019.8682411","DOI":"10.1109\/ICASSP.2019.8682411"},{"key":"10539_CR79","unstructured":"Szegedy C, Zaremba W, Sutskever I, Bruna J, Erhan D, Goodfellow I, Fergus R (2014) Intriguing properties of neural networks"},{"key":"10539_CR80","doi-asserted-by":"publisher","unstructured":"Tak H, Kamble M, Patino J, Todisco M, Evans N (2021) RawBoost: a raw data boosting and augmentation method applied to automatic speaker verification anti-spoofing. arXiv. https:\/\/doi.org\/10.48550\/ARXIV.2111.04433. arXiv:2111.04433","DOI":"10.48550\/ARXIV.2111.04433"},{"key":"10539_CR81","doi-asserted-by":"publisher","unstructured":"Tak H, Jung J-w, Patino J, Kamble M, Todisco M, Evans N (2021) End-to-end spectro-temporal graph attention networks for speaker verification anti-spoofing and speech deepfake detection. arXiv. https:\/\/doi.org\/10.48550\/ARXIV.2107.12710. arXiv:2107.12710","DOI":"10.48550\/ARXIV.2107.12710"},{"key":"10539_CR82","doi-asserted-by":"publisher","unstructured":"Tak H, Jung J-w, Patino J, Todisco M, Evans N (2021) Graph attention networks for anti-spoofing. arXiv. https:\/\/doi.org\/10.48550\/ARXIV.2104.03654. arXiv:2104.03654","DOI":"10.48550\/ARXIV.2104.03654"},{"issue":"21","key":"10539_CR83","doi-asserted-by":"publisher","first-page":"32725","DOI":"10.1007\/s11042-021-11235-x","volume":"80","author":"CB Tan","year":"2021","unstructured":"Tan CB, Hijazi MHA, Khamis N, Zainol Z, Coenen F, Gani A et al (2021) A survey on presentation attack detection for automatic speaker verification systems: state-of-the-art, taxonomy, issues and future direction. Multimed Tools Appl 80(21):32725\u201332762","journal-title":"Multimed Tools Appl"},{"key":"10539_CR84","doi-asserted-by":"crossref","unstructured":"Tapkir PA, Patil HA (2018) Significance of teager energy operator phase for replay spoof detection. In: 2018 Asia-Pacific signal and information processing association annual summit and conference (APSIPA ASC), pp. 1951\u20131956. IEEE","DOI":"10.23919\/APSIPA.2018.8659664"},{"key":"10539_CR85","doi-asserted-by":"crossref","unstructured":"Tapkir PA, Patil AT, Shah N, Patil HA (2018) Novel spectral root cepstral features for replay spoof detection. In: 2018 Asia-Pacific signal and information processing association annual summit and conference (APSIPA ASC), pp. 1945\u20131950. IEEE","DOI":"10.23919\/APSIPA.2018.8659746"},{"key":"10539_CR86","doi-asserted-by":"crossref","unstructured":"Teng Z, Fu Q, White J, Powell ME, Schmidt DC (2022) Sa-sasv: An end-to-end spoof-aggregated spoofing-aware speaker verification system. arXiv preprint arXiv:2203.06517","DOI":"10.21437\/Interspeech.2022-11029"},{"key":"10539_CR87","doi-asserted-by":"publisher","first-page":"516","DOI":"10.1016\/j.csl.2017.01.001","volume":"45","author":"M Todisco","year":"2017","unstructured":"Todisco M, Delgado H, Evans NWD (2017) Constant q cepstral coefficients: a spoofing countermeasure for automatic speaker verification. Comput Speech Lang 45:516\u2013535","journal-title":"Comput Speech Lang"},{"key":"10539_CR88","doi-asserted-by":"crossref","unstructured":"Todisco M, Wang X, Vestman V, Sahidullah M, Delgado H, Nautsch A, Yamagishi J, Evans N, Kinnunen T, Lee KA (2019) Asvspoof 2019: future horizons in spoofed and fake audio detection. arXiv preprint arXiv:1904.05441","DOI":"10.21437\/Interspeech.2019-2249"},{"issue":"6","key":"10539_CR89","doi-asserted-by":"publisher","first-page":"1684","DOI":"10.1109\/TMM.2012.2199972","volume":"14","author":"X Valero","year":"2012","unstructured":"Valero X, Alias F (2012) Gammatone cepstral coefficients: biologically inspired features for non-speech audio classification. IEEE Trans Multimedia 14(6):1684\u20131689","journal-title":"IEEE Trans Multimedia"},{"key":"10539_CR91","doi-asserted-by":"publisher","unstructured":"Wang Q, Lin X, Zhou M, Chen Y, Wang C, Li Q, Luo X (2019) Voicepop: a pop noise based anti-spoofing system for voice authentication on smartphones. In: IEEE INFOCOM 2019\u2014IEEE conference on computer communications, pp. 2062\u20132070. https:\/\/doi.org\/10.1109\/INFOCOM.2019.8737422","DOI":"10.1109\/INFOCOM.2019.8737422"},{"key":"10539_CR90","doi-asserted-by":"publisher","DOI":"10.1016\/j.csl.2020.101114","volume":"64","author":"X Wang","year":"2020","unstructured":"Wang X, Yamagishi J, Todisco M, Delgado H, Nautsch A, Evans N, Sahidullah M, Vestman V, Kinnunen T, Lee KA et al (2020) Asvspoof 2019: a large-scale public database of synthesized, converted and replayed speech. Comput Speech Lang 64:101114","journal-title":"Comput Speech Lang"},{"key":"10539_CR92","doi-asserted-by":"crossref","unstructured":"Witkowski M, Kacprzak S, Zelasko P, Kowalczyk K, Galka J (2017) Audio replay attack detection using high-frequency features. In Interspeech, pp. 27\u201331","DOI":"10.21437\/Interspeech.2017-776"},{"key":"10539_CR93","doi-asserted-by":"crossref","unstructured":"Wong E, Sridharan S (2001) Comparison of linear prediction cepstrum coefficients and mel-frequency cepstrum coefficients for language identification. In: Proceedings of 2001 international symposium on intelligent multimedia, video and speech processing. ISIMP 2001 (IEEE Cat. No. 01EX489), pp. 95\u201398. IEEE","DOI":"10.1109\/ISIMP.2001.925340"},{"key":"10539_CR94","doi-asserted-by":"publisher","first-page":"130","DOI":"10.1016\/j.specom.2014.10.005","volume":"66","author":"Z Wu","year":"2015","unstructured":"Wu Z, Evans N, Kinnunen T, Yamagishi J, Alegre F, Li H (2015) Spoofing and counter measures for speaker verification: a survey. Speech Commun 66:130\u2013153","journal-title":"Speech Commun"},{"key":"10539_CR98","doi-asserted-by":"crossref","unstructured":"Wu Z, Khodabakhsh A, Demiroglu C, Yamagishi J, Saito D, Toda T, King S (2015) Sas: A speaker verification spoofing database containing diverse attacks. In: 2015 IEEE international conference on acoustics, speech and signal processing (ICASSP), pp. 4440\u20134444. IEEE","DOI":"10.1109\/ICASSP.2015.7178810"},{"key":"10539_CR99","doi-asserted-by":"crossref","unstructured":"Wu Z, Kinnunen T, Evans N, Yamagishi J, Hanil\u00e7i C, Sahidullah M, Sizov A (2015) Asvspoof 2015: the first automatic speaker verification spoofing and counter measures challenge. In: Sixteenth annual conference of the international speech communication association","DOI":"10.21437\/Interspeech.2015-462"},{"issue":"4","key":"10539_CR96","doi-asserted-by":"publisher","first-page":"588","DOI":"10.1109\/JSTSP.2017.2671435","volume":"11","author":"Z Wu","year":"2017","unstructured":"Wu Z, Yamagishi J, Kinnunen T, Hanil\u00e7i C, Sahidullah M, Sizov A, Evans N, Todisco M, Delgado H (2017) Asvspoof: the automatic speaker verification spoofing and counter measures challenge. IEEE J Sel Top Signal Process 11(4):588\u2013604. https:\/\/doi.org\/10.1109\/JSTSP.2017.2671435","journal-title":"IEEE J Sel Top Signal Process"},{"issue":"4","key":"10539_CR97","doi-asserted-by":"publisher","first-page":"588","DOI":"10.1109\/JSTSP.2017.2671435","volume":"11","author":"Z Wu","year":"2017","unstructured":"Wu Z, Yamagishi J, Kinnunen T, Hanil\u00e7i C, Sahidullah M, Sizov A, Evans N, Todisco M, Delgado H (2017) Asvspoof: the automatic speaker verification spoofing and counter measures challenge. IEEE J Sel Top Signal Process 11(4):588\u2013604","journal-title":"IEEE J Sel Top Signal Process"},{"issue":"11","key":"10539_CR95","doi-asserted-by":"publisher","first-page":"2884","DOI":"10.1109\/TIFS.2018.2833032","volume":"13","author":"X Wu","year":"2018","unstructured":"Wu X, He R, Sun Z, Tan T (2018) A light cnn for deep face representation with noisy labels. IEEE Trans Inf Forensics Secur 13(11):2884\u20132896","journal-title":"IEEE Trans Inf Forensics Secur"},{"key":"10539_CR100","doi-asserted-by":"publisher","unstructured":"Wu Z, Das RK, Yang J, Li H (2020) Light convolutional neural network with feature genuinization for detection of synthetic speech attacks. arXiv. https:\/\/doi.org\/10.48550\/ARXIV.2009.09637. arXiv:2009.09637","DOI":"10.48550\/ARXIV.2009.09637"},{"key":"10539_CR101","doi-asserted-by":"crossref","unstructured":"Wu H, Liu S, Meng H, Lee H-y (2020a) Defense against adversarial attacks on spoofing counter measures of ASV","DOI":"10.1109\/ICASSP40776.2020.9053643"},{"key":"10539_CR102","doi-asserted-by":"crossref","unstructured":"Wu H, Liu AT, Lee H-y (2020b) Defense for black-box attacks on anti-spoofing models by self-Supervised learning","DOI":"10.21437\/Interspeech.2020-2026"},{"key":"10539_CR103","doi-asserted-by":"crossref","unstructured":"Xie Y, Li Z, Shi C, Liu J, Chen Y, Yuan B (2021) Enabling fast and universal audio adversarial attack using generative model. In: Proceedings of the AAAI conference on artificial intelligence, vol. 35, pp. 14129\u201314137","DOI":"10.1609\/aaai.v35i16.17663"},{"key":"10539_CR104","doi-asserted-by":"publisher","unstructured":"Xue J, Fan C, Yi J, Wang C, Wen Z, Zhang D, Lv Z (2023) Learning from yourself: a self-distillation method for fake speech detection. In: ICASSP 2023 - 2023 IEEE international conference on acoustics, speech and signal processing (ICASSP), pp. 1\u20135. https:\/\/doi.org\/10.1109\/ICASSP49357.2023.10096837","DOI":"10.1109\/ICASSP49357.2023.10096837"},{"key":"10539_CR105","doi-asserted-by":"publisher","DOI":"10.1016\/j.dsp.2019.02.018","author":"J Yang","year":"2019","unstructured":"Yang J, Das RK (2019) Low frequency frame-wise normalization over constant-q transform for playback speech detection. Digit Signal Process. https:\/\/doi.org\/10.1016\/j.dsp.2019.02.018","journal-title":"Digit Signal Process"},{"key":"10539_CR106","doi-asserted-by":"publisher","DOI":"10.1016\/j.dsp.2019.102622","volume":"97","author":"J Yang","year":"2019","unstructured":"Yang J, Das R (2019) Long-term high frequency features for synthetic speech detection. Digit Signal Process 97:102622. https:\/\/doi.org\/10.1016\/j.dsp.2019.102622","journal-title":"Digit Signal Process"},{"issue":"12","key":"10539_CR107","doi-asserted-by":"publisher","first-page":"2373","DOI":"10.1109\/TASLP.2019.2946897","volume":"27","author":"J Yang","year":"2019","unstructured":"Yang J, Das RK, Zhou N (2019) Extraction of octave spectra information for spoofing attack detection. IEEE\/ACM Trans Audio Speech Lang Process 27(12):2373\u20132384. https:\/\/doi.org\/10.1109\/TASLP.2019.2946897","journal-title":"IEEE\/ACM Trans Audio Speech Lang Process"},{"key":"10539_CR108","doi-asserted-by":"publisher","first-page":"937","DOI":"10.1109\/LSP.2021.3076358","volume":"28","author":"Y Zhang","year":"2021","unstructured":"Zhang Y, Jiang F, Duan Z (2021) One-class learning towards synthetic voice spoofing detection. IEEE Signal Process Lett 28:937\u2013941. https:\/\/doi.org\/10.1109\/LSP.2021.3076358","journal-title":"IEEE Signal Processing Letters"},{"key":"10539_CR109","doi-asserted-by":"crossref","unstructured":"Zhang Y, Zhu G, Duan Z (2022) A probabilistic fusion framework for spoofing aware speaker verification. arXiv preprint arXiv:2202.05253","DOI":"10.21437\/Odyssey.2022-11"},{"key":"10539_CR110","doi-asserted-by":"crossref","unstructured":"Zhou X, Garcia-Romero D, Duraiswami R, Espy-Wilson C, Shamma S (2011) Linear versus mel frequency cepstral coefficients for speaker recognition. In: 2011 IEEE workshop on automatic speech recognition & understanding, pp. 559\u2013564. IEEE","DOI":"10.1109\/ASRU.2011.6163888"}],"container-title":["Artificial Intelligence Review"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10462-023-10539-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10462-023-10539-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10462-023-10539-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,10,23]],"date-time":"2024-10-23T03:15:20Z","timestamp":1729653320000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10462-023-10539-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,6,28]]},"references-count":111,"journal-issue":{"issue":"S1","published-print":{"date-parts":[[2023,10]]}},"alternative-id":["10539"],"URL":"https:\/\/doi.org\/10.1007\/s10462-023-10539-8","relation":{"has-preprint":[{"id-type":"doi","id":"10.21203\/rs.3.rs-2557691\/v1","asserted-by":"object"}]},"ISSN":["0269-2821","1573-7462"],"issn-type":[{"value":"0269-2821","type":"print"},{"value":"1573-7462","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,6,28]]},"assertion":[{"value":"13 June 2023","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"28 June 2023","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}