{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,10]],"date-time":"2025-11-10T15:04:58Z","timestamp":1762787098268,"version":"build-2065373602"},"reference-count":125,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2025,10,13]],"date-time":"2025-10-13T00:00:00Z","timestamp":1760313600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,10,13]],"date-time":"2025-10-13T00:00:00Z","timestamp":1760313600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Speech Technol"],"published-print":{"date-parts":[[2025,12]]},"DOI":"10.1007\/s10772-025-10217-w","type":"journal-article","created":{"date-parts":[[2025,10,13]],"date-time":"2025-10-13T14:44:04Z","timestamp":1760366644000},"page":"871-901","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Review and analysis of audio spoof countermeasures: an attack perspective"],"prefix":"10.1007","volume":"28","author":[{"given":"Nidhi","family":"Chakravarty","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mohit","family":"Dua","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,10,13]]},"reference":[{"key":"10217_CR1","doi-asserted-by":"crossref","unstructured":"Al-Karawi, K. A., Abdelwahab, M. M., & Alenizi, A. S. (2025). Comprehensive review of automatic speaker verification with spoofing detection techniques attacks. International Journal of Speech Technology, 1\u201324.","DOI":"10.1007\/s10772-025-10203-2"},{"key":"10217_CR2","doi-asserted-by":"crossref","unstructured":"Alali, A., & Theodorakopoulos, G. (2025). Partial fake speech attacks in the real world using deepfake audio. Journal of Cybersecurity and Privacy, 5(1), 6.","DOI":"10.3390\/jcp5010006"},{"key":"10217_CR3","doi-asserted-by":"crossref","unstructured":"Ali, M., Sabir, A., & Hassan, M. (2021). Fake audio detection using hierarchical representations learning and spectrogram features. In 2021 International conference on robotics and automation in industry (ICRAI) (pp. 1\u20136).","DOI":"10.1109\/ICRAI54018.2021.9651401"},{"key":"10217_CR4","doi-asserted-by":"crossref","unstructured":"Aljasem, M., et al. (2021). Secure automatic speaker verification (SASV) system through sm-ALTP features and asymmetric bagging. IEEE Transactions on Information Forensics and Security, 16, 3524\u20133537.","DOI":"10.1109\/TIFS.2021.3082303"},{"key":"10217_CR5","doi-asserted-by":"crossref","unstructured":"Almutairi, Z., & Elgibreen, H. (2022). A review of modern audio deepfake detection methods: Challenges and future directions. Algorithms, 15(5), 155.","DOI":"10.3390\/a15050155"},{"key":"10217_CR6","unstructured":"Altuncu, E., Franqueira, V. N. L., & Li, S. (2022). Deepfake: Definitions, performance metrics and standards, datasets and benchmarks, and a meta-review. ArXiv Prepr, arXiv2208(10913)."},{"key":"10217_CR7","doi-asserted-by":"crossref","unstructured":"Anjum, Z. K., & Swamy, R. K. (2017). Spoofing and countermeasures for speaker verification: A review. In 2017 international conference on wireless communications, signal processing and networking (WiSPNET) (pp. 467\u2013471).","DOI":"10.1109\/WiSPNET.2017.8299800"},{"key":"10217_CR8","unstructured":"Aravind, P. R., Nechiyil, U., & Paramparambath, N. (2020). Audio spoofing verification using deep convolutional neural networks by transfer learning. ArXiv Prepr, arXiv2008(3464)."},{"key":"10217_CR9","doi-asserted-by":"crossref","unstructured":"Arif, T., Javed, A., Alhameed, M., Jeribi, F., & Tahir, A. (2021). Voice spoofing countermeasure for logical access attacks detection. IEEE Access, 9, 162857\u2013162868.","DOI":"10.1109\/ACCESS.2021.3133134"},{"key":"10217_CR10","doi-asserted-by":"crossref","unstructured":"Ba, Z., et al. (2023). Transferring audio deepfake detection capability across languages. In Proceedings of the ACM Web Conference 2023 (pp. 2033\u20132044).","DOI":"10.1145\/3543507.3583222"},{"key":"10217_CR11","doi-asserted-by":"crossref","unstructured":"Baumann, R., Malik, K. M., Javed, A., Ball, A., Kujawa, B., & Malik, H. (2021). Voice spoofing detection corpus for single and multi-order audio replays. Computer Speech and Language, 65, 101132.","DOI":"10.1016\/j.csl.2020.101132"},{"key":"10217_CR12","doi-asserted-by":"crossref","unstructured":"Bharath, K. P., & Kumar, M. R. (2022). Replay spoof detection for speaker verification system using magnitude-phase-instantaneous frequency and energy features. Multimedia Tools and Applications, 81(27), 39343\u201339366.","DOI":"10.1007\/s11042-022-12380-7"},{"key":"10217_CR13","doi-asserted-by":"crossref","unstructured":"Cai, W., Wu, H., Cai, D., & Li, M. (2019). The DKU replay detection system for the ASVspoof 2019 challenge: On data augmentation, feature representation, classification, and fusion. arXiv Prepr. arXiv1907.02663.","DOI":"10.21437\/Interspeech.2019-1230"},{"key":"10217_CR14","doi-asserted-by":"crossref","unstructured":"Cai, Z., Wang, W., & Li, M. (2023). Waveform boundary detection for partially spoofed audio. In 2023 IEEE international conference on acoustics, speech and signal processing (ICASSP 2023) (pp. 1\u20135).","DOI":"10.1109\/ICASSP49357.2023.10094774"},{"key":"10217_CR15","doi-asserted-by":"crossref","unstructured":"Chadha, A., Abdullah, A., Angeline, L., & Sivanesan, S. (2021). A review on state-of-the-art automatic speaker verification system from spoofing and anti-spoofing perspective. Indian Journal of Science and Technology, 14(40), 3026\u20133050.","DOI":"10.17485\/IJST\/v14i40.1279"},{"key":"10217_CR16","doi-asserted-by":"crossref","unstructured":"Chaiwongyen, A., Songsriboonsit, N., Duangpummet, S., Karnjana, J., Kongprawechnon, W., & Unoki, M. (2022). Contribution of timbre and shimmer features to deepfake speech detection. In 2022 Asia-Pacific signal and information processing association annual summit and conference (APSIPA ASC 2022) (pp. 97\u2013103).","DOI":"10.23919\/APSIPAASC55919.2022.9980281"},{"key":"10217_CR17","doi-asserted-by":"crossref","unstructured":"Chen, X., Zhang, Y., Zhu, G., & Duan, Z. (2021). UR channel-robust synthetic speech detection system for ASVspoof 2021. ArXiv Prepr, arXiv2107(12018).","DOI":"10.21437\/ASVSPOOF.2021-12"},{"key":"10217_CR18","doi-asserted-by":"crossref","unstructured":"Chen, Z., Xie, Z., Zhang, W., & Xu, X. (2017). ResNet and Model fusion for automatic spoofing detection. In Interspeech 2017.","DOI":"10.21437\/Interspeech.2017-1085"},{"key":"10217_CR19","doi-asserted-by":"crossref","unstructured":"Cheng, H., Li, K., Ye, L., & Wang, J. (2024). EnvFake: An initial environmental-fake audio dataset for scene-consistency detection. In  IEEE 14th international symposium on Chinese spoken language processing (ISCSLP 2024) (pp. 81\u201385).","DOI":"10.1109\/ISCSLP63861.2024.10799995"},{"key":"10217_CR20","doi-asserted-by":"crossref","unstructured":"Chintha, A., et al. (2020). Recurrent convolutional structures for audio spoof and video deepfake detection. IEEE Journal of Selected Topics in Signal Processing, 14(5), 1024\u20131037.","DOI":"10.1109\/JSTSP.2020.2999185"},{"key":"10217_CR21","doi-asserted-by":"crossref","unstructured":"Dawood, H., Saleem, S., Hassan, F., & Javed, A. (2022). A robust voice spoofing detection system using novel CLS-LBP features and LSTM. Journal of King Saud University Information Sciences","DOI":"10.1016\/j.jksuci.2022.02.024"},{"key":"10217_CR22","doi-asserted-by":"publisher","unstructured":"de Luis-Garc\u0131\u0301a, R., Alberola-L\u00f3pez, C., Aghzout, O., & Ruiz-Alzola, J. (2003). Biometric identification systems. Signal Processing, 83(12), 2539\u20132557. https:\/\/doi.org\/10.1016\/j.sigpro.2003.08.001","DOI":"10.1016\/j.sigpro.2003.08.001"},{"key":"10217_CR23","unstructured":"Delgado, H., et al. (2021). Asvspoof, 2021: Automatic speaker verification spoofing and countermeasures challenge evaluation plan. ArXiv Prepr, arXiv2109(535)."},{"key":"10217_CR24","doi-asserted-by":"crossref","unstructured":"Dixit, A., Kaur, N., & Kingra, S. (2023). Review of audio deepfake detection techniques: Issues and prospects. Expert Systems, e13322.","DOI":"10.1111\/exsy.13322"},{"key":"10217_CR25","doi-asserted-by":"crossref","unstructured":"Doan, T.-P., Nguyen-Vu, L., Jung, S., & Hong, K. (2023). BTS-E: Audio deepfake detection using breathing-talking-silence encoder. In 2023 IEEE international conference on acoustics, speech and signal processing (ICASSP 2023) (pp. 1\u20135).","DOI":"10.1109\/ICASSP49357.2023.10095927"},{"key":"10217_CR26","doi-asserted-by":"publisher","unstructured":"Dua, M., Jain, C., & Kumar, S. (2021, Feb). LSTM and CNN based ensemble approach for spoof detection task in automatic speaker verification systems.  Journal of Ambient Intelligence and Humanized Computing, 1\u201316. https:\/\/doi.org\/10.1007\/s12652-021-02960-0","DOI":"10.1007\/s12652-021-02960-0"},{"key":"10217_CR27","doi-asserted-by":"publisher","unstructured":"Dua, M., Sadhu, A., Jindal, A., & Mehta, R. (2022). A hybrid noise robust model for multireplay attack detection in automatic speaker verification systems. Biomedical Signal Processing and Control, 74, 103517. https:\/\/doi.org\/10.1016\/j.bspc.2022.103517","DOI":"10.1016\/j.bspc.2022.103517"},{"key":"10217_CR28","doi-asserted-by":"crossref","unstructured":"Fathan, A., Alam, J., & Kang, W. H. (2022). Mel-spectrogram image-based end-to-end audio Deepfake detection under channel-mismatched conditions. In 2022 IEEE international conference on multimedia and Expo (ICME) (pp. 1\u20136).","DOI":"10.1109\/ICME52920.2022.9859621"},{"key":"10217_CR29","doi-asserted-by":"crossref","unstructured":"Fitzgibbon, C., Sankar, A., & Roedig, U. (2024). Do synthetic voices have emotions? Exploring emotional cues for spoofed speech detection. In 2024 Cyber research conference-Ireland (Cyber-RCI) (pp. 1\u20138).","DOI":"10.1109\/Cyber-RCI60769.2024.10939933"},{"key":"10217_CR30","doi-asserted-by":"crossref","unstructured":"Gambhir, J. H., & Patil, V. V. (2021). A review on speech authentication and speaker verification methods. In 2021 Fourth international conference on microelectronics, signals & systems (ICMSS) (pp. 1\u20136).","DOI":"10.1109\/ICMSS53060.2021.9673603"},{"key":"10217_CR31","doi-asserted-by":"crossref","unstructured":"Gao, Y., Lian, J., Raj, B., & Singh, R. (2021). Detection and evaluation of human and machine generated speech in spoofing attacks on automatic speaker verification systems. In 2021 IEEE spoken language technology workshop (SLT) pp. 544\u2013551.","DOI":"10.1109\/SLT48900.2021.9383558"},{"key":"10217_CR32","doi-asserted-by":"crossref","unstructured":"Ge, W., Patino, J., Todisco, M., & Evans, N. (2021). Raw differentiable architecture search for speech deepfake and spoofing detection. ArXiv Prepr, arXiv2107(12212).","DOI":"10.21437\/ASVSPOOF.2021-4"},{"key":"10217_CR33","unstructured":"German, R., & Barber, K. S. Current biometric adoption and trends. Univ. Texas Austin. Retrieved from identity. utexas. edu\/assets\/uploads\/publications\/Current-Biometric-Adoption-and-Trends. pdf, 2017."},{"key":"10217_CR34","doi-asserted-by":"crossref","unstructured":"Gomez-Alanis, A., Peinado, A. M., Gonzalez, J. A., & Gomez, A. M. (2019a). A gated recurrent convolutional neural network for robust spoofing detection. IEEE\/ACM Transactions on Audio, Speech and Language Processing, 27(12), 1985\u20131999.","DOI":"10.1109\/TASLP.2019.2937413"},{"key":"10217_CR35","doi-asserted-by":"crossref","unstructured":"Gomez-Alanis, A., Peinado, A. M., Gonzalez, J. A., & Gomez, A. M. (2019b). A light convolutional GRU-RNN deep feature extractor for ASV spoofing detection. In Proceedings of Interspeech (Vol. 2019), (pp. 1068\u20131072).","DOI":"10.21437\/Interspeech.2019-2212"},{"key":"10217_CR36","doi-asserted-by":"crossref","unstructured":"Gong, Y., Yang, J., & Poellabauer, C. (2020). Detecting replay attacks using multi-channel audio: A neural network-based method. Signal Processing Letters","DOI":"10.1109\/LSP.2020.2996908"},{"key":"10217_CR37","doi-asserted-by":"crossref","unstructured":"Gunendradasan, T., Irtza, S., Ambikairajah, E., & Epps, J. (2019). Transmission line cochlear model based AM-FM features for replay attack detection. In 2019 IEEE international conference on acoustics, speech and signal processing (ICASSP 2019)","DOI":"10.1109\/ICASSP.2019.8682771"},{"key":"10217_CR38","doi-asserted-by":"crossref","unstructured":"Gunendradasan, T., Wickramasinghe, B., Le, P. N., Ambikairajah, E., & Epps, J. (2018). Detection of replay-spoofing attacks using frequency modulation features. Interspeech, 636\u2013640.","DOI":"10.21437\/Interspeech.2018-1473"},{"key":"10217_CR39","doi-asserted-by":"crossref","unstructured":"Halpern, B. M., Kelly, F., van Son, R., & Alexander, A. (2020). Residual networks for resisting noise: Analysis of an embeddings-based spoofing countermeasure In Odyssey: The speaker and language recognition workshop","DOI":"10.21437\/Odyssey.2020-46"},{"key":"10217_CR40","doi-asserted-by":"crossref","unstructured":"Hanifa, R. M., Isa, K., & Mohamad, S. (2021). A review on speaker recognition: Technology and challenges. Computers and Electrical Engineering, 90, 107005.","DOI":"10.1016\/j.compeleceng.2021.107005"},{"key":"10217_CR41","doi-asserted-by":"crossref","unstructured":"Hassan, F., & Javed, A. (2021). Voice spoofing countermeasure for synthetic speech detection. In 2021 International conference on artificial intelligence (ICAI) (pp. 209\u2013212).","DOI":"10.1109\/ICAI52203.2021.9445238"},{"key":"10217_CR42","doi-asserted-by":"crossref","unstructured":"Hemavathi, R., & Kumaraswamy, R. (2021). Voice conversion spoofing detection by exploring artifacts estimates (Vol. 80, pp. 23561\u201323580). Springer.","DOI":"10.1007\/s11042-020-10212-0"},{"key":"10217_CR43","doi-asserted-by":"crossref","unstructured":"Huang, L., Gan, Y., & Ye, H. (2019). Audio-replay attacks spoofing detection for automatic Speaker verification system. In 2019 IEEE international conference on artificial intelligence and computer applications (ICAICA) (pp. 392\u2013396).","DOI":"10.1109\/ICAICA.2019.8873465"},{"key":"10217_CR44","doi-asserted-by":"crossref","unstructured":"Huang, L., & Pun, C.-M. (2019). Audio replay spoof attack detection using segment-based hybrid feature and densenet-LSTM network. In 2019 IEEE international conference on acoustics, speech and signal processing (ICASSP 2019) (pp. 2567\u20132571).","DOI":"10.1109\/ICASSP.2019.8682573"},{"key":"10217_CR45","doi-asserted-by":"crossref","unstructured":"Huang, L., & Pun, C.-M. (2020). Audio replay spoof attack detection by joint segment-based linear filter bank feature extraction and attention-enhanced DenseNet-BiLSTM network. IEEE\/ACM Transactions on Audio, Speech and Lang uage Processing, 28, 1813\u20131825.","DOI":"10.1109\/TASLP.2020.2998870"},{"key":"10217_CR46","unstructured":"Huang, L., & Zhao, J. (2021). Audio replay spoofing attack detection using deep learning feature and long-short-term memory recurrent neural network. In AIIPCC 2021, The secondinternational conference on artificial intelligence, information processing and cloud computing (pp. 1\u20135)."},{"key":"10217_CR47","doi-asserted-by":"crossref","unstructured":"Ilyas, H., Javed, A., & Malik, K. M. (2023). AVFakeNet: A unified end-to-end dense swin transformer deep learning model for audio-visual deepfakes detection. Applied Soft Computing 136, 110124.","DOI":"10.1016\/j.asoc.2023.110124"},{"key":"10217_CR48","doi-asserted-by":"crossref","unstructured":"Irum, A., & Salman, A. (2019). Speaker verification using deep neural networks: A. International Journal of Machine Learning and Computing, 9(1).","DOI":"10.18178\/ijmlc.2019.9.1.760"},{"key":"10217_CR49","doi-asserted-by":"crossref","unstructured":"Javed, A., Malik, K. M., Irtaza, A., & Malik, H. (2021). Towards protecting cyber-physical and IoT systems from single-and multi-order voice spoofing attacks. Applied Acoustics, 183, 108283.","DOI":"10.1016\/j.apacoust.2021.108283"},{"key":"10217_CR50","doi-asserted-by":"crossref","unstructured":"Ji, Z., et al. (2017). Ensemble learning for countermeasure of audio replay spoofing attack in ASVspoof2017. In Interspeech 2017.","DOI":"10.21437\/Interspeech.2017-1246"},{"key":"10217_CR51","doi-asserted-by":"crossref","unstructured":"Joshi, S., & Dua, M. (2022). LSTM-GTCC based approach for audio spoof detection. In 2022 International conference on machine learning, big data, cloud and parallel computing (COM-IT-CON) (Vol. 1, pp. 656\u2013661).","DOI":"10.1109\/COM-IT-CON54601.2022.9850820"},{"key":"10217_CR52","doi-asserted-by":"crossref","unstructured":"Joshi, S., & Dua, M. (2023). Multi-order replay attack detection using enhanced feature extraction and deep learning classification. In Proceedings of international conference on recent trends in computing (ICRTC 2022 ) (pp. 739\u2013745).","DOI":"10.1007\/978-981-19-8825-7_63"},{"key":"10217_CR53","doi-asserted-by":"crossref","unstructured":"Jung, J., Heo, H.-S., Kim, J., Shim, H., & Yu, H.-J. (2019). Rawnet: Advanced end-to-end deep neural network using raw waveforms for text-independent speaker verification. arXiv Prepr. arXiv1904.08104.","DOI":"10.21437\/Interspeech.2019-1982"},{"key":"10217_CR54","doi-asserted-by":"crossref","unstructured":"Jung, J., Shim, H., Heo, H.-S., & Yu, H.-J. (2019). Replay attack detection with complementary high-resolution information using end-to-end DNN for the ASVspoof 2019 challenge. arXiv Prepr. arXiv1904.10134.","DOI":"10.21437\/Interspeech.2019-1991"},{"key":"10217_CR55","doi-asserted-by":"crossref","unstructured":"Kawa, P., Plata, M., Czuba, M., Szyma\u0144ski, P., & Syga, P. (2023). Improved DeepFake detection using whisper features. ArXiv Prepr, arXiv2306(1428).","DOI":"10.21437\/Interspeech.2023-1537"},{"key":"10217_CR56","doi-asserted-by":"crossref","unstructured":"Kawa, P., Plata, M., & Syga, P. (2022). Specrnet: Towards faster and more accessible audio deepfake detection. In 2022 IEEE international conference on trust, security and privacy in computing and communications (TrustCom) (pp. 792\u2013799).","DOI":"10.1109\/TrustCom56396.2022.00111"},{"key":"10217_CR57","doi-asserted-by":"crossref","unstructured":"Khan, A., Malik, K. M., Ryan, J., & Saravanan, M. (2023). Voice spoofing attacks and countermeasures: A systematic review, analysis, and experimental evaluation.Computer Security and Reliability.","DOI":"10.21203\/rs.3.rs-2557691\/v1"},{"key":"10217_CR58","doi-asserted-by":"crossref","unstructured":"Khanjani, Z., Watson, G., & Janeja, V. P. (2023). Audio deepfakes: A survey. Frontiers in Big Data, 5, 1001063.","DOI":"10.3389\/fdata.2022.1001063"},{"key":"10217_CR59","doi-asserted-by":"crossref","unstructured":"Kinnunen, T., et al. (2017). The ASVspoof 2017 challenge: Assessing the limits of replay spoofing attack detection. In Interspeech 2017","DOI":"10.21437\/Interspeech.2017-1111"},{"key":"10217_CR60","doi-asserted-by":"crossref","unstructured":"Kinnunen, T., et al. (2017). Reddots replayed: A new replay spoofing attack corpus for text-dependent speaker verification research. In 2017 IEEE international conference on acoustics, speech and signal processing (ICASSP 2017) (pp. 5395\u20135399).","DOI":"10.1109\/ICASSP.2017.7953187"},{"key":"10217_CR61","doi-asserted-by":"publisher","unstructured":"Kinnunen, T., & Li, H. (2010). An overview of text-independent speaker recognition: From features to supervectors. Speech Communication, 52(1), 12\u201340. https:\/\/doi.org\/10.1016\/j.specom.2009.08.009","DOI":"10.1016\/j.specom.2009.08.009"},{"key":"10217_CR62","doi-asserted-by":"crossref","unstructured":"Kwak, I.-Y., et al. (2023). Voice spoofing detection through residual network, Max Feature Map, and depthwise separable convolution. In IEEE Access.","DOI":"10.1109\/ACCESS.2023.3275790"},{"key":"10217_CR63","doi-asserted-by":"crossref","unstructured":"Lai, J., Abad, A., Richmond, K., Yamagishi, J., & Dehak, N. (2018). Attentive filtering networks for audio replay attack detection.","DOI":"10.1109\/ICASSP.2019.8682640"},{"key":"10217_CR64","doi-asserted-by":"crossref","unstructured":"Lavrentyeva, G., Novoselov, S., Volkova, M., Matveev, Y., & Marsico, M. D. (2019). Phonespoof: A new dataset for spoofing attack detection in telephone channel. In 2019 IEEE international conference on acoustics, speech and signal processing (ICASSP 2019) (pp. 2572\u20132576).","DOI":"10.1109\/ICASSP.2019.8682942"},{"key":"10217_CR65","doi-asserted-by":"crossref","unstructured":"Lei, Z., Yan, H., Liu, C., Ma, M., & Yang, Y. (2022). Two-path GMM-ResNet and GMM-SENet for ASV spoofing detection. In 2022 IEEEinternational conference on acoustics, speech and signal processing (ICASSP 2022) (pp. 6377\u20136381).","DOI":"10.1109\/ICASSP43922.2022.9746163"},{"key":"10217_CR66","doi-asserted-by":"crossref","unstructured":"Li, X., et al. (2021). Replay and synthetic speech detection with res2net architecture. In 2021 IEEE international conference on acoustics, speech and signal processing (ICASSP 2021) (pp. 6354\u20136358).","DOI":"10.1109\/ICASSP39728.2021.9413828"},{"key":"10217_CR67","doi-asserted-by":"crossref","unstructured":"Liu, M., Wang, L., Oo, Z., Dang, J., Li, D., & Nakagawa, S. (2018). Replay attacks detection using phase and magnitude features with various frequency resolutions. In 2018 11th international symposium on Chinese spoken language processing (ISCSLP) (pp. 329\u2013333).","DOI":"10.1109\/ISCSLP.2018.8706628"},{"key":"10217_CR68","doi-asserted-by":"crossref","unstructured":"Lorenzo-Trueba, J., et al. (2018). The voice conversion challenge 2018: Promoting development of parallel and nonparallel methods. ArXiv Prepr, arXiv1804(4262).","DOI":"10.21437\/Odyssey.2018-28"},{"key":"10217_CR69","doi-asserted-by":"crossref","unstructured":"Lu, J., Li, Z., Zhang, Y., Wang, W., & Zhang, P. (2022). Acoustic or pattern? Speech spoofing countermeasure based on image pre-training models. In Proceedings of the 1st international workshop on deepfake detection for audio multimedia (pp. 77\u201384).","DOI":"10.1145\/3552466.3556524"},{"key":"10217_CR70","doi-asserted-by":"crossref","unstructured":"Luo, A., Li, E., Liu, Y., Kang, X., & Wang, Z. J. (2021). A capsule network based approach for detection of audio spoofing attacks. In 2021 IEEE international conference on acoustics, speech and signal processing (ICASSP 2021) (pp. 6359\u20136363).","DOI":"10.1109\/ICASSP39728.2021.9414670"},{"key":"10217_CR71","doi-asserted-by":"crossref","unstructured":"Ma, Y., Ren, Z., & Xu, S. (2021). RW-Resnet: A novel speech anti-spoofing model using raw waveform. ArXiv Prepr, arXiv2108(5684).","DOI":"10.21437\/Interspeech.2021-438"},{"key":"10217_CR72","doi-asserted-by":"crossref","unstructured":"Malik, K. M., Malik, H., & Baumann, R. (2019). Towards vulnerability analysis of voice-driven interfaces and countermeasures for replay attacks. In 2019 IEEE conference onmultimedia information processing and retrieval (MIPR) (pp. 523\u2013528).","DOI":"10.1109\/MIPR.2019.00106"},{"key":"10217_CR73","doi-asserted-by":"publisher","unstructured":"Malik, K., Javed, A., Malik, H., & Irtaza, A. (2020). A light-weight replay detection framework for voice controlled IoT devices. IEEE Journal of Selected Topics in Signal Processing https:\/\/doi.org\/10.1109\/JSTSP.2020.2999828","DOI":"10.1109\/JSTSP.2020.2999828"},{"key":"10217_CR74","doi-asserted-by":"crossref","unstructured":"Meriem, F., Messaoud, B., & Bahia, Y. (2023). Texture analysis of edge mapped audio spectrogram for spoofing attack detection. Multimedia Tools and Applications, 1\u201323.","DOI":"10.1007\/s11042-023-15329-6"},{"key":"10217_CR75","doi-asserted-by":"publisher","unstructured":"Mittal, A., & Dua, M. (2021a, Aug). Automatic speaker verification systems and spoof detection techniques: Review and analysis. International Journal of Speech Technology. https:\/\/doi.org\/10.1007\/s10772-021-09876-2","DOI":"10.1007\/s10772-021-09876-2"},{"key":"10217_CR76","doi-asserted-by":"crossref","unstructured":"Mittal, A., & Dua, M. (2021b). Static-dynamic features and hybrid deep learning models based spoof detection system for ASV. Complex & Intelligent Systems , 1\u201314.","DOI":"10.1007\/s40747-021-00565-w"},{"key":"10217_CR77","doi-asserted-by":"crossref","unstructured":"Nagarsheth, P., Khoury, E., Patil, K., Garland, M. (2017). Replay attack detection using DNN for channel discrimination. In Interspeech 2017","DOI":"10.21437\/Interspeech.2017-1377"},{"key":"10217_CR78","doi-asserted-by":"crossref","unstructured":"Nasr, M. A., El-Shafai, W., Abdel-Salam, N., El-Rabaie, E.-S. M., El-Fishawy, A. S., & El-Samie, F. E. A. (2025). A comprehensive survey of audio forgery detection: Challenges and novel trends. Journal of Electrical Systems and Information Technology, 12(1), 1\u201342.","DOI":"10.1186\/s43067-025-00225-w"},{"key":"10217_CR79","doi-asserted-by":"publisher","unstructured":"Nautsch, A., et al. (2021). Asvspoof, 2019: Spoofing countermeasures for the detection of synthesized, converted and replayed speech. IEEE Transactions on Biometrics, Behavior, and Identity Science, 1. https:\/\/doi.org\/10.1109\/TBIOM.2021.3059479","DOI":"10.1109\/TBIOM.2021.3059479"},{"key":"10217_CR80","doi-asserted-by":"crossref","unstructured":"Patil, H. A., & Kamble, M. R. (2018). A survey on replay attack detection for automatic speaker verification (ASV) system. In 2018 Asia-Pacific signal and information processing association annual summit and conference (APSIPA ASC) (pp. 1047\u20131053).","DOI":"10.23919\/APSIPA.2018.8659666"},{"key":"10217_CR81","doi-asserted-by":"crossref","unstructured":"Patil, U. G., & Shirbahadurkar, S. D. (2018). Performance analysis of SS based speech enhancement algorithms for ASR with non-stationary noisy database-NOIZEUS. In 2018 2nd international  conference on I-SMAC (IoT in social, mobile, analytics and cloud)(I-SMAC) (pp. 636\u2013641)","DOI":"10.1109\/I-SMAC.2018.8653675"},{"key":"10217_CR82","doi-asserted-by":"crossref","unstructured":"Paul, D., Pal, M., & Saha, G. (2015). Novel speech features for improved detection of spoofing attacks. In 2015 annual IEEE India conference (INDICON) (pp. 1\u20136).","DOI":"10.1109\/INDICON.2015.7443805"},{"key":"10217_CR83","doi-asserted-by":"crossref","unstructured":"Pianese, A., Cozzolino, D., Poggi, G., & Verdoliva, L. (2022). Deepfake audio detection by speaker verification. In 2022 IEEE international workshop on information forensics and security (WIFS) (pp. 1\u20136).","DOI":"10.1109\/WIFS55849.2022.9975428"},{"key":"10217_CR84","doi-asserted-by":"crossref","unstructured":"Poddar, A., Sahidullah, M., & Saha, G. (2018). Speaker verification with short utterances: A review of challenges, trends and opportunities. IET Biometrics, 7(2), 91\u2013101.","DOI":"10.1049\/iet-bmt.2017.0065"},{"key":"10217_CR85","doi-asserted-by":"crossref","unstructured":"Qadir, G., Zareen, S., Hassan, F., & Rahman, A. U. (2022). Voice spoofing countermeasure based on spectral features to detect synthetic attacks through LSTM. Interntional Journal of Innovative Science and Technology , 3(5), 153\u2013165.","DOI":"10.33411\/IJIST\/2021030512"},{"key":"10217_CR86","doi-asserted-by":"crossref","unstructured":"Qi, K., Huang, W., Wang, D., & Zhang, H. (2021). Audio replay spoof attack detection using a GMM-RFPNN Model as back-end Classifier. In 2021 2nd international conference on artificial intelligence and computer engineering (ICAICE) (pp. 425\u2013429).","DOI":"10.1109\/ICAICE54393.2021.00089"},{"key":"10217_CR87","doi-asserted-by":"crossref","unstructured":"Rahmeni, R., Aicha, A. B., & Ayed, Y. B. (2022). Voice spoofing detection based on acoustic and glottal flow features using conventional machine learning techniques. Multimedia Tools and Applications, 81(22), 31443\u201331467.","DOI":"10.1007\/s11042-022-12606-8"},{"key":"10217_CR88","doi-asserted-by":"crossref","unstructured":"Ranjan, R., Vatsa, M., & Singh, R. (2022). Statnet: Spectral and temporal features based multi-task network for audio spoofing detection. In 2022 IEEE international joint conference on biometrics (IJCB) (pp. 1\u20139).","DOI":"10.1109\/IJCB54206.2022.10007949"},{"key":"10217_CR89","doi-asserted-by":"publisher","unstructured":"Ray, R., et al. (2021). Feature genuinization based residual squeeze-and-excitation for audio anti-spoofing in sound AI. In 2021 12th international conference on computing communication and networking technologies (ICCCNT) (pp. 1\u20135). https:\/\/doi.org\/10.1109\/ICCCNT51525.2021.9580127","DOI":"10.1109\/ICCCNT51525.2021.9580127"},{"key":"10217_CR90","doi-asserted-by":"crossref","unstructured":"Reimao, R., & Tzerpos, V. (2019). FoR: A dataset for synthetic speech detection. In 2019 international conference on speech technology and human-computer dialogue (SpeD)","DOI":"10.1109\/SPED.2019.8906599"},{"key":"10217_CR91","doi-asserted-by":"crossref","unstructured":"Rostami, A. M., Homayounpour, M. M., & Nickabadi, A. (2023). Efficient attention branch network with combined loss function for automatic speaker verification spoof detection. Circuits, Systems, and Signal Processing, 1\u201319.","DOI":"10.1007\/s00034-023-02314-5"},{"key":"10217_CR92","doi-asserted-by":"crossref","unstructured":"Saranya, S. M., Padmanabhan, R., & Murthy, H. (2018). Replay attack detection in speaker verification using non-voiced segments and decision level feature switching. In 2018 international conference on signal processing and communications (SPCOM)","DOI":"10.1109\/SPCOM.2018.8724469"},{"key":"10217_CR93","doi-asserted-by":"crossref","unstructured":"Saranya, M. S., & Murthy, H. A. (2018). Decision-level feature switching as a paradigm for replay attack detection. Interspeech, 686\u2013690.","DOI":"10.21437\/Interspeech.2018-1494"},{"key":"10217_CR94","unstructured":"Shan, M., & Tsai, T. J. (2020). A cross-verification approach for protecting world leaders from fake and tampered audio. ArXiv Prepr, arXiv2010(12173)."},{"key":"10217_CR95","doi-asserted-by":"crossref","unstructured":"Shukla, S., Prakash, J., & Guntur, R. S. (2019). Replay attack detection with raw audio waves and deep learning framework. In 2019 International conference on data science and engineering (ICDSE) (pp. 66\u201370).","DOI":"10.1109\/ICDSE47409.2019.8971793"},{"key":"10217_CR96","doi-asserted-by":"crossref","unstructured":"Singh, M., & Pati, D. (2019). Usefulness of linear prediction residual for replay attack detection. AEU-International Journal of Electronics and Communication , 110, 152837.","DOI":"10.1016\/j.aeue.2019.152837"},{"key":"10217_CR97","unstructured":"Singh, N. (2014). A study on speech and speaker recognition technology and its challenges. In Proceedings of national conference on information security challenges (pp. 34\u201337). DIT, BBAU, Lucknow."},{"key":"10217_CR98","doi-asserted-by":"crossref","unstructured":"Singh, R., Singh, A. K., & Bhattacharjee, U. (2016). A review on text-independent Speaker verification techniques in realistic world. Oriental Journal of Computer Science and Technology 9(1), 36\u201340","DOI":"10.13005\/ojcst\/901.07"},{"key":"10217_CR99","unstructured":"Snyder, D., Chen, G., & Povey, D. (2015). Musan: A music, speech, and noise corpus. ArXiv Prepr, arXiv1510(8484)."},{"key":"10217_CR100","doi-asserted-by":"crossref","unstructured":"Suthokumar, G., Sethu, V., Wijenayake, C., & Ambikairajah, E. (2018). Modulation dynamic features for the detection of replay attacks. Interspeech, 691\u2013695.","DOI":"10.21437\/Interspeech.2018-1846"},{"key":"10217_CR101","doi-asserted-by":"crossref","unstructured":"Sz\u00f6ke, I., Sk\u00e1cel, M., Mo\u0161ner, L., Paliesek, J., & \u010cernock\u00fd, J. (2019). Building and evaluation of a real room impulse response dataset. IEEE Journal of Selected Topics in Signal Processing, 13(4), 863\u2013876.","DOI":"10.1109\/JSTSP.2019.2917582"},{"key":"10217_CR102","doi-asserted-by":"crossref","unstructured":"Tak, H., Jung, J., Patino, J., Kamble, M., Todisco, M., & Evans, N. (2021). End-to-end spectro-temporal graph attention networks for speaker verification anti-spoofing and speech deepfake detection. ArXiv Prepr, arXiv2107(12710).","DOI":"10.21437\/ASVSPOOF.2021-1"},{"key":"10217_CR103","doi-asserted-by":"crossref","unstructured":"Tak, H., Jung, J., Patino, J., Todisco, M., & Evans, N. (2021). Graph attention networks for anti-spoofing. ArXiv Prepr, arXiv2104(3654).","DOI":"10.21437\/Interspeech.2021-993"},{"key":"10217_CR104","doi-asserted-by":"crossref","unstructured":"Tapkir, P. A., Patil, A. T., Shah, N., & Patil, H. A. (2018). Novel spectral root cepstral features for replay spoof detection. In 2018 Asia-Pacific signal andinformation processing association annual summit and conference (APSIPA ASC) (pp. 1945\u20131950).","DOI":"10.23919\/APSIPA.2018.8659746"},{"key":"10217_CR105","doi-asserted-by":"crossref","unstructured":"Todisco, M., Delgado, H., & Evans, N. W. D. (2016). A new feature for automatic speaker verification anti-spoofing: Constant Q cepstral coefficients. Odyssey, 2016, 283\u2013290.","DOI":"10.21437\/Odyssey.2016-41"},{"key":"10217_CR106","doi-asserted-by":"crossref","unstructured":"Volkova, M., Andzhukaev, T., Lavrentyeva, G., Novoselov, S., & Kozlov, A. (2019). Light CNN architecture enhancement for different types spoofing attack detection. In Speech and computer: 21st international conference, (SPECOM 2019) (Vol. 21, pp. 520\u2013529), Istanbul, Turkey. August 20\u201325, 2019, Proceedings.","DOI":"10.1007\/978-3-030-26061-3_53"},{"key":"10217_CR107","doi-asserted-by":"crossref","unstructured":"Vs, K. V., & Naveed, S. (2024). A review of automatic speaker verification systems with feature extractions and spoofing attacks. In 2024 5th international conference on electronics and sustainable communication systems (ICESC) (pp. 1999\u20132005).","DOI":"10.1109\/ICESC60852.2024.10690005"},{"key":"10217_CR108","doi-asserted-by":"crossref","unstructured":"Wang, C., et al. (2023). TO-Rawnet: Improving RawNet with TCN and orthogonal regularization for fake audio detection. ArXiv Prepr, arXiv2305(13701).","DOI":"10.21437\/Interspeech.2023-1206"},{"key":"10217_CR109","doi-asserted-by":"crossref","unstructured":"Wang, R., et al. (2020). Deepsonar: Towards effective and robust detection of ai-synthesized fake voices. In Proceedings of the 28th ACM international conference on multimedia (pp. 1207\u20131216).","DOI":"10.1145\/3394171.3413716"},{"key":"10217_CR110","doi-asserted-by":"publisher","unstructured":"Wang, X., et al. (2020). Asvspoof, 2019: A large-scale public database of synthesized, converted and replayed speech. Computer Speech and Language, 64, 101114. https:\/\/doi.org\/10.1016\/j.csl.2020.101114","DOI":"10.1016\/j.csl.2020.101114"},{"key":"10217_CR111","unstructured":"Watson, G., Khanjani, Z., & Janeja, V. P. (2021). Audio deepfake perceptions in college going populations. ArXiv Prepr, arXiv2112(3351)."},{"key":"10217_CR112","doi-asserted-by":"crossref","unstructured":"Wickramasinghe, B., Irtza, S., Ambikairajah, E., & Epps, J. (2018). Frequency domain linear prediction features for replay spoofing attack detection. Interspeech, 661\u2013665.","DOI":"10.21437\/Interspeech.2018-1574"},{"key":"10217_CR113","doi-asserted-by":"crossref","unstructured":"Witkowski, M., Kacprzak, S., \u017belasko, P., Kowalczyk, K., & Ga\u0142ka, J. (2017). Audio replay attack detection using high-frequency features. In Interspeech 2017","DOI":"10.21437\/Interspeech.2017-776"},{"key":"10217_CR114","doi-asserted-by":"crossref","unstructured":"Wu, Z., et al. (2015). Asvspoof, 2015: The first automatic speaker verification spoofing and countermeasures challenge. In Interspeech 2015","DOI":"10.21437\/Interspeech.2015-462"},{"key":"10217_CR115","doi-asserted-by":"crossref","unstructured":"Wu, Z., Das, R. K., Yang, J., & Li, H. (2020). Light convolutional neural network with feature genuinization for detection of synthetic speech attacks. ArXiv Prepr, arXiv2009(9637).","DOI":"10.21437\/Interspeech.2020-1810"},{"key":"10217_CR116","doi-asserted-by":"crossref","unstructured":"Wu, Z., Evans, N., Kinnunen, T., Yamagishi, J., & Alegre, F., Li, H. (2015). Spoofing and countermeasures for speaker verification: A survey. Speech Communication, 66, 130\u2013153.","DOI":"10.1016\/j.specom.2014.10.005"},{"key":"10217_CR117","doi-asserted-by":"crossref","unstructured":"Xue, J., et al. (2022). Audio deepfake detection based on a combination of F0 information and real plus imaginary spectrogram features. In Proceedings of the 1st international workshop on deepfakedetection for audio multimedia (pp. 19\u201326).","DOI":"10.1145\/3552466.3556526"},{"key":"10217_CR118","doi-asserted-by":"crossref","unstructured":"Xue, J., & Zhou, H. (2023). Physiological-physical feature fusion for automatic voice spoofing detection. Frontiers in Computer Sci ences, 17(2), 172318.","DOI":"10.1007\/s11704-022-2121-6"},{"key":"10217_CR119","doi-asserted-by":"publisher","unstructured":"Yang, J., & Das, R. (2019). Low frequency frame-wise normalization over constant-Q transform for playback speech detection. Digital Signal Processing, 89. https:\/\/doi.org\/10.1016\/j.dsp.2019.02.018","DOI":"10.1016\/j.dsp.2019.02.018"},{"key":"10217_CR120","doi-asserted-by":"crossref","unstructured":"Yang, J., Das, R. K., & Zhou, N. (2019). Extraction of octave spectra information for spoofing attack detection. IEEE\/ACM Transactions on Audio, Speech, and Language Processing, 27(12), 2373\u20132384.","DOI":"10.1109\/TASLP.2019.2946897"},{"key":"10217_CR121","doi-asserted-by":"crossref","unstructured":"Yi, J., et al. (2021). Half-truth: A partially fake audio detection dataset. ArXiv Prepr, arXiv2104(3617).","DOI":"10.21437\/Interspeech.2021-930"},{"key":"10217_CR122","doi-asserted-by":"crossref","unstructured":"Yi, J., et al. (2024). Scenefake: An initial dataset and benchmarks for scene fake audio detection. Pattern Recognition, 152, 110468.","DOI":"10.1016\/j.patcog.2024.110468"},{"key":"10217_CR123","doi-asserted-by":"crossref","unstructured":"Zaidi, S. F. A., & Xu, L. (2022). Implementation of multiple feature selection algorithms for speech spoofing detection. Journal of Physics: Conference Series 2224(1), 12119.","DOI":"10.1088\/1742-6596\/2224\/1\/012119"},{"key":"10217_CR124","doi-asserted-by":"crossref","unstructured":"Zeinali, H., et al. (2019). Detecting spoofing attacks using vgg and sincnet: But-omilia submission to asvspoof 2019 challenge. arXiv Prepr. arXiv1907.12908.","DOI":"10.21437\/Interspeech.2019-2892"},{"key":"10217_CR125","doi-asserted-by":"crossref","unstructured":"Zhang, Y., Jiang, F., & Duan, Z. (2021). One-class learning towards synthetic voice spoofing detection. IEEE Signal Processing Letters, 28, 937\u2013941.","DOI":"10.1109\/LSP.2021.3076358"}],"container-title":["International Journal of Speech Technology"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10772-025-10217-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10772-025-10217-w\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10772-025-10217-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,11,10]],"date-time":"2025-11-10T15:00:45Z","timestamp":1762786845000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10772-025-10217-w"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,13]]},"references-count":125,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2025,12]]}},"alternative-id":["10217"],"URL":"https:\/\/doi.org\/10.1007\/s10772-025-10217-w","relation":{},"ISSN":["1381-2416","1572-8110"],"issn-type":[{"type":"print","value":"1381-2416"},{"type":"electronic","value":"1572-8110"}],"subject":[],"published":{"date-parts":[[2025,10,13]]},"assertion":[{"value":"11 April 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"31 August 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 October 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no competing interests.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}]}}