{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,29]],"date-time":"2026-04-29T19:14:16Z","timestamp":1777490056515,"version":"3.51.4"},"reference-count":67,"publisher":"Springer Science and Business Media LLC","issue":"31","license":[{"start":{"date-parts":[[2025,3,13]],"date-time":"2025-03-13T00:00:00Z","timestamp":1741824000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,3,13]],"date-time":"2025-03-13T00:00:00Z","timestamp":1741824000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"DOI":"10.1007\/s11042-025-20694-5","type":"journal-article","created":{"date-parts":[[2025,3,13]],"date-time":"2025-03-13T06:19:26Z","timestamp":1741846766000},"page":"38927-38957","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":6,"title":["Attention-based multi dimension fused-feature convolutional neural network framework for speaker recognition"],"prefix":"10.1007","volume":"84","author":[{"given":"V.","family":"Karthikeyan","sequence":"first","affiliation":[]},{"given":"S. Suja","family":"Priyadharsini","sequence":"additional","affiliation":[]},{"given":"K.","family":"Balamurugan","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,3,13]]},"reference":[{"issue":"9","key":"20694_CR1","doi-asserted-by":"publisher","first-page":"1437","DOI":"10.1109\/5.628714","volume":"85","author":"JP Campbell","year":"1997","unstructured":"Campbell JP (1997) Speaker recognition: a tutorial. Proc IEEE 85(9):1437\u20131462","journal-title":"Proc IEEE"},{"issue":"6","key":"20694_CR2","doi-asserted-by":"publisher","first-page":"1182","DOI":"10.1109\/TASL.2009.2031505","volume":"18","author":"R Vogt","year":"2009","unstructured":"Vogt R, Sridharan S, Mason M (2009) Making confident speaker verification decisions with minimal speech. IEEE Trans Audio Speech Lang Process 18(6):1182\u20131192","journal-title":"IEEE Trans Audio Speech Lang Process"},{"key":"20694_CR3","doi-asserted-by":"publisher","DOI":"10.1016\/j.compeleceng.2024.109408","volume":"118","author":"V Karthikeyan","year":"2024","unstructured":"Karthikeyan V, Priyadharsini SS (2024) Text-independent voiceprint recognition via compact embedding of dilated deep convolutional neural networks. Comput Electr Eng 118:109408","journal-title":"Comput Electr Eng"},{"issue":"9","key":"20694_CR4","doi-asserted-by":"publisher","first-page":"859","DOI":"10.1016\/S0167-8655(97)00073-1","volume":"18","author":"S Furui","year":"1997","unstructured":"Furui S (1997) Recent advances in speaker recognition. Pattern Recogn Lett 18(9):859\u2013872","journal-title":"Pattern Recogn Lett"},{"key":"20694_CR5","doi-asserted-by":"crossref","unstructured":"Reynolds DA (2002) An overview of automatic speaker recognition technology. In: Proceedings of the 2002 IEEE International Conference Acoust. Speech Signal Process, Orlando, FL, USA, 13\u201317 May 2002; vol 4, pp 4072\u20134075","DOI":"10.1109\/ICASSP.2002.5745552"},{"issue":"3","key":"20694_CR6","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s12046-021-01649-6","volume":"46","author":"V Karthikeyan","year":"2021","unstructured":"Karthikeyan V, SujaPriyadharsini S (2021) A strong hybrid AdaBoost classification algorithm for speaker recognition. S\u0101dhan\u0101 46(3):1\u201319. https:\/\/doi.org\/10.1007\/s12046-021-01649-6","journal-title":"S\u0101dhan\u0101"},{"key":"20694_CR7","doi-asserted-by":"crossref","unstructured":"Beigi H. (2012). Speaker recognition: advancements and challenges. New trends and developments in biometrics, pp 3\u201329","DOI":"10.5772\/52023"},{"issue":"1","key":"20694_CR8","doi-asserted-by":"publisher","first-page":"72","DOI":"10.1109\/89.365379","volume":"3","author":"DA Reynolds","year":"1995","unstructured":"Reynolds DA, Rose RC (1995) Robust text-independent speaker identification using Gaussian mixture speaker models. IEEE Trans Speech Audio Process 3(1):72\u201383","journal-title":"IEEE Trans Speech Audio Process"},{"issue":"2","key":"20694_CR9","doi-asserted-by":"publisher","first-page":"23","DOI":"10.1109\/MCAS.2011.941079","volume":"11","author":"R Togneri","year":"2011","unstructured":"Togneri R, Pullella D (2011) An overview of speaker identification: accuracy and robustness issues. IEEE Circuits Syst Mag 11(2):23\u201361","journal-title":"IEEE Circuits Syst Mag"},{"issue":"2","key":"20694_CR10","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s10044-024-01278-9","volume":"27","author":"V Karthikeyan","year":"2024","unstructured":"Karthikeyan V, SujaPriyadharsini S (2024) A stacked convolutional neural network framework with multi-scale attention mechanism for text-independent voiceprint recognition. Pattern Anal Appl 27(2):1\u201315","journal-title":"Pattern Anal Appl"},{"key":"20694_CR11","unstructured":"Wang Y, Deng X, Pu S & Huang Z. (2017). Residual convolutional CTC networks for automatic speech recognition. arXiv preprint arXiv:1702.07793"},{"key":"20694_CR12","doi-asserted-by":"publisher","DOI":"10.1016\/j.bspc.2023.105020","volume":"85","author":"SA Almaghrabi","year":"2023","unstructured":"Almaghrabi SA, Clark SR, Baumert M (2023) Bio-acoustic features of depression: a review. Biomed Signal Process Control 85:105020","journal-title":"Biomed Signal Process Control"},{"issue":"10","key":"20694_CR13","doi-asserted-by":"publisher","first-page":"782","DOI":"10.1016\/j.specom.2008.04.010","volume":"50","author":"L Mary","year":"2008","unstructured":"Mary L, Yegnanarayana B (2008) Extraction and representation of prosodic features for language and speaker recognition. Speech Commun 50(10):782\u2013796","journal-title":"Speech Commun"},{"issue":"6","key":"20694_CR14","doi-asserted-by":"publisher","first-page":"74","DOI":"10.1109\/MSP.2015.2462851","volume":"32","author":"JH Hansen","year":"2015","unstructured":"Hansen JH, Hasan T (2015) Speaker recognition by machines and humans: a tutorial review. IEEE Signal Process Mag 32(6):74\u201399","journal-title":"IEEE Signal Process Mag"},{"key":"20694_CR15","doi-asserted-by":"publisher","first-page":"694","DOI":"10.1016\/j.inffus.2022.10.032","volume":"91","author":"Z Qin","year":"2023","unstructured":"Qin Z, Zhao P, Zhuang T, Deng F, Ding Y, Chen D (2023) A survey of identity recognition via data fusion and feature learning. Inf Fusion 91:694\u2013712","journal-title":"Inf Fusion"},{"key":"20694_CR16","doi-asserted-by":"publisher","DOI":"10.1016\/j.engappai.2023.107661","volume":"131","author":"K Radha","year":"2024","unstructured":"Radha K, Bansal M, Pachori RB (2024) Speech and speaker recognition using raw waveform modeling for adult and children\u2019s speech: a comprehensive review. Eng Appl Artif Intell 131:107661","journal-title":"Eng Appl Artif Intell"},{"issue":"4","key":"20694_CR17","first-page":"1893","volume":"14","author":"V Karthikeyan","year":"2024","unstructured":"Karthikeyan V, Raja E, Gurumoorthy K (2024) Denoising convolutional neural network with energy-based attention for image enhancement. J Appl Anal Comput 14(4):1893\u20131914","journal-title":"J Appl Anal Comput"},{"issue":"3","key":"20694_CR18","doi-asserted-by":"publisher","first-page":"300","DOI":"10.3311\/PPee.20971","volume":"67","author":"N Shome","year":"2023","unstructured":"Shome N, Sarkar A, Ghosh AK, Laskar RH, Kashyap R (2023) Speaker recognition through deep learning techniques: a comprehensive review and research challenges. Period Polytech Electr Eng Comput Sci 67(3):300\u2013336","journal-title":"Period Polytech Electr Eng Comput Sci"},{"key":"20694_CR19","doi-asserted-by":"publisher","DOI":"10.1016\/j.specom.2023.102952","volume":"152","author":"SB Junior","year":"2023","unstructured":"Junior SB, Guido RC, Aguiar GJ, Santana EJ, Junior MLP, Patil HA (2023) Multiple voice disorders in the same individual: investigating handcrafted features, multi-label classification algorithms, and base-learners. Speech Commun 152:102952","journal-title":"Speech Commun"},{"issue":"2","key":"20694_CR20","first-page":"789","volume":"15","author":"ND AL-Shakarchy","year":"2023","unstructured":"AL-Shakarchy ND, Obayes HK, Abdullah ZN (2023) Person identification based on voice biometric using deep neural network. Int J Inf Technol 15(2):789\u2013795","journal-title":"Int J Inf Technol"},{"issue":"1","key":"20694_CR21","doi-asserted-by":"publisher","DOI":"10.1002\/ima.23022","volume":"34","author":"V Karthikeyan","year":"2024","unstructured":"Karthikeyan V, Kishore MN, Sajin S (2024) End-to-end light-weighted deep-learning model for abnormality classification in kidney CT images. Int J Imaging Syst Technol 34(1):e23022","journal-title":"Int J Imaging Syst Technol"},{"issue":"21","key":"20694_CR22","doi-asserted-by":"publisher","first-page":"33111","DOI":"10.1007\/s11042-023-14942-9","volume":"82","author":"R Chakroun","year":"2023","unstructured":"Chakroun R, Frikha M (2023) A deep learning approach for text-independent speaker recognition with short utterances. Multimed Tools Appl 82(21):33111\u201333133","journal-title":"Multimed Tools Appl"},{"issue":"4","key":"20694_CR23","doi-asserted-by":"publisher","first-page":"788","DOI":"10.1109\/TASL.2010.2064307","volume":"19","author":"N Dehak","year":"2011","unstructured":"Dehak N, Kenny PJ, Dehak R, Dumouchel P, Ouellet P (2011) Front-end factor analysis for speaker verification. IEEE Trans Audio Speech Lang Process 19(4):788\u2013798. https:\/\/doi.org\/10.1109\/TASL.2010.2064307","journal-title":"IEEE Trans Audio Speech Lang Process"},{"issue":"7","key":"20694_CR24","doi-asserted-by":"publisher","first-page":"3461","DOI":"10.3390\/s23073461","volume":"23","author":"G Costantini","year":"2023","unstructured":"Costantini G, Cesarini V, Brenna E (2023) High-level CNN and machine learning methods for speaker recognition. Sensors 23(7):3461","journal-title":"Sensors"},{"issue":"13","key":"20694_CR25","doi-asserted-by":"publisher","first-page":"5890","DOI":"10.3390\/s23135890","volume":"23","author":"A Moufidi","year":"2023","unstructured":"Moufidi A, Rousseau D, Rasti P (2023) Attention-based fusion of ultrashort voice utterances and depth videos for multimodal person identification. Sensors 23(13):5890","journal-title":"Sensors"},{"key":"20694_CR26","doi-asserted-by":"crossref","unstructured":"Li X, Chen X, Fu R, Hu X, Chen M, Niu K (2024) Learning deep embedding with acoustic and phoneme features for speaker recognition in FM broadcasting. IET Biometrics 2024","DOI":"10.1049\/2024\/6694481"},{"issue":"10","key":"20694_CR27","doi-asserted-by":"publisher","first-page":"1440","DOI":"10.1109\/LSP.2018.2860246","volume":"25","author":"M Chen","year":"2018","unstructured":"Chen M, He X, Yang J, Zhang H (2018) 3-D convolutional recurrent neural networks with attention model for speech emotion recognition. IEEE Signal Process Lett 25(10):1440\u20131444","journal-title":"IEEE Signal Process Lett"},{"issue":"6","key":"20694_CR28","doi-asserted-by":"publisher","first-page":"2817","DOI":"10.1007\/s11760-023-02500-7","volume":"17","author":"K Velayuthapandian","year":"2023","unstructured":"Velayuthapandian K, Subramoniam SP (2023) A focus module-based lightweight end-to-end CNN framework for voiceprint recognition. SIViP 17(6):2817\u20132825","journal-title":"SIViP"},{"key":"20694_CR29","unstructured":"Banerjee A, Dubey A, Menon A, Nanda S, Nandi GC (2018) Speaker recognition using deep belief networks. arXiv preprint arXiv:1805.08865"},{"issue":"1","key":"20694_CR30","doi-asserted-by":"publisher","first-page":"504","DOI":"10.3390\/make1010031","volume":"1","author":"P Dhakal","year":"2019","unstructured":"Dhakal P, Damacharla P, Javaid AY, Devabhaktuni V (2019) A near real-time automatic speaker recognition architecture for voice-based user interface. Mach Learn Knowl Extr 1(1):504\u2013520","journal-title":"Mach Learn Knowl Extr"},{"key":"20694_CR31","doi-asserted-by":"crossref","unstructured":"Lukic Y, Vogt C, D\u00fcrr O, Stadelmann T (2016) Speaker identification and clustering using convolutional neural networks. In: 2016 IEEE 26th international workshop on machine learning for signal processing (MLSP). IEEE, pp 1\u20136","DOI":"10.1109\/MLSP.2016.7738816"},{"key":"20694_CR32","doi-asserted-by":"crossref","unstructured":"Ravanelli M, Bengio Y (2018) Speaker recognition from raw waveform with sincnet. In: 2018 IEEE Spoken Language Technology Workshop (SLT). IEEE, pp 1021\u20131028","DOI":"10.1109\/SLT.2018.8639585"},{"key":"20694_CR33","unstructured":"Feng L (2004) Speaker recognition (Master's thesis, Technical University of Denmark, DTU, DK-2800 Kgs. Lyngby, Denmark"},{"key":"20694_CR34","unstructured":"Garofolo JS (1993) TIMIT acoustic phonetic continuous speech corpus. Linguistic Data Consortium"},{"key":"20694_CR35","unstructured":"NIST Multimodal Information Group (2008) NIST Speaker Recognition Evaluation Training Set Part 1 LDC2011S05; Linguistic Data Consortium: Philadelphia, PA, USA, 2011"},{"key":"20694_CR36","unstructured":"Evans Kiplagat. Speaker Recognition Dataset. https:\/\/www.kaggle.com\/datasets\/kongaevans\/speaker-recognition-dataset\/code?datasetId=470244"},{"key":"20694_CR37","doi-asserted-by":"crossref","unstructured":"Alrusaini O, Daqrouq K (2024) Text-independent speaker identification system using discrete wavelet transform with linear prediction coding. J Umm Al-Qura Univ Eng Archit 1\u20138","DOI":"10.1007\/s43995-024-00046-4"},{"key":"20694_CR38","unstructured":"Yunfei ZI, Xiong S (2024) Short utterance speaker recognition based on speech high frequency information compensation and dynamic feature enhancement methods. Archives of Acoustics"},{"key":"20694_CR39","doi-asserted-by":"crossref","unstructured":"Sell G, Garcia-Romero D (2014) Speaker diarization with PLDA i-vector scoring and unsupervised calibration. In: 2014 IEEE Spoken Language Technology Workshop (SLT). IEEE, pp 413\u2013417","DOI":"10.1109\/SLT.2014.7078610"},{"issue":"7","key":"20694_CR40","doi-asserted-by":"publisher","first-page":"3244","DOI":"10.1109\/TII.2018.2799928","volume":"14","author":"Z Liu","year":"2018","unstructured":"Liu Z, Wu Z, Li T, Li J, Shen C (2018) GMM and CNN hybrid method for short utterance speaker recognition. IEEE Trans Industr Inf 14(7):3244\u20133252","journal-title":"IEEE Trans Industr Inf"},{"issue":"2\u20133","key":"20694_CR41","doi-asserted-by":"publisher","first-page":"210","DOI":"10.1016\/j.csl.2005.06.003","volume":"20","author":"WM Campbell","year":"2006","unstructured":"Campbell WM, Campbell JP, Reynolds DA, Singer E, Torres-Carrasquillo PA (2006) Support vector machines for speaker and language recognition. Comput Speech Lang 20(2\u20133):210\u2013229","journal-title":"Comput Speech Lang"},{"key":"20694_CR42","doi-asserted-by":"crossref","unstructured":"Chang J, Wang D (2017) Robust speaker recognition based on DNN\/i-vectors and speech separation. In: 2017 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP). IEEE, pp 5415\u20135419","DOI":"10.1109\/ICASSP.2017.7953191"},{"key":"20694_CR43","unstructured":"Banerjee A, Dubey A, Menon A, Nanda S, Nandi GC (2018) Speaker recognition using deep belief networks. arXiv preprint arXiv:1805.08865"},{"key":"20694_CR44","doi-asserted-by":"crossref","unstructured":"Karthikeyan V, Kumar PS, Karthikeyan P (2023) Automatic recognition of speaker labels using CNN-SVM scheme. In: International conference on innovative computing and communication. Springer Nature Singapore, Singapore, pp 513\u2013529","DOI":"10.1007\/978-981-99-3315-0_39"},{"issue":"8","key":"20694_CR45","doi-asserted-by":"publisher","first-page":"3603","DOI":"10.3390\/app11083603","volume":"11","author":"F Ye","year":"2021","unstructured":"Ye F, Yang J (2021) A deep neural network model for speaker identification. Appl Sci 11(8):3603","journal-title":"Appl Sci"},{"key":"20694_CR46","unstructured":"Li W (2021) Speaker identification from raw waveform with LineNet. arXiv preprint arXiv:2105.14826"},{"key":"20694_CR47","doi-asserted-by":"publisher","DOI":"10.1016\/j.compeleceng.2024.109100","volume":"115","author":"B Saritha","year":"2024","unstructured":"Saritha B, Laskar MA, Laskar RH, Choudhury M (2024) CACRN-Net: A 3D log Mel spectrogram based channel attention convolutional recurrent neural network for few-shot speaker identification. Comput Electr Eng 115:109100","journal-title":"Comput Electr Eng"},{"issue":"11","key":"20694_CR48","doi-asserted-by":"publisher","first-page":"6410","DOI":"10.3390\/app13116410","volume":"13","author":"P Safari","year":"2023","unstructured":"Safari P, India M, Hernando J (2023) Self-attention networks in speaker recognition. Appl Sci 13(11):6410","journal-title":"Appl Sci"},{"issue":"10","key":"20694_CR49","doi-asserted-by":"publisher","first-page":"1671","DOI":"10.1109\/LSP.2015.2420092","volume":"22","author":"F Richardson","year":"2015","unstructured":"Richardson F, Reynolds D, Dehak N (2015) Deep neural network approaches to speaker and language recognition. IEEE Signal Process Lett 22(10):1671\u20131675","journal-title":"IEEE Signal Process Lett"},{"key":"20694_CR50","doi-asserted-by":"crossref","unstructured":"Al-Dulaimi HW, Aldhahab A, Al Abboodi HM (2023) Speaker identification system employing multi-resolution analysis in conjunction with CNN. Int J Intell Eng Syst 16(5)","DOI":"10.22266\/ijies2023.1031.30"},{"key":"20694_CR51","doi-asserted-by":"crossref","unstructured":"Zhang A, Wang Q, Zhu Z, Paisley J, Wang C (2019) Fully supervised speaker diarization. In: ICASSP 2019\u20132019 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP). IEEE, pp 6301\u20136305","DOI":"10.1109\/ICASSP.2019.8683892"},{"issue":"21","key":"20694_CR52","doi-asserted-by":"publisher","first-page":"10989","DOI":"10.3390\/app122110989","volume":"12","author":"Y Dong","year":"2022","unstructured":"Dong Y, Chen Z, Li Z, Gao F (2022) A multi-branch multi-scale deep learning image fusion algorithm based on DenseNet. Appl Sci 12(21):10989","journal-title":"Appl Sci"},{"key":"20694_CR53","doi-asserted-by":"crossref","unstructured":"Ma B, Wang X, Zhang H, Li F, Dan J (2019) CBAM-GAN: generative adversarial networks based on convolutional block attention module. In: Artificial Intelligence and Security: 5th International Conference, ICAIS 2019, New York, NY, USA, July 26\u201328, 2019, Proceedings, Part I 5. Springer International Publishing, pp 227\u2013236","DOI":"10.1007\/978-3-030-24274-9_20"},{"key":"20694_CR54","doi-asserted-by":"publisher","first-page":"2008","DOI":"10.1017\/CBO9780511841644","volume-title":"Introductory econometrics for finance","author":"C Brooks","year":"2008","unstructured":"Brooks C (2008) Introductory econometrics for finance, 2nd edn. Cambridge University Press, Cambridge, p 2008","edition":"2"},{"key":"20694_CR55","doi-asserted-by":"crossref","unstructured":"Lawson A, Vabishchevich P, Huggins M, Ardis P, Battles B, Stauffer A (2011) Survey and evaluation of acoustic features for speaker recognition. In: 2011 IEEE international conference on acoustics, speech and signal processing (ICASSP). IEEE, pp 5444\u20135447","DOI":"10.1109\/ICASSP.2011.5947590"},{"key":"20694_CR56","doi-asserted-by":"crossref","unstructured":"Chen YH, Lopez-Moreno I, Sainath TN, Visontai M, Alvarez R, Parada C (2015) Locally-connected and convolutional neural networks for small footprint speaker recognition. In: Sixteenth Annual Conference of the International Speech Communication Association","DOI":"10.21437\/Interspeech.2015-297"},{"key":"20694_CR57","unstructured":"Thanda Setty V (2018) Speaker recognition using deep neural networks with reduced complexity (Thesis). Texas State University, San Marcos, Texas"},{"key":"20694_CR58","doi-asserted-by":"crossref","unstructured":"Ghezaiel W, Brun L, L\u00e9zoray O (2021) Hybrid network for end-to-end text-independent speaker identification. In: 2020 25th International Conference on Pattern Recognition (ICPR). IEEE, pp 2352\u20132359","DOI":"10.1109\/ICPR48806.2021.9413293"},{"key":"20694_CR59","doi-asserted-by":"crossref","unstructured":"Nunes JAC, Mac\u00eado D, Zanchettin C (2020) Am-mobilenet1d: a portable model for speaker recognition. In: 2020 International Joint Conference on Neural Networks (IJCNN). IEEE, pp 1\u20138","DOI":"10.1109\/IJCNN48605.2020.9207519"},{"issue":"7","key":"20694_CR60","doi-asserted-by":"publisher","first-page":"2399","DOI":"10.3390\/s18072399","volume":"18","author":"C Sun","year":"2018","unstructured":"Sun C, Yang Y, Wen C, Xie K, Wen F (2018) Voiceprint identification for limited dataset using the deep migration hybrid model based on transfer learning. Sensors 18(7):2399","journal-title":"Sensors"},{"key":"20694_CR61","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1155\/2021\/8493795","volume":"2021","author":"M Xiao","year":"2021","unstructured":"Xiao M, Wu Y, Zuo G, Fan S, Yu H, Shaikh ZA, Wen Z (2021) Addressing overfitting problem in deep learning-based solutions for next generation data-driven networks. Wirel Commun Mob Comput 2021:1\u201310","journal-title":"Wirel Commun Mob Comput"},{"key":"20694_CR62","unstructured":"Cieri C, Graff D, Kimball O, Miller D, Walker K (2004) Fisher English training speech part 1 transcripts. Philadelphia: Linguistic Data Consortium. Univ. Pennsylvania, Philadelphia"},{"key":"20694_CR63","doi-asserted-by":"crossref","unstructured":"Tan B, Li Q, Foresta R (2010) An automatic non-native speaker recognition system. In: 2010 IEEE International Conference on Technologies for Homeland Security (HST). IEEE, pp 77\u201383","DOI":"10.1109\/THS.2010.5655088"},{"key":"20694_CR64","doi-asserted-by":"crossref","unstructured":"McClanahan R, De Leon P (2013) Towards a more efficient SVM supervector speaker verification system using gaussian reduction and a tree-structured hash (No. SAND2013-2166C). Sandia National Lab. (SNL-NM), Albuquerque","DOI":"10.21437\/Interspeech.2013-688"},{"key":"20694_CR65","doi-asserted-by":"crossref","unstructured":"Varun Prakash R, Karthikeyan V, Vishali S, Karthika M (2024) Multi-level LSTM framework with hybrid sonic features for human\u2013animal conflict evasion. The Visual Computer, 1\u201317","DOI":"10.1007\/s00371-024-03588-9"},{"key":"20694_CR66","doi-asserted-by":"crossref","unstructured":"Chowdhury A, Ross A (2017) Extracting sub-glottal and supra-glottal features from MFCC using convolutional neural networks for speaker identification in degraded audio signals. In: 2017 IEEE International Joint Conference on Biometrics (IJCB). IEEE, pp 608\u2013617","DOI":"10.1109\/BTAS.2017.8272748"},{"issue":"3","key":"20694_CR67","doi-asserted-by":"publisher","first-page":"764","DOI":"10.1016\/j.jksuci.2020.03.011","volume":"34","author":"MK Nammous","year":"2022","unstructured":"Nammous MK, Saeed K, Kobojek P (2022) Using a small amount of text-independent speech data for a BiLSTM large-scale speaker identification approach. J King Saud Univ-Comput Inf Sci 34(3):764\u2013770","journal-title":"J King Saud Univ-Comput Inf Sci"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-025-20694-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-025-20694-5\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-025-20694-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,17]],"date-time":"2025-09-17T09:43:49Z","timestamp":1758102229000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-025-20694-5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,3,13]]},"references-count":67,"journal-issue":{"issue":"31","published-online":{"date-parts":[[2025,9]]}},"alternative-id":["20694"],"URL":"https:\/\/doi.org\/10.1007\/s11042-025-20694-5","relation":{},"ISSN":["1573-7721"],"issn-type":[{"value":"1573-7721","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,3,13]]},"assertion":[{"value":"1 May 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"20 January 2025","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"6 February 2025","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 March 2025","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"Not Applicable.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical approval"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}]}}