{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,9]],"date-time":"2026-01-09T22:44:48Z","timestamp":1767998688911,"version":"3.49.0"},"reference-count":73,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2024,4,27]],"date-time":"2024-04-27T00:00:00Z","timestamp":1714176000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,4,27]],"date-time":"2024-04-27T00:00:00Z","timestamp":1714176000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Pattern Anal Applic"],"published-print":{"date-parts":[[2024,6]]},"DOI":"10.1007\/s10044-024-01278-9","type":"journal-article","created":{"date-parts":[[2024,4,27]],"date-time":"2024-04-27T08:02:04Z","timestamp":1714204924000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":11,"title":["A stacked convolutional neural network framework with multi-scale attention mechanism for text-independent voiceprint recognition"],"prefix":"10.1007","volume":"27","author":[{"given":"V.","family":"Karthikeyan","sequence":"first","affiliation":[]},{"given":"S.","family":"Suja Priyadharsini","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,4,27]]},"reference":[{"issue":"6","key":"1278_CR1","doi-asserted-by":"publisher","first-page":"74","DOI":"10.1109\/MSP.2015.2462851","volume":"32","author":"JHL Hansen","year":"2015","unstructured":"Hansen JHL, Hasan T (2015) Speaker recognition by machines and humans: a tutorial review. IEEE Signal Process Mag 32(6):74\u201399","journal-title":"IEEE Signal Process Mag"},{"issue":"2","key":"1278_CR2","doi-asserted-by":"publisher","first-page":"133","DOI":"10.1109\/TASSP.1987.1165110","volume":"35","author":"D Burton","year":"1987","unstructured":"Burton D (1987) Text-dependent speaker verification using vector quantization source coding. IEEE Trans Acoust 35(2):133\u2013143","journal-title":"IEEE Trans Acoust"},{"issue":"1","key":"1278_CR3","doi-asserted-by":"publisher","first-page":"72","DOI":"10.1109\/89.365379","volume":"3","author":"DA Reynolds","year":"1995","unstructured":"Reynolds DA, Rose RC (1995) Robust text-independent speaker identification using gaussian mixture speaker models. IEEE Trans Speech Audio Process 3(1):72\u201383","journal-title":"IEEE Trans Speech Audio Process"},{"issue":"1\u20133","key":"1278_CR4","doi-asserted-by":"publisher","first-page":"19","DOI":"10.1006\/dspr.1999.0361","volume":"10","author":"DA Reynolds","year":"2000","unstructured":"Reynolds DA, Quatieri TF, Dunn RB (2000) Speaker verification using adapted Gaussian mixture models. Digit Signal Process 10(1\u20133):19\u201341","journal-title":"Digit Signal Process"},{"key":"1278_CR5","doi-asserted-by":"crossref","unstructured":"Campbell WM, Sturim DE, Reynolds DA, Solomonoff A (2006) SVM based speaker verification using a GMM supervector kernel and NAP variability compensation. In: Proceedings.2006 IEEE international conference on acoustics, speech and signal processing, 2006. ICASSP 2006, 1. IEEE, pp I-I","DOI":"10.1109\/ICASSP.2006.1659966"},{"issue":"5","key":"1278_CR6","doi-asserted-by":"publisher","first-page":"308","DOI":"10.1109\/LSP.2006.870086","volume":"13","author":"WM Campbell","year":"2006","unstructured":"Campbell WM, Sturim DE, Reynolds DA (2006) Support vector machines using GMM supervectors for speaker verification. IEEE Signal Process Lett 13(5):308\u2013311","journal-title":"IEEE Signal Process Lett"},{"key":"1278_CR7","unstructured":"Dehak N (2009) Discriminative and generative approaches for long-and short-term speaker characteristics modeling: application to speaker verification (Doctoral dissertation, \u00c9cole de technologie sup\u00e9rieure)"},{"issue":"4","key":"1278_CR8","doi-asserted-by":"publisher","first-page":"788","DOI":"10.1109\/TASL.2010.2064307","volume":"19","author":"N Dehak","year":"2011","unstructured":"Dehak N, Kenny PJ, Dehak R, Dumouchel P, Ouellet P (2011) Front-end factor analysis for speaker verification. IEEE Trans Audio Speech Lang Process 19(4):788\u2013798","journal-title":"IEEE Trans Audio Speech Lang Process"},{"key":"1278_CR9","doi-asserted-by":"crossref","unstructured":"Garcia-Romero D, Espy-Wilson CY (2011) Analysis of i-vector length normalization in speaker recognition systems. In: Twelfth annual conference of the international speech communication association","DOI":"10.21437\/Interspeech.2011-53"},{"key":"1278_CR10","doi-asserted-by":"crossref","unstructured":"Cumani S, Plchot O, Laface P (2013) Probabilistic linear discriminant analysis of i-vector posterior distributions. In: 2013 IEEE international conference on acoustics, speech and signal processing. IEEE, pp 7644\u20137648","DOI":"10.1109\/ICASSP.2013.6639150"},{"issue":"6","key":"1278_CR11","doi-asserted-by":"publisher","first-page":"599","DOI":"10.1080\/02564602.2017.1357507","volume":"35","author":"RK Das","year":"2018","unstructured":"Das RK, MahadevaPrasanna SR (2018) Speaker verification from short utterance perspective: a review. IETE Tech Rev 35(6):599\u2013617","journal-title":"IETE Tech Rev"},{"issue":"2","key":"1278_CR12","doi-asserted-by":"publisher","first-page":"91","DOI":"10.1049\/iet-bmt.2017.0065","volume":"7","author":"A Poddar","year":"2017","unstructured":"Poddar A, Sahidullah M, Saha G (2017) Speaker verification with short utterances: a review of challenges, trends and opportunities. IET Biom 7(2):91\u2013101","journal-title":"IET Biom"},{"key":"1278_CR13","doi-asserted-by":"crossref","unstructured":"Sarkar AK, Matrouf D, Bousquet PM, Bonastre J-F (2012) Study of the effect of i-vector modeling on short and mismatch utterance duration for speaker verification. In: Thirteenth annual conference of the international speech communication association","DOI":"10.21437\/Interspeech.2012-347"},{"key":"1278_CR14","doi-asserted-by":"crossref","unstructured":"Lei Y, Scheffer N, Ferrer L, McLaren M (2014) A novel scheme for speaker recognition using a phonetically-aware deep neural network. In: 2014 IEEE international conference on acoustics, speech and signal processing (ICASSP), IEEE, pp 1695\u20131699","DOI":"10.1109\/ICASSP.2014.6853887"},{"key":"1278_CR15","unstructured":"Gonzalez-Dominguez J (2014) Deep neural networks for small footprint text-dependent speaker verification. In: ICASSP, vol 14, pp 4052\u20134056"},{"key":"1278_CR16","doi-asserted-by":"crossref","unstructured":"Snyder D, Garcia-Romero D, Povey D, Khudanpur S (2017) Deep neural network embeddings for text-independent speaker verification. In: Interspeech, pp 999\u20131003","DOI":"10.21437\/Interspeech.2017-620"},{"key":"1278_CR17","unstructured":"Li C, Ma X, Jiang B, Li X, Zhang X, Liu X, Cao Y, Kannan A, Zhu Z (2017) Deep speaker: an end-to-end neural speaker embedding system. http:\/\/arxiv.org\/abs\/1705.02304"},{"key":"1278_CR18","doi-asserted-by":"crossref","unstructured":"Zhang C, Koishida K (2017) End-to-end text-independent speaker verification with triplet loss on short utterances. In: Proceedings of the Interspeech","DOI":"10.21437\/Interspeech.2017-1608"},{"key":"1278_CR19","doi-asserted-by":"crossref","unstructured":"Heigold G, Moreno I, Bengio S, Shazeer N (2016) End-to-end text-dependent speaker verification. In: 2016 IEEE international conference on acoustics, speech and signal processing (ICASSP), IEEE, pp 5115\u20135119","DOI":"10.1109\/ICASSP.2016.7472652"},{"key":"1278_CR20","doi-asserted-by":"crossref","unstructured":"Wan L, Wang Q, Papir A, Moreno IL (2018) Generalized end-to-end loss for speaker verification. In: 2018 IEEE international conference on acoustics, speech and signal processing (ICASSP), IEEE, pp 4879\u20134883","DOI":"10.1109\/ICASSP.2018.8462665"},{"key":"1278_CR21","doi-asserted-by":"crossref","unstructured":"He K, Zhang X, Ren S, Sun J (2016) Deep residual learning for image recognition. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 770\u2013778","DOI":"10.1109\/CVPR.2016.90"},{"key":"1278_CR22","doi-asserted-by":"crossref","unstructured":"Szegedy C, Liu W, Jia Y, Sermanet P, Reed S, Anguelov D, Erhan D, Vanhoucke V, Rabinovich A (2015) Going deeper with convolutions. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 1\u20139","DOI":"10.1109\/CVPR.2015.7298594"},{"key":"1278_CR23","first-page":"5998","volume":"30","author":"A Vaswani","year":"2017","unstructured":"Vaswani A, Shazeer N, Parmar N, Uszkoreit J, Jones L, Gomez AN, Kaiser \u0141, Polosukhin I (2017) Attention is all you need. Adv Neural Inf Process Syst 30:5998\u20136008","journal-title":"Adv Neural Inf Process Syst"},{"key":"1278_CR24","doi-asserted-by":"crossref","unstructured":"Hu J, Shen L, Sun G (2017) Squeeze-and-excitation networks. http:\/\/arxiv.org\/abs\/1709.01507","DOI":"10.1109\/CVPR.2018.00745"},{"key":"1278_CR25","unstructured":"Zhang H, Goodfellow I, Metaxas D, Odena A (2018) Self-attention generative adversarial networks. http:\/\/arxiv.org\/abs\/1805.08318"},{"key":"1278_CR26","doi-asserted-by":"crossref","unstructured":"Zhang S-X, Chen Z, Zhao Y, Li J, Gong Y (2016) End-to-End attention based text-dependent speaker verification. In: Spoken language technology workshop (SLT), 2016 IEEE, IEEE, pp 171\u2013178","DOI":"10.1109\/SLT.2016.7846261"},{"key":"1278_CR27","doi-asserted-by":"crossref","unstructured":"Matejka P, et al (2016) Analysis of DNN approaches to speaker identification. In: IEEE ICASSP, pp 5100\u20135104","DOI":"10.1109\/ICASSP.2016.7472649"},{"issue":"10","key":"1278_CR28","doi-asserted-by":"publisher","first-page":"1671","DOI":"10.1109\/LSP.2015.2420092","volume":"22","author":"F Richardson","year":"2015","unstructured":"Richardson F, Reynolds D, Dehak N (2015) Deep neural network approaches to speaker and language recognition. IEEE Signal Process Lett 22(10):1671\u20131675","journal-title":"IEEE Signal Process Lett"},{"key":"1278_CR29","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s13636-015-0056-7","volume":"2015","author":"Z Zhang","year":"2015","unstructured":"Zhang Z, Wang L, Kai A, Yamada T, Li W, Iwahashi M (2015) Deep neural network-based bottleneck feature and denoising autoencoder-based dereverberation for distant-talking speaker identification. EURASIP J Audio Speech Music Process 2015:1\u201313","journal-title":"EURASIP J Audio Speech Music Process"},{"key":"1278_CR30","doi-asserted-by":"crossref","unstructured":"Richardson FS, Melot JT, Brandstein MS, Reynolds DA (2016) Speaker recognition using real versus synthetic parallel data for DNN channel compensation. In: Proceedings of the INTERSPEECH, pp 1\u20136","DOI":"10.21437\/Interspeech.2016-544"},{"key":"1278_CR31","doi-asserted-by":"crossref","unstructured":"Snyder D, Garcia-Romero D, Sell G, Povey D, Khudanpur S (2018) X-vectors: robust DNN embeddings for speaker recognition. In: Proceedings of the IEEE ICASSP, pp 5329\u20135333","DOI":"10.1109\/ICASSP.2018.8461375"},{"issue":"3","key":"1278_CR32","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s12046-021-01649-6","volume":"46","author":"V Karthikeyan","year":"2021","unstructured":"Karthikeyan V, Suja-Priyadharsini S (2021) A strong hybrid AdaBoost classification algorithm for speaker recognition. S\u0101dhan\u0101. 46(3):1\u201319. https:\/\/doi.org\/10.1007\/s12046-021-01649-6","journal-title":"S\u0101dhan\u0101."},{"key":"1278_CR33","doi-asserted-by":"publisher","first-page":"1616","DOI":"10.1109\/TIFS.2019.2941773","volume":"15","author":"A Chowdhury","year":"2019","unstructured":"Chowdhury A, Ross A (2019) Fusing MFCC and LPC features using 1D triplet CNN for speaker recognition in severely degraded audio signals. IEEE Trans Inf Forensics Secur 15:1616\u20131629","journal-title":"IEEE Trans Inf Forensics Secur"},{"issue":"2","key":"1278_CR34","doi-asserted-by":"publisher","first-page":"273","DOI":"10.1080\/0952813X.2022.2092560","volume":"36","author":"V Karthikeyan","year":"2022","unstructured":"Karthikeyan V, SujaPriyadharsini S (2022) Modified layer deep convolution neural network for text-independent speaker recognition. J Exp Theor Artif Intell 36(2):273\u2013285","journal-title":"J Exp Theor Artif Intell"},{"key":"1278_CR35","doi-asserted-by":"crossref","unstructured":"Qin X, Li N, Weng C, Su D, Li M (2022) Simple attention module based speaker verification with iterative noisy label detection. In: ICASSP 2022-2022 IEEE international conference on acoustics, speech and signal processing (ICASSP), pp 6722\u20136726. IEEE","DOI":"10.1109\/ICASSP43922.2022.9746294"},{"key":"1278_CR36","doi-asserted-by":"crossref","unstructured":"Zhu H, Lee KA, Li H (2021) Serialized multi-layer multi-head attention for neural speaker embedding. http:\/\/arxiv.org\/abs\/2107.06493","DOI":"10.21437\/Interspeech.2021-2210"},{"key":"1278_CR37","doi-asserted-by":"publisher","first-page":"59","DOI":"10.1016\/j.neucom.2019.08.046","volume":"368","author":"T Bian","year":"2019","unstructured":"Bian T, Chen F, Xu L (2019) Self-attention based speaker recognition using Cluster-Range Loss. Neurocomputing 368:59\u201368","journal-title":"Neurocomputing"},{"issue":"4","key":"1278_CR38","doi-asserted-by":"publisher","first-page":"1233","DOI":"10.3390\/s20041233","volume":"20","author":"Y Yao","year":"2020","unstructured":"Yao Y, Zhang S, Yang S, Gui G (2020) Learning attention representation with a multi-scale CNN for gear fault diagnosis under different working conditions. Sensors 20(4):1233","journal-title":"Sensors"},{"key":"1278_CR39","doi-asserted-by":"crossref","unstructured":"Cai W, Chen J, Li M (2018) Exploring the encoding layer and loss function in end-to-end speaker and language recognition system. In: Proceedings of the Odyssey 2018: the speaker and language recognition workshop, Les Sables d\u2019Olonne, France, pp 74\u201381","DOI":"10.21437\/Odyssey.2018-11"},{"key":"1278_CR40","doi-asserted-by":"crossref","unstructured":"Okabe K, Koshinaka T, Shinoda K (2018) Attentive statistics pooling for deep speaker embedding. In: Proceedings of the 19th annual conference of the international speech communication association (Interspeech), Hyderabad, India, pp 2252\u20132256","DOI":"10.21437\/Interspeech.2018-993"},{"key":"1278_CR41","doi-asserted-by":"crossref","unstructured":"Arandjelovi\u0107 R, Gronat P, Torii A, Pajdla T, Sivic J (2016) NetVLAD: CNN architecture for weakly supervised place recognition. In: Proceedings of the 2016 IEEE conference on computer vision and pattern recognition (CVPR), Las Vegas, NV, USA, pp 5297\u20135307","DOI":"10.1109\/CVPR.2016.572"},{"key":"1278_CR42","doi-asserted-by":"crossref","unstructured":"Xie W, Nagrani A, Chung JS, Zisserman A (2019) Utterance-level aggregation for speaker recognition in the wild. In: Proceedings of the IEEE international conference on acoustics, speech and signal processing (ICASSP), Brighton, UK, pp 5791\u20135795","DOI":"10.1109\/ICASSP.2019.8683120"},{"issue":"6","key":"1278_CR43","doi-asserted-by":"publisher","first-page":"2147","DOI":"10.3390\/s22062147","volume":"22","author":"M Wang","year":"2022","unstructured":"Wang M, Feng D, Su T, Chen M (2022) Attention-based temporal-frequency aggregation for speaker verification. Sensors 22(6):2147","journal-title":"Sensors"},{"key":"1278_CR44","doi-asserted-by":"publisher","first-page":"203","DOI":"10.1007\/s10044-011-0243-9","volume":"15","author":"R San-Segundo","year":"2012","unstructured":"San-Segundo R et al (2012) Design, development and field evaluation of a Spanish into sign language translation system. Pattern Anal Appl 15:203\u2013224","journal-title":"Pattern Anal Appl"},{"key":"1278_CR45","doi-asserted-by":"publisher","unstructured":"Karthikeyan V, Suja Priyadharsini S (2023) A focus module-based lightweight end-to-end CNN framework for voiceprint recognition. SIViP (2023). https:\/\/doi.org\/10.1007\/s11760-023-02500-7","DOI":"10.1007\/s11760-023-02500-7"},{"issue":"3","key":"1278_CR46","doi-asserted-by":"publisher","first-page":"1033","DOI":"10.1111\/1556-4029.15006","volume":"46","author":"V Karthikeyan","year":"2022","unstructured":"Karthikeyan V, Suja PS (2022) Hybrid machine learning classification scheme for speaker identification. J Forensic Sci 46(3):1033\u20131048. https:\/\/doi.org\/10.1111\/1556-4029.15006","journal-title":"J Forensic Sci"},{"key":"1278_CR47","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9780511841644","volume-title":"Introductory econometrics for finance","author":"C Brooks","year":"2008","unstructured":"Brooks C (2008) Introductory econometrics for finance, 2nd edn. Cambridge University Press, Cambridge","edition":"2"},{"key":"1278_CR48","unstructured":"Feng L (2004) Speaker recognition (Master's thesis, Technical University of Denmark, DTU, DK-2800 Kgs. Lyngby, Denmark"},{"issue":"1","key":"1278_CR49","doi-asserted-by":"publisher","first-page":"504","DOI":"10.3390\/make1010031","volume":"1","author":"P Dhakal","year":"2019","unstructured":"Dhakal P, Damacharla P, Javaid AY, Devabhaktuni V (2019) A near real-time automatic speaker recognition architecture for voice-based user interface. Mach Learn Knowl Extr 1(1):504\u2013520","journal-title":"Mach Learn Knowl Extr"},{"key":"1278_CR50","unstructured":"Banerjee A, Dubey A, Menon A, Nanda S, Nandi GC (2018) Speaker recognition using deep belief networks. http:\/\/arxiv.org\/abs\/1805.08865"},{"key":"1278_CR51","unstructured":"Garofolo JS (1993) Timit acoustic phonetic continuous speech corpus. Linguistic Data Consortium"},{"key":"1278_CR52","unstructured":"Wildermoth BR, Paliwal KK (2003) GMM based speaker recognition on readily available databases. In: Microelectronic engineering research conference, Brisbane, Australia, vol 7, p 55"},{"key":"1278_CR53","doi-asserted-by":"crossref","unstructured":"Lukic Y., Vogt C., D\u00fcrr O., & Stadelmann T. 2016. Speaker identification and clustering using convolutional neural networks. In 2016 IEEE 26th international workshop on machine learning for signal processing (MLSP) (pp. 1\u20136). IEEE.","DOI":"10.1109\/MLSP.2016.7738816"},{"key":"1278_CR54","unstructured":"Thanda Setty V (2018) Speaker recognition using deep neural networks with reduced complexity (Thesis). Texas State University, San Marcos, Texas"},{"key":"1278_CR55","doi-asserted-by":"crossref","unstructured":"Ghezaiel W, Brun L, L\u00e9zoray O (2021) Hybrid network for end-to-end text-independent speaker identification. In: 2020 25th international conference on pattern recognition (ICPR), pp 2352\u20132359. IEEE","DOI":"10.1109\/ICPR48806.2021.9413293"},{"key":"1278_CR56","unstructured":"Li W (2021) Speaker identification from raw waveform with LineNet. http:\/\/arxiv.org\/abs\/2105.14826"},{"key":"1278_CR57","doi-asserted-by":"crossref","unstructured":"Nunes JAC, Mac\u00eado D, Zanchettin C (2020) AM-mobilenet1D: a portable model for speaker recognition. In: 2020 International joint conference on neural networks (IJCNN), pp 1\u20138. IEEE","DOI":"10.1109\/IJCNN48605.2020.9207519"},{"key":"1278_CR58","doi-asserted-by":"crossref","unstructured":"Ravanelli M, Bengio Y (2018) Speaker recognition from raw waveform with sincnet. In: 2018 IEEE spoken language technology workshop (SLT), pp 1021\u20131028. IEEE","DOI":"10.1109\/SLT.2018.8639585"},{"key":"1278_CR59","unstructured":"Nunes JAC, Mac\u00eado D, Zanchettin C (2019) Additive margin sincnet for speaker recognition. In: Proceedings of the 2019 IEEE international joint conference on neural networks (IJCNN), Budapest, Hungary, 14\u201319, pp 1\u20135"},{"issue":"21","key":"1278_CR60","doi-asserted-by":"publisher","first-page":"7522","DOI":"10.3390\/app10217522","volume":"10","author":"L Chowdhury","year":"2020","unstructured":"Chowdhury L, Zunair H, Mohammed N (2020) Robust deep speaker recognition: learning latent representation with joint angular margin loss. Appl Sci 10(21):7522","journal-title":"Appl Sci"},{"key":"1278_CR61","doi-asserted-by":"crossref","unstructured":"Prachi NN, Nahiyan FM, Habibullah M, Khan R (2022) Deep learning based speaker recognition system with CNN and LSTM techniques. In: 2022 interdisciplinary research in technology and management (IRTM), pp 1\u20136. IEEE","DOI":"10.1109\/IRTM54583.2022.9791766"},{"key":"1278_CR62","unstructured":"NIST Multimodal Information Group (2008) NIST Speaker Recognition Evaluation Training Set Part 1 LDC2011S05; Linguistic Data Consortium: Philadelphia, PA, USA, 2011"},{"key":"1278_CR63","doi-asserted-by":"crossref","unstructured":"Al-Kaltakchi MT, Woo WL, Dlay SS, Chambers JA (2017) Comparison of I-vector and GMM-UBM approaches to speaker identification with TIMIT and NIST 2008 databases in challenging environments. In: 2017 25th European signal processing conference (EUSIPCO), pp 533\u2013537. IEEE","DOI":"10.23919\/EUSIPCO.2017.8081264"},{"key":"1278_CR64","doi-asserted-by":"crossref","unstructured":"Chang J, Wang D (2017) Robust speaker recognition based on DNN\/i-vectors and speech separation. In: 2017 IEEE international conference on acoustics, speech and signal processing (ICASSP), pp 5415\u20135419. IEEE","DOI":"10.1109\/ICASSP.2017.7953191"},{"issue":"7","key":"1278_CR65","doi-asserted-by":"publisher","first-page":"2399","DOI":"10.3390\/s18072399","volume":"18","author":"C Sun","year":"2018","unstructured":"Sun C, Yang Y, Wen C, Xie K, Wen F (2018) Voiceprint identification for limited dataset using the deep migration hybrid model based on transfer learning. Sensors 18(7):2399","journal-title":"Sensors"},{"key":"1278_CR66","doi-asserted-by":"crossref","unstructured":"Wen Y, Zhou T, Singh R, Raj B (2018) A corrective learning approach for text-independent speaker verification. In: 2018 IEEE international conference on acoustics, speech and signal processing (ICASSP), pp 4894\u20134898. IEEE","DOI":"10.1109\/ICASSP.2018.8461340"},{"key":"1278_CR67","doi-asserted-by":"crossref","unstructured":"Ribas D, Vincent E (2019) An improved uncertainty propagation method for robust i-vector based speaker recognition. In: ICASSP 2019-2019 IEEE international conference on acoustics, speech and signal processing (ICASSP), pp 6331\u20136335. IEEE","DOI":"10.1109\/ICASSP.2019.8683132"},{"key":"1278_CR68","unstructured":"Cieri C, Miller D, Walker K (2004) Fisher English training speech parts 1 and 2. In: Philadelphia: linguistic data consortium. University of Pennsylvania, Philadelphia"},{"key":"1278_CR69","doi-asserted-by":"crossref","unstructured":"Tan B, Li Q, Foresta R (2010) An automatic non-native speaker recognition system. In: 2010 IEEE international conference on technologies for homeland security (HST), pp 77\u201383. IEEE","DOI":"10.1109\/THS.2010.5655088"},{"key":"1278_CR70","doi-asserted-by":"crossref","unstructured":"McClanahan R, De Leon P (2013) Towards a more efficient SVM supervector speaker verification system using Gaussian reduction and a tree-structured hash (No. SAND2013-2166C). Sandia National Lab. (SNL-NM), Albuquerque, NM (United States)","DOI":"10.21437\/Interspeech.2013-688"},{"key":"1278_CR71","doi-asserted-by":"crossref","unstructured":"Chowdhury A, Ross A (2017) Extracting sub-glottal and supra-glottal features from MFCC using convolutional neural networks for speaker identification in degraded audio signals. In: 2017 IEEE international joint conference on biometrics (IJCB), pp 608\u2013617. IEEE.","DOI":"10.1109\/BTAS.2017.8272748"},{"issue":"3","key":"1278_CR72","first-page":"764","volume":"34","author":"MK Nammous","year":"2022","unstructured":"Nammous MK, Saeed K, Kobojek P (2022) Using a small amount of text-independent speech data for a BiLSTM large-scale speaker identification approach. J King Saud Univ-Comput Inf Sci 34(3):764\u2013770","journal-title":"J King Saud Univ-Comput Inf Sci"},{"key":"1278_CR73","doi-asserted-by":"publisher","first-page":"109826","DOI":"10.1016\/j.asoc.2022.109826","volume":"131","author":"V Karthikeyan","year":"2022","unstructured":"Karthikeyan V, Suja PS (2022) Adaptive boosted random forest-support vector machine based classification scheme for speaker identification. Appl Soft Comput 131:109826","journal-title":"Appl Soft Comput"}],"container-title":["Pattern Analysis and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10044-024-01278-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10044-024-01278-9\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10044-024-01278-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,17]],"date-time":"2024-11-17T05:12:04Z","timestamp":1731820324000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10044-024-01278-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,4,27]]},"references-count":73,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2024,6]]}},"alternative-id":["1278"],"URL":"https:\/\/doi.org\/10.1007\/s10044-024-01278-9","relation":{},"ISSN":["1433-7541","1433-755X"],"issn-type":[{"value":"1433-7541","type":"print"},{"value":"1433-755X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,4,27]]},"assertion":[{"value":"11 July 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"15 April 2024","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 April 2024","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"Not Applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical approval"}}],"article-number":"48"}}