{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,29]],"date-time":"2026-04-29T19:14:20Z","timestamp":1777490060167,"version":"3.51.4"},"reference-count":75,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2026,2,17]],"date-time":"2026-02-17T00:00:00Z","timestamp":1771286400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,2,17]],"date-time":"2026-02-17T00:00:00Z","timestamp":1771286400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Evolving Systems"],"published-print":{"date-parts":[[2026,6]]},"DOI":"10.1007\/s12530-026-09797-y","type":"journal-article","created":{"date-parts":[[2026,2,17]],"date-time":"2026-02-17T11:02:50Z","timestamp":1771326170000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["Multidimensional acoustic feature fusion with attention-guided light weighted CNN for improved speaker recognition"],"prefix":"10.1007","volume":"17","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-2974-6554","authenticated-orcid":false,"given":"V.","family":"Karthikeyan","sequence":"first","affiliation":[]},{"given":"S. Suja","family":"Priyadharsini","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2026,2,17]]},"reference":[{"key":"9797_CR1","doi-asserted-by":"crossref","unstructured":"Al-Dujaili MJ, Ahily HJS, Fatlawi A (2023). Gender recognition of human based on speech characteristics by features fusion with K_NN and MLPNN classifications. In: AIP Conference Proceedings (Vol. 2977, No. 1, p. 020092). AIP Publishing LLC","DOI":"10.1063\/5.0181969"},{"key":"9797_CR2","doi-asserted-by":"publisher","first-page":"18940","DOI":"10.1109\/ACCESS.2019.2895688","volume":"7","author":"SU Amin","year":"2019","unstructured":"Amin SU, Alsulaiman M, Muhammad G, Bencherif MA, Hossain MS (2019) Multilevel weighted feature fusion using convolutional neural networks for EEG motor imagery classification. IEEE Access 7:18940\u201318950","journal-title":"IEEE Access"},{"key":"9797_CR3","unstructured":"Banerjee A, Dubey A, Menon A, Nanda S, Nandi GC (2018) Speaker recognition using deep belief networks. ArXiv Preprint arXiv :180508865"},{"issue":"2","key":"9797_CR4","doi-asserted-by":"publisher","first-page":"1913","DOI":"10.1007\/s11277-022-09640-y","volume":"125","author":"KB Bhangale","year":"2022","unstructured":"Bhangale KB, Kothandaraman M (2022) Survey of deep learning paradigms for speech processing. Wireless Pers Commun 125(2):1913\u20131949","journal-title":"Wireless Pers Commun"},{"key":"9797_CR5","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9780511841644","volume-title":"Introductory econometrics for finance","author":"C Brooks","year":"2008","unstructured":"Brooks C (2008) Introductory econometrics for finance, 2nd edn. Cambridge University Press, Cambridge, UK","edition":"2"},{"key":"9797_CR6","doi-asserted-by":"crossref","unstructured":"Byeon H, Sengar AS, Karthikeyan V, Sheeba PM (2025). Optimized improved CNN enabled automated classification of brain tumor. In: AIP conference proceedings (Vol. 3306, No. 1, p. 040005). AIP Publishing LLC","DOI":"10.1063\/5.0275941"},{"issue":"2\u20133","key":"9797_CR7","doi-asserted-by":"publisher","first-page":"210","DOI":"10.1016\/j.csl.2005.06.003","volume":"20","author":"WM Campbell","year":"2006","unstructured":"Campbell WM, Campbell JP, Reynolds DA, Singer E, Torres-Carrasquillo PA (2006) Support vector machines for speaker and language recognition. Comput Speech Lang 20(2\u20133):210\u2013229","journal-title":"Comput Speech Lang"},{"issue":"4","key":"9797_CR8","first-page":"385","volume":"20","author":"V Chandrabanshi","year":"2024","unstructured":"Chandrabanshi V, Domnic S (2024) Hnet: a deep learning based hybrid network for speaker dependent visual speech recognition. Int J Hybrid Intell Syst 20(4):385\u2013401","journal-title":"Int J Hybrid Intell Syst"},{"key":"9797_CR9","doi-asserted-by":"crossref","unstructured":"Chang J, Wang D (2017) Robust speaker recognition based on DNN\/i-vectors and speech separation. In: 2017 IEEE international conference on acoustics, speech and signal processing (ICASSP). IEEE\u00a0pp. 5415\u20135419","DOI":"10.1109\/ICASSP.2017.7953191"},{"issue":"10","key":"9797_CR10","doi-asserted-by":"publisher","first-page":"1440","DOI":"10.1109\/LSP.2018.2860246","volume":"25","author":"M Chen","year":"2018","unstructured":"Chen M, He X, Yang J, Zhang H (2018) 3-d convolutional recurrent neural networks with attention model for speech emotion recognition. IEEE Signal Process Lett 25(10):1440\u20131444","journal-title":"IEEE Signal Process Lett"},{"key":"9797_CR11","doi-asserted-by":"crossref","unstructured":"Chen YH, Lopez-Moreno I, Sainath TN, Visontai M, Alvarez R, Parada C (2015) Locally-connected and convolutional neural networks for small footprint speaker recognition. In: Sixteenth annual conference of the international speech communication association","DOI":"10.21437\/Interspeech.2015-297"},{"key":"9797_CR12","doi-asserted-by":"crossref","unstructured":"Chung JS, Huh J, Mun S, Lee M, Heo HS, Choe S, Han I (2020). In defence of metric learning for speaker recognition. arXiv preprint arXiv:2003.11982.","DOI":"10.21437\/Interspeech.2020-1064"},{"key":"9797_CR13","doi-asserted-by":"crossref","unstructured":"Chung JS, Nagrani A, Zisserman A (2018). Voxceleb2: deep speaker recognition. arXiv preprint arXiv:1806.05622","DOI":"10.21437\/Interspeech.2018-1929"},{"issue":"1","key":"9797_CR14","doi-asserted-by":"publisher","first-page":"504","DOI":"10.3390\/make1010031","volume":"1","author":"P Dhakal","year":"2019","unstructured":"Dhakal P, Damacharla P, Javaid AY, Devabhaktuni V (2019) A near real-time automatic speaker recognition architecture for voice-based user interface. Mach Learn Knowl Extr 1(1):504\u2013520","journal-title":"Mach Learn Knowl Extr"},{"issue":"21","key":"9797_CR15","doi-asserted-by":"publisher","first-page":"10989","DOI":"10.3390\/app122110989","volume":"12","author":"Y Dong","year":"2022","unstructured":"Dong Y, Chen Z, Li Z, Gao F (2022) A multi-branch multi-scale deep learning image fusion algorithm based on densenet. Appl Sci 12(21):10989","journal-title":"Appl Sci"},{"key":"9797_CR16","doi-asserted-by":"crossref","unstructured":"Dong X, Song J (2022). Application of voiceprint recognition based on improved ECAPA-TDNN. In: 2022 4th international academic exchange conference on science and technology innovation (IAECST). IEEE\u00a0pp. 1196\u20131199","DOI":"10.1109\/IAECST57965.2022.10062023"},{"key":"9797_CR17","unstructured":"Evans Kiplagat (2020). Speaker recognition dataset,\u00a0https:\/\/www.kaggle.com\/datasets\/kongaevans\/speaker-recognition-dataset\/code? dataset Id\u2009=\u2009470244."},{"key":"9797_CR18","unstructured":"Feng L (2004). Speaker recognition (Master\u2019s thesis, Technical University of Denmark, DTU, DK-2800 Kgs. Lyngby, Denmark)"},{"issue":"9","key":"9797_CR19","doi-asserted-by":"publisher","first-page":"859","DOI":"10.1016\/S0167-8655(97)00073-1","volume":"18","author":"S Furui","year":"1997","unstructured":"Furui S (1997) Recent advances in speaker recognition. Pattern Recognit Lett 18(9):859\u2013872","journal-title":"Pattern Recognit Lett"},{"key":"9797_CR20","unstructured":"Garofolo JS (1993) TIMIT acoustic phonetic continuous speech corpus. Linguistic Data Consortium, 1993"},{"key":"9797_CR21","doi-asserted-by":"crossref","unstructured":"Ghezaiel W, Brun L, L\u00e9zoray O (2021) Hybrid network for end-to-end text-independent speaker identification. In: 2020 25th international conference on pattern recognition (ICPR). IEEE\u00a0pp. 2352\u20132359","DOI":"10.1109\/ICPR48806.2021.9413293"},{"key":"9797_CR22","doi-asserted-by":"crossref","unstructured":"Hajavi A, Etemad A (2019) A deep neural network for short-segment speaker recognition. arXiv preprint arXiv:1907.10420.","DOI":"10.21437\/Interspeech.2019-2240"},{"key":"9797_CR23","unstructured":"Jahangir R (2021) Speaker identification through feature fusion based deep learning (Doctoral dissertation, University of Malaya (Malaysia))"},{"key":"9797_CR24","doi-asserted-by":"publisher","first-page":"32187","DOI":"10.1109\/ACCESS.2020.2973541","volume":"8","author":"R Jahangir","year":"2020","unstructured":"Jahangir R, Teh YW, Memon NA, Mujtaba G, Zareei M, Ishtiaq U, Akhtar MZ, Ali I (2020) Text-independent speaker identification through feature fusion and deep neural network. IEEE Access 8:32187\u201332202","journal-title":"IEEE Access"},{"issue":"4","key":"9797_CR25","doi-asserted-by":"publisher","first-page":"1564","DOI":"10.1109\/TCDS.2021.3123979","volume":"14","author":"P Jiang","year":"2021","unstructured":"Jiang P, Xu X, Tao H, Zhao L, Zou C (2021) Convolutional-recurrent neural networks with multiple attention mechanisms for speech emotion recognition. IEEE Trans Cogn Dev Syst 14(4):1564\u20131573","journal-title":"IEEE Trans Cogn Dev Syst"},{"issue":"4","key":"9797_CR26","doi-asserted-by":"publisher","first-page":"2407","DOI":"10.1007\/s11277-024-11607-0","volume":"138","author":"PR Kanna","year":"2024","unstructured":"Kanna PR, Santhi P (2024) An enhanced hybrid intrusion detection using mapreduce-optimized black widow convolutional LSTM neural networks. Wireless Pers Commun 138(4):2407\u20132445","journal-title":"Wireless Pers Commun"},{"key":"9797_CR27","unstructured":"Karthikeyan V (2022) Text independent speaker recognition using hybrid ensemble and adaptive boosting techniques"},{"key":"9797_CR28","doi-asserted-by":"crossref","unstructured":"Karthikeyan V, Kumar PS, Karthikeyan P (2023). Automatic recognition of speaker labels using CNN-SVM scheme. In: International conference on innovative computing and communication. Springer Nature Singapore,\u00a0Singapore, pp. 513\u2013529","DOI":"10.1007\/978-981-99-3315-0_39"},{"key":"9797_CR29","doi-asserted-by":"publisher","DOI":"10.1007\/s00371-024-03785-6","author":"V Karthikeyan","year":"2025","unstructured":"Karthikeyan V, Praveen S, Nandan SS (2025a) Lightweight deep hybrid CNN with attention mechanism for enhanced underwater image restoration. Vis Comput. https:\/\/doi.org\/10.1007\/s00371-024-03785-6","journal-title":"Vis Comput"},{"key":"9797_CR30","doi-asserted-by":"publisher","DOI":"10.1007\/s11042-025-20694-5","author":"V Karthikeyan","year":"2025","unstructured":"Karthikeyan V, Priyadharsini SS, Balamurugan K (2025b) Attention-based multi dimension fused-feature convolutional neural network framework for speaker recognition. Multimedia Tools Appl. https:\/\/doi.org\/10.1007\/s11042-025-20694-5","journal-title":"Multimedia Tools Appl"},{"key":"9797_CR31","doi-asserted-by":"publisher","DOI":"10.1016\/j.compbiomed.2025.110984","volume":"197","author":"V Karthikeyan","year":"2025","unstructured":"Karthikeyan V, Saranya P, Natchiyar M (2025c) A lightweight ECA-based DCNN approach for speech command recognition. Comput Biol Med 197:110984","journal-title":"Comput Biol Med"},{"issue":"4","key":"9797_CR32","first-page":"1893","volume":"14","author":"V Karthikeyan","year":"2024","unstructured":"Karthikeyan V, Raja E, Gurumoorthy K (2024) Denoising convolutional neural network with energy-based attention for image enhancement. J Appl Anal Comput 14(4):1893\u20131914","journal-title":"J Appl Anal Comput"},{"key":"9797_CR33","doi-asserted-by":"crossref","unstructured":"Kathikeyan V, Balamurugan K (2024) Underwater multiple access communication using spread spectrum scheme. National Academy Science Letters, pp 1\u20135","DOI":"10.1007\/s40009-024-01589-9"},{"issue":"31","key":"9797_CR34","doi-asserted-by":"publisher","first-page":"75557","DOI":"10.1007\/s11042-024-18316-7","volume":"83","author":"WA Khan","year":"2024","unstructured":"Khan WA, ul Qudous H, Farhan AA (2024) Speech emotion recognition using feature fusion: a hybrid approach to deep learning. Multimedia Tools Appl 83(31):75557\u201375584","journal-title":"Multimedia Tools Appl"},{"issue":"1","key":"9797_CR35","doi-asserted-by":"publisher","first-page":"478","DOI":"10.1109\/TCSS.2022.3228649","volume":"11","author":"Y Khurana","year":"2022","unstructured":"Khurana Y, Gupta S, Sathyaraj R, Raja SP (2022) Robinnet: a multimodal speech emotion recognition system with speaker recognition for social interactions. IEEE Trans Comput Social Syst 11(1):478\u2013487","journal-title":"IEEE Trans Comput Social Syst"},{"key":"9797_CR36","doi-asserted-by":"crossref","unstructured":"Lawson A, Vabishchevich P, Huggins M, Ardis P, Battles B, Stauffer A (2011) Survey and evaluation of acoustic features for speaker recognition. In: 2011 IEEE international conference on acoustics, speech and signal processing (ICASSP). IEEE, pp. 5444\u20135447","DOI":"10.1109\/ICASSP.2011.5947590"},{"issue":"1","key":"9797_CR37","doi-asserted-by":"publisher","DOI":"10.1186\/s13636-025-00396-4","volume":"2025","author":"P Li","year":"2025","unstructured":"Li P, Hoi LM, Wang Y, Yang X, Im SK (2025) Enhancing speaker recognition with CRET model: a fusion of CONV2D, RESNET and ECAPA-TDNN. EURASIP J Audio Speech Music Process 2025(1):9","journal-title":"EURASIP J Audio Speech Music Process"},{"key":"9797_CR38","unstructured":"Li W (2021) Speaker identification from raw waveform with LineNet. arXiv preprint arXiv:2105.14826"},{"issue":"10","key":"9797_CR39","doi-asserted-by":"publisher","first-page":"1440","DOI":"10.3390\/e25101440","volume":"25","author":"H Lian","year":"2023","unstructured":"Lian H, Lu C, Li S, Zhao Y, Tang C, Zong Y (2023) A survey of deep learning-based multimodal emotion recognition: speech, text, and face. Entropy 25(10):1440","journal-title":"Entropy"},{"issue":"16","key":"9797_CR40","doi-asserted-by":"publisher","first-page":"3149","DOI":"10.3390\/electronics13163149","volume":"13","author":"L Liao","year":"2024","unstructured":"Liao L, Wu S, Song C, Fu J (2024) PH-CBAM: a parallel hybrid CBAM network with multi-feature extraction for facial expression recognition. Electronics 13(16):3149","journal-title":"Electronics"},{"key":"9797_CR41","doi-asserted-by":"publisher","DOI":"10.1016\/j.specom.2023.103010","volume":"156","author":"M Liu","year":"2024","unstructured":"Liu M, Raj ANJ, Rajangam V, Ma K, Zhuang Z, Zhuang S (2024) Multiscale-multichannel feature extraction and classification through one-dimensional convolutional neural network for speech emotion recognition. Speech Commun 156:103010","journal-title":"Speech Commun"},{"issue":"7","key":"9797_CR42","doi-asserted-by":"publisher","first-page":"3244","DOI":"10.1109\/TII.2018.2799928","volume":"14","author":"Z Liu","year":"2018","unstructured":"Liu Z, Wu Z, Li T, Li J, Shen C (2018) GMM and CNN hybrid method for short utterance speaker recognition. IEEE Trans Ind Inform 14(7):3244\u20133252","journal-title":"IEEE Trans Ind Inform"},{"key":"9797_CR43","doi-asserted-by":"crossref","unstructured":"Lukic Y, Vogt C, D\u00fcrr O, Stadelmann T (2016) Speaker identification and clustering using convolutional neural networks. In: 2016 IEEE 26th international workshop on machine learning for signal processing (MLSP). IEEE,\u00a0pp. 1\u20136","DOI":"10.1109\/MLSP.2016.7738816"},{"key":"9797_CR44","doi-asserted-by":"crossref","unstructured":"Ma B, Wang X, Zhang H, Li F, Dan J (2019). CBAM-GAN: generative adversarial networks based on convolutional block attention module. In: Artificial intelligence and security: 5th international conference, ICAIS 2019, New York, NY, USA, July 26\u201328, 2019, proceedings, part I 5. Springer International Publishing, pp. 227\u2013236","DOI":"10.1007\/978-3-030-24274-9_20"},{"key":"9797_CR45","doi-asserted-by":"crossref","unstructured":"Nagrani A, Chung JS, Zisserman A (2017) Voxceleb: a large-scale speaker identification dataset. arXiv preprint arXiv:1706.08612.","DOI":"10.21437\/Interspeech.2017-950"},{"key":"9797_CR46","unstructured":"NIST Multimodal Information Group (2008) NIST speaker recognition evaluation training set Part 1 LDC2011S05; Linguistic Data Consortium: Philadelphia, PA, USA, 2011"},{"key":"9797_CR47","doi-asserted-by":"crossref","unstructured":"Nunes JA, C, Mac\u00eado D, Zanchettin C (2020) Am-mobilenet1d: A portable model for speaker recognition. In: 2020 international joint conference on neural networks (IJCNN). IEEE\u00a0pp. 1\u20138","DOI":"10.1109\/IJCNN48605.2020.9207519"},{"key":"9797_CR48","volume":"108","author":"J Pan","year":"2022","unstructured":"Pan J, Cui W, An X, Huang X, Zhang H, Zhang S, Zhang R, Li X, Cheng W, Hu Y (2022) MapsNet: Multi-level feature constraint and fusion network for change detection. Int J Appl Earth Obs Geoinf 108:102676","journal-title":"Int J Appl Earth Obs Geoinf"},{"key":"9797_CR49","doi-asserted-by":"crossref","unstructured":"Pandiaraja P, Karthik K, Rajesh Kanna P, PC SM, Muthumanickam K. (2024). Assessing Secure cloud information sharing through authentication and encoded indexing. In: 2024 8th international conference on I-SMAC (IoT in Social, Mobile, Analytics and Cloud)(I-SMAC). IEEE,\u00a0pp. 1030\u20131037","DOI":"10.1109\/I-SMAC61858.2024.10714840"},{"issue":"1","key":"9797_CR50","first-page":"1261","volume":"29","author":"V Passricha","year":"2019","unstructured":"Passricha V, Aggarwal RK (2019) A hybrid of deep CNN and bidirectional LSTM for automatic speech recognition. J Intell Syst 29(1):1261\u20131274","journal-title":"J Intell Syst"},{"key":"9797_CR51","doi-asserted-by":"crossref","unstructured":"Peddinti V, Povey D, Khudanpur S (2015). A time delay neural network architecture for efficient modeling of long temporal contexts. In: Interspeech (Vol. 2015)\u00a0pp. 3214\u20133218","DOI":"10.21437\/Interspeech.2015-647"},{"key":"9797_CR52","doi-asserted-by":"crossref","unstructured":"Ravanelli M, Bengio Y (2018) Speaker recognition from raw waveform with SINCNET. In: 2018 IEEE spoken language technology workshop (SLT). IEEE, pp 1021\u20131028","DOI":"10.1109\/SLT.2018.8639585"},{"key":"9797_CR53","doi-asserted-by":"publisher","DOI":"10.1016\/j.engappai.2023.107661","volume":"131","author":"K Radha","year":"2024","unstructured":"Radha K, Bansal M, Pachori RB (2024) Speech and speaker recognition using raw waveform modeling for adult and children\u2019s speech: a comprehensive review. Eng Appl Artif Intell 131:107661","journal-title":"Eng Appl Artif Intell"},{"issue":"11","key":"9797_CR54","doi-asserted-by":"publisher","first-page":"6410","DOI":"10.3390\/app13116410","volume":"13","author":"P Safari","year":"2023","unstructured":"Safari P, India M, Hernando J (2023) Self-attention networks in speaker recognition. Appl Sci 13(11):6410","journal-title":"Appl Sci"},{"key":"9797_CR55","doi-asserted-by":"publisher","DOI":"10.1016\/j.compeleceng.2024.109100","volume":"115","author":"B Saritha","year":"2024","unstructured":"Saritha B, Laskar MA, Laskar RH, Choudhury M (2024) CACRN-Net: a 3D log mel spectrogram based channel attention convolutional recurrent neural network for few-shot speaker identification. Comput Electr Eng 115:109100","journal-title":"Comput Electr Eng"},{"key":"9797_CR56","doi-asserted-by":"publisher","first-page":"413","DOI":"10.1109\/SLT.2014.7078610","volume-title":"2014 IEEE spoken language technology workshop (SLT)","author":"G Sell","year":"2014","unstructured":"Sell G, Garcia-Romero D (2014) Speaker diarization with PLDA i-vector scoring and unsupervised calibration. 2014 IEEE spoken language technology workshop (SLT). IEEE, pp 413\u2013417"},{"key":"9797_CR57","doi-asserted-by":"crossref","unstructured":"Snyder D, Garcia-Romero D, Sell G, McCree A, Povey D, Khudanpur S (2019). Speaker recognition for multi-speaker conversations using x-vectors. In: ICASSP 2019\u20132019 IEEE international conference on acoustics, speech and signal processing (ICASSP). IEEE,\u00a0pp. 5796\u20135800","DOI":"10.1109\/ICASSP.2019.8683760"},{"key":"9797_CR58","doi-asserted-by":"publisher","first-page":"128149","DOI":"10.1016\/j.eswa.2025.128149","volume":"286","author":"K Somasundaram","year":"2025","unstructured":"Somasundaram K, Kanna PR (2025) Scalable hierarchical balanced clustering-based routing with multipath authentication for secured data transmission in large-scale multicast group communications. Expert Syst Appl 286:128149","journal-title":"Expert Syst Appl"},{"issue":"7","key":"9797_CR59","doi-asserted-by":"publisher","DOI":"10.3390\/s18072399","volume":"18","author":"C Sun","year":"2018","unstructured":"Sun C, Yang Y, Wen C, Xie K, Wen F (2018) Voiceprint identification for limited dataset using the deep migration hybrid model based on transfer learning. Sensors 18(7):2399","journal-title":"Sensors"},{"key":"9797_CR60","doi-asserted-by":"publisher","DOI":"10.1016\/j.specom.2025.103242","author":"X Tang","year":"2025","unstructured":"Tang X, Huang J, Lin Y, Dang T, Cheng J (2025) Speech emotion recognition via CNN-transformer and multidimensional attention mechanism. Speech Commun. https:\/\/doi.org\/10.1016\/j.specom.2025.103242","journal-title":"Speech Commun"},{"key":"9797_CR61","unstructured":"Thanda Setty V (2018) Speaker recognition using deep neural networks with reduced complexity (Thesis). Texas State University, San Marcos, Texas"},{"key":"9797_CR62","doi-asserted-by":"publisher","DOI":"10.1007\/s00371-024-03588-9","author":"R Varun Prakash","year":"2024","unstructured":"Varun Prakash R, Karthikeyan V, Vishali S, Karthika M (2024) Multi-level LSTM framework with hybrid sonic features for human\u2013animal conflict evasion. Vis Comput. https:\/\/doi.org\/10.1007\/s00371-024-03588-9","journal-title":"Vis Comput"},{"key":"9797_CR63","first-page":"1","volume-title":"Computational intelligence and modelling techniques for disease detection in mammogram images","author":"K Velayuthapandian","year":"2024","unstructured":"Velayuthapandian K, Karuppiah G, Vadivel SRS, Joseph DRV (2024a) Mammogram data analysis: trends, challenges, and future directions. Computational intelligence and modelling techniques for disease detection in mammogram images. Academic Press, pp 1\u201338"},{"issue":"1","key":"9797_CR64","doi-asserted-by":"publisher","DOI":"10.1007\/s44291-024-00034-x","volume":"1","author":"K Velayuthapandian","year":"2024","unstructured":"Velayuthapandian K, Murugan N, Paramasivan S (2024b) End-to-end CNN conceptual model for a biometric authentication mechanism for ATM machines. Discover Electronics 1(1):26","journal-title":"Discover Electronics"},{"issue":"3","key":"9797_CR65","first-page":"2145","volume":"18","author":"K Velayuthapandian","year":"2024","unstructured":"Velayuthapandian K, Veyilraj M, Jayakumaraj MA (2024c) An intelligent parking allocation framework for digital society 5.0. Intell Decis Technol 18(3):2145\u20132159","journal-title":"Intell Decis Technol"},{"key":"9797_CR66","unstructured":"Wang Y, Deng X, Pu S, Huang Z (2017) Residual convolutional CTC networks for automatic speech recognition. arXiv preprint arXiv:1702.07793."},{"key":"9797_CR67","doi-asserted-by":"crossref","unstructured":"Wu H, Soraghan J, Lowit A, Di Caterina G (2018). A deep learning method for pathological voice detection using convolutional deep belief networks. In Interspeech 2018","DOI":"10.21437\/Interspeech.2018-1351"},{"key":"9797_CR68","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1155\/2021\/8493795","volume":"2021","author":"M Xiao","year":"2021","unstructured":"Xiao M, Wu Y, Zuo G, Fan S, Yu H, Shaikh ZA, Wen Z (2021) Addressing overfitting problem in deep learning-based solutions for next generation data-driven networks. Wirel Commun Mob Comput 2021:1\u201310","journal-title":"Wirel Commun Mob Comput"},{"key":"9797_CR69","doi-asserted-by":"crossref","unstructured":"Xie W, Nagrani A, Chung JS, Zisserman A (2019). Utterance-level aggregation for speaker recognition in the wild. In: ICASSP 2019\u20132019 IEEE international conference on acoustics, speech and signal processing (ICASSP). IEEE, pp. 5791\u20135795","DOI":"10.1109\/ICASSP.2019.8683120"},{"key":"9797_CR70","doi-asserted-by":"publisher","first-page":"394","DOI":"10.1016\/j.neucom.2020.06.045","volume":"410","author":"J Xu","year":"2020","unstructured":"Xu J, Wang X, Feng B, Liu W (2020) Deep multi-metric learning for text-independent speaker verification. Neurocomputing 410:394\u2013400","journal-title":"Neurocomputing"},{"issue":"4","key":"9797_CR71","doi-asserted-by":"publisher","first-page":"1323","DOI":"10.1007\/s11045-022-00845-9","volume":"33","author":"B Yalamanchili","year":"2022","unstructured":"Yalamanchili B, Samayamantula SK, Anne KR (2022) Neural network-based blended ensemble learning for speech emotion recognition. Multidimens Syst Signal Process 33(4):1323\u20131348","journal-title":"Multidimens Syst Signal Process"},{"issue":"8","key":"9797_CR72","doi-asserted-by":"publisher","first-page":"3603","DOI":"10.3390\/app11083603","volume":"11","author":"F Ye","year":"2021","unstructured":"Ye F, Yang J (2021) A deep neural network model for speaker identification. Appl Sci 11(8):3603","journal-title":"Appl Sci"},{"key":"9797_CR73","doi-asserted-by":"crossref","unstructured":"Yu YQ, Li WJ (2020). Densely connected time delay neural network for speaker verification. In: Interspeech\u00a0pp. 921\u2013925","DOI":"10.21437\/Interspeech.2020-1275"},{"key":"9797_CR74","doi-asserted-by":"crossref","unstructured":"Zhang H, Zou Y, Wang H (2021). Contrastive self-supervised learning for text-independent speaker verification. In: ICASSP 2021\u20132021 IEEE international conference on acoustics, speech and signal processing (ICASSP). IEEE, pp. 6713\u20136717","DOI":"10.1109\/ICASSP39728.2021.9413351"},{"key":"9797_CR75","doi-asserted-by":"publisher","first-page":"301","DOI":"10.1109\/SLT48900.2021.9383531","volume-title":"2021 IEEE spoken language technology workshop (SLT)","author":"T Zhou","year":"2021","unstructured":"Zhou T, Zhao Y, Wu J (2021) Resnext and res2net structures for speaker verification. 2021 IEEE spoken language technology workshop (SLT). IEEE, pp 301\u2013307"}],"container-title":["Evolving Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s12530-026-09797-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s12530-026-09797-y","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s12530-026-09797-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,2,17]],"date-time":"2026-02-17T11:02:59Z","timestamp":1771326179000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s12530-026-09797-y"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,2,17]]},"references-count":75,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2026,6]]}},"alternative-id":["9797"],"URL":"https:\/\/doi.org\/10.1007\/s12530-026-09797-y","relation":{},"ISSN":["1868-6478","1868-6486"],"issn-type":[{"value":"1868-6478","type":"print"},{"value":"1868-6486","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,2,17]]},"assertion":[{"value":"4 February 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 January 2026","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"17 February 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"Not Applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical approval"}}],"article-number":"27"}}