{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,7]],"date-time":"2026-02-07T20:48:15Z","timestamp":1770497295865,"version":"3.49.0"},"reference-count":35,"publisher":"Springer Science and Business Media LLC","issue":"5","license":[{"start":{"date-parts":[[2024,2,5]],"date-time":"2024-02-05T00:00:00Z","timestamp":1707091200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,2,5]],"date-time":"2024-02-05T00:00:00Z","timestamp":1707091200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Circuits Syst Signal Process"],"published-print":{"date-parts":[[2024,5]]},"DOI":"10.1007\/s00034-024-02598-1","type":"journal-article","created":{"date-parts":[[2024,2,5]],"date-time":"2024-02-05T13:02:21Z","timestamp":1707138141000},"page":"3139-3159","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["Role of Data Augmentation and Effective Conservation of High-Frequency Contents in the Context Children\u2019s Speaker Verification System"],"prefix":"10.1007","volume":"43","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-5415-8864","authenticated-orcid":false,"given":"Shahid","family":"Aziz","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"S.","family":"Shahnawazuddin","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2024,2,5]]},"reference":[{"key":"2598_CR1","doi-asserted-by":"crossref","unstructured":"S. Aziz, S. Shahnawazuddin, Effective preservation of higher-frequency contents in the context of short utterance based children\u2019s speaker verification system. Appl. Acoust. 209, 109,420 (2023)","DOI":"10.1016\/j.apacoust.2023.109420"},{"key":"2598_CR2","doi-asserted-by":"crossref","unstructured":"K. Badillo-Urquiola, D. Smriti, B. McNally, E. Golub, E. Bonsignore, P.J. Wisniewski, Stranger danger! social media app features co-designed with children to keep them safe online. in Proceedings of the 18th ACM International Conference on Interaction Design and Children, pp. 394\u2013406 (2019)","DOI":"10.1145\/3311927.3323133"},{"key":"2598_CR3","doi-asserted-by":"crossref","unstructured":"A. Batliner, M. Blomberg, S. D\u2019Arcy, D. Elenius, D. Giuliani, M. Gerosa, C. Hacker, M. Russell, M. Wong, The PF_STAR children\u2019s speech corpus. in Proceedings of INTERSPEECH, pp. 2761\u20132764 (2005)","DOI":"10.21437\/Interspeech.2005-705"},{"issue":"12","key":"2598_CR4","doi-asserted-by":"publisher","first-page":"1293","DOI":"10.3390\/app7121293","volume":"7","author":"EP Damsk\u00e4gg","year":"2017","unstructured":"E.P. Damsk\u00e4gg, V. V\u00e4lim\u00e4ki, Audio time stretching using fuzzy classification of spectral bins. Appl. Sci. 7(12), 1293 (2017)","journal-title":"Appl. Sci."},{"key":"2598_CR5","doi-asserted-by":"crossref","unstructured":"S. D\u2019Arcy, M. Russell, A comparison of human and computer recognition accuracy for children\u2019s speech. in Ninth European Conference on Speech Communication and Technology (2005)","DOI":"10.21437\/Interspeech.2005-697"},{"issue":"4","key":"2598_CR6","doi-asserted-by":"publisher","first-page":"357","DOI":"10.1109\/TASSP.1980.1163420","volume":"28","author":"S Davis","year":"1980","unstructured":"S. Davis, P. Mermelstein, Comparison of parametric representations for monosyllabic word recognition in continuously spoken sentences. IEEE Trans. Acoust. Speech Signal Process. 28(4), 357\u2013366 (1980). https:\/\/doi.org\/10.1109\/TASSP.1980.1163420","journal-title":"IEEE Trans. Acoust. Speech Signal Process."},{"key":"2598_CR7","unstructured":"M. Eskenazi, J. Mostow, D. Graff, The CMU Kids Corpus LDC97S63. https:\/\/catalog.ldc.upenn.edu\/LDC97S63 (1997)"},{"key":"2598_CR8","doi-asserted-by":"crossref","unstructured":"M. Gerosa, D. Giuliani, S. Narayanan, A. Potamianos, A review of ASR technologies for children\u2019s speech. in Proceedings of Workshop on Child, Computer and Interaction, pp. 7:1\u20137:8 (2009)","DOI":"10.1145\/1640377.1640384"},{"key":"2598_CR9","doi-asserted-by":"crossref","unstructured":"R.M. Hanifa, K. Isa, S. Mohamad, A review on speaker recognition: technology and challenges. Comput. Electr. Eng. 90, 107005 (2021)","DOI":"10.1016\/j.compeleceng.2021.107005"},{"key":"2598_CR10","doi-asserted-by":"crossref","unstructured":"A. Kanagasundaram, R. Vogt, D. Dean, S. Sridharan, Plda based speaker recognition on short utterances. in Proceedings of The Speaker and Language Recognition Workshop: Odyssey 2012, pp. 28\u201333. International Speech Communication Association (2012)","DOI":"10.21437\/Interspeech.2011-58"},{"key":"2598_CR11","doi-asserted-by":"crossref","unstructured":"T. Kaneko, H. Kameoka, Parallel-data-free voice conversion using cycle-consistent adversarial networks. arXiv preprint arXiv:1711.11293 (2017)","DOI":"10.23919\/EUSIPCO.2018.8553236"},{"key":"2598_CR12","doi-asserted-by":"crossref","unstructured":"H.K. Kathania, S.R. Kadiri, P. Alku, M. Kurimo, Study of formant modification for children asr. in ICASSP 2020\u20132020 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp. 7429\u20137433 (2020)","DOI":"10.1109\/ICASSP40776.2020.9053334"},{"issue":"10","key":"2598_CR13","doi-asserted-by":"publisher","first-page":"4667","DOI":"10.1007\/s00034-019-01072-7","volume":"38","author":"HK Kathania","year":"2019","unstructured":"H.K. Kathania, S. Shahnawazuddin, W. Ahmad, N. Adiga, Role of linear, mel and inverse-mel filterbanks in automatic recognition of speech from high-pitched speakers. Circuits Syst. Signal Process. 38(10), 4667\u20134682 (2019)","journal-title":"Circuits Syst. Signal Process."},{"issue":"4","key":"2598_CR14","doi-asserted-by":"publisher","first-page":"2205","DOI":"10.1007\/s00034-021-01885-5","volume":"41","author":"V Kumar","year":"2022","unstructured":"V. Kumar, A. Kumar, S. Shahnawazuddin, Creating robust children\u2019s asr system in zero-resource condition through out-of-domain data augmentation. Circuits Syst. Signal Process. 41(4), 2205\u20132220 (2022)","journal-title":"Circuits Syst. Signal Process."},{"issue":"3","key":"2598_CR15","doi-asserted-by":"publisher","first-page":"1455","DOI":"10.1121\/1.426686","volume":"105","author":"S Lee","year":"1999","unstructured":"S. Lee, A. Potamianos, S.S. Narayanan, Acoustics of children\u2019s speech: developmental changes of temporal and spectral parameters. J. Acoust. Soc. Am. 105(3), 1455\u20131468 (1999)","journal-title":"J. Acoust. Soc. Am."},{"key":"2598_CR16","unstructured":"M. Observations, Multivariate observations, gaf seber, ed (1984)"},{"key":"2598_CR17","doi-asserted-by":"crossref","unstructured":"V. Peddinti, D. Povey, S. Khudanpur, A time delay neural network architecture for efficient modeling of long temporal contexts. in Proceedings of INTERSPEECH (2015)","DOI":"10.21437\/Interspeech.2015-647"},{"issue":"2","key":"2598_CR18","doi-asserted-by":"publisher","first-page":"91","DOI":"10.1049\/iet-bmt.2017.0065","volume":"7","author":"A Poddar","year":"2018","unstructured":"A. Poddar, M. Sahidullah, G. Saha, Speaker verification with short utterances: a review of challenges, trends and opportunities. IET Biometrics 7(2), 91\u2013101 (2018)","journal-title":"IET Biometrics"},{"key":"2598_CR19","doi-asserted-by":"publisher","unstructured":"A. Poddar, M. Sahidullah, G. Saha, Quality measures for speaker verification with short utterances. Digital Signal Process. 88, 66\u201379 (2019) https:\/\/doi.org\/10.1016\/j.dsp.2019.01.023","DOI":"10.1016\/j.dsp.2019.01.023"},{"key":"2598_CR20","unstructured":"D. Povey, A. Ghoshal, G. Boulianne, L. Burget, O. Glembek, N. Goel, M. Hannemann, P. Motlicek, Y. Qian, P. Schwarz, J. Silovsky, G. Stemmer, K. Vesely, The Kaldi Speech recognition toolkit. in Proceedings of ASRU (2011)"},{"key":"2598_CR21","unstructured":"D. Povey, X. Zhang, S. Khudanpur, Parallel training of deep neural networks with natural gradient and parameter averaging. in Proceedings of ICLR (2015)"},{"key":"2598_CR22","doi-asserted-by":"crossref","unstructured":"S.R.M. Prasanna, D. Govind, K.S. Rao, B. Yegnanarayana, Fast prosody modification using instants of significant excitation. In Proceedings of International Conference on Speech Prosody (2010)","DOI":"10.21437\/SpeechProsody.2010-126"},{"key":"2598_CR23","doi-asserted-by":"crossref","unstructured":"T. Robinson, J. Fransen, D. Pye, J. Foote, S. Renals, WSJCAM0: a British English speech corpus for large vocabulary continuous speech recognition. in ICASSP 1995\u20131995 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp. 81\u201384 (1995)","DOI":"10.1109\/ICASSP.1995.479278"},{"key":"2598_CR24","doi-asserted-by":"crossref","unstructured":"M. Russell, S. D\u2019Arcy, Challenges for computer recognition of children\u2019s speech. in Proceedings of Speech and Language Technologies in Education (SLaTE) (2007)","DOI":"10.21437\/SLaTE.2007-26"},{"issue":"12","key":"2598_CR25","doi-asserted-by":"publisher","first-page":"1044","DOI":"10.1109\/LSP.2007.906213","volume":"14","author":"M Russell","year":"2007","unstructured":"M. Russell, S. D\u2019Arcy, L. Qun, The effects of bandwidth reduction on human and computer recognition of children\u2019s speech. IEEE Signal Process. Lett. 14(12), 1044\u20131046 (2007)","journal-title":"IEEE Signal Process. Lett."},{"key":"2598_CR26","doi-asserted-by":"crossref","unstructured":"S. Safavi, M. Russell, P. Jancovic, Automatic speaker, age-group and gender identification from children\u2019s speech. Comput. Speech Language, 50 (2018)","DOI":"10.1016\/j.csl.2018.01.001"},{"key":"2598_CR27","doi-asserted-by":"publisher","first-page":"213","DOI":"10.1016\/j.patrec.2019.12.019","volume":"131","author":"S Shahnawazuddin","year":"2020","unstructured":"S. Shahnawazuddin, N. Adiga, H.K. Kathania, B.T. Sai, Creating speaker independent asr system through prosody modification based data augmentation. Pattern Recognit. Lett. 131, 213\u2013218 (2020). https:\/\/doi.org\/10.1016\/j.patrec.2019.12.019","journal-title":"Pattern Recognit. Lett."},{"key":"2598_CR28","doi-asserted-by":"publisher","first-page":"34","DOI":"10.1016\/j.dsp.2019.06.015","volume":"93","author":"S Shahnawazuddin","year":"2019","unstructured":"S. Shahnawazuddin, N. Adiga, B.T. Sai, W. Ahmad, H.K. Kathania, Developing speaker independent asr system using limited data through prosody modification based on fuzzy classification of spectral bins. Digital Signal Process. 93, 34\u201342 (2019)","journal-title":"Digital Signal Process."},{"key":"2598_CR29","doi-asserted-by":"crossref","unstructured":"S. Shahnawazuddin, W. Ahmad, N. Adiga, A. Kumar, In-domain and out-of-domain data augmentation to improve children\u2019s speaker verification system in limited data scenario. in ICASSP 2020\u20132020 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp. 7554\u20137558 (2020)","DOI":"10.1109\/ICASSP40776.2020.9053891"},{"key":"2598_CR30","doi-asserted-by":"crossref","unstructured":"S. Shahnawazuddin, W. Ahmad, N. Adiga, A. Kumar, Children\u2019s speaker verification in low and zero resource conditions. Digital Signal Process. 116, 103115 (2021)","DOI":"10.1016\/j.dsp.2021.103115"},{"key":"2598_CR31","unstructured":"K. Shobaki, J.P. Hosom, R. Cole, Cslu: Kids\u2019 Speech Version 1.1. Linguistic Data Consortium (2007)"},{"key":"2598_CR32","doi-asserted-by":"crossref","unstructured":"S. Snyder, D. Garcia-Romero, D. Povey, S. Khudanpur, Deep neural network embeddings for text-independent speaker verification. in Proceedings of INTERSPEECH, pp. 999\u20131003 (2017)","DOI":"10.21437\/Interspeech.2017-620"},{"key":"2598_CR33","doi-asserted-by":"crossref","unstructured":"D. Snyder, D. Garcia-Romero, G. Sell, D. Povey, S. Khudanpur, X-vectors: robust DNN embeddings for speaker recognition. in ICASSP 2018\u20132018 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp. 5329\u20135333 (2018)","DOI":"10.1109\/ICASSP.2018.8461375"},{"key":"2598_CR34","doi-asserted-by":"crossref","unstructured":"M. Tsujikawa, T. Nishikawa, T. Matsui, I-vector-based speaker identification with extremely short utterances for both training and testing. in 2017 IEEE 6th Global Conference on Consumer Electronics (GCCE), pp. 1\u20134. IEEE (2017)","DOI":"10.1109\/GCCE.2017.8229389"},{"key":"2598_CR35","doi-asserted-by":"crossref","unstructured":"G. Yeung, A. Alwan, On the difficulties of automatic speech recognition for kindergarten-aged children. Interspeech 2018 (2018)","DOI":"10.21437\/Interspeech.2018-2297"}],"container-title":["Circuits, Systems, and Signal Processing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00034-024-02598-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00034-024-02598-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00034-024-02598-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,10]],"date-time":"2024-11-10T04:46:11Z","timestamp":1731213971000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00034-024-02598-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,2,5]]},"references-count":35,"journal-issue":{"issue":"5","published-print":{"date-parts":[[2024,5]]}},"alternative-id":["2598"],"URL":"https:\/\/doi.org\/10.1007\/s00034-024-02598-1","relation":{},"ISSN":["0278-081X","1531-5878"],"issn-type":[{"value":"0278-081X","type":"print"},{"value":"1531-5878","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,2,5]]},"assertion":[{"value":"1 June 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"25 December 2023","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"26 December 2023","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"5 February 2024","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"Funding information is not applicable\/No funding was received.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Funding"}},{"value":"The work presented in the uploaded manuscript is an original one and the manuscript is not currently under consideration for publication elsewhere.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics Approval"}},{"value":"It is hereby confirmed that the manuscript has been read and approved for submission by all the named authors. It is therefore requested, to consider the submitted manuscript for publication in the esteemed journal.","order":5,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for Publication"}}]}}