{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,7,27]],"date-time":"2025-07-27T07:52:59Z","timestamp":1753602779918,"version":"3.37.3"},"reference-count":34,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2023,11,5]],"date-time":"2023-11-05T00:00:00Z","timestamp":1699142400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,11,5]],"date-time":"2023-11-05T00:00:00Z","timestamp":1699142400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Circuits Syst Signal Process"],"published-print":{"date-parts":[[2024,3]]},"DOI":"10.1007\/s00034-023-02535-8","type":"journal-article","created":{"date-parts":[[2023,11,5]],"date-time":"2023-11-05T20:01:23Z","timestamp":1699214483000},"page":"1715-1740","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["Short-Utterance-Based Children\u2019s Speaker Verification in Low-Resource Conditions"],"prefix":"10.1007","volume":"43","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-5415-8864","authenticated-orcid":false,"given":"Shahid","family":"Aziz","sequence":"first","affiliation":[]},{"family":"Ankita","sequence":"additional","affiliation":[]},{"given":"S.","family":"Shahnawazuddin","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2023,11,5]]},"reference":[{"key":"2535_CR1","doi-asserted-by":"crossref","unstructured":"M. Athineos, D. Ellis: Frequency-domain linear prediction for temporal features. In: 2003 IEEE Workshop on Automatic Speech Recognition and Understanding (IEEE Cat. No.03EX721), pp. 261\u2013266 (2003)","DOI":"10.1109\/ASRU.2003.1318451"},{"key":"2535_CR2","doi-asserted-by":"crossref","unstructured":"A. Batliner, M. Blomberg , S. D\u2019Arcy, D. Elenius, D. Giuliani, M. Gerosa, C. Hacker, M. Russell, M. Wong: The PF_STAR children\u2019s speech corpus. In: Proc. INTERSPEECH, pp. 2761\u20132764 (2005)","DOI":"10.21437\/Interspeech.2005-705"},{"issue":"4","key":"2535_CR3","doi-asserted-by":"publisher","first-page":"357","DOI":"10.1109\/TASSP.1980.1163420","volume":"28","author":"S Davis","year":"1980","unstructured":"S. Davis, P. Mermelstein, Comparison of parametric representations for monosyllabic word recognition in continuously spoken sentences. IEEE Trans. Acoustic, Speech Signal Processing 28(4), 357\u2013366 (1980). https:\/\/doi.org\/10.1109\/TASSP.1980.1163420","journal-title":"IEEE Trans. Acoustic, Speech Signal Processing"},{"key":"2535_CR4","unstructured":"M. Eskenazi, J. Mostow, D. Graff: The CMU Kids Corpus LDC97S63. https:\/\/catalog.ldc.upenn.edu\/LDC97S63 (1997)"},{"key":"2535_CR5","doi-asserted-by":"crossref","unstructured":"S. Fernando, V. Sethu, E. Ambikairajah: Sub-band envelope features using frequency domain linear prediction for short duration language identification. In: INTERSPEECH, pp. 1818\u20131822 (2018)","DOI":"10.21437\/Interspeech.2018-1805"},{"key":"2535_CR6","doi-asserted-by":"crossref","unstructured":"S. Ganapathy, P. Rajan, H. Hermansky: Multi-layer perceptron based speech activity detection for speaker verification. In: 2011 IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), pp. 321\u2013324. IEEE (2011)","DOI":"10.1109\/ASPAA.2011.6082323"},{"key":"2535_CR7","doi-asserted-by":"crossref","unstructured":"M. Islam: Frequency domain linear prediction-based robust text-dependent speaker identification. In: 2016 international conference on innovations in science, engineering and technology (ICISET), pp. 1\u20134. IEEE (2016)","DOI":"10.1109\/ICISET.2016.7856508"},{"key":"2535_CR8","doi-asserted-by":"crossref","unstructured":"T. Kaneko, H. Kameoka: Parallel-data-free voice conversion using cycle-consistent adversarial networks. arXiv preprint arXiv:1711.11293 (2017)","DOI":"10.23919\/EUSIPCO.2018.8553236"},{"key":"2535_CR9","doi-asserted-by":"crossref","unstructured":"H.K. Kathania, S.R. Kadiri, P. Alku, M. Kurimo: Study of formant modification for children asr. In: ICASSP 2020-2020 IEEE international conference on acoustics, speech and signal processing (ICASSP), pp. 7429\u20137433. IEEE (2020)","DOI":"10.1109\/ICASSP40776.2020.9053334"},{"key":"2535_CR10","doi-asserted-by":"publisher","DOI":"10.1016\/j.apacoust.2021.108553","volume":"188","author":"R Kethireddy","year":"2022","unstructured":"R. Kethireddy, S.R. Kadiri, S.V. Gangashetty, Exploration of temporal dynamics of frequency domain linear prediction cepstral coefficients for dialect classification. Appl. Acoustics 188, 108553 (2022)","journal-title":"Appl. Acoustics"},{"issue":"4","key":"2535_CR11","doi-asserted-by":"publisher","first-page":"2205","DOI":"10.1007\/s00034-021-01885-5","volume":"41","author":"V Kumar","year":"2022","unstructured":"V. Kumar, A. Kumar, S. Shahnawazuddin, Creating robust children\u2019s asr system in zero-resource condition through out-of-domain data augmentation. Circuits Syst. Signal Process. 41(4), 2205\u20132220 (2022)","journal-title":"Circuits Syst. Signal Process."},{"issue":"3","key":"2535_CR12","doi-asserted-by":"publisher","first-page":"1455","DOI":"10.1121\/1.426686","volume":"105","author":"S Lee","year":"1999","unstructured":"S. Lee, A. Potamianos, S. Narayanan, Acoustics of children\u2019s speech: Developmental changes of temporal and spectral parameters. J. Acoust. Soc. Am. 105(3), 1455\u20131468 (1999)","journal-title":"J. Acoust. Soc. Am."},{"issue":"5","key":"2535_CR13","doi-asserted-by":"publisher","first-page":"946","DOI":"10.1109\/TASLP.2014.2311322","volume":"22","author":"G Mantena","year":"2014","unstructured":"G. Mantena, S. Achanta, K. Prahallad, Query-by-example spoken term detection using frequency domain linear prediction and non-segmental dynamic time warping. IEEE\/ACM Trans. Audio, Speech, nd Language Process. 22(5), 946\u2013955 (2014)","journal-title":"IEEE\/ACM Trans. Audio, Speech, nd Language Process."},{"issue":"2","key":"2535_CR14","doi-asserted-by":"publisher","first-page":"91","DOI":"10.1049\/iet-bmt.2017.0065","volume":"7","author":"A Poddar","year":"2018","unstructured":"A. Poddar, M. Sahidullah, G. Saha, Speaker verification with short utterances: a review of challenges, trends and opportunities. IET Biometrics 7(2), 91\u2013101 (2018)","journal-title":"IET Biometrics"},{"key":"2535_CR15","unstructured":"Povey, D., Ghoshal, A., Boulianne, G., Burget, L., Glembek, O., Goel, N., Hannemann, M., Motlicek, P., Qian, Y., Schwarz, P., Silovsky, J., Stemmer, G., Vesely, K.: The Kaldi Speech recognition toolkit. In: Proc. ASRU (2011)"},{"key":"2535_CR16","unstructured":"Povey, D., Zhang, X., Khudanpur, S.: Parallel training of dnns with natural gradient and parameter averaging. arXiv preprint arXiv:1410.7455 (2014)"},{"key":"2535_CR17","doi-asserted-by":"crossref","unstructured":"Prasanna, S.R.M., Govind, D., Rao, K.S., Yegnanarayana, B.: Fast prosody modification using instants of significant excitation. In: Proc. Int. Conf. on Speech Prosody (2010)","DOI":"10.21437\/SpeechProsody.2010-126"},{"key":"2535_CR18","unstructured":"Quateier, T.F.: Discrete time processing of speech signals- principles and practice (1997)"},{"key":"2535_CR19","doi-asserted-by":"publisher","unstructured":"Robinson, T., Fransen, J., Pye, D., Foote, J., Renals, S.: WSJCAM0: A British English speech corpus for large vocabulary continuous speech recognition. In: Proc. ICASSP, vol.\u00a01, pp. 81\u201384 (1995). https:\/\/doi.org\/10.1109\/ICASSP.1995.479278","DOI":"10.1109\/ICASSP.1995.479278"},{"key":"2535_CR20","doi-asserted-by":"publisher","first-page":"141","DOI":"10.1016\/j.csl.2018.01.001","volume":"50","author":"S Safavi","year":"2018","unstructured":"S. Safavi, M. Russell, P. Jan\u010dovi\u010d, Automatic speaker, age-group and gender identification from children\u2019s speech. Comput. Speech & Language 50, 141\u2013156 (2018)","journal-title":"Comput. Speech & Language"},{"key":"2535_CR21","doi-asserted-by":"crossref","unstructured":"Sahidullah, M., Kinnunen, T., Hanil\u00e7i, C.: A comparison of features for synthetic speech detection (2015)","DOI":"10.21437\/Interspeech.2015-472"},{"key":"2535_CR22","doi-asserted-by":"publisher","first-page":"213","DOI":"10.1016\/j.patrec.2019.12.019","volume":"131","author":"S Shahnawazuddin","year":"2020","unstructured":"S. Shahnawazuddin, N. Adiga, H.K. Kathania, B.T. Sai, Creating speaker independent asr system through prosody modification based data augmentation. Pattern Recognition Lett. 131, 213\u2013218 (2020)","journal-title":"Pattern Recognition Lett."},{"key":"2535_CR23","doi-asserted-by":"publisher","first-page":"213","DOI":"10.1016\/j.patrec.2019.12.019","volume":"131","author":"S Shahnawazuddin","year":"2020","unstructured":"S. Shahnawazuddin, N. Adiga, H.K. Kathania, B.T. Sai, Creating speaker independent asr system through prosody modification based data augmentation. Pattern Recogn. Lett. 131, 213\u2013218 (2020). https:\/\/doi.org\/10.1016\/j.patrec.2019.12.019","journal-title":"Pattern Recogn. Lett."},{"key":"2535_CR24","doi-asserted-by":"publisher","first-page":"34","DOI":"10.1016\/j.dsp.2019.06.015","volume":"93","author":"S Shahnawazuddin","year":"2019","unstructured":"S. Shahnawazuddin, N. Adiga, B.T. Sai, W. Ahmad, H.K. Kathania, Developing speaker independent asr system using limited data through prosody modification based on fuzzy classification of spectral bins. Digital Signal Processing 93, 34\u201342 (2019)","journal-title":"Digital Signal Processing"},{"key":"2535_CR25","doi-asserted-by":"publisher","unstructured":"Shahnawazuddin, S., Ahmad, W., Adiga, N., Kumar, A.: In-domain and out-of-domain data augmentation to improve children\u2019s speaker verification system in limited data scenario. In: Proc. ICASSP, pp. 7554\u20137558 (2020). https:\/\/doi.org\/10.1109\/ICASSP40776.2020.9053891","DOI":"10.1109\/ICASSP40776.2020.9053891"},{"key":"2535_CR26","doi-asserted-by":"publisher","DOI":"10.1016\/j.dsp.2021.103115","volume":"116","author":"S Shahnawazuddin","year":"2021","unstructured":"S. Shahnawazuddin, W. Ahmad, N. Adiga, A. Kumar, Children\u2019s speaker verification in low and zero resource conditions. Digital Signal Processing 116, 103115 (2021)","journal-title":"Digital Signal Processing"},{"key":"2535_CR27","unstructured":"K. Shobaki, J.P. Hosom, R. Cole: Cslu: Kids\u2019 speech version 1.1. Linguistic Data Consortium (2007)"},{"key":"2535_CR28","doi-asserted-by":"crossref","unstructured":"D. Snyder, D. Garcia-Romero, G. Sell, D. Povey, S. Khudanpur: X-vectors: Robust dnn embeddings for speaker recognition. In: 2018 IEEE international conference on acoustics, speech and signal processing (ICASSP), pp. 5329\u20135333. IEEE (2018)","DOI":"10.1109\/ICASSP.2018.8461375"},{"issue":"3","key":"2535_CR29","doi-asserted-by":"publisher","first-page":"185","DOI":"10.1121\/1.1915893","volume":"8","author":"SS Stevens","year":"1937","unstructured":"S.S. Stevens, J. Volkmann, E.B. Newman, A scale for the measurement of the psychological magnitude pitch. J. Acoustical Soc. Am. 8(3), 185\u2013190 (1937)","journal-title":"J. Acoustical Soc. Am."},{"issue":"2","key":"2535_CR30","doi-asserted-by":"publisher","first-page":"576","DOI":"10.1016\/j.jfranklin.2015.12.007","volume":"353","author":"V Stojanovic","year":"2016","unstructured":"V. Stojanovic, N. Nedic, Robust identification of oe model with constrained output using optimal input design. J. Franklin Inst. 353(2), 576\u2013593 (2016)","journal-title":"J. Franklin Inst."},{"key":"2535_CR31","doi-asserted-by":"publisher","first-page":"681","DOI":"10.1109\/LSP.2008.2002708","volume":"15","author":"S Thomas","year":"2008","unstructured":"S. Thomas, S. Ganapathy, H. Hermansky, Recognition of reverberant speech using frequency domain linear prediction. IEEE Signal Process. Lett. 15, 681\u2013684 (2008)","journal-title":"IEEE Signal Process. Lett."},{"key":"2535_CR32","doi-asserted-by":"crossref","unstructured":"Wickramasinghe, B., Irtza, S., Ambikairajah, E., Epps, J.: Frequency domain linear prediction features for replay spoofing attack detection. In: Interspeech, pp. 661\u2013665 (2018)","DOI":"10.21437\/Interspeech.2018-1574"},{"key":"2535_CR33","doi-asserted-by":"crossref","unstructured":"Yeung, G., Alwan, A.: On the difficulties of automatic speech recognition for kindergarten-aged children. Interspeech 2018 (2018)","DOI":"10.21437\/Interspeech.2018-2297"},{"issue":"2","key":"2535_CR34","doi-asserted-by":"publisher","first-page":"380","DOI":"10.1002\/acs.3529","volume":"37","author":"Z Zhang","year":"2023","unstructured":"Z. Zhang, X. Song, X. Sun, V. Stojanovic, Hybrid-driven-based fuzzy secure filtering for nonlinear parabolic partial differential equation systems with cyber attacks. Int. J. Adapt. Control Signal Process. 37(2), 380\u2013398 (2023)","journal-title":"Int. J. Adapt. Control Signal Process."}],"container-title":["Circuits, Systems, and Signal Processing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00034-023-02535-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00034-023-02535-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00034-023-02535-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,1]],"date-time":"2024-11-01T11:55:56Z","timestamp":1730462156000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00034-023-02535-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,11,5]]},"references-count":34,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2024,3]]}},"alternative-id":["2535"],"URL":"https:\/\/doi.org\/10.1007\/s00034-023-02535-8","relation":{},"ISSN":["0278-081X","1531-5878"],"issn-type":[{"type":"print","value":"0278-081X"},{"type":"electronic","value":"1531-5878"}],"subject":[],"published":{"date-parts":[[2023,11,5]]},"assertion":[{"value":"22 December 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"7 October 2023","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"8 October 2023","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"5 November 2023","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"The work presented in the uploaded manuscript is an original one, and the manuscript is not currently under consideration for publication elsewhere.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical Approval"}},{"value":"It is hereby confirmed that the manuscript has been read and approved for submission by all the named authors. It is therefore requested to consider the submitted manuscript for publication in the esteemed journal.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for Publication"}}]}}