{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,5]],"date-time":"2025-11-05T14:03:08Z","timestamp":1762351388429},"reference-count":95,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2024,2,29]],"date-time":"2024-02-29T00:00:00Z","timestamp":1709164800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,2,29]],"date-time":"2024-02-29T00:00:00Z","timestamp":1709164800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Speech Technol"],"published-print":{"date-parts":[[2024,3]]},"DOI":"10.1007\/s10772-024-10085-w","type":"journal-article","created":{"date-parts":[[2024,2,29]],"date-time":"2024-02-29T15:02:17Z","timestamp":1709218937000},"page":"101-119","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["Stockwell-Transform based feature representation for detection and assessment of voice disorders"],"prefix":"10.1007","volume":"27","author":[{"given":"Purva","family":"Barche","sequence":"first","affiliation":[]},{"given":"Krishna","family":"Gurugubelli","sequence":"additional","affiliation":[]},{"given":"Anil Kumar","family":"Vuppala","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,2,29]]},"reference":[{"key":"10085_CR1","doi-asserted-by":"crossref","unstructured":"Adiga, N., Vikram, C., Pullela, K., & Prasanna, S. M. (2017). Zero frequency filter based analysis of voice disorders. In Proceeding of INTERSPEECH (pp. 1824\u20131828).","DOI":"10.21437\/Interspeech.2017-589"},{"issue":"3","key":"10085_CR2","doi-asserted-by":"publisher","first-page":"596","DOI":"10.1109\/TASLP.2013.2294585","volume":"22","author":"M Airaksinen","year":"2013","unstructured":"Airaksinen, M., Raitio, T., Story, B., & Alku, P. (2013). Quasi closed phase glottal inverse filtering analysis with weighted linear prediction. IEEE\/ACM Transactions on Audio, Speech, and Language Processing, 22(3), 596\u2013607.","journal-title":"IEEE\/ACM Transactions on Audio, Speech, and Language Processing"},{"key":"10085_CR3","doi-asserted-by":"crossref","unstructured":"Al-Nasheri, A., Ali, Z., Muhammad, G., & Alsulaiman, M. (2015). An investigation of MDVP parameters for voice pathology detection on three different databases. In Sixteenth annual conference of the international speech communication association.","DOI":"10.21437\/Interspeech.2015-611"},{"issue":"4","key":"10085_CR4","doi-asserted-by":"publisher","first-page":"705","DOI":"10.1109\/TASLP.2015.2404035","volume":"23","author":"G Aneeja","year":"2015","unstructured":"Aneeja, G., & Yegnanarayana, B. (2015). Single frequency filtering approach for discriminating speech and nonspeech. IEEE\/ACM Transactions on Audio, Speech, and Language Processing, 23(4), 705\u2013717.","journal-title":"IEEE\/ACM Transactions on Audio, Speech, and Language Processing"},{"issue":"2","key":"10085_CR5","doi-asserted-by":"publisher","first-page":"60","DOI":"10.3109\/14015439.2010.528788","volume":"36","author":"JD Arias-Londo\u00f1o","year":"2011","unstructured":"Arias-Londo\u00f1o, J. D., Godino-Llorente, J. I., Markaki, M., & Stylianou, Y. (2011). On combining information from modulation spectra and mel-frequency cepstral coefficients for automatic detection of pathological voices. Logopedics Phoniatrics Vocology, 36(2), 60\u201369.","journal-title":"Logopedics Phoniatrics Vocology"},{"key":"10085_CR6","volume-title":"Clinical voice disorders","author":"A Aronson","year":"1990","unstructured":"Aronson, A. (1990). Clinical voice disorders (3rd ed.). Thieme.","edition":"3"},{"issue":"1","key":"10085_CR7","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/1687-6180-2012-49","volume":"2012","author":"S Assous","year":"2012","unstructured":"Assous, S., & Boashash, B. (2012). Evaluation of the modified S-transform for time-frequency synchrony analysis and source localisation. EURASIP Journal on Advances in Signal Processing, 2012(1), 1\u201318.","journal-title":"EURASIP Journal on Advances in Signal Processing"},{"issue":"1A","key":"10085_CR8","first-page":"65","volume":"47","author":"BS Atal","year":"1970","unstructured":"Atal, B. S. (1970). Speech analysis and synthesis by linear prediction of the speech wave. The Journal of the Acoustical Society of America, 47(1A), 65\u201365.","journal-title":"The Journal of the Acoustical Society of America"},{"issue":"9","key":"10085_CR9","doi-asserted-by":"publisher","first-page":"2093","DOI":"10.1002\/lary.26465","volume":"127","author":"KE Bainbridge","year":"2017","unstructured":"Bainbridge, K. E., Roy, N., Losonczy, K. G., Hoffman, H. J., & Cohen, S. M. (2017). Voice disorders and associated risk markers among young adults in the United States. The Laryngoscope, 127(9), 2093\u20132099.","journal-title":"The Laryngoscope"},{"issue":"3","key":"10085_CR10","doi-asserted-by":"publisher","first-page":"326","DOI":"10.1016\/j.jvoice.2009.12.010","volume":"25","author":"RK Balasubramanium","year":"2011","unstructured":"Balasubramanium, R. K., Bhat, J. S., Fahim III, S., & Raju III, R. (2011). Cepstral analysis of voice in unilateral adductor vocal fold palsy. Journal of voice, 25(3), 326\u2013329.","journal-title":"Journal of voice"},{"key":"10085_CR11","doi-asserted-by":"crossref","unstructured":"Barche, P., Gurugubelli, K., Vuppala, A. K. (2020) Towards automatic assessment of voice disorders: A clinical approach. In Proceedings of INTERSPEECH (pp. 2537\u20132541)","DOI":"10.21437\/Interspeech.2020-2160"},{"key":"10085_CR12","unstructured":"Barche, P., Gurugubelli, K., & Vuppala, A. K. (2021). Comparative study of filter banks to improve the performance of voice disorder assessment systems using LTAS features. In APSIPA ASC (pp. 737\u2013742). IEEE."},{"issue":"6","key":"10085_CR13","doi-asserted-by":"publisher","first-page":"782","DOI":"10.1016\/j.specom.2013.02.007","volume":"55","author":"Y Bayya","year":"2013","unstructured":"Bayya, Y., & Gowda, D. N. (2013). Spectro-temporal analysis of speech signals using zero-time windowing and group delay function. Speech Communication, 55(6), 782\u2013795.","journal-title":"Speech Communication"},{"issue":"4","key":"10085_CR14","doi-asserted-by":"publisher","first-page":"175","DOI":"10.1049\/ecej:19940401","volume":"6","author":"PM Bentley","year":"1994","unstructured":"Bentley, P. M., & McDonnell, J. (1994). Wavelet transforms: An introduction. Electronics & Communication Engineering Journal, 6(4), 175\u2013186.","journal-title":"Electronics & Communication Engineering Journal"},{"key":"10085_CR15","doi-asserted-by":"crossref","unstructured":"Berisha, V., Krantsevich, C., Stegmann, G., Hahn, S., & Liss, J. (2022). Are reported accuracies in the clinical speech machine learning literature overoptimistic? In Proceedings of INTERSPEECH (pp. 2453\u20132457).","DOI":"10.21437\/Interspeech.2022-691"},{"issue":"3","key":"10085_CR16","doi-asserted-by":"publisher","first-page":"115","DOI":"10.1049\/iet-spr.2019.0042","volume":"14","author":"C Beuter","year":"2020","unstructured":"Beuter, C., & Oleskovicz, M. (2020). S-transform: From main concepts to some power quality applications. IET Signal Processing, 14(3), 115\u2013123.","journal-title":"IET Signal Processing"},{"issue":"1","key":"10085_CR17","doi-asserted-by":"publisher","first-page":"126","DOI":"10.1044\/jshr.3901.126","volume":"39","author":"S Bielamowicz","year":"1996","unstructured":"Bielamowicz, S., Kreiman, J., Gerratt, B. R., Dauer, M. S., & Berke, G. S. (1996). Comparison of voice analysis systems for perturbation measurement. Journal of Speech, Language, and Hearing Research, 39(1), 126\u2013134.","journal-title":"Journal of Speech, Language, and Hearing Research"},{"key":"10085_CR18","doi-asserted-by":"publisher","first-page":"932-e1","DOI":"10.1016\/j.jvoice.2020.03.009","volume":"35","author":"L Chen","year":"2021","unstructured":"Chen, L., Wang, C., Chen, J., Xiang, Z., & Hu, X. (2021). Voice disorder identification by using Hilbert-Huang transform (HHT) and K nearest neighbor (KNN). Journal of Voice, 35, 932-e1.","journal-title":"Journal of Voice"},{"key":"10085_CR19","first-page":"015","volume":"2","author":"P Claros","year":"2019","unstructured":"Claros, P., Karlikowska, A., Claros-Pujol, A., Claros, A., & Pujol, C. (2019). Psychogenic voice disorders literature review personal experiences with opera singers and case report of psychogenic dysphonia in opera singer. International Journal of Depression and Anxiety, 2, 015.","journal-title":"International Journal of Depression and Anxiety"},{"issue":"3","key":"10085_CR20","doi-asserted-by":"publisher","first-page":"268","DOI":"10.1016\/0141-5425(92)90063-Q","volume":"14","author":"J Crowe","year":"1992","unstructured":"Crowe, J., Gibson, N., Woolfson, M., & Somekh, M. G. (1992). Wavelet transform as a potential tool for ECG analysis and compression. Journal of Biomedical Engineering, 14(3), 268\u2013272.","journal-title":"Journal of Biomedical Engineering"},{"issue":"4","key":"10085_CR21","first-page":"245","volume":"62","author":"I Djurovic","year":"2008","unstructured":"Djurovic, I., Sejdic, E., & Jiang, J. (2008). Frequency-based window width optimization for S-transform. AEU-International Journal of Electronics and Communications, 62(4), 245\u2013250.","journal-title":"AEU-International Journal of Electronics and Communications"},{"key":"10085_CR22","doi-asserted-by":"crossref","unstructured":"Drugman, T., Dubuisson, T., & Dutoit, T. (2009). On the mutual information between source and filter contributions for voice pathology detection. In Proceedings of INTERSPEECH 2009 (pp. 1463\u20131466).","DOI":"10.21437\/Interspeech.2009-447"},{"key":"10085_CR23","doi-asserted-by":"crossref","unstructured":"Dubey, A. K., Prasanna, S. M., & Dandapat, S. (2019). Hypernasality severity detection using constant-Q cepstral coefficients. In Proceedings of INTERSPEECH (pp. 4554\u20134558)","DOI":"10.21437\/Interspeech.2019-2151"},{"key":"10085_CR24","doi-asserted-by":"crossref","unstructured":"Ezzine, K., & Frikha, M. (2018). Investigation of glottal flow parameters for voice pathology detection on SVD and MEEI databases. In ATSIP (pp. 1\u20136). IEEE.","DOI":"10.1109\/ATSIP.2018.8364517"},{"key":"10085_CR25","doi-asserted-by":"publisher","first-page":"42","DOI":"10.1016\/j.bspc.2014.07.001","volume":"14","author":"R Fraile","year":"2014","unstructured":"Fraile, R., & Godino-Llorente, J. I. (2014). Cepstral peak prominence: A comprehensive analysis. Biomedical Signal Processing and Control, 14, 42\u201354.","journal-title":"Biomedical Signal Processing and Control"},{"key":"10085_CR26","doi-asserted-by":"crossref","unstructured":"Frohlich, M., Michaelis, D., & Strube, H. W. (1998). Acoustic breathiness measures in the description of pathologic voices. In Proceedings of ICASSP (Vol. 2, pp. 937\u2013940). IEEE.","DOI":"10.1109\/ICASSP.1998.675420"},{"issue":"3","key":"10085_CR27","doi-asserted-by":"publisher","first-page":"573","DOI":"10.1109\/TNSRE.2020.2966290","volume":"28","author":"M Geng","year":"2020","unstructured":"Geng, M., Zhou, W., Liu, G., Li, C., & Zhang, Y. (2020). Epileptic seizure detection based on stockwell transform and bidirectional long short-term memory. IEEE Transactions on Neural Systems and Rehabilitation Engineering, 28(3), 573\u2013580.","journal-title":"IEEE Transactions on Neural Systems and Rehabilitation Engineering"},{"issue":"39","key":"10085_CR28","doi-asserted-by":"publisher","first-page":"28499","DOI":"10.1007\/s11042-020-09424-1","volume":"79","author":"G Gidaye","year":"2020","unstructured":"Gidaye, G., Nirmal, J., Ezzine, K., & Frikha, M. (2020). Wavelet sub-band features for voice disorder detection and classification. Multimedia Tools and Applications, 79(39), 28499\u201328523.","journal-title":"Multimedia Tools and Applications"},{"key":"10085_CR29","doi-asserted-by":"crossref","unstructured":"Godino-Llorente, J. I., Aguilera-Navarro, S., & Gomez-Vilda, P. (2000). LPC, LPCC and MFCC parameterisation applied to the detection of voice impairments. In Sixth international conference on spoken language processing (pp. 965\u2013968).","DOI":"10.21437\/ICSLP.2000-695"},{"issue":"4","key":"10085_CR30","doi-asserted-by":"publisher","first-page":"465","DOI":"10.1007\/s00405-007-0467-x","volume":"265","author":"JI Godino-Llorente","year":"2008","unstructured":"Godino-Llorente, J. I., Osma-Ruiz, V., S\u00e1enz-Lech\u00f3n, N., Cobeta-Marco, I., Gonz\u00e1lez-Herranz, R., & Ram\u00edrez-Calvo, C. (2008). Acoustic analysis of voice using WPCVox: A comparative study with multi dimensional voice program. European Archives of Oto-Rhino-Laryngology, 265(4), 465\u2013476.","journal-title":"European Archives of Oto-Rhino-Laryngology"},{"key":"10085_CR31","unstructured":"Gupta, V. (2018). Voice disorder detection using long short term memory (LSTM) model. ArXiv:1812.01779"},{"key":"10085_CR32","doi-asserted-by":"crossref","unstructured":"Gurugubelli, K., Vuppala, A. K. (2019). Perceptually enhanced single frequency filtering for dysarthric speech detection and intelligibility assessment. In Proceedings of ICASSP (pp. 6410\u20136414). IEEE.","DOI":"10.1109\/ICASSP.2019.8683314"},{"key":"10085_CR33","doi-asserted-by":"publisher","first-page":"99","DOI":"10.1016\/j.dsp.2016.09.001","volume":"60","author":"M Hamidia","year":"2017","unstructured":"Hamidia, M., & Amrouche, A. (2017). A new robust double-talk detector based on the Stockwell transform for acoustic echo cancellation. Digital Signal Processing, 60, 99\u2013112.","journal-title":"Digital Signal Processing"},{"issue":"4","key":"10085_CR34","doi-asserted-by":"publisher","first-page":"324","DOI":"10.1177\/000348940311200406","volume":"112","author":"YD Heman-Ackah","year":"2003","unstructured":"Heman-Ackah, Y. D., Michael, D. D., Baroody, M. M., Ostrowski, R., Hillenbrand, J., Heuer, R. J., Horman, M., & Sataloff, R. T. (2003). Cepstral peak prominence: A more reliable measure of dysphonia. Annals of Otology, Rhinology & Laryngology, 112(4), 324\u2013333.","journal-title":"Annals of Otology, Rhinology & Laryngology"},{"key":"10085_CR35","doi-asserted-by":"publisher","first-page":"20","DOI":"10.1016\/S0892-1997(02)00067-X","volume":"16","author":"YD Heman-Ackah","year":"2002","unstructured":"Heman-Ackah, Y. D., Michael, D. D., & Goding, G. S., Jr. (2002). The relationship between cepstral peak prominence and selected parameters of dysphonia. Journal of Voice, 16, 20\u201327.","journal-title":"Journal of Voice"},{"issue":"4","key":"10085_CR36","doi-asserted-by":"publisher","first-page":"1738","DOI":"10.1121\/1.399423","volume":"87","author":"H Hermansky","year":"1990","unstructured":"Hermansky, H. (1990). Perceptual linear predictive (PLP) analysis of speech. The Journal of the Acoustical Society of America, 87(4), 1738\u20131752.","journal-title":"The Journal of the Acoustical Society of America"},{"issue":"2","key":"10085_CR37","doi-asserted-by":"publisher","first-page":"311","DOI":"10.1044\/jshr.3902.311","volume":"39","author":"J Hillenbrand","year":"1996","unstructured":"Hillenbrand, J., & Houde, R. A. (1996). Acoustic correlates of breathy vocal quality: Dysphonic voices and continuous speech. Journal of Speech, Language, and Hearing Research, 39(2), 311\u2013321.","journal-title":"Journal of Speech, Language, and Hearing Research"},{"key":"10085_CR38","doi-asserted-by":"crossref","unstructured":"Huckvale, M., Buciuleac, C. (2021). Automated detection of voice disorder in the Saarbr\u00fccken voice database: Effects of pathology subset and audio materials. In Proceedings of INTERSPEECH (pp. 4850\u20134854).","DOI":"10.21437\/Interspeech.2021-1507"},{"key":"10085_CR39","doi-asserted-by":"crossref","unstructured":"Javanmardi, F., Kadiri, S. R., Kodali, M., Alku, P., et\u00a0al. (2022). Comparing 1-dimensional and 2-dimensional spectral feature representations in voice pathology detection using machine learning and deep learning classifiers. In Proceedings of INTERSPEECH (pp. 2173\u20132177).","DOI":"10.21437\/Interspeech.2022-10420"},{"key":"10085_CR40","doi-asserted-by":"crossref","unstructured":"Javid, M. H., Gurugubelli, K., & Vuppala, A. K. (2020). Single frequency filter bank based long-term average spectra for hypernasality detection and assessment in cleft lip and palate speech. In Proceedings of ICASSP (pp. 6754\u20136758). IEEE.","DOI":"10.1109\/ICASSP40776.2020.9054684"},{"key":"10085_CR41","doi-asserted-by":"crossref","unstructured":"Jo, C.-W., & Kim, D.-H. (1998) Analysis of disordered speech signal using wavelet transform. In Fifth international conference on spoken language processing.","DOI":"10.21437\/ICSLP.1998-783"},{"key":"10085_CR42","doi-asserted-by":"crossref","unstructured":"Kadiri, S. R., & Yegnanarayana, B. (2018). Breathy to tense voice discrimination using zero-time windowing cepstral coefficients (ZTWCCs). In Proceedings of INTERSPEECH (pp. 232\u2013236).","DOI":"10.21437\/Interspeech.2018-2498"},{"issue":"2","key":"10085_CR44","doi-asserted-by":"publisher","first-page":"367","DOI":"10.1109\/JSTSP.2019.2957988","volume":"14","author":"SR Kadiri","year":"2020","unstructured":"Kadiri, S. R., & Alku, P. (2020). Analysis and detection of pathological voice using glottal source features. IEEE Journal of Selected Topics in Signal Processing, 14(2), 367\u2013379.","journal-title":"IEEE Journal of Selected Topics in Signal Processing"},{"key":"10085_CR43","doi-asserted-by":"crossref","unstructured":"Kadiri, S. R., Yegnanarayana, B. (2018). Analysis and detection of phonation modes in singing voice using excitation source features and single frequency filtering cepstral coefficients (SFFCC). In Proceedings of INTERSPEECH (pp. 441\u2013445).","DOI":"10.21437\/Interspeech.2018-2502"},{"key":"10085_CR45","doi-asserted-by":"publisher","first-page":"811","DOI":"10.1007\/s11517-013-1051-8","volume":"51","author":"M Kaleem","year":"2013","unstructured":"Kaleem, M., Ghoraani, B., Guergachi, A., & Krishnan, S. (2013). Pathological speech signal analysis and classification using empirical mode decomposition. Medical & Biological Engineering & Computing, 51, 811\u2013821.","journal-title":"Medical & Biological Engineering & Computing"},{"issue":"6","key":"10085_CR46","doi-asserted-by":"publisher","first-page":"1170","DOI":"10.1109\/TASL.2013.2245653","volume":"21","author":"J Kane","year":"2013","unstructured":"Kane, J., & Gobl, C. (2013). Wavelet maxima dispersion for breathy to tense voice discrimination. IEEE Transactions on Audio, Speech, and Language Processing, 21(6), 1170\u20131179.","journal-title":"IEEE Transactions on Audio, Speech, and Language Processing"},{"issue":"5","key":"10085_CR47","doi-asserted-by":"publisher","first-page":"2218","DOI":"10.1121\/1.399189","volume":"87","author":"F Klingholtz","year":"1990","unstructured":"Klingholtz, F. (1990). Acoustic recognition of voice disorders: A comparative study of running speech versus sustained vowels. The Journal of the Acoustical Society of America, 87(5), 2218\u20132224.","journal-title":"The Journal of the Acoustical Society of America"},{"issue":"2","key":"10085_CR48","doi-asserted-by":"publisher","first-page":"169","DOI":"10.1044\/jshr.2802.169","volume":"28","author":"F Klingholz","year":"1985","unstructured":"Klingholz, F., & Martin, F. (1985). Quantitative spectral evaluation of shimmer and jitter. Journal of Speech, Language, and Hearing Research, 28(2), 169\u2013174.","journal-title":"Journal of Speech, Language, and Hearing Research"},{"key":"10085_CR49","doi-asserted-by":"publisher","first-page":"549","DOI":"10.1016\/j.jvoice.2015.06.010","volume":"30","author":"M Kohler","year":"2016","unstructured":"Kohler, M., Vellasco, M. M., Cataldo, E., et al. (2016). Analysis and classification of voice pathologies using glottal signal parameters. Journal of Voice, 30, 549\u2013556.","journal-title":"Journal of Voice"},{"issue":"4","key":"10085_CR50","first-page":"248","volume":"54","author":"O Koichi","year":"2011","unstructured":"Koichi, O. (2011). Diagnosis of voice disorders. JMAJ, 54(4), 248\u2013253.","journal-title":"JMAJ"},{"issue":"2","key":"10085_CR51","doi-asserted-by":"publisher","first-page":"254","DOI":"10.1044\/jshr.3602.254","volume":"36","author":"GD Krom","year":"1993","unstructured":"Krom, G. D. (1993). A cepstrum-based technique for determining a harmonics-to-noise ratio in speech signals. Journal of Speech, Language, and Hearing Research, 36(2), 254\u2013266.","journal-title":"Journal of Speech, Language, and Hearing Research"},{"key":"10085_CR52","doi-asserted-by":"publisher","first-page":"651","DOI":"10.1016\/j.jvoice.2009.07.008","volume":"24","author":"BR Kumar","year":"2010","unstructured":"Kumar, B. R., Bhat, J. S., & Prasad, N. (2010). Cepstral analysis of voice in persons with vocal nodules. Journal of Voice, 24, 651\u2013653.","journal-title":"Journal of Voice"},{"issue":"2","key":"10085_CR53","doi-asserted-by":"publisher","first-page":"115","DOI":"10.1016\/S0892-1997(05)80125-0","volume":"6","author":"J Laver","year":"1992","unstructured":"Laver, J., Hiller, S., & Beck, J. M. (1992). Acoustic waveform perturbations and voice disorders. Journal of Voice, 6(2), 115\u2013126.","journal-title":"Journal of Voice"},{"key":"10085_CR54","doi-asserted-by":"crossref","unstructured":"Lee, J.-W., Kim, S., Kang, H.-G. (2014). Detecting pathological speech using contour modeling of harmonic-to-noise ratio. In Proceedings of ICASSP (pp. 5969\u20135973). IEEE","DOI":"10.1109\/ICASSP.2014.6854749"},{"issue":"8","key":"10085_CR55","doi-asserted-by":"publisher","first-page":"1876","DOI":"10.1016\/j.sigpro.2011.02.010","volume":"91","author":"W Lin","year":"2011","unstructured":"Lin, W., & Xiaofeng, M. (2011). An adaptive generalized S-transform for instantaneous frequency estimation. Signal Processing, 91(8), 1876\u20131886.","journal-title":"Signal Processing"},{"key":"10085_CR56","doi-asserted-by":"crossref","unstructured":"Livanos, G., Ranganathan, N., & Jiang, J. (2000). Heart sound analysis using the S transform. In Computers in cardiology 2000 (Vol. 27, pp. 587\u2013590). IEEE.","DOI":"10.1109\/CIC.2000.898590"},{"issue":"1","key":"10085_CR57","doi-asserted-by":"publisher","first-page":"119-e1","DOI":"10.1016\/j.jvoice.2016.02.021","volume":"31","author":"LW Lopes","year":"2017","unstructured":"Lopes, L. W., da Silva, J. D., Sim\u00f5es, L. B., da Silva Evangelista, D., Silva, P. O. C., Almeida, A. A., & de Lima-Silva, M. F. B. (2017). Relationship between acoustic measurements and self-evaluation in patients with voice disorders. Journal of Voice, 31(1), 119-e1.","journal-title":"Journal of Voice"},{"issue":"3","key":"10085_CR58","doi-asserted-by":"publisher","first-page":"793","DOI":"10.1523\/JNEUROSCI.2758-10.2011","volume":"31","author":"CL Ludlow","year":"2011","unstructured":"Ludlow, C. L. (2011). Spasmodic dysphonia: A laryngeal control disorder specific to speech. Journal of Neuroscience, 31(3), 793\u2013797.","journal-title":"Journal of Neuroscience"},{"issue":"4","key":"10085_CR59","doi-asserted-by":"publisher","first-page":"561","DOI":"10.1109\/PROC.1975.9792","volume":"63","author":"J Makhoul","year":"1975","unstructured":"Makhoul, J. (1975). Linear prediction: A tutorial review. Proceedings of the IEEE, 63(4), 561\u2013580.","journal-title":"Proceedings of the IEEE"},{"key":"10085_CR60","doi-asserted-by":"crossref","unstructured":"Markaki, M., & Stylianou, Y. (2009). Normalized modulation spectral features for cross-database voice pathology detection. In Tenth annual conference of the international speech communication association.","DOI":"10.21437\/Interspeech.2009-280"},{"issue":"4","key":"10085_CR61","doi-asserted-by":"publisher","first-page":"217","DOI":"10.1159\/000227999","volume":"61","author":"Y Maryn","year":"2009","unstructured":"Maryn, Y., Corthals, P., De Bodt, M., Van Cauwenberge, P., & Deliyski, D. (2009). Perturbation measures of voice: A comparative study between multi-dimensional voice program and praat. Folia Phoniatrica et Logopaedica, 61(4), 217\u2013226.","journal-title":"Folia Phoniatrica et Logopaedica"},{"issue":"11","key":"10085_CR62","doi-asserted-by":"publisher","first-page":"3723","DOI":"10.3390\/app10113723","volume":"10","author":"MA Mohammed","year":"2020","unstructured":"Mohammed, M. A., Abdulkareem, K. H., Mostafa, S. A., Khanapi Abd Ghani, M., Maashi, M. S., Garcia-Zapirain, B., Oleagordia, I., Alhakami, H., & Al-Dhief, F. T. (2020). Voice pathology detection and classification using convolutional neural network model. Applied Sciences, 10(11), 3723.","journal-title":"Applied Sciences"},{"key":"10085_CR63","doi-asserted-by":"publisher","first-page":"226","DOI":"10.1016\/j.dsp.2015.07.003","volume":"46","author":"A Moukadem","year":"2015","unstructured":"Moukadem, A., Bouguila, Z., Abdeslam, D. O., & Dieterlen, A. (2015). A new optimized Stockwell transform applied on synthetic and real non-stationary signals. Digital Signal Processing, 46, 226\u2013238.","journal-title":"Digital Signal Processing"},{"issue":"3","key":"10085_CR64","doi-asserted-by":"publisher","first-page":"273","DOI":"10.1016\/j.bspc.2012.11.008","volume":"8","author":"A Moukadem","year":"2013","unstructured":"Moukadem, A., Dieterlen, A., Hueber, N., & Brandt, C. (2013). A robust heart sounds segmentation module based on S-transform. Biomedical Signal Processing and Control, 8(3), 273\u2013281.","journal-title":"Biomedical Signal Processing and Control"},{"issue":"8","key":"10085_CR65","doi-asserted-by":"publisher","first-page":"1602","DOI":"10.1109\/TASL.2008.2004526","volume":"16","author":"KSR Murty","year":"2008","unstructured":"Murty, K. S. R., & Yegnanarayana, B. (2008). Epoch extraction from speech signals. IEEE Transactions on Audio, Speech, and Language Processing, 16(8), 1602\u20131613.","journal-title":"IEEE Transactions on Audio, Speech, and Language Processing"},{"key":"10085_CR66","doi-asserted-by":"publisher","first-page":"67745","DOI":"10.1109\/ACCESS.2020.2986171","volume":"8","author":"N Narendra","year":"2020","unstructured":"Narendra, N., & Alku, P. (2020). Glottal source information for pathological voice detection. IEEE Access, 8, 67745\u201367755.","journal-title":"IEEE Access"},{"issue":"2","key":"10085_CR67","doi-asserted-by":"publisher","first-page":"469","DOI":"10.1044\/jslhr.4302.469","volume":"43","author":"V Parsa","year":"2000","unstructured":"Parsa, V., & Jamieson, D. G. (2000). Identification of pathological voices using glottal noise measures. Journal of Speech, Language, and Hearing Research, 43(2), 469\u2013485.","journal-title":"Journal of Speech, Language, and Hearing Research"},{"issue":"11","key":"10085_CR68","doi-asserted-by":"publisher","first-page":"2583","DOI":"10.1109\/TBME.2009.2026735","volume":"56","author":"CR Pinnegar","year":"2009","unstructured":"Pinnegar, C. R., Khosravani, H., & Federico, P. (2009). Time-frequency phase analysis of ictal EEG recordings with the S-transform. IEEE Transactions on Biomedical Engineering, 56(11), 2583\u20132593.","journal-title":"IEEE Transactions on Biomedical Engineering"},{"key":"10085_CR69","doi-asserted-by":"crossref","unstructured":"Poh, K.-K., & Marziliano, P. (2007). Analysis of neonatal EEG signals using stockwell transform. In 2007 29th annual international conference of the IEEE engineering in medicine and biology society (pp. 594\u2013597). IEEE.","DOI":"10.1109\/IEMBS.2007.4352360"},{"issue":"1","key":"10085_CR70","doi-asserted-by":"publisher","first-page":"537","DOI":"10.1121\/1.419726","volume":"102","author":"Y Qi","year":"1997","unstructured":"Qi, Y., & Hillman, R. E. (1997). Temporal and spectral estimations of harmonics-to-noise ratio in human voice signals. The Journal of the Acoustical Society of America, 102(1), 537\u2013543.","journal-title":"The Journal of the Acoustical Society of America"},{"issue":"4","key":"10085_CR71","doi-asserted-by":"publisher","first-page":"2532","DOI":"10.1121\/1.426860","volume":"105","author":"Y Qi","year":"1999","unstructured":"Qi, Y., Hillman, R. E., & Milstein, C. (1999). The estimation of signal-to-noise ratio in continuous speech for disordered voices. The Journal of the Acoustical Society of America, 105(4), 2532\u20132535.","journal-title":"The Journal of the Acoustical Society of America"},{"key":"10085_CR72","doi-asserted-by":"publisher","first-page":"113597","DOI":"10.1016\/j.jelechem.2019.113597","volume":"855","author":"O Ramos-Negr\u00f3n","year":"2019","unstructured":"Ramos-Negr\u00f3n, O., Escobar-Jim\u00e9nez, R., Arellano-P\u00e9rez, J., Uruchurtu-Chavar\u00edn, J., G\u00f3mez-Aguilar, J., & Lucio-Garc\u00eda, M. (2019). Electrochemical noise analysis to identify the corrosion type using the Stockwell Transform and the Shannon energy: Part II. Journal of Electroanalytical Chemistry, 855, 113597.","journal-title":"Journal of Electroanalytical Chemistry"},{"key":"10085_CR73","doi-asserted-by":"publisher","first-page":"135953","DOI":"10.1109\/ACCESS.2021.3117665","volume":"9","author":"MK Reddy","year":"2021","unstructured":"Reddy, M. K., & Alku, P. (2021). A comparison of cepstral features in the detection of pathological voices by varying the input and filterbank of the cepstrum computation. IEEE Access, 9, 135953\u2013135963.","journal-title":"IEEE Access"},{"issue":"4","key":"10085_CR74","doi-asserted-by":"publisher","first-page":"979","DOI":"10.1007\/s10772-019-09644-3","volume":"22","author":"A Revathi","year":"2019","unstructured":"Revathi, A., & Sasikaladevi, N. (2019). Hearing impaired speech recognition: Stockwell features and models. International Journal of Speech Technology, 22(4), 979\u2013991.","journal-title":"International Journal of Speech Technology"},{"issue":"5","key":"10085_CR75","doi-asserted-by":"publisher","first-page":"672","DOI":"10.1016\/j.jvoice.2012.02.002","volume":"26","author":"V Reynolds","year":"2012","unstructured":"Reynolds, V., Buckland, A., Bailey, J., Lipscombe, J., Nathan, E., Vijayasekaran, S., Kelly, R., Maryn, Y., & French, N. (2012). Objective assessment of pediatric voice disorders with the acoustic voice quality index. Journal of Voice, 26(5), 672\u201316727.","journal-title":"Journal of Voice"},{"key":"10085_CR76","doi-asserted-by":"publisher","first-page":"114667","DOI":"10.1016\/j.jelechem.2020.114667","volume":"878","author":"C Rocabruno-Vald\u00e9s","year":"2020","unstructured":"Rocabruno-Vald\u00e9s, C., Escobar-Jim\u00e9nez, R., D\u00edaz-Blanco, Y., G\u00f3mez-Aguilar, J., Astorga-Zaragoza, C., & Uruchurtu-Chavarin, J. (2020). Corrosion evaluation of aluminum 6061\u2013t6 exposed to sugarcane bioethanol-gasoline blends using the Stockwell Transform. Journal of Electroanalytical Chemistry, 878, 114667.","journal-title":"Journal of Electroanalytical Chemistry"},{"issue":"2","key":"10085_CR77","doi-asserted-by":"publisher","first-page":"168","DOI":"10.1166\/jmihi.2014.1253","volume":"4","author":"JC Saldanha","year":"2014","unstructured":"Saldanha, J. C., Ananthakrishna, T., & Pinto, R. (2014). Vocal fold pathology assessment using mel-frequency cepstral coefficients and linear predictive cepstral coefficients features. Journal of Medical Imaging and Health Informatics, 4(2), 168\u2013173.","journal-title":"Journal of Medical Imaging and Health Informatics"},{"key":"10085_CR78","doi-asserted-by":"crossref","unstructured":"Sanyal, A., Baral, A., & Lahiri, A. (2012). Application of S-transform for removing baseline drift from ECG. In 2012 2nd national conference on computational intelligence and signal processing (CISP) (pp. 153\u2013157). IEEE.","DOI":"10.1109\/NCCISP.2012.6189697"},{"key":"10085_CR79","doi-asserted-by":"crossref","unstructured":"Saoud, S., Bousselmi, S., Naser, M. B., & Cherif, A. (2016). New speech enhancement based on discrete orthonormal Stockwell Transform. International Journal of Advanced Computer Science and Applications, 7(10).","DOI":"10.14569\/IJACSA.2016.071026"},{"issue":"10","key":"10085_CR80","doi-asserted-by":"publisher","first-page":"1128","DOI":"10.1001\/archotol.132.10.1128","volume":"132","author":"E Seifert","year":"2006","unstructured":"Seifert, E., & Kollbrunner, J. (2006). An update in thinking about nonorganic voice disorders. Archives of Otolaryngology-Head & Neck Surgery, 132(10), 1128\u20131132.","journal-title":"Archives of Otolaryngology-Head & Neck Surgery"},{"key":"10085_CR81","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1155\/2008\/672941","volume":"2008","author":"E Sejdic","year":"2007","unstructured":"Sejdic, E., Djurovic, I., & Jiang, J. (2007). A window width optimized S-transform. EURASIP Journal on Advances in Signal Processing, 2008, 1\u201313.","journal-title":"EURASIP Journal on Advances in Signal Processing"},{"key":"10085_CR82","doi-asserted-by":"publisher","first-page":"309","DOI":"10.1109\/LSP.2008.917014","volume":"15","author":"E Sejdic","year":"2008","unstructured":"Sejdic, E., Stankovic, L., Dakovic, M., & Jiang, J. (2008). Instantaneous frequency estimation using the S-transform. IEEE Signal Processing Letters, 15, 309\u2013312.","journal-title":"IEEE Signal Processing Letters"},{"key":"10085_CR83","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1155\/2009\/567875","volume":"2009","author":"DG Silva","year":"2009","unstructured":"Silva, D. G., Oliveira, L. C., & Andrea, M. (2009). Jitter estimation algorithms for detection of pathological voices. EURASIP Journal on Advances in Signal Processing, 2009, 1\u20139.","journal-title":"EURASIP Journal on Advances in Signal Processing"},{"key":"10085_CR84","doi-asserted-by":"publisher","first-page":"371","DOI":"10.1016\/j.dsp.2006.04.006","volume":"17","author":"RG Stockwell","year":"2007","unstructured":"Stockwell, R. G. (2007). A basis for efficient representation of the S-transform. Digital Signal Processing, 17, 371\u2013393.","journal-title":"Digital Signal Processing"},{"issue":"4","key":"10085_CR85","doi-asserted-by":"publisher","first-page":"998","DOI":"10.1109\/78.492555","volume":"44","author":"RG Stockwell","year":"1996","unstructured":"Stockwell, R. G., Mansinha, L., & Lowe, R. (1996). Localization of the complex spectrum: The S-transform. IEEE Transactions on Signal Processing, 44(4), 998\u20131001.","journal-title":"IEEE Transactions on Signal Processing"},{"key":"10085_CR86","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1155\/2021\/6635964","volume":"2021","author":"SA Syed","year":"2021","unstructured":"Syed, S. A., Rashid, M., Hussain, S., & Zahid, H. (2021). Comparative analysis of CNN and RNN for voice pathology detection. BioMed Research International, 2021, 1\u20138.","journal-title":"BioMed Research International"},{"key":"10085_CR87","doi-asserted-by":"publisher","first-page":"1112","DOI":"10.1016\/j.protcy.2013.12.124","volume":"9","author":"JP Teixeira","year":"2013","unstructured":"Teixeira, J. P., Oliveira, C., & Lopes, C. (2013). Vocal acoustic analysis-jitter, shimmer and HNR parameters. Procedia Technology, 9, 1112\u20131122.","journal-title":"Procedia Technology"},{"issue":"3","key":"10085_CR88","doi-asserted-by":"publisher","first-page":"421","DOI":"10.1109\/TBME.2004.842962","volume":"52","author":"K Umapathy","year":"2005","unstructured":"Umapathy, K., Krishnan, S., Parsa, V., & Jamieson, D. G. (2005). Discrimination of pathological voices using a time-frequency approach. IEEE Transactions on Biomedical Engineering, 52(3), 421\u2013430.","journal-title":"IEEE Transactions on Biomedical Engineering"},{"issue":"7","key":"10085_CR89","doi-asserted-by":"publisher","first-page":"2771","DOI":"10.1109\/TSP.2008.917029","volume":"56","author":"S Ventosa","year":"2008","unstructured":"Ventosa, S., Simon, C., Schimmel, M., Da\u00f1obeitia, J. J., & M\u00e0nuel, A. (2008). The S-transform from a wavelet point of view. IEEE Transactions on Signal Processing, 56(7), 2771\u20132780.","journal-title":"IEEE Transactions on Signal Processing"},{"issue":"5","key":"10085_CR90","doi-asserted-by":"publisher","first-page":"3896","DOI":"10.1121\/1.4967517","volume":"140","author":"HK Vydana","year":"2016","unstructured":"Vydana, H. K., & Vuppala, A. K. (2016). Detection of fricatives using S-transform. The Journal of the Acoustical Society of America, 140(5), 3896\u20133907.","journal-title":"The Journal of the Acoustical Society of America"},{"key":"10085_CR91","doi-asserted-by":"crossref","unstructured":"Waldekar, S., & Saha, G. (2018). Wavelet transform based mel-scaled features for acoustic scene classification. In INTERSPEECH (Vol. 2018, pp. 3323\u20133327).","DOI":"10.21437\/Interspeech.2018-2083"},{"key":"10085_CR92","doi-asserted-by":"publisher","first-page":"1525","DOI":"10.1044\/1092-4388(2011\/10-0209)","volume":"54","author":"CR Watts","year":"2011","unstructured":"Watts, C. R., & Awan, S. N. (2011). Use of spectral\/cepstral analyses for differentiating normal from hypofunctional voices in sustained vowel and continuous speech contexts. Journal of Speech, Language, and Hearing Research, 54, 1525\u20131537.","journal-title":"Journal of Speech, Language, and Hearing Research"},{"key":"10085_CR93","unstructured":"Woldert-Jokisz, B. (2007). Saarbruecken voice database."},{"key":"10085_CR94","doi-asserted-by":"crossref","unstructured":"Wu, H., Soraghan, J., Lowit, A., & Di\u00a0Caterina, G. (2018). A deep learning method for pathological voice detection using convolutional deep belief networks. In Proceedings of INTERSPEECH (pp. 446\u2013450)","DOI":"10.21437\/Interspeech.2018-1351"},{"key":"10085_CR95","doi-asserted-by":"crossref","unstructured":"Zhu, M., Jiang, Z., Zhang, X., Qi, Y. (2014). A S-transform based spectrum enhancement method for complex noise environment. In 2014 international conference on audio, language and image processing (pp. 382\u2013385). IEEE.","DOI":"10.1109\/ICALIP.2014.7009820"}],"container-title":["International Journal of Speech Technology"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10772-024-10085-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10772-024-10085-w\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10772-024-10085-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,5,13]],"date-time":"2024-05-13T15:12:46Z","timestamp":1715613166000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10772-024-10085-w"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,2,29]]},"references-count":95,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2024,3]]}},"alternative-id":["10085"],"URL":"https:\/\/doi.org\/10.1007\/s10772-024-10085-w","relation":{},"ISSN":["1381-2416","1572-8110"],"issn-type":[{"value":"1381-2416","type":"print"},{"value":"1572-8110","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,2,29]]},"assertion":[{"value":"25 December 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"17 January 2024","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"29 February 2024","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}