{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,3]],"date-time":"2025-12-03T18:10:56Z","timestamp":1764785456487},"reference-count":80,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2024,9,1]],"date-time":"2024-09-01T00:00:00Z","timestamp":1725148800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,9,1]],"date-time":"2024-09-01T00:00:00Z","timestamp":1725148800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Speech Technol"],"published-print":{"date-parts":[[2024,9]]},"DOI":"10.1007\/s10772-024-10137-1","type":"journal-article","created":{"date-parts":[[2024,9,4]],"date-time":"2024-09-04T07:03:22Z","timestamp":1725433402000},"page":"831-845","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Epoch extraction in real-world scenario"],"prefix":"10.1007","volume":"27","author":[{"given":"Purva","family":"Barche","sequence":"first","affiliation":[]},{"given":"Krishna","family":"Gurugubelli","sequence":"additional","affiliation":[]},{"given":"Anil Kumar","family":"Vuppala","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,9,4]]},"reference":[{"key":"10137_CR1","doi-asserted-by":"crossref","unstructured":"Adiga, N., Vikram, C., Pullela, K., & Prasanna, S. M. (2017). Zero frequency filter based analysis of voice disorders. In Interspeech (pp. 1824\u20131828).","DOI":"10.21437\/Interspeech.2017-589"},{"key":"10137_CR2","doi-asserted-by":"crossref","unstructured":"Ananthapadmanabha, T., & Yegnanarayana, B. (1978). Epoch extraction from linear prediction residual. In IEEE international conference on acoustics, speech, and signal processing (ICASSP\u201978) (Vol. 3, pp. 8\u201311). IEEE.","DOI":"10.1109\/ICASSP.1978.1170401"},{"issue":"4","key":"10137_CR3","doi-asserted-by":"publisher","first-page":"309","DOI":"10.1109\/TASSP.1979.1163267","volume":"27","author":"T Ananthapadmanabha","year":"1979","unstructured":"Ananthapadmanabha, T., & Yegnanarayana, B. (1979). Epoch extraction from linear prediction residual for identification of closed glottis interval. IEEE Transactions on Acoustics, Speech, and Signal Processing, 27(4), 309\u2013319.","journal-title":"IEEE Transactions on Acoustics, Speech, and Signal Processing"},{"key":"10137_CR4","doi-asserted-by":"crossref","unstructured":"Aneeja, G., Kadiri, S. R., & Yegnanarayana, B. (2018). Detection of glottal closure instants in degraded speech using single frequency filtering analysis. In Interspeech (pp. 2300\u20132304).","DOI":"10.21437\/Interspeech.2018-1018"},{"key":"10137_CR5","doi-asserted-by":"crossref","unstructured":"Ardaillon, L., & Roebel, A. (2020). Gci detection from raw speech using a fully-convolutional network. In 2020 IEEE international conference on acoustics, speech and signal processing (ICASSP 2020) (pp. 6739\u20136743). IEEE.","DOI":"10.1109\/ICASSP40776.2020.9053089"},{"key":"10137_CR6","unstructured":"Aronson, A. E. (1985). Clinical voice disorders. An interdisciplinary approach. Thieme."},{"key":"10137_CR7","doi-asserted-by":"crossref","unstructured":"Bapineedu, G., Avinash, B., Gangashetty, S. V., & Yegnanarayana, B. (2009). Analysis of Lombard speech using excitation source information. In Interspeech (pp. 1091\u20131094).","DOI":"10.21437\/Interspeech.2009-34"},{"key":"10137_CR8","doi-asserted-by":"crossref","unstructured":"Barche, P., Gurugubelli, K., & Vuppala, A. K. (2020). Towards automatic assessment of voice disorders: A clinical approach. In Interspeech (pp. 2537\u20132541).","DOI":"10.21437\/Interspeech.2020-2160"},{"key":"10137_CR9","doi-asserted-by":"crossref","unstructured":"Barche, P., Gurugubelli, K., & Vuppala, A. K. (2021). Comparative study of different epoch extraction methods for speech associated with voice disorders. In 2021 IEEE international conference on acoustics, speech and signal processing (ICASSP 2021) (pp. 6923\u20136927). IEEE.","DOI":"10.1109\/ICASSP39728.2021.9413518"},{"key":"10137_CR10","doi-asserted-by":"crossref","unstructured":"Burkhardt, F., Paeschke, A., Rolfes, M., Sendlmeier, W. F., & Weiss, B. (2005). A database of german emotional speech. In Interspeech (Vol. 5, pp. 1517\u20131520).","DOI":"10.21437\/Interspeech.2005-446"},{"key":"10137_CR11","doi-asserted-by":"crossref","unstructured":"Chien, Y.-R., Borsk\u1ef3, M., & Gunason, J. (2019). F0 variability measures based on glottal closure instants. In Interspeech (pp. 1986\u20131989).","DOI":"10.21437\/Interspeech.2019-1326"},{"key":"10137_CR12","doi-asserted-by":"crossref","unstructured":"Dasgupta, H., Pandey, P. C., & Nataraj, K. (2018). Detection of glottal excitation epochs in speech signal using Hilbert envelope. In Interspeech (pp. 2132\u20132136).","DOI":"10.21437\/Interspeech.2018-2014"},{"issue":"2","key":"10137_CR13","doi-asserted-by":"publisher","first-page":"461","DOI":"10.1109\/JSTSP.2019.2951458","volume":"14","author":"H Dasgupta","year":"2019","unstructured":"Dasgupta, H., Pandey, P. C., & Nataraj, K. (2019). Epoch detection using hilbert envelope for glottal excitation enhancement and maximum-sum subarray for epoch marking. IEEE Journal of Selected Topics in Signal Processing, 14(2), 461\u2013471.","journal-title":"IEEE Journal of Selected Topics in Signal Processing"},{"issue":"7","key":"10137_CR14","doi-asserted-by":"publisher","first-page":"2309","DOI":"10.1007\/s00034-014-9957-4","volume":"34","author":"K Deepak","year":"2015","unstructured":"Deepak, K., & Prasanna, S. (2015). Epoch extraction using zero band filtering from speech signal. Circuits, Systems, and Signal Processing, 34(7), 2309\u20132333.","journal-title":"Circuits, Systems, and Signal Processing"},{"key":"10137_CR15","unstructured":"Drugman, T., & Dutoit, T. (2019). Glottal closure and opening instant detection from speech signals. arXiv preprint. arXiv:2001.00841"},{"issue":"5","key":"10137_CR16","doi-asserted-by":"publisher","first-page":"1117","DOI":"10.1016\/j.csl.2014.03.003","volume":"28","author":"T Drugman","year":"2014","unstructured":"Drugman, T., Alku, P., Alwan, A., & Yegnanarayana, B. (2014). Glottal source processing: From analysis to applications. Computer Speech & Language, 28(5), 1117\u20131138.","journal-title":"Computer Speech & Language"},{"key":"10137_CR17","doi-asserted-by":"crossref","unstructured":"Dubagunta, S. P., Vlasenko, B., & Doss, M. M. (2019). Learning voice source related information for depression detection. In 2019 IEEE international conference on acoustics, speech and signal processing (ICASSP 2019) (pp. 6525\u20136529). IEEE.","DOI":"10.1109\/ICASSP.2019.8683498"},{"issue":"6","key":"10137_CR18","doi-asserted-by":"publisher","first-page":"4211","DOI":"10.1121\/1.5134433","volume":"146","author":"AK Dubey","year":"2019","unstructured":"Dubey, A. K., Prasanna, S. M., & Dandapat, S. (2019). Detection and assessment of hypernasality in repaired cleft palate speech using vocal tract and residual features. The Journal of the Acoustical Society of America, 146(6), 4211\u20134223.","journal-title":"The Journal of the Acoustical Society of America"},{"key":"10137_CR19","doi-asserted-by":"crossref","unstructured":"Gangamohan, P., & Gangashetty, S. V. (2019). Epoch extraction from speech signals using temporal and spectral cues by exploiting harmonic structure of impulse-like excitations. In 2019 IEEE international conference on acoustics, speech and signal processing (ICASSP 2019) (pp. 6505\u20136509). IEEE.","DOI":"10.1109\/ICASSP.2019.8682976"},{"key":"10137_CR20","doi-asserted-by":"crossref","unstructured":"Gangamohan, P., & Yegnanarayana, B. (2017). A robust and alternative approach to zero frequency filtering method for epoch extraction. In Interspeech (pp. 2297\u20132300).","DOI":"10.21437\/Interspeech.2017-1172"},{"key":"10137_CR21","doi-asserted-by":"crossref","unstructured":"Gangamohan, P., Kadiri, S. R., & Yegnanarayana, B. (2013). Analysis of emotional speech at subsegmental level. In Interspeech (Vol. 2013, pp. 1916\u20131920).","DOI":"10.21437\/Interspeech.2013-20"},{"key":"10137_CR22","doi-asserted-by":"crossref","unstructured":"Govind, D., & Prasanna, S. (2012). Epoch extraction from emotional speech. In 2012 International conference on signal processing and communications (SPCOM), (pp. 1\u20135). IEEE.","DOI":"10.1109\/SPCOM.2012.6289995"},{"key":"10137_CR23","doi-asserted-by":"crossref","unstructured":"Govind, D., Prasanna, S. M., & Yegnanarayana, B. (2011). Neutral to target emotion conversion using source and suprasegmental information. In Twelfth annual conference of the international speech communication association.","DOI":"10.21437\/Interspeech.2011-743"},{"key":"10137_CR24","doi-asserted-by":"crossref","unstructured":"Goyal, M., Srivastava, V., &  Prathosh, A. P. (2018). Detection of glottal closure instants from raw speech using convolutional neural networks. arXiv preprint. arXiv:1804.10147","DOI":"10.21437\/Interspeech.2019-2587"},{"issue":"4","key":"10137_CR25","doi-asserted-by":"publisher","first-page":"2050","DOI":"10.1007\/s00034-020-01551-2","volume":"40","author":"K Gurugubelli","year":"2021","unstructured":"Gurugubelli, K., Javid, M. H., Alluri, K. R., & Vuppala, A. K. (2021). Toward improving the performance of epoch extraction from telephonic speech. Circuits, Systems, and Signal Processing, 40(4), 2050\u20132064.","journal-title":"Circuits, Systems, and Signal Processing"},{"issue":"9","key":"10137_CR26","doi-asserted-by":"publisher","first-page":"1310","DOI":"10.1109\/LSP.2019.2929442","volume":"26","author":"K Gurugubelli","year":"2019","unstructured":"Gurugubelli, K., & Vuppala, A. K. (2019). Stable implementation of zero frequency filtering of speech signals for efficient epoch extraction. IEEE Signal Processing Letters, 26(9), 1310\u20131314.","journal-title":"IEEE Signal Processing Letters"},{"key":"10137_CR27","doi-asserted-by":"crossref","unstructured":"Hamon, C., Mouline, E., & Charpentier, F. (1989). A diphone synthesis system based on time-domain prosodic modifications of speech. In International conference on acoustics, speech, and signal processing (pp. 238\u2013241). IEEE.","DOI":"10.1109\/ICASSP.1989.266409"},{"key":"10137_CR28","doi-asserted-by":"crossref","unstructured":"Jelil, S., Das, R. K., Prasanna, S. M., & Sinha, R. (2017). Spoof detection using source, instantaneous frequency and cepstral features. In Interspeech (pp. 22\u201326).","DOI":"10.21437\/Interspeech.2017-930"},{"key":"10137_CR29","doi-asserted-by":"crossref","unstructured":"Kadiri, S. R. (2019). A quantitative comparison of epoch extraction algorithms for telephone speech. In 2019 IEEE international conference on acoustics, speech and signal processing (ICASSP 2019) (pp. 6500\u20136504). IEEE.","DOI":"10.1109\/ICASSP.2019.8683558"},{"key":"10137_CR30","doi-asserted-by":"crossref","unstructured":"Kadiri, S.R., Alku, P., & Yegnanarayana, B. (2020). Comparison of glottal closure instants detection algorithms for emotional speech. In 2020 IEEE international conference on acoustics, speech and signal processing (ICASSP 2020), (pp. 7379\u20137383). IEEE.","DOI":"10.1109\/ICASSP40776.2020.9054737"},{"key":"10137_CR31","doi-asserted-by":"crossref","unstructured":"Kadiri, S. R., Gangamohan, P., Gangashetty, S. V., & Yegnanarayana, B. (2015). Analysis of excitation source features of speech for emotion recognition. In Sixteenth annual conference of the international speech communication association.","DOI":"10.21437\/Interspeech.2015-329"},{"issue":"2","key":"10137_CR32","doi-asserted-by":"publisher","first-page":"367","DOI":"10.1109\/JSTSP.2019.2957988","volume":"14","author":"SR Kadiri","year":"2019","unstructured":"Kadiri, S. R., & Alku, P. (2019). Analysis and detection of pathological voice using glottal source features. IEEE Journal of Selected Topics in Signal Processing, 14(2), 367\u2013379.","journal-title":"IEEE Journal of Selected Topics in Signal Processing"},{"issue":"9","key":"10137_CR33","doi-asserted-by":"publisher","first-page":"4459","DOI":"10.1007\/s00034-020-01377-y","volume":"39","author":"SR Kadiri","year":"2020","unstructured":"Kadiri, S. R., Gangamohan, P., Gangashetty, S. V., Alku, P., & Yegnanarayana, B. (2020). Excitation features of speech for emotion recognition using neutral speech as reference. Circuits, Systems, and Signal Processing, 39(9), 4459\u20134481.","journal-title":"Circuits, Systems, and Signal Processing"},{"key":"10137_CR34","doi-asserted-by":"publisher","first-page":"52","DOI":"10.1016\/j.specom.2016.11.005","volume":"86","author":"SR Kadiri","year":"2017","unstructured":"Kadiri, S. R., & Yegnanarayana, B. (2017). Epoch extraction from emotional speech using single frequency filtering approach. Speech Communication, 86, 52\u201363.","journal-title":"Speech Communication"},{"issue":"8","key":"10137_CR35","doi-asserted-by":"publisher","first-page":"1107","DOI":"10.1109\/LSP.2019.2921229","volume":"26","author":"YM Keerthana","year":"2019","unstructured":"Keerthana, Y. M., Reddy, M. K., & Rao, K. S. (2019). Cwt-based approach for epoch extraction from telephone quality speech. IEEE Signal Processing Letters, 26(8), 1107\u20131111.","journal-title":"IEEE Signal Processing Letters"},{"key":"10137_CR36","unstructured":"Kominek, J., & Black, A. W. (2004). The CMU arctic speech databases. In Fifth ISCA workshop on speech synthesis."},{"issue":"4","key":"10137_CR37","doi-asserted-by":"publisher","first-page":"495","DOI":"10.1007\/s10772-012-9150-8","volume":"15","author":"SG Koolagudi","year":"2012","unstructured":"Koolagudi, S. G., & Krothapalli, S. R. (2012). Emotion recognition from speech using sub-syllabic and pitch synchronous spectral features. International Journal of Speech Technology, 15(4), 495\u2013511.","journal-title":"International Journal of Speech Technology"},{"key":"10137_CR38","doi-asserted-by":"crossref","unstructured":"Kumar, K. S., Mallidi, S. H. R., Murty, K. S. R., & Yegnanarayana, B. (2009). Analysis of laugh signals for detecting in continuous speech. In Interspeech (pp. 1591\u20131594).","DOI":"10.21437\/Interspeech.2009-473"},{"issue":"2","key":"10137_CR39","doi-asserted-by":"publisher","first-page":"115","DOI":"10.1016\/S0892-1997(05)80125-0","volume":"6","author":"J Laver","year":"1992","unstructured":"Laver, J., Hiller, S., & Beck, J. M. (1992). Acoustic waveform perturbations and voice disorders. Journal of Voice, 6(2), 115\u2013126.","journal-title":"Journal of Voice"},{"key":"10137_CR40","doi-asserted-by":"crossref","unstructured":"Li, Y., Tao, J., Liu, B., Erickson, D., & Akagi, M. (2020). Comparison of glottal source parameter values in emotional vowels. In Interspeech 2020.","DOI":"10.21437\/Interspeech.2020-1536"},{"issue":"4","key":"10137_CR41","doi-asserted-by":"publisher","first-page":"561","DOI":"10.1109\/PROC.1975.9792","volume":"63","author":"J Makhoul","year":"1975","unstructured":"Makhoul, J. (1975). Linear prediction: A tutorial review. Proceedings of the IEEE, 63(4), 561\u2013580.","journal-title":"Proceedings of the IEEE"},{"key":"10137_CR42","unstructured":"Mandal, T., Rao, K. S., & Gurumath Reddy, M. (2018). Glottal closure instants detection from pathological acoustic speech signal using deep learning. arXiv preprint. arXiv:1811.09956"},{"key":"10137_CR44","doi-asserted-by":"crossref","unstructured":"Matou\u0161ek, J., & Tihelka, D. (2017). Classification-based detection of glottal closure instants from speech signals. In Interspeech (pp. 3053\u20133057), Stockholm, Sweden.","DOI":"10.21437\/Interspeech.2017-213"},{"key":"10137_CR43","doi-asserted-by":"crossref","unstructured":"Matousek, J., & Tihelka, D. (2018) Glottal closure instant detection from speech signal using voting classifier and recursive feature elimination. In Interspeech (pp. 2112\u20132116).","DOI":"10.21437\/Interspeech.2018-1147"},{"key":"10137_CR45","doi-asserted-by":"crossref","unstructured":"Matousek, J., & Tihelka, D. (2021). A comparison of convolutional neural networks for glottal closure instant detection from raw speech. In 2021 IEEE international conference on acoustics, speech and signal processing (ICASSP 2021) (pp. 6938\u20136942). IEEE.","DOI":"10.1109\/ICASSP39728.2021.9413675"},{"issue":"1","key":"10137_CR46","doi-asserted-by":"publisher","first-page":"52","DOI":"10.1109\/LSP.2005.860538","volume":"13","author":"KSR Murty","year":"2005","unstructured":"Murty, K. S. R., & Yegnanarayana, B. (2005). Combining evidence from residual phase and mfcc features for speaker recognition. IEEE Signal Processing Letters, 13(1), 52\u201355.","journal-title":"IEEE signal processing letters"},{"issue":"8","key":"10137_CR47","doi-asserted-by":"publisher","first-page":"1602","DOI":"10.1109\/TASL.2008.2004526","volume":"16","author":"KSR Murty","year":"2008","unstructured":"Murty, K. S. R., & Yegnanarayana, B. (2008). Epoch extraction from speech signals. IEEE Transactions on Audio, Speech, and Language Processing, 16(8), 1602\u20131613.","journal-title":"IEEE Transactions on Audio, Speech, and Language Processing"},{"key":"10137_CR48","doi-asserted-by":"crossref","unstructured":"Narendra, N., Airaksinen, M., & Alku, P. (2017) Glottal source estimation from coded telephone speech using a deep neural network. In Interspeech (pp. 3931\u20133935).","DOI":"10.21437\/Interspeech.2017-882"},{"key":"10137_CR49","doi-asserted-by":"crossref","unstructured":"Narendra, N., & Alku, P. (2018). Dysarthric speech classification using glottal features computed from non-words, words and sentences. In Interspeech (pp. 3403\u20133407).","DOI":"10.21437\/Interspeech.2018-1059"},{"key":"10137_CR50","doi-asserted-by":"crossref","unstructured":"Narendra, N., & Rao, K. S. (2015). Automatic detection of creaky voice using epoch parameters. In Sixteenth annual conference of the international speech communication association","DOI":"10.21437\/Interspeech.2015-508"},{"key":"10137_CR51","doi-asserted-by":"publisher","first-page":"1925","DOI":"10.1109\/TASLP.2021.3078364","volume":"29","author":"N Narendra","year":"2021","unstructured":"Narendra, N., Schuller, B., & Alku, P. (2021). The detection of Parkinson\u2019s disease from speech using voice source information. IEEE\/ACM Transactions on Audio, Speech, and Language Processing, 29, 1925\u20131936.","journal-title":"IEEE\/ACM Transactions on Audio, Speech, and Language Processing"},{"issue":"1","key":"10137_CR52","doi-asserted-by":"publisher","first-page":"34","DOI":"10.1109\/TASL.2006.876878","volume":"15","author":"PA Naylor","year":"2006","unstructured":"Naylor, P. A., Kounoudes, A., Gudnason, J., & Brookes, M. (2006). Estimation of glottal closure instants in voiced speech using the dypsa algorithm. IEEE Transactions on Audio, Speech, and Language Processing, 15(1), 34\u201343.","journal-title":"IEEE Transactions on Audio, Speech, and Language Processing"},{"key":"10137_CR53","unstructured":"Paeschke, A., Kienast, M., & Sendlmeier, W. F. (1999). F0-contours in emotional speech. In Proceedings of the 14th international congress of phonetic sciences (Vol. 2, pp. 929\u2013932)."},{"issue":"12","key":"10137_CR54","doi-asserted-by":"publisher","first-page":"2471","DOI":"10.1109\/TASL.2013.2273717","volume":"21","author":"A Prathosh","year":"2013","unstructured":"Prathosh, A., Ananthapadmanabha, T., & Ramakrishnan, A. (2013). Epoch extraction based on integrated linear prediction residual using plosion index. IEEE Transactions on Audio, Speech, and Language Processing, 21(12), 2471\u20132480.","journal-title":"IEEE Transactions on Audio, Speech, and Language Processing"},{"key":"10137_CR55","doi-asserted-by":"crossref","unstructured":"Raju, V. V., Vydana, H. K., Gangashetty, S. V., & Vuppala, A. K. (2017). Importance of non-uniform prosody modification for speech recognition in emotion conditions. In 2017 Asia-Pacific signal and information processing association annual summit and conference (APSIPA ASC) (pp. 573\u2013576). IEEE.","DOI":"10.1109\/APSIPA.2017.8282109"},{"key":"10137_CR56","doi-asserted-by":"crossref","unstructured":"Rao, K. S., & Yegnanarayana, B. (2006). Voice conversion by prosody and vocal tract modification. In 9th international conference on information technology (ICIT\u201906) (pp. 111\u2013116). IEEE.","DOI":"10.1109\/ICIT.2006.92"},{"issue":"4","key":"10137_CR57","doi-asserted-by":"publisher","first-page":"413","DOI":"10.1007\/s10772-013-9193-5","volume":"16","author":"KS Rao","year":"2013","unstructured":"Rao, K. S., Maity, S., & Reddy, V. R. (2013). Pitch synchronous and glottal closure based speech analysis for language recognition. International Journal of Speech Technology, 16(4), 413\u2013430.","journal-title":"International Journal of Speech Technology"},{"issue":"10","key":"10137_CR58","doi-asserted-by":"publisher","first-page":"762","DOI":"10.1109\/LSP.2007.896454","volume":"14","author":"KS Rao","year":"2007","unstructured":"Rao, K. S., Prasanna, S. M., & Yegnanarayana, B. (2007). Determination of instants of significant excitation in speech using hilbert envelope and group delay function. IEEE Signal Processing Letters, 14(10), 762\u2013765.","journal-title":"IEEE Signal Processing Letters"},{"issue":"3","key":"10137_CR59","doi-asserted-by":"publisher","first-page":"972","DOI":"10.1109\/TSA.2005.858051","volume":"14","author":"KS Rao","year":"2006","unstructured":"Rao, K. S., & Yegnanarayana, B. (2006). Prosody modification using instants of significant excitation. IEEE Transactions on Audio, Speech, and Language Processing, 14(3), 972\u2013980.","journal-title":"IEEE Transactions on Audio, Speech, and Language Processing"},{"key":"10137_CR60","doi-asserted-by":"crossref","unstructured":"Reddy, G., Rao, K. S., & Das, P. P. (2020). Glottal closure instants detection from egg signal by classification approach. In  Interspeech (pp. 4891\u20134895).","DOI":"10.21437\/Interspeech.2020-1189"},{"issue":"10","key":"10137_CR61","doi-asserted-by":"publisher","first-page":"1128","DOI":"10.1001\/archotol.132.10.1128","volume":"132","author":"E Seifert","year":"2006","unstructured":"Seifert, E., & Kollbrunner, J. (2006). An update in thinking about nonorganic voice disorders. Archives of Otolaryngology-Head & Neck Surgery, 132(10), 1128\u20131132.","journal-title":"Archives of Otolaryngology-Head & Neck Surgery"},{"issue":"7","key":"10137_CR62","doi-asserted-by":"publisher","first-page":"1853","DOI":"10.1109\/TASL.2010.2101595","volume":"19","author":"G Seshadri","year":"2010","unstructured":"Seshadri, G., & Yegnanarayana, B. (2010). Performance of an event-based instantaneous fundamental frequency estimator for distant speech signals. IEEE Transactions on Audio, Speech, and Language Processing, 19(7), 1853\u20131864.","journal-title":"IEEE Transactions on Audio, Speech, and Language Processing"},{"key":"10137_CR63","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1155\/2009\/567875","volume":"2009","author":"DG Silva","year":"2009","unstructured":"Silva, D. G., Oliveira, L. C., & Andrea, M. (2009). Jitter estimation algorithms for detection of pathological voices. EURASIP Journal on Advances in Signal Processing, 2009, 1\u20139.","journal-title":"EURASIP Journal on advances in signal processing"},{"key":"10137_CR64","doi-asserted-by":"crossref","unstructured":"Simantiraki, O., Charonyktakis, P., Pampouchidou, A., Tsiknakis, M., & Cooke, M. (2017). Glottal source features for automatic speech-based depression assessment. In Interspeech (pp. 2700\u20132704).","DOI":"10.21437\/Interspeech.2017-1251"},{"issue":"5","key":"10137_CR65","doi-asserted-by":"publisher","first-page":"325","DOI":"10.1109\/89.466662","volume":"3","author":"R Smits","year":"1995","unstructured":"Smits, R., & Yegnanarayana, B. (1995). Determination of instants of significant excitation in speech using group delay function. IEEE Transactions on Speech and Audio Processing, 3(5), 325\u2013333.","journal-title":"IEEE Transactions on Speech and Audio Processing"},{"issue":"9","key":"10137_CR66","doi-asserted-by":"publisher","first-page":"2613","DOI":"10.1109\/TASL.2012.2207114","volume":"20","author":"KS Srinivas","year":"2012","unstructured":"Srinivas, K. S., & Prahallad, K. (2012). An FIR implementation of zero frequency filtering of speech signals. IEEE Transactions on Audio, Speech, and Language Processing, 20(9), 2613\u20132617.","journal-title":"IEEE Transactions on Audio, Speech, and Language Processing"},{"issue":"4","key":"10137_CR67","doi-asserted-by":"publisher","first-page":"1145","DOI":"10.1109\/TASL.2006.876113","volume":"14","author":"J Tao","year":"2006","unstructured":"Tao, J., Kang, Y., & Li, A. (2006). Prosody conversion from neutral speech to emotional speech. IEEE Transactions on Audio, Speech, and Language Processing, 14(4), 1145\u20131154.","journal-title":"IEEE Transactions on Audio, Speech, and Language Processing"},{"issue":"5","key":"10137_CR68","doi-asserted-by":"publisher","first-page":"3072","DOI":"10.1121\/1.4798664","volume":"133","author":"S.A Thati","year":"2013","unstructured":"Thati, S. A., Kumar, K., S., & Yegnanarayana, B. (2013). Synthesis of laughter by modifying excitation characteristics. The Journal of the Acoustical Society of America, 133(5), 3072\u20133082.","journal-title":"The Journal of the Acoustical Society of America"},{"issue":"1","key":"10137_CR69","doi-asserted-by":"publisher","first-page":"82","DOI":"10.1109\/TASL.2011.2157684","volume":"20","author":"MR Thomas","year":"2011","unstructured":"Thomas, M. R., Gudnason, J., & Naylor, P. A. (2011). Estimation of glottal closing and opening instants in voiced speech using the yaga algorithm. IEEE Transactions on Audio, Speech, and Language Processing, 20(1), 82\u201391.","journal-title":"IEEE Transactions on Audio, Speech, and Language Processing"},{"key":"10137_CR70","doi-asserted-by":"crossref","unstructured":"Vijayan, K., & Murty, K. S. R. (2014). Epoch extraction from allpass residual of speech signals. In 2014 IEEE international conference on acoustics, speech and signal processing (ICASSP) (pp. 1493\u20131497). IEEE.","DOI":"10.1109\/ICASSP.2014.6853846"},{"key":"10137_CR71","doi-asserted-by":"crossref","unstructured":"Vikram, R., Girish, K. V., Harshavardhan, S., Ramakrishnan, A., & Ananthapadmanabha, T. (2014). Subband analysis of linear prediction residual for the estimation of glottal closure instants. In 2014 IEEE international conference on acoustics, speech and signal processing (ICASSP) (pp. 945\u2013949). IEEE.","DOI":"10.1109\/ICASSP.2014.6853736"},{"issue":"3","key":"10137_CR72","doi-asserted-by":"publisher","first-page":"624","DOI":"10.1109\/TASLP.2017.2651391","volume":"25","author":"C Vikram","year":"2017","unstructured":"Vikram, C., & Prasanna, S. M. (2017). Epoch extraction from telephone quality speech using single pole filter. IEEE\/ACM Transactions on Audio, Speech, and Language Processing, 25(3), 624\u2013636.","journal-title":"IEEE\/ACM Transactions on Audio, Speech, and Language Processing"},{"key":"10137_CR73","doi-asserted-by":"crossref","unstructured":"Vydana, H. K., Raju, V. V., Gangashetty, S. V., & Vuppala, A. K. (2015). Significance of emotionally significant regions of speech for emotive to neutral conversion. In International conference on mining intelligence and knowledge exploration (pp. 287\u2013296). Springer.","DOI":"10.1007\/978-3-319-26832-3_28"},{"key":"10137_CR74","unstructured":"Woldert-Jokisz, B. (2007). Saarbruecken voice database."},{"key":"10137_CR75","doi-asserted-by":"publisher","first-page":"142","DOI":"10.1016\/j.specom.2017.12.002","volume":"96","author":"J Yadav","year":"2018","unstructured":"Yadav, J., Fahad, M. S., & Rao, K. S. (2018). Epoch detection from emotional speech signal using zero time windowing. Speech Communication, 96, 142\u2013149.","journal-title":"Speech Communication"},{"key":"10137_CR76","doi-asserted-by":"crossref","unstructured":"Yang, S., Wu, Z., Shen, B., & Meng, H. (2018). Detection of glottal closure instants from speech signals: A convolutional neural network based method. In Interspeech (pp. 317\u2013321).","DOI":"10.21437\/Interspeech.2018-1281"},{"issue":"5","key":"10137_CR77","doi-asserted-by":"publisher","first-page":"651","DOI":"10.1007\/s12046-011-0046-0","volume":"36","author":"B Yegnanarayana","year":"2011","unstructured":"Yegnanarayana, B., & Gangashetty, S. V. (2011). Epoch-based analysis of speech signals. Sadhana, 36(5), 651\u2013697.","journal-title":"Sadhana"},{"issue":"3","key":"10137_CR78","doi-asserted-by":"publisher","first-page":"267","DOI":"10.1109\/89.841209","volume":"8","author":"B Yegnanarayana","year":"2000","unstructured":"Yegnanarayana, B., & Murthy, P. S. (2000). Enhancement of reverberant speech using LP residual signal. IEEE Transactions on Speech and Audio Processing, 8(3), 267\u2013281.","journal-title":"IEEE Transactions on Speech and Audio Processing"},{"issue":"4","key":"10137_CR79","doi-asserted-by":"publisher","first-page":"614","DOI":"10.1109\/TASL.2008.2012194","volume":"17","author":"B Yegnanarayana","year":"2009","unstructured":"Yegnanarayana, B., & Murty, K. S. R. (2009). Event-based instantaneous fundamental frequency estimation from speech signals. IEEE Transactions on Audio, Speech, and Language Processing, 17(4), 614\u2013624.","journal-title":"IEEE Transactions on Audio, Speech, and Language Processing"},{"issue":"4","key":"10137_CR80","doi-asserted-by":"publisher","first-page":"313","DOI":"10.1109\/89.701359","volume":"6","author":"B Yegnanarayana","year":"1998","unstructured":"Yegnanarayana, B., & Veldhuis, R. N. (1998). Extraction of vocal-tract system characteristics from speech signals. IEEE Transactions on Speech and Audio Processing, 6(4), 313\u2013327.","journal-title":"IEEE Transactions on Speech and Audio Processing"}],"container-title":["International Journal of Speech Technology"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10772-024-10137-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10772-024-10137-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10772-024-10137-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,12]],"date-time":"2024-09-12T12:16:20Z","timestamp":1726143380000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10772-024-10137-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,9]]},"references-count":80,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2024,9]]}},"alternative-id":["10137"],"URL":"https:\/\/doi.org\/10.1007\/s10772-024-10137-1","relation":{},"ISSN":["1381-2416","1572-8110"],"issn-type":[{"type":"print","value":"1381-2416"},{"type":"electronic","value":"1572-8110"}],"subject":[],"published":{"date-parts":[[2024,9]]},"assertion":[{"value":"26 February 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"25 August 2024","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"4 September 2024","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}