{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T07:28:56Z","timestamp":1740122936790,"version":"3.37.3"},"reference-count":30,"publisher":"Springer Science and Business Media LLC","issue":"9","license":[{"start":{"date-parts":[[2021,1,16]],"date-time":"2021-01-16T00:00:00Z","timestamp":1610755200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2021,1,16]],"date-time":"2021-01-16T00:00:00Z","timestamp":1610755200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"published-print":{"date-parts":[[2021,4]]},"DOI":"10.1007\/s11042-020-10394-7","type":"journal-article","created":{"date-parts":[[2021,1,16]],"date-time":"2021-01-16T02:02:20Z","timestamp":1610762540000},"page":"13615-13637","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["Robust vowel region detection method for multimode speech"],"prefix":"10.1007","volume":"80","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-4198-7430","authenticated-orcid":false,"given":"Kumud","family":"Tripathi","sequence":"first","affiliation":[]},{"given":"K. Sreenivasa","family":"Rao","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2021,1,16]]},"reference":[{"key":"10394_CR1","doi-asserted-by":"crossref","unstructured":"Burget L, Schwarz P, Agarwal M, Akyazi P, Feng K, Ghoshal A, Glembek O, Goel N, Karafi\u00e1t M, Povey D, et al. (2010) Multilingual acoustic modeling for speech recognition based on subspace Gaussian mixture models. In: International conference on acoustics speech and signal processing (ICASSP), pp 4334\u20134337. IEEE","DOI":"10.1109\/ICASSP.2010.5495646"},{"issue":"4","key":"10394_CR2","doi-asserted-by":"publisher","first-page":"1016","DOI":"10.1121\/1.393842","volume":"80","author":"S Furui","year":"1986","unstructured":"Furui S (1986) On the role of spectral transition for speech perception. The Journal of the Acoustical Society of America 80(4):1016\u20131025","journal-title":"The Journal of the Acoustical Society of America"},{"key":"10394_CR3","unstructured":"Garofalo JS, Lamel LF, Fisher WM, Fiscus JG, Pallett DS, Dahlgren NL (1993) The DARPA TIMIT acoustic-phonetic continuous speech corpus cdrom. Linguistic Data Consortium. pp. 207\u2013212"},{"key":"10394_CR4","volume-title":"Neural networks: a comprehensive foundation","author":"S Haykin","year":"1994","unstructured":"Haykin S (1994) Neural networks: a comprehensive foundation. Prentice Hall PTR, Upper Saddle River"},{"issue":"8","key":"10394_CR5","doi-asserted-by":"publisher","first-page":"1107","DOI":"10.1109\/LSP.2019.2921229","volume":"26","author":"YM Keerthana","year":"2019","unstructured":"Keerthana YM, Reddy MK, Rao KS (2019) Cwt-based approach for epoch extraction from telephone quality speech. IEEE Signal Processing Letters 26(8):1107\u20131111","journal-title":"IEEE Signal Processing Letters"},{"issue":"6","key":"10394_CR6","doi-asserted-by":"publisher","first-page":"2315","DOI":"10.1007\/s00034-016-0409-1","volume":"36","author":"A Kumar","year":"2017","unstructured":"Kumar A, Shahnawazuddin S, Pradhan G (2017) Improvements in the detection of vowel onset and offset points in a speech sequence. Circuits, systems, and signal processing 36(6):2315\u20132340","journal-title":"Circuits, systems, and signal processing"},{"key":"10394_CR7","doi-asserted-by":"crossref","unstructured":"Kumar A, Shahnawazuddin S, Pradhan G (2017) Non-local estimation of speech signal for vowel onset point detection in varied environments.. In: INTERSPEECH, pp 429\u2013433","DOI":"10.21437\/Interspeech.2017-624"},{"key":"10394_CR8","unstructured":"Kumar SBSunil, Rao KS, Pati D (2013) Phonetic and prosodically rich transcribed speech corpus in Indian languages: Bengali and Odia. In: Proceedings of international conference on oriental COCOSDA held jointly with conference on asian spoken language research and evaluation (O-COCOSDA\/CASLRE), Gurgaon, India, pp 1\u20135"},{"key":"10394_CR9","doi-asserted-by":"crossref","unstructured":"Mallat S (1999) Wavelet tour of signal processing. New York, NY, USA: Academic","DOI":"10.1016\/B978-012466606-1\/50008-8"},{"key":"10394_CR10","doi-asserted-by":"crossref","unstructured":"Manjunath KE, Rao KS (2014) Automatic phonetic transcription for read, extempore and conversation speech for an Indian language: Bengali. In: Twentieth national conference on communications (NCC), pp 1\u20136. IEEE","DOI":"10.1109\/NCC.2014.6811347"},{"issue":"2","key":"10394_CR11","doi-asserted-by":"publisher","first-page":"257","DOI":"10.1007\/s10772-014-9266-0","volume":"18","author":"KE Manjunath","year":"2015","unstructured":"Manjunath KE, Rao KS (2015) Source and system features for phone recognition. International Journal of Speech Technology 18(2):257\u2013270","journal-title":"International Journal of Speech Technology"},{"key":"10394_CR12","doi-asserted-by":"crossref","unstructured":"Manjunath KE, Rao KS, Jayagopi DB (2017) Development of multilingual phone recognition system for Indian languages. In: International conference on signal processing, informatics, communication and energy systems (SPICES), pp 1\u20136. IEEE","DOI":"10.1109\/SPICES.2017.8091271"},{"key":"10394_CR13","doi-asserted-by":"crossref","unstructured":"Mittal VK, Vuppala AK (2016) Changes in shout features in automatically detected vowel regions. In: 2016 International conference on signal processing and communications (SPCOM), pp 1\u20135. IEEE","DOI":"10.1109\/SPCOM.2016.7746601"},{"issue":"8","key":"10394_CR14","doi-asserted-by":"publisher","first-page":"1602","DOI":"10.1109\/TASL.2008.2004526","volume":"16","author":"KSR Murty","year":"2008","unstructured":"Murty K SR, Yegnanarayana B (2008) Epoch extraction from speech signals. IEEE Transactions on Audio, Speech, and Language Processing 16(8):1602\u20131613","journal-title":"IEEE Transactions on Audio, Speech, and Language Processing"},{"key":"10394_CR15","doi-asserted-by":"crossref","unstructured":"Pradeep R, Rao KS (2016) Deep neural networks for Kannada phoneme recognition. In: Ninth international conference on contemporary computing (IC3), pp 1\u20136. IEEE","DOI":"10.1109\/IC3.2016.7880202"},{"issue":"4","key":"10394_CR16","doi-asserted-by":"publisher","first-page":"854","DOI":"10.1109\/TASL.2013.2238529","volume":"21","author":"G Pradhan","year":"2013","unstructured":"Pradhan G, Prasanna SRMahadeva (2013) Speaker verification by vowel and nonvowel like segmentation. IEEE Transactions on Audio, Speech, and Language Processing 21(4):854\u2013867","journal-title":"IEEE Transactions on Audio, Speech, and Language Processing"},{"issue":"8","key":"10394_CR17","doi-asserted-by":"publisher","first-page":"2552","DOI":"10.1109\/TASL.2011.2155061","volume":"19","author":"SRM Prasanna","year":"2011","unstructured":"Prasanna SRM, Pradhan G (2011) Significance of vowel-like regions for speaker verification under degraded conditions. IEEE transactions on audio, speech, and language processing 19(8):2552\u20132565","journal-title":"IEEE transactions on audio, speech, and language processing"},{"issue":"4","key":"10394_CR18","doi-asserted-by":"publisher","first-page":"556","DOI":"10.1109\/TASL.2008.2010884","volume":"17","author":"SRM Prasanna","year":"2009","unstructured":"Prasanna SRM, Reddy BVS, Krishnamoorthy P (2009) Vowel onset point detection using source, spectral peaks, and modulation spectrum energies. IEEE Transactions on audio, speech, and language processing 17(4):556\u2013565","journal-title":"IEEE Transactions on audio, speech, and language processing"},{"key":"10394_CR19","doi-asserted-by":"crossref","unstructured":"Ramdinmawii E, Mohanta A, Mittal VK (2017) Emotion recognition from speech signal. In: TENCON, pp 1562\u20131567. IEEE","DOI":"10.1109\/TENCON.2017.8228105"},{"issue":"8","key":"10394_CR20","doi-asserted-by":"publisher","first-page":"1133","DOI":"10.1109\/LSP.2017.2712646","volume":"24","author":"MK Reddy","year":"2017","unstructured":"Reddy MK, Rao KS (2017) Robust pitch extraction method for the hmm-based speech synthesis system. IEEE signal processing letters 24(8):1133\u20131137","journal-title":"IEEE signal processing letters"},{"key":"10394_CR21","doi-asserted-by":"crossref","unstructured":"Scanzio S, Laface P, Fissore L, Gemello R, Mana F (2008) On the use of a multilingual neural network front-end. In: Ninth annual conference of the international speech communication association","DOI":"10.21437\/Interspeech.2008-672"},{"key":"10394_CR22","doi-asserted-by":"crossref","unstructured":"Suni AS, Simko J, Vainio MT, et al. (2016) Boundary detection using continuous wavelet analysis. Proceedings of Speech prosody 2016","DOI":"10.21437\/SpeechProsody.2016-55"},{"issue":"4","key":"10394_CR23","doi-asserted-by":"publisher","first-page":"4753","DOI":"10.1007\/s11042-017-5044-8","volume":"77","author":"R Thirumuru","year":"2018","unstructured":"Thirumuru R, Gangashetty SV, Vuppala AK (2018) Improved vowel region detection from a continuous speech using post processing of vowel onset points and vowel end-points. Multimedia Tools and Applications 77(4):4753\u20134767","journal-title":"Multimedia Tools and Applications"},{"issue":"3","key":"10394_CR24","doi-asserted-by":"publisher","first-page":"489","DOI":"10.1007\/s10772-017-9483-4","volume":"21","author":"K Tripathi","year":"2017","unstructured":"Tripathi K, Rao KS (2017) Improvement of phone recognition accuracy using speech mode classification. International Journal of Speech Technology 21(3):489\u2013500. https:\/\/doi.org\/10.1007\/s10772-017-9483-4","journal-title":"International Journal of Speech Technology"},{"key":"10394_CR25","doi-asserted-by":"crossref","unstructured":"Tripathi K, Rao KS (2019) Speech mode classification for indian languages using vocal tract and excitation source features. In: 22nd Conference of the oriental COCOSDA","DOI":"10.1109\/NCC48643.2020.9056073"},{"key":"10394_CR26","unstructured":"Tripathi K, Sreenivasa Rao K (2019) VOP Detection for Read and Conversation Speech using CWT Coefficients and Phone Boundaries"},{"issue":"9","key":"10394_CR27","doi-asserted-by":"publisher","first-page":"781","DOI":"10.1002\/acs.2357","volume":"27","author":"AK Vuppala","year":"2013","unstructured":"Vuppala AK, Rao KS (2013) Speaker identification under background noise using features extracted from steady vowel regions. International Journal of Adaptive Control and Signal Processing 27(9):781\u2013792","journal-title":"International Journal of Adaptive Control and Signal Processing"},{"issue":"8","key":"10394_CR28","doi-asserted-by":"publisher","first-page":"697","DOI":"10.1016\/j.aeue.2011.12.013","volume":"66","author":"AK Vuppala","year":"2012","unstructured":"Vuppala AK, Rao KS, Chakrabarti S (2012) Improved vowel onset point detection using epoch intervals. AEU-International Journal of Electronics and Communications 66(8):697\u2013700","journal-title":"AEU-International Journal of Electronics and Communications"},{"issue":"6","key":"10394_CR29","doi-asserted-by":"publisher","first-page":"1894","DOI":"10.1109\/TASL.2012.2191284","volume":"20","author":"AK Vuppala","year":"2012","unstructured":"Vuppala AK, Yadav J, Chakrabarti S, Rao KS (2012) Vowel onset point detection for low bit rate coded speech. IEEE Transactions on Audio, Speech, and Language Processing 20(6):1894\u20131903","journal-title":"IEEE Transactions on Audio, Speech, and Language Processing"},{"issue":"4","key":"10394_CR30","doi-asserted-by":"publisher","first-page":"299","DOI":"10.1109\/LSP.2013.2245647","volume":"20","author":"J Yadav","year":"2013","unstructured":"Yadav J, Rao KS (2013) Detection of vowel offset point from speech signal. IEEE signal processing letters 20(4):299\u2013302","journal-title":"IEEE signal processing letters"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-020-10394-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-020-10394-7\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-020-10394-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,12,11]],"date-time":"2022-12-11T22:05:54Z","timestamp":1670796354000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-020-10394-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,1,16]]},"references-count":30,"journal-issue":{"issue":"9","published-print":{"date-parts":[[2021,4]]}},"alternative-id":["10394"],"URL":"https:\/\/doi.org\/10.1007\/s11042-020-10394-7","relation":{},"ISSN":["1380-7501","1573-7721"],"issn-type":[{"type":"print","value":"1380-7501"},{"type":"electronic","value":"1573-7721"}],"subject":[],"published":{"date-parts":[[2021,1,16]]},"assertion":[{"value":"20 November 2019","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"5 October 2020","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"22 December 2020","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"16 January 2021","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}