{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,24]],"date-time":"2026-03-24T16:28:29Z","timestamp":1774369709239,"version":"3.50.1"},"reference-count":179,"publisher":"Springer Science and Business Media LLC","issue":"5","license":[{"start":{"date-parts":[[2019,10,11]],"date-time":"2019-10-11T00:00:00Z","timestamp":1570752000000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2019,10,11]],"date-time":"2019-10-11T00:00:00Z","timestamp":1570752000000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Artif Intell Rev"],"published-print":{"date-parts":[[2020,6]]},"DOI":"10.1007\/s10462-019-09775-8","type":"journal-article","created":{"date-parts":[[2019,10,11]],"date-time":"2019-10-11T15:05:07Z","timestamp":1570806307000},"page":"3673-3704","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":43,"title":["ASRoIL: a comprehensive survey for automatic speech recognition of Indian languages"],"prefix":"10.1007","volume":"53","author":[{"given":"Amitoj","family":"Singh","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Virender","family":"Kadyan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Munish","family":"Kumar","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Nancy","family":"Bassan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2019,10,11]]},"reference":[{"key":"9775_CR1","doi-asserted-by":"crossref","unstructured":"Aggarwal RK and Dave M (2010) Fitness evaluation of Gaussian mixtures in Hindi speech recognition system. In: Proceedings of first international conference on integrated intelligent computing (ICIIC), pp 177\u2013183","DOI":"10.1109\/ICIIC.2010.13"},{"key":"9775_CR2","unstructured":"Aggarwal RK, Dave M (2011) Application of genetically optimized neural networks for Hindi speech recognition system. In: Proceedings of the world congress on information and communication technologies (WICT), pp 512\u2013517"},{"issue":"2","key":"9775_CR3","doi-asserted-by":"crossref","first-page":"191","DOI":"10.1007\/s10772-012-9133-9","volume":"15","author":"RK Aggarwal","year":"2012","unstructured":"Aggarwal RK, Dave M (2012) Filter bank optimization for robust ASR using GA and PSO. Int J Speech Technol 15(2):191\u2013201","journal-title":"Int J Speech Technol"},{"issue":"3","key":"9775_CR4","doi-asserted-by":"crossref","first-page":"1457","DOI":"10.1007\/s11235-011-9623-0","volume":"52","author":"RK Aggarwal","year":"2013","unstructured":"Aggarwal RK, Dave M (2013) Performance evaluation of sequentially combined heterogeneous feature streams for Hindi speech recognition system. Telecommun Syst 52(3):1457\u20131466","journal-title":"Telecommun Syst"},{"key":"9775_CR6","doi-asserted-by":"crossref","unstructured":"Ahamed B, Israt F, Chowdhury SMR, Huda MN (2013) Effect of speaker variation on the performance of Bangla ASR. In: Proceedings of the 2nd international conference on informatics, electronics and vision, pp 1\u20135","DOI":"10.1109\/ICIEV.2013.6572578"},{"key":"9775_CR7","unstructured":"Ali H, Ahmad N, Yahya KM, Farooq O (2012) A medium vocabulary Urdu isolated words balanced corpus for automatic speech recognition. In: Proceedings of the international conference on electronics computer technology, pp 473\u2013476"},{"key":"9775_CR8","unstructured":"Ali H, Ahmad N, Zhou X, Ali M, Manjotho AA (2013) Linear discriminant analysis based approach for automatic speech recognition of Urdu isolated words. In: Proceedings of the international multi topic conference, pp 24\u201334"},{"issue":"1","key":"9775_CR9","first-page":"47","volume":"18","author":"PJ Antony","year":"2013","unstructured":"Antony PJ (2013) Machine translation approaches and survey for Indian Languages. Int J Comput Linguist Chin Lang Process 18(1):47\u201378","journal-title":"Int J Comput Linguist Chin Lang Process"},{"key":"9775_CR10","doi-asserted-by":"crossref","unstructured":"Anukriti, Tiwari S, Chatterjee T, Bhattacharya M (2013) Speaker independent speech recognition implementation with adaptive language models. In: Proceedings of international symposium on computational and business intelligence, pp 7\u201310","DOI":"10.1109\/ISCBI.2013.9"},{"key":"9775_CR11","unstructured":"Anumanchipalli G, Chitturi R, Joshi S, Kumar R, Singh SP, Sitaram RNV, Kishore SP (2005) Development of Indian language speech databases for large vocabulary speech recognition systems. In: Proceedings of international conference on speech and computer (SPECOM), pp 1\u20134"},{"key":"9775_CR12","doi-asserted-by":"crossref","first-page":"48","DOI":"10.1109\/MCI.2009.932255","volume":"4","author":"MA Anusuya","year":"2009","unstructured":"Anusuya MA, Katti SK (2009) Comments on the paper by Perlovsky entitled integrating language and cognition. IEEE Comput Intell Mag 4:48\u201349","journal-title":"IEEE Comput Intell Mag"},{"issue":"3","key":"9775_CR200","first-page":"181","volume":"6","author":"MA Anusuya","year":"2010","unstructured":"Anusuya MA, Katti SK (2010) Speech recognition by machine: a review. Int J Comput Sci Inf Secur 6(3):181\u2013205","journal-title":"Int J Comput Sci Inf Secur"},{"key":"9775_CR13","doi-asserted-by":"crossref","unstructured":"Arora A, Kadyan V, Singh A (2019) Effect of tonal features on various dialectal variations of Punjabi language. In: Proceedings of the conference on advances in signal processing and communication, pp 467\u2013475","DOI":"10.1007\/978-981-13-2553-3_45"},{"key":"9775_CR14","doi-asserted-by":"crossref","unstructured":"Asfak-Ur-Rahman M, Kotwal MRA, Hassan F, Ahmmed S, Huda MN (2012) Gender effect cannonicalization for Bangla ASR. In: Proceedings of the 15th international conference on computer and information technology (ICCIT), pp 179\u2013184","DOI":"10.1109\/ICCITechn.2012.6509701"},{"key":"9775_CR15","doi-asserted-by":"crossref","unstructured":"Bansal S, Dev A (2013) Emotional Hindi speech database. In: Proceedings of the International Conference on Oriental COCOSDA held jointly with Asian spoken language research and evaluation (O-COCOSDA\/CASLRE), pp 1\u20134","DOI":"10.1109\/ICSDA.2013.6709867"},{"key":"9775_CR16","doi-asserted-by":"crossref","unstructured":"Bansal S, Sharan S, Agrawal SS (2015) Corpus design and development of an annotated speech database for Punjabi. In: Proceedings of the international conference on oriental COCOSDA held jointly with Asian spoken language research and evaluation (O-COCOSDA\/CASLRE), pp 32\u201337","DOI":"10.1109\/ICSDA.2015.7357860"},{"key":"9775_CR17","doi-asserted-by":"crossref","first-page":"85","DOI":"10.1016\/j.specom.2013.07.008","volume":"56","author":"L Besacier","year":"2014","unstructured":"Besacier L, Barnard E, Karpov A, Schultz T (2014) Automatic speech recognition for under-resourced languages: a survey. Speech Commun 56:85\u2013100","journal-title":"Speech Commun"},{"issue":"4","key":"9775_CR18","doi-asserted-by":"crossref","first-page":"673","DOI":"10.1007\/s10772-015-9311-7","volume":"18","author":"SS Bharali","year":"2015","unstructured":"Bharali SS, Kalita SK (2015) A comparative study of different features for isolated spoken word recognition using HMM with reference to Assamese language. Int J Speech Technol 18(4):673\u2013684","journal-title":"Int J Speech Technol"},{"issue":"2","key":"9775_CR19","doi-asserted-by":"crossref","first-page":"251","DOI":"10.1007\/s10772-018-9501-1","volume":"21","author":"SS Bharali","year":"2018","unstructured":"Bharali SS, Kalita SK (2018) Speech recognition with reference to Assamese language using novel fusion technique. Int J Speech Technol 21(2):251\u2013263","journal-title":"Int J Speech Technol"},{"issue":"6","key":"9775_CR20","first-page":"114","volume":"1","author":"U Bhattacharjee","year":"2013","unstructured":"Bhattacharjee U (2013a) Recognition of the tonal words of Bodo language. Int J Recent Technol Eng 1(6):114\u2013118","journal-title":"Int J Recent Technol Eng"},{"issue":"1","key":"9775_CR21","doi-asserted-by":"crossref","first-page":"1","DOI":"10.15623\/ijret.2013.0201001","volume":"2","author":"U Bhattacharjee","year":"2013","unstructured":"Bhattacharjee U (2013b) A comparative study Of LPCC and MFCC features for the recognition of Assamese phonemes. Int J Eng Res Technol 2(1):1\u20136","journal-title":"Int J Eng Res Technol"},{"key":"9775_CR22","doi-asserted-by":"crossref","first-page":"895","DOI":"10.1016\/j.procs.2017.12.114","volume":"125","author":"T Bhowmik","year":"2018","unstructured":"Bhowmik T, Chowdhury A, Mandal SKD (2018) Deep neural network based place and manner of articulation detection and classification for Bengali continuous speech. Procedia Comput Sci 125:895\u2013901","journal-title":"Procedia Comput Sci"},{"issue":"5","key":"9775_CR23","doi-asserted-by":"crossref","first-page":"92","DOI":"10.5923\/j.ajsp.20120205.02","volume":"2","author":"K Bhuvanagirir","year":"2012","unstructured":"Bhuvanagirir K, Kopparapu SK (2012) Mixed language speech recognition without explicit identification of language. Am J Signal Process 2(5):92\u201397","journal-title":"Am J Signal Process"},{"issue":"4","key":"9775_CR24","doi-asserted-by":"crossref","first-page":"1111","DOI":"10.1016\/j.compeleceng.2014.01.008","volume":"40","author":"A Biswas","year":"2014","unstructured":"Biswas A, Sahu PK, Chandra M (2014) Admissible wavelet packet features based on human inner ear frequency response for Hindi consonant recognition. Comput Electr Eng 40(4):1111\u20131122","journal-title":"Comput Electr Eng"},{"key":"9775_CR25","doi-asserted-by":"crossref","first-page":"12","DOI":"10.1016\/j.compeleceng.2014.12.017","volume":"42","author":"A Biswas","year":"2015","unstructured":"Biswas A, Sahu PK, Bhowmick A, Chandra M (2015) Hindi phoneme classification using Wiener filtered wavelet packet decomposed periodic and aperiodic acoustic feature. Comput Electr Eng 42:12\u201322","journal-title":"Comput Electr Eng"},{"issue":"1\u20134","key":"9775_CR26","doi-asserted-by":"crossref","first-page":"11","DOI":"10.1016\/S0925-2312(00)00305-2","volume":"34","author":"BB Chaudhuri","year":"2000","unstructured":"Chaudhuri BB, Bhattacharya U (2000) Efficient training and improved performance of multilayer perceptron in pattern classification. Neurocomputing 34(1\u20134):11\u201327","journal-title":"Neurocomputing"},{"key":"9775_CR27","doi-asserted-by":"crossref","unstructured":"Chellapriyadharshini M, Toffy A, Srinivasa RKM, Ramasubramanian V (2018) Semi-supervised and active-learning scenarios: efficient acoustic model refinement for a low resource Indian language. In: Computer and languages, pp 1041\u20131045","DOI":"10.21437\/Interspeech.2018-2486"},{"key":"9775_CR28","unstructured":"Chhayani NH, Patil HA (2013) Development of corpora for person recognition using humming, singing and speech. In: Proceedings of the international conference on oriental COCOSDA held jointly with Asian spoken language research and evaluation, pp 1\u20136"},{"key":"9775_CR29","unstructured":"CDAC Corpus (2015) http:\/\/cdac.in\/index.aspx?=mc-i\/fspeech-corpora . Accessed 22 Feb 2018"},{"key":"9775_CR30","first-page":"35","volume":"23","author":"RV Darekar","year":"2018","unstructured":"Darekar RV, Dhande AP (2018) Emotion recognition from Marathi speech database using adaptive artificial neural network. Biol Inspired Cognit Archit 23:35\u201342","journal-title":"Biol Inspired Cognit Archit"},{"key":"9775_CR31","unstructured":"Das B, Mandal S, Mitra P (2011) Bengali speech corpus for continuous automatic speech recognition system. In: Proceedings of the international conference on speech database and assessments, pp 51\u201355"},{"key":"9775_CR32","doi-asserted-by":"crossref","unstructured":"Dey A, Zhang W, Fung P (2014) Acoustic modeling for Hindi speech recognition in low-resource settings. In: International conference on audio, language and image processing (ICALIP), pp 891\u2013894","DOI":"10.1109\/ICALIP.2014.7009923"},{"key":"9775_CR33","unstructured":"Dey A, Lalhminghlui W, Sarmah P, Samudravijaya K, Prasanna SM, Sinha R, Nirmala SR (2018) Mizo phone recognition system. In: Interspeech, pp 1\u20135"},{"key":"9775_CR34","unstructured":"Dileep AD, Sekhar CC (2013) HMM based pyramid match kernel for classification of sequential patterns of speech using support vector machines. In: Proceedings of the IEEE international conference on acoustics, speech and signal processing, pp 3562\u20133566"},{"issue":"4","key":"9775_CR35","first-page":"359","volume":"9","author":"M Dua","year":"2012","unstructured":"Dua M, Aggarwal RK, Kadyan V, Dua S (2012a) Punjabi automatic speech recognition using HTK. Int J Comput Sci Issues (IJCSI) 9(4):359","journal-title":"Int J Comput Sci Issues (IJCSI)"},{"key":"9775_CR36","doi-asserted-by":"crossref","unstructured":"Dua M, Aggarwal RK, Kadyan V, Dua S (2012b) Punjabi speech to text system for connected words. In: Proceedings of the fourth international conference on advances in recent technologies in communication and computing (ARTCom2012), pp 206\u2013209","DOI":"10.1049\/cp.2012.2528"},{"key":"9775_CR37","unstructured":"Dua M, Kumar A, Chaudhary T (2015) Implementation and performance evaluation of speaker adaptive continuous Hindi ASR using tri-phone based acoustic modelling. In: Proceedings of 2015 international conference on future computational technologies, pp 68\u201373"},{"key":"9775_CR38","doi-asserted-by":"crossref","unstructured":"Dua M, Aggarwal RK, Biswas M (2017) Discriminative training using heterogeneous feature vector for Hindi automatic speech recognition system. In: Proceedings of international conference on computer and applications (ICCA), pp 158\u2013162","DOI":"10.1109\/COMAPP.2017.8079777"},{"key":"9775_CR39","first-page":"1","volume":"10","author":"M Dua","year":"2018","unstructured":"Dua M, Aggarwal RK, Biswas M (2018a) GFCC based discriminatively trained noise robust continuous ASR system for Hindi language. J Ambient Intell Humaniz Comput 10:1\u201314","journal-title":"J Ambient Intell Humaniz Comput"},{"key":"9775_CR40","doi-asserted-by":"publisher","DOI":"10.1515\/jisys-2017-0618","author":"M Dua","year":"2018","unstructured":"Dua M, Aggarwal RK, Biswas M (2018b) Discriminative training using noise robust integrated features and refined HMM modeling. J Intell Syst. https:\/\/doi.org\/10.1515\/jisys-2017-0618","journal-title":"J Intell Syst"},{"key":"9775_CR41","doi-asserted-by":"publisher","DOI":"10.1515\/jisys-2017-0618","author":"M Dua","year":"2018","unstructured":"Dua M, Aggarwal RK, Biswas M (2018c) Discriminative training using noise robust integrated features and refined HMM modeling. J Intell Syst. https:\/\/doi.org\/10.1515\/jisys-2017-0618","journal-title":"J Intell Syst"},{"key":"9775_CR42","doi-asserted-by":"publisher","DOI":"10.1515\/jisys-2017-0618","author":"M Dua","year":"2018","unstructured":"Dua M, Aggarwal RK, Biswas M (2018d) Discriminative training using noise robust integrated features and refined HMM modeling. J Intell Syst. https:\/\/doi.org\/10.1515\/jisys-2017-0618","journal-title":"J Intell Syst"},{"key":"9775_CR45","doi-asserted-by":"crossref","unstructured":"Dutta K, Sarma KK (2012) Multiple feature extraction for RNN-based Assamese speech recognition for speech to text conversion application. In: Proceedings of the international conference on communications, devices and intelligent systems (CODIS), pp 600\u2013603","DOI":"10.1109\/CODIS.2012.6422274"},{"key":"9775_CR46","unstructured":"EMILLE Corpora (2015) http:\/\/catalog.elra.info\/search-result.php?keywords=W0037&language=en . Accessed on 05 Jan 2018"},{"issue":"6","key":"9775_CR47","doi-asserted-by":"crossref","first-page":"847","DOI":"10.1142\/S0219691310003845","volume":"8","author":"O Farooq","year":"2010","unstructured":"Farooq O, Datta S, Shrotriya MC (2010) Wavelet sub-band based temporal features for robust Hindi phoneme recognition. Int J Wavelets Multi Resolut Inf Process 8(6):847\u2013859","journal-title":"Int J Wavelets Multi Resolut Inf Process"},{"key":"9775_CR48","doi-asserted-by":"crossref","unstructured":"Fathima N, Patel T, Mahima C, Iyengar A (2018) TDNN-based multilingual speech recognition system for low resource Indian languages. In: Proceedings of the Inter-speech, pp 3197\u20133201","DOI":"10.21437\/Interspeech.2018-2117"},{"key":"9775_CR49","doi-asserted-by":"crossref","unstructured":"Gaikwad S, Gawali B, Mehrotra S (2013) Creation of Marathi speech corpus for automatic speech recognition. In: Proceedings of the international conference on oriental COCOSDA held jointly with Asian spoken language research and evaluation (O-COCOSDA\/CASLRE), pp 1\u20135","DOI":"10.1109\/ICSDA.2013.6709893"},{"key":"9775_CR50","unstructured":"Ganesh AA, Ravichandran C (2013) Grapheme Gaussian model and prosodic syllable based Tamil speech recognition system. In: Proceedings of the international conference on signal processing and communication (ICSC), pp 401\u2013406"},{"issue":"8","key":"9775_CR51","first-page":"42","volume":"41","author":"W Ghai","year":"2012","unstructured":"Ghai W, Singh N (2012) Literature review on automatic speech recognition. Int J Comput Appl 41(8):42\u201350","journal-title":"Int J Comput Appl"},{"key":"9775_CR52","unstructured":"Godambe T, Samudravijaya K (2011) Speech data acquisition for voice based agricultural information retrieval. In: Proceedings of the all India DLA conference, Punjabi University, Patiala, pp 1\u20138"},{"key":"9775_CR53","doi-asserted-by":"crossref","unstructured":"Gr\u00e9zl F, Karafiat M, Janda M (2011) Study of probabilistic and bottle-neck features in multilingual environment. In: IEEE workshop on automatic speech recognition and understanding (ASRU), pp 359\u2013364","DOI":"10.1109\/ASRU.2011.6163958"},{"issue":"3","key":"9775_CR54","first-page":"1664","volume":"4","author":"T Gulzar","year":"2014","unstructured":"Gulzar T, Singh A, Rajoriya DK, Farooq N (2014) A systematic analysis of automatic speech recognition: an overview. Int J Curr Eng Technol 4(3):1664\u20131675","journal-title":"Int J Curr Eng Technol"},{"key":"9775_CR55","doi-asserted-by":"crossref","unstructured":"Gunasekaran S, Revathy K (2008) Fractal dimension analysis of audio signals for Indian musical instrument recognition. In: Proceedings of the international conference on audio, language and image processing, pp 257\u2013261","DOI":"10.1109\/ICALIP.2008.4590238"},{"key":"9775_CR56","unstructured":"Hasnat M, Mowla J, Khan M (2007) Isolated and continuous bangla speech recognition: implementation, performance and application perspective. In: Proceedings of international symposium on natural language processing (SNLP), pp 1\u20136"},{"key":"9775_CR57","doi-asserted-by":"crossref","unstructured":"Hassan F, Kotwal MRA, Huda MN (2011) Bangla ASR design by suppressing gender factor with gender-independent and gender-based HMM classifiers. In: Proceedings of the world Congress on information and communication technologies (WICT), pp 1276\u20131281","DOI":"10.1109\/WICT.2011.6141432"},{"key":"9775_CR58","doi-asserted-by":"crossref","unstructured":"Hegde RM, Murthy HA, Gadde VRR (2004) Continuous speech recognition using joint features derived from the modified group delay function and MFCC. In: Proceedings of 8th international conference on spoken language processing, pp 1\u20134","DOI":"10.21437\/Interspeech.2004-333"},{"key":"9775_CR59","doi-asserted-by":"crossref","unstructured":"Hegde S, Achary KK, Shetty S (2012) Isolated word recognition for Kannada language using support vector machine. In: Wireless networks and computational intelligence, pp 262\u2013269","DOI":"10.1007\/978-3-642-31686-9_31"},{"issue":"1","key":"9775_CR60","first-page":"1707","volume":"5","author":"G Hemakumar","year":"2014","unstructured":"Hemakumar G, Punitha P (2014) Automatic Segmentation of Kannada speech signal into syllables and sub-words: noised and noiseless signals. Int J Sci Eng Res 5(1):1707\u20131711","journal-title":"Int J Sci Eng Res"},{"key":"9775_CR61","unstructured":"Interspeech (2018) Low resource speech recognition challenge for Indian Languages. https:\/\/www.microsoft.com\/en-us\/research\/event\/interspeech-2018-special-session-low-resource-speech-recognition-challenge-indian-languages\/ . Accessed 22 Feb 2018"},{"key":"9775_CR62","doi-asserted-by":"crossref","unstructured":"Jain A, Prakash N, Agrawal SS (2011) Evaluation of MFCC for emotion identification in Hindi speech. In: Proceedings of the 3rd international conference on communication software and networks (ICCSN), pp 189\u2013193","DOI":"10.1109\/ICCSN.2011.6014878"},{"key":"9775_CR63","unstructured":"Jayanna HS (2009) Limited data speaker recognition. Ph.D. thesis, Indian Institute of Technology Guwahati"},{"issue":"3","key":"9775_CR64","doi-asserted-by":"crossref","first-page":"544","DOI":"10.1016\/j.dsp.2011.11.008","volume":"22","author":"S Jothilakshmi","year":"2012","unstructured":"Jothilakshmi S, Ramalingam V, Palanivel S (2012) A hierarchical language identification system for Indian languages. Digit Signal Process 22(3):544\u2013553","journal-title":"Digit Signal Process"},{"issue":"4","key":"9775_CR65","doi-asserted-by":"crossref","first-page":"761","DOI":"10.1007\/s10772-017-9446-9","volume":"20","author":"V Kadyan","year":"2017","unstructured":"Kadyan V, Mantri A, Aggarwal RK (2017) A heterogeneous speech feature vectors generation approach with hybrid hmm classifiers. Int J Speech Technol 20(4):761\u2013769","journal-title":"Int J Speech Technol"},{"issue":"1","key":"9775_CR66","doi-asserted-by":"crossref","first-page":"111","DOI":"10.1007\/s10772-018-09577-3","volume":"22","author":"V Kadyan","year":"2018","unstructured":"Kadyan V, Mantri A, Aggarwal RK, Singh A (2018) A comparative study of deep neural network based Punjabi\u2014ASR system. Int J Speech Technol 22(1):111\u2013119","journal-title":"Int J Speech Technol"},{"issue":"3","key":"9775_CR67","first-page":"171","volume":"6","author":"N Kalyani","year":"2010","unstructured":"Kalyani N, Sunitha KVN (2010) Syllable analysis to build a dictation system in Telugu language. Int J Comput Sci Inf Secur (IJCSIS) 6(3):171\u2013176","journal-title":"Int J Comput Sci Inf Secur (IJCSIS)"},{"key":"9775_CR68","doi-asserted-by":"crossref","unstructured":"Kamble VV, Gaikwad BP, Rana DM (2014) Spontaneous emotion recognition for Marathi spoken words. In: Proceedings of international conference on communications and signal processing (ICCSP), pp 1984\u20131990","DOI":"10.1109\/ICCSP.2014.6950191"},{"key":"9775_CR69","doi-asserted-by":"crossref","unstructured":"Kandali AB, Routray A, Basu TK (2008) Emotion recognition from Assamese speeches using MFCC features and GMM classifier. In: Proceedings of the IEEE region 10 conference, pp 1\u20135","DOI":"10.1109\/TENCON.2008.4766487"},{"key":"9775_CR70","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1007\/s10772-009-9046-4","volume":"12","author":"AB Kandali","year":"2009","unstructured":"Kandali AB, Routray A, Basu TK (2009) Vocal emotion recognition in five native languages of Assam using new wavelet features. Int J Speech Technol 12:1\u201313","journal-title":"Int J Speech Technol"},{"key":"9775_CR71","doi-asserted-by":"crossref","unstructured":"Kannadaguli P, Bhat V (2018) A comparison of Bayesian and HMM based approaches in machine learning for emotion detection in native Kannada speaker. In: Proceedings of the IEEMA Engineer infinite conference (eTechNxT), pp 1\u20136","DOI":"10.1109\/ETECHNXT.2018.8385377"},{"key":"9775_CR72","doi-asserted-by":"crossref","unstructured":"Kaur A, Singh A (2016a) Power-normalized cepstral coefficients (PNCC) for Punjabi automatic speech recognition using phone based modelling in HTK. In: Proceedings of the 2nd international conference on applied and theoretical computing and communication technology (iCATccT), Bangalore, India, pp 372\u2013375","DOI":"10.1109\/ICATCCT.2016.7912026"},{"key":"9775_CR73","doi-asserted-by":"crossref","unstructured":"Kaur A, Singh A (2016b) Optimizing feature extraction techniques constituting phone based modelling on connected words for Punjabi automatic speech recognition. In: Proceedings of the 2nd international conference on advances in computing, communications and informatics (ICACCI), Jaipur, India, pp 2104\u20132108","DOI":"10.1109\/ICACCI.2016.7732362"},{"issue":"1","key":"9775_CR74","doi-asserted-by":"crossref","first-page":"35","DOI":"10.1007\/s10772-010-9085-x","volume":"14","author":"SG Koolagudi","year":"2011","unstructured":"Koolagudi SG, Krothapalli RS (2011) Two stage emotion recognition based on speaking rate. Int J Speech Technol 14(1):35\u201348","journal-title":"Int J Speech Technol"},{"key":"9775_CR75","doi-asserted-by":"crossref","unstructured":"Koolagudi SG, Reddy R, Yadav J, Rao KS (2011) IITKGP-SEHSC: Hindi speech corpus for emotion analysis. In: Proceedings of the international conference on devices and communications (ICDeCom), pp 1\u20135","DOI":"10.1109\/ICDECOM.2011.5738540"},{"key":"9775_CR76","doi-asserted-by":"crossref","first-page":"3391","DOI":"10.1016\/j.proeng.2012.06.392","volume":"38","author":"SG Koolagudi","year":"2012","unstructured":"Koolagudi SG, Rastogi D, Rao KS (2012) Identification of language using mel-frequency cepstral coefficients (MFCC). Procedia Eng 38:3391\u20133398","journal-title":"Procedia Eng"},{"key":"9775_CR77","doi-asserted-by":"crossref","unstructured":"Kotwal MRA, Halim T, Almaji MMH, Hossain I, Huda MN (2012) Extraction of local features for tri-phone based Bangla ASR. In: Proceedings of the ninth international conference on information technology: new generations (ITNG), pp 668\u2013673","DOI":"10.1109\/ITNG.2012.135"},{"issue":"2","key":"9775_CR78","doi-asserted-by":"crossref","first-page":"297","DOI":"10.1007\/s10772-017-9408-2","volume":"20","author":"Y Kumar","year":"2017","unstructured":"Kumar Y, Singh N (2017) An automatic speech recognition system for spontaneous Punjabi speech corpus. Int J Speech Technol 20(2):297\u2013303","journal-title":"Int J Speech Technol"},{"issue":"5\u20136","key":"9775_CR79","doi-asserted-by":"crossref","first-page":"703","DOI":"10.1147\/rd.485.0703","volume":"48","author":"M Kumar","year":"2004","unstructured":"Kumar M, Rajput N, Verma A (2004) A large-vocabulary continuous speech recognition system for Hindi. IBM J Res Dev 48(5\u20136):703\u2013715","journal-title":"IBM J Res Dev"},{"key":"9775_CR204","doi-asserted-by":"crossref","first-page":"25","DOI":"10.1504\/IJCSYSE.2012.044740","volume":"1","author":"K Kumar","year":"2012","unstructured":"Kumar K, Aggarwal R, Jain A (2012) A Hindi speech recognition system for connected words using HTK. Int J Comput Syst Eng 1:25\u201332","journal-title":"Int J Comput Syst Eng"},{"key":"9775_CR80","unstructured":"Kumar SBS, Rao KS, Pati D (2013a) Phonetic and prosodically rich transcribed speech corpus in Indian languages: Bengali and Odia. In: Proceedings of international conference oriental COCOSDA held jointly with 2013 conference on Asian spoken language research and evaluation (O-COCOSDA\/CASLRE), pp 1\u20135"},{"key":"9775_CR81","unstructured":"Kumar SSB, Rao KS, Pati D (2013b) Phonetic and prosodically rich transcribed speech corpus in Indian languages: Bengali and Odia. In: Proceedings of the international conference oriental COCOSDA held jointly with 2013 conference on Asian spoken language research and evaluation (O-COCOSDA\/CASLRE), pp 1\u20135"},{"key":"9775_CR82","doi-asserted-by":"crossref","unstructured":"Kumar A, Dua M, Choudhary A (2014a) Implementation and performance evaluation of continuous Hindi speech recognition. In: Proceedings of international conference on electronics and communication systems (ICECS), pp 1\u20135","DOI":"10.1109\/ECS.2014.6892777"},{"key":"9775_CR201","doi-asserted-by":"crossref","unstructured":"Kumar A, Dua M, Choudhary T (2014b) Continuous Hindi speech recognition using monophone based acoustic modeling. In: Proceedings of the international conference on advances in computer engineering & applications. pp 1\u20135","DOI":"10.1109\/SCEECS.2014.6804519"},{"key":"9775_CR83","doi-asserted-by":"crossref","first-page":"231","DOI":"10.1016\/j.procs.2015.06.027","volume":"54","author":"VR Kumar","year":"2015","unstructured":"Kumar VR, Vydana HK, Vuppala AK (2015) Significance of GMM-UBM based modelling for Indian language identification. Procedia Comput Sci 54:231\u2013236","journal-title":"Procedia Comput Sci"},{"key":"9775_CR84","doi-asserted-by":"crossref","unstructured":"Kumari P, Deiv DS, Bhattacharya M (2014) Automatic speech recognition of accented Hindi data. In: Proceedings of the international conference on computation of power, energy, information and communication (ICCPEIC), pp 68\u201376","DOI":"10.1109\/ICCPEIC.2014.6915342"},{"issue":"4","key":"9775_CR85","first-page":"80","volume":"4","author":"C Kurian","year":"2014","unstructured":"Kurian C (2014) A review on technological development of automatic speech recognition. Int J Soft Comput Eng 4(4):80\u201386","journal-title":"Int J Soft Comput Eng"},{"key":"9775_CR86","doi-asserted-by":"crossref","unstructured":"Kurian C, Balakrishnan K (2009) Speech recognition of Malayalam numbers. In: Proceedings of the world Congress on nature and biologically inspired computing, pp 1475\u20131479","DOI":"10.1109\/NABIC.2009.5393692"},{"key":"9775_CR87","unstructured":"Lakshmi A, Murthy HA (2008) A new approach to continuous speech recognition in Indian languages. In: Proceedings of the national conference on communication, pp 1\u20135"},{"issue":"2","key":"9775_CR88","doi-asserted-by":"crossref","first-page":"221","DOI":"10.1007\/s12046-009-0006-0","volume":"34","author":"SG Lakshmi","year":"2009","unstructured":"Lakshmi SG, Lakshmi A, Murthy HA, Nagarajan T (2009) Automatic transcription of continuous speech into syllable-like units for Indian languages. Sadhana 34(2):221\u2013233","journal-title":"Sadhana"},{"key":"9775_CR89","doi-asserted-by":"crossref","unstructured":"Lata S, Arora S (2013) Laryngeal tonal characteristics of Punjabi\u2014an experimental study. In: Proceedings of the international conference on human computer interactions (ICHCI), pp 1\u20136","DOI":"10.1109\/ICHCI-IEEE.2013.6887793"},{"key":"9775_CR90","doi-asserted-by":"crossref","unstructured":"Maity S, Vuppala AK, Rao KS, Nandi D (2012) IITKGP-MLILSC speech database for language identification. In: Proceedings of the national conference on communication, pp 1\u20135","DOI":"10.1109\/NCC.2012.6176831"},{"key":"9775_CR91","doi-asserted-by":"crossref","unstructured":"Malde KD, Vachhani BB, Madhavi MC, Chhayani NH, Patil HA (2013) Development of speech corpora in Gujarati and Marathi for phonetic transcription. In: Proceedings of the international conference on oriental COCOSDA held jointly with Asian spoken language research and evaluation (O-COCOSDA\/CASLRE), pp 1\u20136","DOI":"10.1109\/ICSDA.2013.6709865"},{"key":"9775_CR92","doi-asserted-by":"crossref","unstructured":"Malhotra K, Khosla A (2008) Automatic identification of gender and accent in spoken Hindi utterances with regional Indian accents. In: Proceedings of the spoken language technology workshop, pp 309\u2013312","DOI":"10.1109\/SLT.2008.4777902"},{"key":"9775_CR93","doi-asserted-by":"crossref","unstructured":"Malhotra K, Khosla A (2013) Impact of regional Indian accents on spoken Hindi. In: Proceedings of the international conference on oriental COCOSDA held jointly with 2013 conference on Asian spoken language research and evaluation (O-COCOSDA\/CASLRE), pp 1\u20134","DOI":"10.1109\/ICSDA.2013.6709876"},{"key":"9775_CR94","doi-asserted-by":"crossref","unstructured":"Mandal S, Das B, Mitra P (2010) Shruti-II: a vernacular speech recognition system in Bengali and an application for visually impaired community. In: Proceedings of the students\u2019 technology symposium (TechSym), pp 229\u2013233","DOI":"10.1109\/TECHSYM.2010.5469156"},{"key":"9775_CR95","doi-asserted-by":"crossref","unstructured":"Mandal P, Jain S, Ojha G, Shukla A (2015) Development of Hindi speech recognition system of agricultural commodities using deep neural network. In: Proceedings of sixteenth annual conference of the international speech communication association, pp 1241\u20131245","DOI":"10.21437\/Interspeech.2015-312"},{"key":"9775_CR96","unstructured":"Manjunath KE, Rao KS (2014) Automatic phonetic transcription for read, extempore and conversation speech for an Indian language: Bengali. In: Proceedings of the twentieth national conference on communications (NCC), pp 1\u20136"},{"issue":"2","key":"9775_CR97","doi-asserted-by":"crossref","first-page":"704","DOI":"10.1007\/s00034-017-0568-8","volume":"37","author":"KE Manjunath","year":"2018","unstructured":"Manjunath KE, Rao KS (2018) Improvement of phone recognition accuracy using articulatory features. Circuits Syst Signal Process 37(2):704\u2013728","journal-title":"Circuits Syst Signal Process"},{"key":"9775_CR98","unstructured":"Mantena GV, Rajendran S, Gangashetty SV, Yegnanarayana B, Prahallad K (2011) Development of a spoken dialogue system for accessing agricultural information in Telugu. In: Proceedings of the 9th international conference on natural language processing, pp 1\u20136"},{"key":"9775_CR99","doi-asserted-by":"crossref","unstructured":"Mehta K, Anand RS (2010) Robust front-end and back-end processing for feature extraction for Hindi speech recognition. In: Proceedings of the IEEE international conference on computational intelligence and computing research (ICCIC), pp 1\u20134","DOI":"10.1109\/ICCIC.2010.5705781"},{"issue":"6","key":"9775_CR100","doi-asserted-by":"crossref","first-page":"1390","DOI":"10.1007\/s11771-016-3191-0","volume":"23","author":"T Mittal","year":"2016","unstructured":"Mittal T, Sharma RK (2016) Integrated search technique for parameter determination of SVM for speech recognition. J Cent South Univ 23(6):1390\u20131398","journal-title":"J Cent South Univ"},{"key":"9775_CR101","doi-asserted-by":"crossref","unstructured":"Mittal T, Barthwal A, Koolagudi SG (2013) Age approximation from speech using Gaussian mixture models. In: Proceedings of 2nd international conference on advanced computing, networking and security (ADCONS), pp 74\u201378","DOI":"10.1109\/ADCONS.2013.43"},{"key":"9775_CR102","doi-asserted-by":"crossref","first-page":"676","DOI":"10.1016\/j.procs.2016.07.261","volume":"93","author":"FK Mohamed","year":"2016","unstructured":"Mohamed FK, Lajish VL (2016) Nonlinear speech analysis and modeling for Malayalam vowel recognition. Procedia Comput Sci 93:676\u2013682","journal-title":"Procedia Comput Sci"},{"key":"9775_CR103","doi-asserted-by":"crossref","first-page":"616","DOI":"10.1016\/j.proeng.2012.01.906","volume":"30","author":"A Mohamed","year":"2012","unstructured":"Mohamed A, Nair KR (2012) HMM\/ANN hybrid model for continuous Malayalam speech recognition. Procedia Eng 30:616\u2013622","journal-title":"Procedia Eng"},{"key":"9775_CR104","doi-asserted-by":"crossref","unstructured":"Mohan A, Rose R (2013) Cross-lingual context sharing and parameter-tying for multi-lingual speech recognition. In: Proceedings of the IEEE workshop on automatic speech recognition and understanding (ASRU), pp 126\u2013131","DOI":"10.1109\/ASRU.2013.6707717"},{"key":"9775_CR105","doi-asserted-by":"crossref","unstructured":"Mohan A, Umesh S, Rose R (2012) Subspace based for Indian languages. In: 11th International conference on information science, signal processing and their applications (ISSPA), pp 35\u201339","DOI":"10.1109\/ISSPA.2012.6310575"},{"key":"9775_CR106","doi-asserted-by":"crossref","first-page":"167","DOI":"10.1016\/j.specom.2013.07.005","volume":"56","author":"A Mohan","year":"2014","unstructured":"Mohan A, Rose R, Ghalehjegh SH, Umesh S (2014) Acoustic modelling for speech recognition in Indian languages in an agricultural commodities task domain. Speech Commun 56:167\u2013180","journal-title":"Speech Commun"},{"key":"9775_CR107","doi-asserted-by":"crossref","unstructured":"Muralikrishna H, Ananthakrishna T (2013) HMM based isolated Kannada digit recognition system using MFCC. In: Proceedings of the international conference on advances in computing, communications and informatics (ICACCI), pp 730\u2013733","DOI":"10.1109\/ICACCI.2013.6637264"},{"key":"9775_CR108","doi-asserted-by":"crossref","unstructured":"Musfir M, Krishnan KR, Murthy HA (2014) Analysis of fricatives, stop consonants and nasals in the automatic segmentation of speech using the group delay algorithm. In: Proceedings of twentieth national conference on communications (NCC), pp 1\u20136","DOI":"10.1109\/NCC.2014.6811364"},{"issue":"2","key":"9775_CR109","doi-asserted-by":"crossref","first-page":"307","DOI":"10.1016\/j.csl.2009.05.001","volume":"24","author":"NU Nair","year":"2010","unstructured":"Nair NU, Sreenivas TV (2010) Joint evaluation of multiple speech patterns for speech recognition and training. Comput Speech Lang 24(2):307\u2013340","journal-title":"Comput Speech Lang"},{"key":"9775_CR110","unstructured":"Pal M, Roy R, Khan S, Bepari MS, Basu J (2018) PannoMulloKathan: voice enabled mobile app for agricultural commodity price dissemination in Bengali language. In: Interspeech, pp 1491\u20131492"},{"key":"9775_CR111","doi-asserted-by":"crossref","unstructured":"Pandey L, Nathwani K (2018) LSTM based attentive fusion of spectral and prosodic information for keyword spotting in Hindi language. In: Interspeech, pp 112\u2013116","DOI":"10.21437\/Interspeech.2018-1016"},{"key":"9775_CR112","doi-asserted-by":"crossref","unstructured":"Pandey D, Mondal T, Agrawal SS, Bangalore S (2013) Development and suitability of Indian languages speech database for building watson based ASR system. In: Proceedings of the international conference on oriental COCOSDA held jointly with Asian Spoken language research and evaluation (O-COCOSDA\/CASLRE), pp 1\u20136","DOI":"10.1109\/ICSDA.2013.6709861"},{"key":"9775_CR113","doi-asserted-by":"crossref","unstructured":"Pandey A, Srivastava BML, Gangashetty SV (2017) Adapting monolingual resources for code-mixed hindi-english speech recognition. In: Proceedings of international conference on Asian language processing (IALP), pp 218\u2013221","DOI":"10.1109\/IALP.2017.8300583"},{"key":"9775_CR114","doi-asserted-by":"crossref","unstructured":"Parameswarappa S, Narayana VN (2011) Target word sense disambiguation system for Kannada language. In: Proceedings of the 3rd international conference on advances in recent technologies in communication and computing, pp 269\u2013273","DOI":"10.1049\/ic.2011.0097"},{"key":"9775_CR115","unstructured":"Patel TB, Patil HA (2016) Effectiveness of fundamental frequency (F 0) and strength of excitation (SoE) for spoofed speech detection. In: Proceedings of the IEEE international conference on acoustics, speech and signal processing (ICASSP), pp 5105\u20135109"},{"key":"9775_CR116","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2018-2133","author":"T Patel","year":"2018","unstructured":"Patel T, Krishna DN, Fathima N, Shah N, Mahima C, Kumar D, Iyengar A (2018) Development of large vocabulary speech recognition system with keyword search for Manipuri. Proc Inter speech. https:\/\/doi.org\/10.21437\/Interspeech.2018-2133","journal-title":"Proc Inter speech"},{"key":"9775_CR117","doi-asserted-by":"crossref","unstructured":"Patil PP, Pardeshi SA (2014a) Marathi connected word speech recognition system. In: Proceedings of the first international conference on networks and soft computing (ICNSC), pp 314\u2013318","DOI":"10.1109\/CNSC.2014.6906687"},{"key":"9775_CR118","doi-asserted-by":"crossref","unstructured":"Patil PP, Pardeshi SA (2014b) Devnagari phoneme recognition system. In: Proceedings of the fourth international conference on advances in computing and communications (ICACC), pp 5\u20138","DOI":"10.1109\/ICACC.2014.92"},{"key":"9775_CR119","doi-asserted-by":"crossref","first-page":"202","DOI":"10.1016\/j.wocn.2015.11.001","volume":"54","author":"VV Patil","year":"2016","unstructured":"Patil VV, Rao P (2016) Detection of phonemic aspiration for spoken Hindi pronunciation evaluation. J Phon 54:202\u2013221","journal-title":"J Phon"},{"key":"9775_CR120","doi-asserted-by":"crossref","unstructured":"Paul AK, Das D, Kamal M (2009) Bangla speech recognition system using LPC and ANN. In: Proceedings of the 7th international conference on advances in pattern recognition, pp 171\u2013174","DOI":"10.1109\/ICAPR.2009.80"},{"key":"9775_CR121","doi-asserted-by":"crossref","unstructured":"Plauche M, Nallasamy U, Pal J, Wooters C, Ramachandran D (2006) Speech recognition for illiterate access to information and technology. In: Proceedings of the international conference on information and communication technologies and development, pp 83\u201392","DOI":"10.1109\/ICTD.2006.301842"},{"issue":"8","key":"9775_CR122","doi-asserted-by":"crossref","first-page":"2552","DOI":"10.1109\/TASL.2011.2155061","volume":"19","author":"SRM Prasanna","year":"2011","unstructured":"Prasanna SRM, Pradhan G (2011) Significance of vowel-like regions for speaker verification under degraded conditions. IEEE Trans Audio Speech Lang Process 19(8):2552\u20132565","journal-title":"IEEE Trans Audio Speech Lang Process"},{"issue":"5","key":"9775_CR123","first-page":"2623","volume":"2","author":"P Pravin","year":"2013","unstructured":"Pravin P, Jethva H (2013) Neural network based Gujarati language speech recognition. Int J Comput Sci Manag Res 2(5):2623\u20132627","journal-title":"Int J Comput Sci Manag Res"},{"key":"9775_CR124","doi-asserted-by":"crossref","unstructured":"Pulugundla B, Baskar MK, Kesiraju S, Egorova E, Karafiat M, Burget L, Cernock J (2018) BUT system for low resource Indian language ASR. In: Interspeech, pp 3182\u20133186","DOI":"10.21437\/Interspeech.2018-1302"},{"key":"9775_CR127","doi-asserted-by":"crossref","first-page":"1097","DOI":"10.1016\/j.proeng.2012.01.968","volume":"30","author":"V Radha","year":"2012","unstructured":"Radha V (2012) Speaker independent isolated speech recognition system for Tamil language using HMM. Procedia Eng 30:1097\u20131102","journal-title":"Procedia Eng"},{"key":"9775_CR128","doi-asserted-by":"crossref","unstructured":"Rahul L, Nandakishor S, Singh LJ, Dutta SK (2013) Design of Manipuri keywords spotting system using HMM. In: Proceedings of the fourth national conference on computer vision, pattern recognition, image processing and graphics (NCVPRIPG), pp 1\u20133","DOI":"10.1109\/NCVPRIPG.2013.6776249"},{"key":"9775_CR129","unstructured":"Raji SA, Sarin SA, Firoz SA, Babu AP (2010) Key-word based query recognition in a speech corpus by using artificial neural networks. In: Proceedings of 2nd international conference on computational intelligence, communication systems and networks, pp 33\u201336"},{"key":"9775_CR130","doi-asserted-by":"crossref","unstructured":"Rajput N, Subramaniam LV, Verma A (2000) Adapting phonetic decision trees between languages for continuous speech recognition. In: Proceedings of the sixth international conference on spoken language processing, pp 1\u20133","DOI":"10.21437\/ICSLP.2000-667"},{"key":"9775_CR131","unstructured":"Ram CS, Ponnusamy R (2014) An effective automatic speech emotion recognition for Tamil language using support vector machine. In: Proceedings of the international conference on issues and challenges in intelligent computing techniques (ICICT), pp 19\u201323"},{"issue":"3","key":"9775_CR132","doi-asserted-by":"crossref","first-page":"737","DOI":"10.1109\/TSA.2005.858071","volume":"14","author":"S Ramamohan","year":"2006","unstructured":"Ramamohan S, Dandapat S (2006) Sinusoidal model-based analysis and classification of stressed speech. IEEE Trans Audio Speech Lang Process 14(3):737\u2013746","journal-title":"IEEE Trans Audio Speech Lang Process"},{"issue":"6","key":"9775_CR133","doi-asserted-by":"crossref","first-page":"747","DOI":"10.1007\/s12046-012-0109-x","volume":"37","author":"NU Rani","year":"2012","unstructured":"Rani NU, Girija PN (2012) Error analysis to improve the speech recognition accuracy on Telugu language. Sadhana 37(6):747\u2013761","journal-title":"Sadhana"},{"key":"9775_CR134","doi-asserted-by":"crossref","unstructured":"Ranjan S (2010) A discrete wavelet transform based approach to Hindi speech recognition. In: Proceedings of the international conference on signal acquisition and processing, pp 345\u2013348","DOI":"10.1109\/ICSAP.2010.21"},{"key":"9775_CR135","doi-asserted-by":"crossref","unstructured":"Ranjan R, Singh SK, Shukla A, Tiwari R (2010) Text-dependent multilingual speaker identification for indian languages using artificial neural network. In: Proceedings of 3rd international conference on emerging trends in engineering and technology (ICETET), pp 632\u2013635","DOI":"10.1109\/ICETET.2010.23"},{"key":"9775_CR136","doi-asserted-by":"crossref","first-page":"19","DOI":"10.1007\/s10772-010-9086-9","volume":"14","author":"KS Rao","year":"2011","unstructured":"Rao KS (2011) Application of prosody models for developing speech systems in Indian languages. Int J Speech Technol 14:19\u201333","journal-title":"Int J Speech Technol"},{"key":"9775_CR137","doi-asserted-by":"crossref","unstructured":"Renjith S, Manju KG (2017) Speech based emotion recognition in Tamil and Telugu using LPCC and hurst parameters\u2014a comparitive study using KNN and ANN classifiers. In: Proceedings of international conference on in circuit, power and computing technologies (ICCPCT), pp 1\u20136","DOI":"10.1109\/ICCPCT.2017.8074220"},{"key":"9775_CR138","doi-asserted-by":"crossref","unstructured":"Rojathai S, Venkatesulu M (2014) Noise robust Tamil speech word recognition system by means of PAC features with ANFIS. In: Proceedings of the IEEE\/ACIS 13th international conference on computer and information science (ICIS), pp 435\u2013440","DOI":"10.1109\/ICIS.2014.6912173"},{"key":"9775_CR139","unstructured":"Saad MK, Ashour W (2010) OSAC: open source Arabic corpora. In: Proceedings of the 6th international conference on electrical and computer systems, pp 1\u20136"},{"key":"9775_CR140","doi-asserted-by":"crossref","unstructured":"Sadanandam M, Prasad VK, Janaki V, Nagesh A (2012) Text independent language recognition system using DHMM with new features. In: Proceedings of the IEEE 11th international conference on signal processing (ICSP), pp 511\u2013514","DOI":"10.1109\/ICoSP.2012.6491537"},{"issue":"2","key":"9775_CR141","first-page":"132","volume":"4","author":"P Saini","year":"2013","unstructured":"Saini P, Kaur P (2013) Automatic speech recognition: a review. Int J Eng Trends Technol 4(2):132\u2013136","journal-title":"Int J Eng Trends Technol"},{"key":"9775_CR142","doi-asserted-by":"crossref","unstructured":"Samudravijaya K (2006) Development of multi-lingual spoken corpora of Indian languages. In: Proceedings of the Chinese spoken language processing symposium, pp 792\u2013801","DOI":"10.1007\/11939993_79"},{"key":"9775_CR143","unstructured":"Samudravijaya K (2014) HMMs as generative models of speech, workshop on Text-to-Speech (TTS) synthesis. http:\/\/www.iitg.ac.in\/samudravijaya\/tutorialSlides\/hmm4hts_samudravijaya140615.pdf . Accessed 20 Jan 2018"},{"key":"9775_CR144","unstructured":"Samudravijaya K, Gogate MR (2006) Marathi speech database. In: Proceedings of the international symposium on speech technology and processing systems and oriental COCOSDA, pp 21\u201324"},{"issue":"4","key":"9775_CR145","doi-asserted-by":"crossref","first-page":"313","DOI":"10.1007\/BF02745745","volume":"23","author":"K Samudravijaya","year":"1998","unstructured":"Samudravijaya K, Ahuja R, Bondale N, Jose T, Krishnan S, Poddar P, Raveendran R (1998) A feature-based hierarchical speech recognition system for Hindi. Sadhana 23(4):313\u2013340","journal-title":"Sadhana"},{"key":"9775_CR146","unstructured":"Samudravijaya K, Rao PVS, Agrawal SS (2002) Hindi speech database. In: Proceedings of the international conference on spoken language processing, pp 456\u2013464"},{"key":"9775_CR147","doi-asserted-by":"crossref","unstructured":"Sangwan A, Mehrabani M, Hansen JH (2010) Automatic language analysis and identification based on speech production knowledge. In: Proceedings of the IEEE international conference on acoustics speech and signal processing (ICASSP), pp 5006\u20135009","DOI":"10.1109\/ICASSP.2010.5495066"},{"issue":"3","key":"9775_CR148","first-page":"214","volume":"4","author":"S Saraswathi","year":"2007","unstructured":"Saraswathi S, Geetha T (2007) Morpheme based language model for Tamil speech recognition system. Int Arab J Inf Technol 4(3):214\u2013219","journal-title":"Int Arab J Inf Technol"},{"key":"9775_CR149","unstructured":"Sarfraz H, Hussain S, Bokhari R, Raza AA, UllahI, Sarfraz Z, Parveen R (2010) Speech corpus development for a speaker independent spontaneous Urdu speech recognition system. In: Proceedings of the O-COCOSDA, pp 1\u20136"},{"issue":"3","key":"9775_CR150","doi-asserted-by":"crossref","first-page":"305","DOI":"10.1080\/02564602.2017.1293570","volume":"35","author":"BD Sarma","year":"2018","unstructured":"Sarma BD, Prasanna SRM (2018) Acoustic\u2013phonetic analysis for speech recognition: a review. IETE Tech Rev 35(3):305\u2013327","journal-title":"IETE Tech Rev"},{"key":"9775_CR151","doi-asserted-by":"crossref","unstructured":"Sarma M, Dutta K, Sarma KK (2010) Speech corpus of Assamese numerals extracted using an adaptive pre-emphasis filter for speech recognition. In: Proceedings of the international conference on computer and communication technology (ICCCT), pp 461\u2013466","DOI":"10.1109\/ICCCT.2010.5640485"},{"key":"9775_CR152","unstructured":"Sarma BD, Sarma M, Sarma M, Prasanna SRM (2013) Development of Assamese phonetic engine: some issues. In: Proceedings of the annual IEEE India conference (INDICON), pp 1\u20136"},{"key":"9775_CR153","doi-asserted-by":"crossref","unstructured":"Sarma BD, Sarmah P, Lalhminghlui W, Prasanna SM (2015) Detection of Mizo tones. In: Proceedings of sixteenth annual conference of the international speech communication association, pp 934\u2013937","DOI":"10.21437\/Interspeech.2015-15"},{"issue":"7","key":"9775_CR154","doi-asserted-by":"crossref","first-page":"472","DOI":"10.1109\/TSA.2002.804298","volume":"10","author":"CC Sekhar","year":"2002","unstructured":"Sekhar CC, Yegnanarayana B (2002) A constraint satisfaction model for recognition of stop consonant-vowel (SCV) utterances. IEEE Trans Speech Audio Process 10(7):472\u2013480","journal-title":"IEEE Trans Speech Audio Process"},{"issue":"7","key":"9775_CR155","doi-asserted-by":"crossref","first-page":"1853","DOI":"10.1109\/TASL.2010.2101595","volume":"19","author":"G Seshadri","year":"2011","unstructured":"Seshadri G, Yegnanarayana B (2011) Performance of an event-based instantaneous fundamental frequency estimator for distant speech signals. IEEE Trans Audio Speech Lang Process 19(7):1853\u20131864","journal-title":"IEEE Trans Audio Speech Lang Process"},{"key":"9775_CR156","unstructured":"Shah F (2009) Automatic emotion recognition from speech using artificial neural networks with gender-dependent databases. In: Proceedings of the international conference on advances in computing, control, and telecommunication technologies, pp 162\u2013164"},{"key":"9775_CR157","unstructured":"Shruti (2015) Bengali continuous ASR Speech Corpus 2015. http:\/\/cse.iitkgp.ac.in\/pabitra\/shruti-corpus.html . Accessed 20 Jan 2018"},{"issue":"3","key":"9775_CR158","first-page":"222","volume":"2","author":"B Singh","year":"2011","unstructured":"Singh B, Singh P (2011) Voice based user machine interface for Punjabi using Hidden Markov model. Int J Comput Sci Technol 2(3):222\u2013224","journal-title":"Int J Comput Sci Technol"},{"key":"9775_CR159","doi-asserted-by":"crossref","unstructured":"Singhvi A, Gupta P, Sanyal S (2008) Hierarchical phoneme classifier for Hindi speech. In: Proceedings of the 9th international conference on signal processing, pp 571\u2013574","DOI":"10.1109\/ICOSP.2008.4697197"},{"key":"9775_CR160","doi-asserted-by":"crossref","unstructured":"Sinha S, Agrawal SS and Olsen J (2011) Development of Hindi mobile communication text and speech corpus. In: Proceedings of O-COCODSA, pp 30\u201335","DOI":"10.1109\/ICSDA.2011.6085975"},{"key":"9775_CR161","doi-asserted-by":"crossref","unstructured":"Sinha S, Agrawal SS, Jain A (2013) Continuous density hidden markov model for context dependent Hindi speech recognition. In: Proceedings of the international conference on advances in computing, communications and informatics (ICACCI), pp 1953\u20131958","DOI":"10.1109\/ICACCI.2013.6637481"},{"key":"9775_CR162","doi-asserted-by":"crossref","unstructured":"Sreenu G, Girija PN, Prasad MN, Nagamani M (2004) A human machine speaker dependent speech interactive system. In: Proceedings of the IEEE INDICON, pp 349\u2013351","DOI":"10.1109\/INDICO.2004.1497769"},{"key":"9775_CR163","doi-asserted-by":"crossref","unstructured":"Sriranjani R, Karthick BM, Umesh S (2014) Experiments on front-end techniques and segmentation model for robust Indian Language speech recognizer. In: Proceedings of the twentieth national conference on communications (NCC), pp 1\u20136","DOI":"10.1109\/NCC.2014.6811284"},{"key":"9775_CR164","doi-asserted-by":"crossref","unstructured":"Sukumar AR, Shah AF, Anto PB (2010) Isolated question words recognition from speech queries by using artificial neural networks. In: Proceedings of international conference on computing communication and networking technologies, pp 1\u20134","DOI":"10.1109\/ICCCNT.2010.5591733"},{"issue":"6","key":"9775_CR165","first-page":"33","volume":"2","author":"KRK Sunil","year":"2012","unstructured":"Sunil KRK, Lajish VL (2012) Vowel phoneme recognition based on average energy information in the zerocrossing intervals and its distribution using ANN. Int J Inf Sci Tech 2(6):33\u201342","journal-title":"Int J Inf Sci Tech"},{"issue":"1","key":"9775_CR166","doi-asserted-by":"crossref","first-page":"93","DOI":"10.1007\/s10772-018-9491-z","volume":"21","author":"M Swain","year":"2018","unstructured":"Swain M, Routray A, Kabisatpathy P (2018) Databases, features and classifiers for speech emotion recognition: a review. Int J Speech Technol 21(1):93\u2013120","journal-title":"Int J Speech Technol"},{"key":"9775_CR167","doi-asserted-by":"crossref","unstructured":"Taheri A, Tarihi MR, Ali HV (2006) Fuzzy hidden markov models and fuzzy NN models in speaker recognition. In: Proceedings of the 1st IEEE conference on industrial electronics and applications, pp 1\u20135","DOI":"10.1109\/ICIEA.2006.257377"},{"key":"9775_CR168","first-page":"177","volume":"11","author":"EA Thakur","year":"2011","unstructured":"Thakur EA, Singla N, Patil VV (2011) Design of Hindi key word recognition system for home automation system using MFCC and DTW. Int J Adv Eng Sci Technol 11:177\u2013182","journal-title":"Int J Adv Eng Sci Technol"},{"issue":"3","key":"9775_CR169","first-page":"1","volume":"4","author":"A Thakur","year":"2013","unstructured":"Thakur A, Kumar R, Kumar N (2013) Automatic speech recognition system for Hindi utterances with regional Indian accents: a review. Int J Electron Commun Technol 4(3):1\u20136","journal-title":"Int J Electron Commun Technol"},{"issue":"4","key":"9775_CR170","doi-asserted-by":"crossref","first-page":"817","DOI":"10.1007\/s10772-016-9374-0","volume":"19","author":"A Thalengala","year":"2016","unstructured":"Thalengala A, Shama K (2016) Study of sub-word acoustical models for Kannada isolated word recognition system. Int J Speech Technol 19(4):817\u2013826","journal-title":"Int J Speech Technol"},{"issue":"3","key":"9775_CR171","first-page":"76","volume":"4","author":"R Thangarajan","year":"2008","unstructured":"Thangarajan R, Natarajan AM, Selvam M (2008) Word and triphone based approaches in continuous speech recognition for Tamil language. WSEAS Trans Signal Process 4(3):76\u201386","journal-title":"WSEAS Trans Signal Process"},{"key":"9775_CR172","unstructured":"Thasleema TM, Narayanan NK (2012) Wavelet transform based consonant\u2013vowel (CV) classification using support vector machines. In: Proceedings of the international conference on neural information processing, pp 250\u2013257"},{"key":"9775_CR173","doi-asserted-by":"crossref","unstructured":"Thasleema TM, Kabeer V, Narayanan NK (2007) Malayalam vowel recognition based on linear predictive coding parameters and k-NN algorithm. In: Proceedings of international conference on computational intelligence and multimedia applications (ICCIMA 2007), pp 361\u2013365","DOI":"10.1109\/ICCIMA.2007.372"},{"key":"9775_CR203","doi-asserted-by":"crossref","unstructured":"Udhyakumar N, Swaminathan R, Ramakrishnan SK (2004) Multilingual speech recognition for information retrieval in Indian context. In: Proceedings from the student research workshop, HLT\/NAACL, Boston, MA. pp 1\u20136","DOI":"10.3115\/1614038.1614039"},{"key":"9775_CR174","doi-asserted-by":"crossref","unstructured":"Undha AG, Patil HA, Madhavi MC (2014) Exploiting speech source information for vowel landmark detection for low resource language. In: Proceedings of 9th international symposium on chinese spoken language processing, pp 546\u2013550","DOI":"10.1109\/ISCSLP.2014.6936660"},{"key":"9775_CR175","unstructured":"Upadhyay RK, Riyal MK (2010) Garhwali speech database. In: Proceedings of O-COCOSDA, pp 1\u20133"},{"issue":"1","key":"9775_CR176","doi-asserted-by":"crossref","first-page":"193","DOI":"10.1007\/s11036-018-1052-9","volume":"24","author":"V Vegesna","year":"2018","unstructured":"Vegesna V, Gurugubelli K, Vuppala A (2018) Application of emotion recognition and modification for emotional Telugu speech recognition. Mob Netw Appl 24(1):193\u2013201","journal-title":"Mob Netw Appl"},{"key":"9775_CR177","doi-asserted-by":"crossref","unstructured":"Venkateswarlu RLK, Teja RR, Kumari RV (2012) Developing efficient speech recognition system for Telugu letter recognition. In: Proceedings of international conference on computing, communication and applications, pp 1\u20136","DOI":"10.1109\/ICCCA.2012.6179184"},{"key":"9775_CR178","doi-asserted-by":"crossref","unstructured":"Vydana HK, Vikash P, Vamsi T, Kumar KP, Vuppala AK (2015) Detection of emotionally significant regions of speech for emotion recognition. In: Proceedings of the annual IEEEIndia conference (INDICON), pp 1\u20136","DOI":"10.1109\/INDICON.2015.7443415"},{"issue":"5","key":"9775_CR179","doi-asserted-by":"crossref","first-page":"651","DOI":"10.1007\/s12046-011-0046-0","volume":"36","author":"B Yegnanarayana","year":"2011","unstructured":"Yegnanarayana B, Gangashetty SV (2011) Epoch-based analysis of speech signals. Sadhana 36(5):651\u2013697","journal-title":"Sadhana"},{"issue":"4","key":"9775_CR180","doi-asserted-by":"crossref","first-page":"575","DOI":"10.1109\/TSA.2005.848892","volume":"13","author":"B Yegnanarayana","year":"2005","unstructured":"Yegnanarayana B, Prasanna SRM, Gupta CS (2005) Combining evidence from source, supra segmental and spectral features for a fixed-text speaker verification system. IEEE Trans Speech Audio Process 13(4):575\u2013582","journal-title":"IEEE Trans Speech Audio Process"}],"container-title":["Artificial Intelligence Review"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10462-019-09775-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10462-019-09775-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10462-019-09775-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,10,1]],"date-time":"2022-10-01T13:53:26Z","timestamp":1664632406000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10462-019-09775-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,10,11]]},"references-count":179,"journal-issue":{"issue":"5","published-print":{"date-parts":[[2020,6]]}},"alternative-id":["9775"],"URL":"https:\/\/doi.org\/10.1007\/s10462-019-09775-8","relation":{},"ISSN":["0269-2821","1573-7462"],"issn-type":[{"value":"0269-2821","type":"print"},{"value":"1573-7462","type":"electronic"}],"subject":[],"published":{"date-parts":[[2019,10,11]]},"assertion":[{"value":"11 October 2019","order":1,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}