{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,31]],"date-time":"2026-03-31T08:42:51Z","timestamp":1774946571809,"version":"3.50.1"},"reference-count":83,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2021,2,13]],"date-time":"2021-02-13T00:00:00Z","timestamp":1613174400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2021,2,13]],"date-time":"2021-02-13T00:00:00Z","timestamp":1613174400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/501100008628","name":"Ministry of Electronics and Information technology","doi-asserted-by":"publisher","award":["Yet to be awarded"],"award-info":[{"award-number":["Yet to be awarded"]}],"id":[{"id":"10.13039\/501100008628","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Wireless Pers Commun"],"published-print":{"date-parts":[[2021,6]]},"DOI":"10.1007\/s11277-021-08181-0","type":"journal-article","created":{"date-parts":[[2021,2,14]],"date-time":"2021-02-14T13:43:26Z","timestamp":1613310206000},"page":"3303-3333","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":28,"title":["Feature Extraction Techniques with Analysis of Confusing Words for Speech Recognition in the Hindi Language"],"prefix":"10.1007","volume":"118","author":[{"given":"Shobha","family":"Bhatt","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Anurag","family":"Jain","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Amita","family":"Dev","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2021,2,13]]},"reference":[{"issue":"4","key":"8181_CR1","doi-asserted-by":"publisher","first-page":"239","DOI":"10.4103\/0377-2063.44216","volume":"54","author":"P Bansal","year":"2008","unstructured":"Bansal, P., Dev, A., & Jain, S. B. (2008). Optimum HMM combined with vector quantization for hindi speech recognition. IETE Journal of Research, 54(4), 239\u2013243. https:\/\/doi.org\/10.4103\/0377-2063.44216.","journal-title":"IETE Journal of Research"},{"key":"8181_CR2","doi-asserted-by":"publisher","unstructured":"Rabiner, L. R. (1997). Applications of speech recognition in the area of telecommunications. In IEEE workshop on automatic speech recognition and understanding proceedings (pp. 501\u2013510). IEEE. https:\/\/doi.org\/10.1109\/asru.1997.659129","DOI":"10.1109\/asru.1997.659129"},{"issue":"6","key":"8181_CR3","doi-asserted-by":"publisher","first-page":"18","DOI":"10.1109\/MSP.2012.2197156","volume":"29","author":"G Saon","year":"2012","unstructured":"Saon, G., & Chien, J. T. (2012). Large-vocabulary continuous speech recognition systems: A look at some recent advances. IEEE Signal Processing Magazine, 29(6), 18\u201333. https:\/\/doi.org\/10.1109\/MSP.2012.2197156.","journal-title":"IEEE Signal Processing Magazine"},{"issue":"6","key":"8181_CR4","doi-asserted-by":"publisher","first-page":"62","DOI":"10.15520\/ajcsit.v4i6.3","volume":"4","author":"PK Kurzekar","year":"2014","unstructured":"Kurzekar, P.K, Deshmukh, R. R., Waghmare, V. B., & Shrishrimal, P. P. (2014). Continuous speech recognition system: A review. Asian Journal of Computer Science and Information Technology, 4(6), 62\u201366. https:\/\/doi.org\/10.15520\/ajcsit.v4i6.3","journal-title":"Asian Journal of Computer Science and Information Technology"},{"issue":"4","key":"8181_CR5","doi-asserted-by":"publisher","first-page":"501","DOI":"10.1109\/PROC.1976.10158","volume":"64","author":"DR Reddy","year":"1976","unstructured":"Reddy, D. R. (1976). Speech recognition by machine: A review. Proceedings of the IEEE, 64(4), 501\u2013531. https:\/\/doi.org\/10.1109\/PROC.1976.10158.","journal-title":"Proceedings of the IEEE"},{"key":"8181_CR6","unstructured":"Anusuya, M. A., & Katti, S. K. (2009). Speech recognition by machine, A review. International Journal of Computer Science and Information Security, Vol. 6(3), 181\u2013205. Retrieved from http:\/\/arxiv.org\/abs\/1001.2267"},{"key":"8181_CR7","doi-asserted-by":"crossref","unstructured":"Samudravijaya, K. (2003). Durational characteristics of Hindi stop consonants. In EUROSPEECH 2003 - 8th European Conference on Speech Communication and Technology, 81\u201384.","DOI":"10.21437\/Eurospeech.2003-56"},{"key":"8181_CR8","unstructured":"Tifr, S. K. (2011). Introduction to Automatic Speech Recognition \u201cAutomatic Speech Recognition using Sphinx and HTK\u201d A hands-on Workshop. Retrieved from http:\/\/www.au-kbc.org\/speechhttp:\/\/speech.tifr.res.in"},{"key":"8181_CR9","doi-asserted-by":"publisher","unstructured":"Mich\u00e1lek, J., & Van\u011bk, J. (2018). A survey of recent DNN architectures on the TIMIT phone recognition task. Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics), 11107 LNAI, 436\u2013444. https:\/\/doi.org\/10.1007\/978-3-030-00794-2_47","DOI":"10.1007\/978-3-030-00794-2_47"},{"issue":"2","key":"8181_CR10","doi-asserted-by":"publisher","first-page":"165","DOI":"10.1007\/s10772-012-9131-y","volume":"15","author":"RK Aggarwal","year":"2012","unstructured":"Aggarwal, R. K., & Dave, M. (2012). Integration of multiple acoustic and language models for improved Hindi speech recognition system. International Journal of Speech Technology, 15(2), 165\u2013180. https:\/\/doi.org\/10.1007\/s10772-012-9131-y.","journal-title":"International Journal of Speech Technology"},{"issue":"10","key":"8181_CR11","doi-asserted-by":"publisher","first-page":"1401","DOI":"10.1109\/TASSP.1987.1165057","volume":"35","author":"MA Bush","year":"1987","unstructured":"Bush, M. A., & Kopec, G. E. (1987). Network-based connected digit recognition. IEEE Transactions on Acoustics, Speech, and Signal Processing, 35(10), 1401\u20131413. https:\/\/doi.org\/10.1109\/TASSP.1987.1165057.","journal-title":"IEEE Transactions on Acoustics, Speech, and Signal Processing"},{"key":"8181_CR12","doi-asserted-by":"publisher","unstructured":"Tripathy, S., Baranwal, N., & Nandi, G. C. (2013). A MFCC based Hindi speech recognition technique using HTK Toolkit. 2013 IEEE 2nd International Conference on Image Information Processing, IEEE ICIIP 2013, 539\u2013544. https:\/\/doi.org\/10.1109\/ICIIP.2013.6707650","DOI":"10.1109\/ICIIP.2013.6707650"},{"key":"8181_CR13","doi-asserted-by":"publisher","first-page":"1324","DOI":"10.4028\/www.scientific.net\/AMR.542-543.1324","volume":"542\u2013543","author":"Z He","year":"2012","unstructured":"He, Z., & Liu, Z. (2012). Chinese connected word speech recognition based on derivative dynamic time warping. Advanced Materials Research, 542\u2013543, 1324\u20131329. https:\/\/doi.org\/10.4028\/www.scientific.net\/AMR.542-543.1324.","journal-title":"Advanced Materials Research"},{"key":"8181_CR14","doi-asserted-by":"publisher","first-page":"389","DOI":"10.1007\/bfb0054006","volume-title":"Hybrid HMM\/ANN systems for speech recognition: Overview and new research directions","author":"H Bourlard","year":"1998","unstructured":"Bourlard, H., & Morgan, N. (1998). Hybrid HMM\/ANN systems for speech recognition: Overview and new research directions. Berlin: Springer. https:\/\/doi.org\/10.1007\/bfb0054006 pp. 389\u2013417"},{"issue":"November","key":"8181_CR15","doi-asserted-by":"publisher","first-page":"44","DOI":"10.1109\/MSP.2012.2210952","volume":"XX","author":"K Livescu","year":"2012","unstructured":"Livescu, K., Fosler-lussier, E., & Metze, F. (2012). Subword modeling for automatic speech recognition. IEEE Signal Processing Magazine. XX(November), 44\u201357.","journal-title":"IEEE Signal Processing Magazine"},{"issue":"5","key":"8181_CR16","first-page":"617","volume":"10","author":"C Vimala","year":"2015","unstructured":"Vimala, C., & Radha, V. (2015). Isolated speech recognition system for Tamil language using statistical pattern matching and machine learning techniques. Journal of Engineering Science and Technology, 10(5), 617\u2013632.","journal-title":"Journal of Engineering Science and Technology"},{"issue":"9","key":"8181_CR17","doi-asserted-by":"publisher","first-page":"1215","DOI":"10.1109\/5.237532","volume":"81","author":"JW Picone","year":"1993","unstructured":"Picone, J. W. (1993). Signal modeling techniques in speech recognition. Proceedings of the IEEE, 81(9), 1215\u20131247. https:\/\/doi.org\/10.1109\/5.237532.","journal-title":"Proceedings of the IEEE"},{"key":"8181_CR18","unstructured":"Scharenborg, O., Bouwman, G., & Boves, L. (2000). Connected digit recognition with class specific word models. Retrieved from http:\/\/hdl.handle.net\/2066\/75043"},{"issue":"SUPPL. 1","key":"8181_CR19","doi-asserted-by":"publisher","first-page":"1983","DOI":"10.3906\/elk-1112-84","volume":"21","author":"CY Fook","year":"2013","unstructured":"Fook, C. Y., Muthusamy, H., Chee, L. S., Yaacob, S. B., & Adom, A. H. B. (2013). Comparison of speech parameterization techniques for the classification of speech disfluencies. Turkish Journal of Electrical Engineering and Computer Sciences, 21(SUPPL. 1), 1983\u20131994. https:\/\/doi.org\/10.3906\/elk-1112-84.","journal-title":"Turkish Journal of Electrical Engineering and Computer Sciences"},{"key":"8181_CR20","unstructured":"C. Nieuwoudta and E.C. Bothab. (1999). Connected digit recognition in Afrikaans using hidden Markov models. The South African Computer Journal. Retrieved from http:\/\/uir.unisa.ac.za\/handle\/10500\/24317"},{"key":"8181_CR21","unstructured":"Raj, B., & Singh, R. (2014). Design and implementation of speech recognition systems. Retrieved from http:\/\/asr.cs.cmu.edu\/spring2014\/"},{"key":"8181_CR22","doi-asserted-by":"publisher","unstructured":"Bourlard, H., Kamp, Y., & Wellekens, C. J. (1985). SPEAKER DEPENDENT CONNECTED SPEECH RECOGNITION VIA PHONEMIC MARKOV MODELS. In ICASSP, IEEE International Conference on Acoustics, Speech and Signal Processing - Proceedings (pp. 1213\u20131216). IEEE. https:\/\/doi.org\/10.1109\/icassp.1985.1168285","DOI":"10.1109\/icassp.1985.1168285"},{"key":"8181_CR23","unstructured":"Davel, M., & Martirosian, O. (2009). Pronunciation dictionary development in resource-scarce environments. Retrieved from http:\/\/www.meraka.org.za\/lwazi."},{"key":"8181_CR24","unstructured":"Bhatt, S., Dev, A., & Jain, A. (2018). Hidden Markov model based speech recognition-a review. In International Conference on \"Computing for Sustainable Global Development India Com IEEE Conference (pp. 3367\u20133372)."},{"key":"8181_CR25","unstructured":"Alghamdi, Mansour & Alotaibi, Y. (2010). HMM automatic speech recognition system of arabic alphadigits. Arabian Journal for Science and Engineering, 35(2), 139\u2013155. Retrieved from https:\/\/www.researchgate.net\/publication\/228703879_HMM_automatic_speech_recognition_system_of_arabic_alphadigits"},{"key":"8181_CR26","doi-asserted-by":"publisher","unstructured":"Tailor, J. H., & Shah, D. B. (2018). HMM-based lightweight speech recognition system for gujarati language. In Lecture Notes in Networks and Systems (Vol. 10, pp. 451\u2013461). Springer. https:\/\/doi.org\/10.1007\/978-981-10-3920-1_46","DOI":"10.1007\/978-981-10-3920-1_46"},{"key":"8181_CR27","doi-asserted-by":"publisher","unstructured":"Renals, S., McKelvie, D., & McInnes, F. (1991). A comparative study of continuous speech recognition using neural networks and hidden Markov models. In ICASSP, IEEE International Conference on Acoustics, Speech and Signal Processing (Vol. 1, pp. 369\u2013372). IEEE. https:\/\/doi.org\/10.1109\/icassp.1991.150353","DOI":"10.1109\/icassp.1991.150353"},{"key":"8181_CR28","unstructured":"Saini, P., Kaur, P., & Dua, M. (2013). Hindi automatic speech recognition using HTK. International Journal of Engineering Trends and Technology (IJETT), 4(6), 2223\u20132229. Retrieved from http:\/\/www.ijettjournal.org"},{"issue":"6","key":"8181_CR29","doi-asserted-by":"publisher","first-page":"2301","DOI":"10.1007\/s12652-018-0828-x","volume":"10","author":"M Dua","year":"2019","unstructured":"Dua, M., Aggarwal, R. K., & Biswas, M. (2019). GFCC based discriminatively trained noise robust continuous ASR system for Hindi language. Journal of Ambient Intelligence and Humanized Computing, 10(6), 2301\u20132314. https:\/\/doi.org\/10.1007\/s12652-018-0828-x.","journal-title":"Journal of Ambient Intelligence and Humanized Computing"},{"key":"8181_CR30","unstructured":"Chaudhary, A., Chauhan, M. R., & Gupta, M. G. (2013). Automatic speech recognition system for isolated and connected words of hindi language by using hidden markov model toolkit (HTK). In Proceedings of international conference on emerging trends in engineering and technology, organized by association of computer electronics and electrical engineers (ACEEE) (pp. 847\u2013853)."},{"key":"8181_CR31","doi-asserted-by":"publisher","unstructured":"Da\u011fitan, U., & Yalabik, N. (1990). Connected word recognition using neural networks. In Neurocomputing (pp. 297\u2013300). Springer, Berlin. https:\/\/doi.org\/10.1007\/978-3-642-76153-9_34","DOI":"10.1007\/978-3-642-76153-9_34"},{"issue":"1","key":"8181_CR32","doi-asserted-by":"publisher","first-page":"25","DOI":"10.1504\/ijcsyse.2012.044740","volume":"1","author":"K Kumar","year":"2012","unstructured":"Kumar, K., Aggarwal, R. K., & Jain, A. (2012). A Hindi speech recognition system for connected words using HTK. International Journal of Computational Systems Engineering, 1(1), 25. https:\/\/doi.org\/10.1504\/ijcsyse.2012.044740.","journal-title":"International Journal of Computational Systems Engineering"},{"key":"8181_CR33","doi-asserted-by":"publisher","unstructured":"Kaur, A., & Singh, A. (2016). Optimizing feature extraction techniques constituting phone based modelling on connected words for Punjabi automatic speech recognition. In 2016 International Conference on Advances in Computing, Communications and Informatics, ICACCI 2016 (pp. 2104\u20132108). Institute of Electrical and Electronics Engineers Inc. https:\/\/doi.org\/10.1109\/ICACCI.2016.7732362","DOI":"10.1109\/ICACCI.2016.7732362"},{"key":"8181_CR34","doi-asserted-by":"publisher","unstructured":"Levinson, S. E. (1982). Speaker independent connected word recognition. In NATO Advanced Study Institutes Series, Series C: Mathematical and Physical Sciences (Vol. 88, pp. 179\u2013190). D. Reidel Publ Co. https:\/\/doi.org\/10.1007\/978-94-009-7879-9_10","DOI":"10.1007\/978-94-009-7879-9_10"},{"key":"8181_CR35","doi-asserted-by":"publisher","unstructured":"Patil, P. P., & Pardeshi, S. A. (2014). Marathi connected word speech recognition system. In 1st international conference on networks and soft computing, ICNSC 2014 - proceedings (pp. 314\u2013318). Institute of Electrical and Electronics Engineers Inc. https:\/\/doi.org\/10.1109\/CNSC.2014.6906687","DOI":"10.1109\/CNSC.2014.6906687"},{"key":"8181_CR36","doi-asserted-by":"publisher","unstructured":"Haeb-Umbach, R., Geller, D., & Ney, H. (1993). Improvements in connected digit recognition using linear discriminant analysis and mixture densities. In Proceedings - ICASSP, IEEE international conference on acoustics, speech and signal processing (Vol. 2). Publ by IEEE. https:\/\/doi.org\/10.1109\/icassp.1993.319279","DOI":"10.1109\/icassp.1993.319279"},{"key":"8181_CR37","doi-asserted-by":"publisher","unstructured":"Skinner, T. E., Kloker, D. R., & Medress, M. F. (1976). A speech recognition system for connected word sequences. In ICASSP, IEEE international conference on acoustics, speech and signal processing - proceedings (Vol. 1976-April, pp. 434\u2013437). Institute of Electrical and Electronics Engineers Inc. https:\/\/doi.org\/10.1109\/ICASSP.1976.1170052","DOI":"10.1109\/ICASSP.1976.1170052"},{"issue":"9","key":"8181_CR38","doi-asserted-by":"publisher","first-page":"1981","DOI":"10.1002\/j.1538-7305.1984.tb00085.x","volume":"63","author":"LR Rabiner","year":"1984","unstructured":"Rabiner, L. R. (1984). On the application of energy contours to the recognition of connected word sequences. AT&T Bell Laboratories Technical Journal, 63(9), 1981\u20131995. https:\/\/doi.org\/10.1002\/j.1538-7305.1984.tb00085.x.","journal-title":"AT&T Bell Laboratories Technical Journal"},{"key":"8181_CR39","unstructured":"Krishnan, M., Neophytou, C. P., & Prescott, G. (1994). Wavelet transform speech recognition using vector quantization, dynamic time warping and artificial neural networks. Signal Processing; (3): 4\u20136."},{"key":"8181_CR40","doi-asserted-by":"crossref","unstructured":"Alasadi, A. A., Ambedkar Marathwada, B., H Adhyani, T. H., Deshmukh, R. R., Alahmadi, A. H., & Saleh Alshebami, A. (2020). Efficient Feature Extraction Algorithms to Develop an Arabic Speech Recognition System. Engineering Technology & Applied Science Research, 10(2), 5547\u20135553. Retrieved from www.etasr.com","DOI":"10.48084\/etasr.3465"},{"issue":"6","key":"8181_CR41","doi-asserted-by":"publisher","first-page":"1333","DOI":"10.1080\/02522667.2020.1809091","volume":"41","author":"S Bhatt","year":"2020","unstructured":"Bhatt, S., Jain, A., & Dev, A. (2020). Syllable based Hindi speech recognition. Journal of Information and Optimization Sciences, 41(6), 1333\u20131351. https:\/\/doi.org\/10.1080\/02522667.2020.1809091.","journal-title":"Journal of Information and Optimization Sciences"},{"key":"8181_CR42","doi-asserted-by":"publisher","DOI":"10.1007\/s10772-020-09717-8","author":"J Guglani","year":"2020","unstructured":"Guglani, J., & Mishra, A. N. (2020). DNN based continuous speech recognition system of Punjabi language on Kaldi toolkit. International Journal of Speech Technology. https:\/\/doi.org\/10.1007\/s10772-020-09717-8.","journal-title":"International Journal of Speech Technology"},{"issue":"1","key":"8181_CR43","doi-asserted-by":"publisher","first-page":"219","DOI":"10.1007\/s10772-019-09593-x","volume":"22","author":"P Mittal","year":"2019","unstructured":"Mittal, P., & Singh, N. (2019). Development and analysis of Punjabi ASR system for mobile phones under different acoustic models. International Journal of Speech Technology, 22(1), 219\u2013230. https:\/\/doi.org\/10.1007\/s10772-019-09593-x.","journal-title":"International Journal of Speech Technology"},{"issue":"2","key":"8181_CR44","doi-asserted-by":"publisher","first-page":"329","DOI":"10.1121\/1.1910582","volume":"42","author":"DR Reddy","year":"1967","unstructured":"Reddy, D. R. (1967). Computer recognition of connected speech. The Journal of the Acoustical Society of America, 42(2), 329\u2013347. https:\/\/doi.org\/10.1121\/1.1910582.","journal-title":"The Journal of the Acoustical Society of America"},{"issue":"4","key":"8181_CR45","doi-asserted-by":"publisher","first-page":"1738","DOI":"10.1121\/1.399423","volume":"87","author":"H Hermansky","year":"1990","unstructured":"Hermansky, H. (1990). Perceptual linear predictive (PLP) analysis of speech. Journal of the Acoustical Society of America, 87(4), 1738\u20131752. https:\/\/doi.org\/10.1121\/1.399423.","journal-title":"Journal of the Acoustical Society of America"},{"key":"8181_CR46","unstructured":"Bhatt, S., Jain, A., & Dev, A. (2017). Continuous Speech Recognition Technologies-A Review. In 46th National Symposium on Acoustics (NSA-2017) (pp. 2\u20136)."},{"key":"8181_CR47","doi-asserted-by":"publisher","DOI":"10.2174\/2213275912666191001215916","author":"S Bhatt","year":"2020","unstructured":"Bhatt, S., Dev, A., & Jain, A. (2020). Effects of the dynamic and energy based feature extraction on hindi speech recognition. Recent Advances in Computer Science and Communications, 13. https:\/\/doi.org\/10.2174\/2213275912666191001215916.","journal-title":"Recent Advances in Computer Science and Communications"},{"issue":"1","key":"8181_CR48","doi-asserted-by":"publisher","first-page":"165","DOI":"10.1515\/jisys-2018-0417","volume":"30","author":"A Kumar","year":"2020","unstructured":"Kumar, A., & Aggarwal, R. K. (2020). Discriminatively trained continuous Hindi speech recognition using integrated acoustic features and recurrent neural network language modeling. Journal of Intelligent Systems, 30(1), 165\u2013179. https:\/\/doi.org\/10.1515\/jisys-2018-0417.","journal-title":"Journal of Intelligent Systems"},{"key":"8181_CR49","doi-asserted-by":"publisher","unstructured":"Dhawan, K., Sreeram, G., Priyadarshi, K., & Sinha, R. (2020). Investigating target set reduction for end-to-end speech recognition of Hindi-english code-switching data. In 26th national conference on communications, NCC 2020. Institute of Electrical and Electronics Engineers Inc. https:\/\/doi.org\/10.1109\/NCC48643.2020.9056083","DOI":"10.1109\/NCC48643.2020.9056083"},{"key":"8181_CR50","doi-asserted-by":"publisher","DOI":"10.1007\/s10772-020-09757-0","author":"A Kumar","year":"2020","unstructured":"Kumar, A., & Aggarwal, R. K. (2020). Hindi speech recognition using time delay neural network acoustic modeling with i-vector adaptation. International Journal of Speech Technology, 1\u201312,. https:\/\/doi.org\/10.1007\/s10772-020-09757-0.","journal-title":"International Journal of Speech Technology"},{"key":"8181_CR51","unstructured":"Chourasia, V., Samudravijaya, K., & Chandwani, M. (2005). Phonetically rich hindi sentence corpus for creation of speech database. Proc. O-Cocosda (pp. 132\u2013137)."},{"key":"8181_CR52","doi-asserted-by":"publisher","unstructured":"Tripathy, S., Baranwal, N., & Nandi, G. C. (2013). A MFCC based Hindi speech recognition technique using HTK Toolkit. 2013 IEEE 2nd international conference on image information processing, IEEE ICIIP 2013, (December) (pp. 539\u2013544). https:\/\/doi.org\/10.1109\/ICIIP.2013.6707650","DOI":"10.1109\/ICIIP.2013.6707650"},{"issue":"10","key":"8181_CR53","doi-asserted-by":"publisher","first-page":"4213","DOI":"10.1007\/s12652-020-01703-x","volume":"11","author":"S Bhatt","year":"2020","unstructured":"Bhatt, S., Dev, A., & Jain, A. (2020). Confusion analysis in phoneme based speech recognition in Hindi. Journal of Ambient Intelligence and Humanized Computing, 11(10), 4213\u20134238. https:\/\/doi.org\/10.1007\/s12652-020-01703-x.","journal-title":"Journal of Ambient Intelligence and Humanized Computing"},{"issue":"2","key":"8181_CR54","doi-asserted-by":"publisher","first-page":"675","DOI":"10.1007\/s12652-019-01325-y","volume":"11","author":"V Passricha","year":"2020","unstructured":"Passricha, V., & Aggarwal, R. K. (2020). A comparative analysis of pooling strategies for convolutional neural network based Hindi ASR. Journal of Ambient Intelligence and Humanized Computing, 11(2), 675\u2013691. https:\/\/doi.org\/10.1007\/s12652-019-01325-y.","journal-title":"Journal of Ambient Intelligence and Humanized Computing"},{"key":"8181_CR55","unstructured":"Bansal, S., & Dev, A. (2015). Emotional Hindi speech: Feature extraction and classification - IEEE Conference Publication. In In 2015 2nd International Conference on Computing for Sustainable Global Development (INDIACom) . IEEE. (pp. 1865\u20131868). Retrieved from https:\/\/ieeexplore.ieee.org\/document\/7100568?denied"},{"key":"8181_CR56","doi-asserted-by":"publisher","unstructured":"Durvasula, K., & Luo, Q. (2012). Voicing, aspiration, and vowel duration in Hindi. Proceedings of Meetings on Acoustics, 18(1). https:\/\/doi.org\/10.1121\/1.4895027","DOI":"10.1121\/1.4895027"},{"key":"8181_CR57","unstructured":"Pruthi, T., Saksena, S., & Das, P. K. (2000). Swaranjali: Isolated word recognition for Hindi language using VQ and HMM. In International Conference on Multimedia Processing and Systems (ICMPS) (pp. 13\u201315)."},{"key":"8181_CR58","doi-asserted-by":"crossref","unstructured":"Yamuna Kachru. (2006). Hindi. John Benjamins Publishing. Retrieved from https:\/\/books.google.co.in\/books\/about\/Hindi.html?id=ooH5VfLTQEQC&redir_esc=y","DOI":"10.1075\/loall.12"},{"key":"8181_CR59","doi-asserted-by":"publisher","unstructured":"Lude\u00f1a-Choez, J., & Gallardo-Antol\u00edn, A. (2013). NMF-based spectral analysis for acoustic event classification tasks. Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics), 7911 LNAI(June), 9\u201316. https:\/\/doi.org\/10.1007\/978-3-642-38847-7","DOI":"10.1007\/978-3-642-38847-7"},{"key":"8181_CR60","unstructured":"Jurafsky, D., & Martin, J. H. (2007). Speech recognition: advanced topics. Speech and Language Processing: An Introduction to Natural Language Processing, Computational Linguistics, and Speech Recognition (pp. 1\u201334)."},{"issue":"8","key":"8181_CR61","doi-asserted-by":"publisher","first-page":"1731","DOI":"10.1080\/02522667.2019.1703266","volume":"40","author":"A Patil","year":"2019","unstructured":"Patil, A., More, P., & Sasikumar, M. (2019). Incorporating finer acoustic phonetic features in lexicon for Hindi language speech recognition. Journal of Information and Optimization Sciences, 40(8), 1731\u20131739. https:\/\/doi.org\/10.1080\/02522667.2019.1703266.","journal-title":"Journal of Information and Optimization Sciences"},{"issue":"2","key":"8181_CR62","doi-asserted-by":"publisher","first-page":"378","DOI":"10.1007\/s11704-018-8030-z","volume":"14","author":"W Ying","year":"2020","unstructured":"Ying, W., Zhang, L., & Deng, H. (2020). Sichuan dialect speech recognition with deep LSTM network. Frontiers of Computer Science, 14(2), 378\u2013387. https:\/\/doi.org\/10.1007\/s11704-018-8030-z.","journal-title":"Frontiers of Computer Science"},{"key":"8181_CR63","doi-asserted-by":"crossref","unstructured":"Chen, S. F., & Goodman, J. (1996). An empirical study of smoothing techniques for language modeling. In Proceedings of the 34th Annual Meeting of the ACL (pp. 1\u201310).","DOI":"10.3115\/981863.981904"},{"key":"8181_CR64","doi-asserted-by":"crossref","unstructured":"Sundermeyer, M., Schl\u00fcter, R., & Ney, H. (2012). LSTM neural networks for language modeling. In INTERSPEECH (pp. 194\u2013197).","DOI":"10.21437\/Interspeech.2012-65"},{"key":"8181_CR65","unstructured":"Salvi, G. (1999). Developing acoustic models for automatic speech recognition in Swedish. European Student Journal of Language and Speech, (June 1999), 1\u201316."},{"issue":"3","key":"8181_CR66","doi-asserted-by":"publisher","first-page":"314","DOI":"10.1504\/ijmc.2020.107097","volume":"18","author":"OZ Mamyrbayev","year":"2020","unstructured":"Mamyrbayev, O. Z., Alimhan, K., Amirgaliyev, B., Zhumazhanov, B., Mussayeva, D., & Gusmanova, F. (2020). Multimodal systems for speech recognition. International Journal of Mobile Communications, 18(3), 314\u2013326. https:\/\/doi.org\/10.1504\/ijmc.2020.107097.","journal-title":"International Journal of Mobile Communications"},{"key":"8181_CR67","doi-asserted-by":"publisher","unstructured":"Deshwal, D., Sangwan, P., & Kumar, D. (2019). Feature extraction methods in language identification: A survey. wireless personal communications. Springer US. https:\/\/doi.org\/10.1007\/s11277-019-06373-3","DOI":"10.1007\/s11277-019-06373-3"},{"key":"8181_CR68","doi-asserted-by":"publisher","DOI":"10.1109\/TASSP.1980.1163420","author":"SB Davis","year":"1980","unstructured":"Davis, S. B., & Mermelstein, P. (1980). Comparison of parametric representations for monosyllabic word recognition in continuously spoken sentences. IEEE Transactions on Acoustics, Speech, and Signal Processing. https:\/\/doi.org\/10.1109\/TASSP.1980.1163420.","journal-title":"IEEE Transactions on Acoustics, Speech, and Signal Processing."},{"key":"8181_CR69","doi-asserted-by":"publisher","unstructured":"Anusuya, M. A., & Katti, S. K. (2011). Front end analysis of speech recognition: A review. International Journal of Speech Technology. https:\/\/doi.org\/10.1007\/s10772-010-9088-7","DOI":"10.1007\/s10772-010-9088-7"},{"key":"8181_CR70","doi-asserted-by":"publisher","unstructured":"Kao, Y. H., & Netsch, L. (1997). Inter-digit HMM connected digit recognition using the macrophone corpus. In ICASSP, IEEE international conference on acoustics, speech and signal processing - proceedings (Vol. 3, pp. 1739\u20131742). IEEE. https:\/\/doi.org\/10.1109\/icassp.1997.598860","DOI":"10.1109\/icassp.1997.598860"},{"key":"8181_CR71","unstructured":"University of Cambridge. (1989). HTK speech recognition toolkit. Retrieved January 26, 2016, from http:\/\/htk.eng.cam.ac.uk\/"},{"issue":"4","key":"8181_CR72","doi-asserted-by":"publisher","first-page":"318","DOI":"10.4103\/0377-2063.86274","volume":"57","author":"A Jain","year":"2011","unstructured":"Jain, A., Agrawal, S. S., & Prakash, N. (2011). Transformation of emotion based on acoustic features of intonation patterns for Hindi speech and their perception. IETE Journal of Research, 57(4), 318\u2013324. https:\/\/doi.org\/10.4103\/0377-2063.86274.","journal-title":"IETE Journal of Research"},{"key":"8181_CR73","unstructured":"TMH KTH\u202f:: WaveSurfer. (n.d.). Retrieved January 20, 2017, from http:\/\/www.speech.kth.se\/wavesurfer\/"},{"key":"8181_CR74","unstructured":"Chootrakool, Patcharika & Wuttiwiwatchai, Chai & Kosawat, K. (2009). A large pronunciation dictionary for Thai speech processing. In 6th Biennial Conf. Asian assoc. for lexicography (ASIALEX)At: Bangkok, Thailand (pp. 1\u20139). Retrieved from https:\/\/www.researchgate.net\/publication\/316682538_A_Large_Pronunciation_Dictionary_for_Thai_Speech_Processing"},{"key":"8181_CR75","doi-asserted-by":"crossref","unstructured":"K. Samudravijaya, P. Rao, S. A. (2000). Hindi speech database. In ICSLP (pp. 1\u20134). Retrieved from https:\/\/www.isca-speech.org\/archive\/icslp_2000\/i00_4456.html","DOI":"10.21437\/ICSLP.2000-847"},{"issue":"2","key":"8181_CR76","first-page":"157","volume":"35","author":"G Droua-Hamdani","year":"2010","unstructured":"Droua-Hamdani, G., Selouani, S.-A., & Boudraa, M. (2010). Algerian Arabic speech database (ALGASD): Corpus design and automatic speech recognition application. Arabian Journal for Science and Engineering, 35(2), 157\u2013166.","journal-title":"Arabian Journal for Science and Engineering"},{"key":"8181_CR77","doi-asserted-by":"publisher","unstructured":"Agarwal, A., Jain, A., Prakash, N., & Agrawal, S. S. (2010). Word Based emotion conversion in Hindi Language. IN Proceedings - 2010 3rd IEEE International Conference on Computer Science and Information Technology, ICCSIT 2010, 9, 419\u2013423. https:\/\/doi.org\/10.1109\/ICCSIT.2010.5565148","DOI":"10.1109\/ICCSIT.2010.5565148"},{"key":"8181_CR78","unstructured":"Bhatt, S., Jain, A., & Dev, A. (2017). Hindi speech recognition\u202f: Issues and Challenges. In International conference on computing for sustainable global development India Com 2017 IEEE conference (pp. 2719\u20132723)."},{"key":"8181_CR79","unstructured":"Cambridgr, U. (n.d.). HTK speech recognition toolkit. Retrieved November 6, 2019, from http:\/\/htk.eng.cam.ac.uk\/"},{"key":"8181_CR80","doi-asserted-by":"publisher","unstructured":"Al-Qatab, B. A. Q., & Ainon, R. N. (2010). Arabic speech recognition using Hidden Markov Model Toolkit(HTK). In Proceedings 2010 international symposium on information technology - engineering technology, ITSim\u201910 (Vol. 2, pp. 557\u2013562). https:\/\/doi.org\/10.1109\/ITSIM.2010.5561391","DOI":"10.1109\/ITSIM.2010.5561391"},{"issue":"03","key":"8181_CR81","doi-asserted-by":"publisher","first-page":"20","DOI":"10.9790\/9622-0703022024","volume":"07","author":"V K\u00ebpuska","year":"2017","unstructured":"K\u00ebpuska, V. (2017). Comparing speech recognition systems (Microsoft API, Google API And CMU Sphinx). International Journal of Engineering Research and Applications, 07(03), 20\u201324. https:\/\/doi.org\/10.9790\/9622-0703022024.","journal-title":"International Journal of Engineering Research and Applications"},{"key":"8181_CR82","doi-asserted-by":"crossref","unstructured":"Bhatt, S., Dev, A., & Jain, A. (2018). Hindi speech vowel recognition using hidden Markov model. In The 6th Intl. Workshop on spoken language technologies for under-resourced languages , (Vol. 1, pp. 196\u2013199).","DOI":"10.21437\/SLTU.2018-41"},{"issue":"3","key":"8181_CR83","doi-asserted-by":"publisher","first-page":"1718","DOI":"10.1121\/1.402451","volume":"91","author":"Y Qi","year":"1992","unstructured":"Qi, Y., & Fox, R. A. (1992). Analysis of Nasal consonants using perceptual linear prediction. Journal of the Acoustical Society of America, 91(3), 1718\u20131726. https:\/\/doi.org\/10.1121\/1.402451.","journal-title":"Journal of the Acoustical Society of America"}],"container-title":["Wireless Personal Communications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11277-021-08181-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11277-021-08181-0\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11277-021-08181-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,12,17]],"date-time":"2022-12-17T09:34:35Z","timestamp":1671269675000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11277-021-08181-0"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,2,13]]},"references-count":83,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2021,6]]}},"alternative-id":["8181"],"URL":"https:\/\/doi.org\/10.1007\/s11277-021-08181-0","relation":{},"ISSN":["0929-6212","1572-834X"],"issn-type":[{"value":"0929-6212","type":"print"},{"value":"1572-834X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2021,2,13]]},"assertion":[{"value":"28 January 2021","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 February 2021","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Compliance with Ethical Standards"}},{"value":"The authors declare that there is no conflict of interest in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflicts of interest"}},{"value":"NA.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Code Availability"}}]}}