{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,25]],"date-time":"2026-02-25T12:20:54Z","timestamp":1772022054510,"version":"3.50.1"},"reference-count":25,"publisher":"Springer Science and Business Media LLC","issue":"12","license":[{"start":{"date-parts":[[2022,3,5]],"date-time":"2022-03-05T00:00:00Z","timestamp":1646438400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2022,3,5]],"date-time":"2022-03-05T00:00:00Z","timestamp":1646438400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"published-print":{"date-parts":[[2022,5]]},"DOI":"10.1007\/s11042-022-12723-4","type":"journal-article","created":{"date-parts":[[2022,3,5]],"date-time":"2022-03-05T12:02:52Z","timestamp":1646481772000},"page":"17169-17184","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":8,"title":["Acoustic model with hybrid Deep Bidirectional Single Gated Unit (DBSGU) for low resource speech recognition"],"prefix":"10.1007","volume":"81","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-4978-542X","authenticated-orcid":false,"given":"S.","family":"Girirajan","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"A.","family":"Pandian","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2022,3,5]]},"reference":[{"issue":"2","key":"12723_CR1","doi-asserted-by":"publisher","first-page":"183","DOI":"10.1007\/s10032-015-0242-2","volume":"18","author":"GA Abandah","year":"2015","unstructured":"Abandah GA, Graves A, Al-Shagoor B, Arabiyat A, Al-Taee M (2015) Automatic diacritization of Arabic text using recurrent neural networks. Int J Doc Anal Recognit (IJDAR) 18(2):183\u2013197","journal-title":"Int J Doc Anal Recognit (IJDAR)"},{"key":"12723_CR2","doi-asserted-by":"publisher","first-page":"117","DOI":"10.1016\/j.procs.2018.10.359","volume":"143","author":"PP Barman","year":"2018","unstructured":"Barman PP, Boruah A (2018) A RNN based approach for next word prediction in Assamese phonetic transcription. Procedia Comput Sci 143:117\u2013123 (ISSN 1877 \u2013 0509)","journal-title":"Procedia Comput Sci"},{"key":"12723_CR3","unstructured":"Chavandan RS, Sable GS (2013) An overview of speech recognition using HMM. Int J Comput Sci Mob Comput 2(6):233\u2013238"},{"key":"12723_CR4","unstructured":"Chung J, Gulcehre C, Cho K, Bengio Y (2014) Empirical evaluation of gated recurrent neural networks on sequence modeling. arXiv arXiv:1412.3555"},{"key":"12723_CR5","doi-asserted-by":"crossref","unstructured":"Cheng G, Povey D, Huang L, Xu J, Khudanpur S, Yan Y (2018) Output-gate projected gated recurrent unit for speech recognition. Interspeech, pp 1793\u20131797","DOI":"10.21437\/Interspeech.2018-1403"},{"issue":"5\u20136","key":"12723_CR6","doi-asserted-by":"publisher","first-page":"602","DOI":"10.1016\/j.neunet.2005.06.042","volume":"18","author":"A Graves","year":"2005","unstructured":"Graves A, Schmidhuber J (2005) Framewise phoneme classification with bidirectional LSTM and other neural network architectures. Neural Netw 18(5\u20136):602\u2013610","journal-title":"Neural Netw"},{"key":"12723_CR7","doi-asserted-by":"crossref","unstructured":"Graves A, Mohamed A, Hinton G (2013) Speech recognitionwith deep recurrent neural networks. In: Proc ICASSP 2013, Vancouver, Canada","DOI":"10.1109\/ICASSP.2013.6638947"},{"key":"12723_CR8","unstructured":"Greff K, Srivastava RK, Koutnk J, Steunebrink BR, Schmidhuber J (2015) LSTM: A search space odyssey. arXiv: 1503.04069"},{"key":"12723_CR9","unstructured":"He F, Chu SH, Kjartansson O, Rivera C, Katanova A, Gutkin A, Demirsahin I, Johny C, Jansche M, Sain S et al (2020) Open-source Multi-speaker Speech Corpora for Building Gujarati, Kannada, Malayalam, Marathi, Tamil and Telugu Speech Synthesis Systems. In: Proceedings of the 12th LREC Conference, Marseille, France, 11\u201316"},{"key":"12723_CR10","doi-asserted-by":"publisher","first-page":"1735","DOI":"10.1162\/neco.1997.9.8.1735","volume":"9","author":"S Hochreiter","year":"1997","unstructured":"Hochreiter S, J\u00fcrgen S (1997) Long short-term memory. Neural Comput 9:1735\u201380. https:\/\/doi.org\/10.1162\/neco.1997.9.8.1735","journal-title":"Neural Comput"},{"key":"12723_CR11","unstructured":"Jozefowicz R, Zaremba W, Sutskever I (2015) An empirical exploration of recurrent network architectures. In Proceedings of the 32nd International Conference on Machine Learning, Lille, France, vol 37, pp 2342\u20132350"},{"key":"12723_CR12","doi-asserted-by":"crossref","unstructured":"Kim J, Kim J, Thu HLT, Kim H (2016) Long short term memory recurrent neural network classifier for intrusion detection. International Conference on Platform Technology and Service (PlatCon), Jeju, pp 1\u20135","DOI":"10.1109\/PlatCon.2016.7456805"},{"key":"12723_CR13","unstructured":"Kingma DP, Ba J (2014) Adam: A method for stochastic optimization, CoRR, vol abs\/1412.6980"},{"key":"12723_CR14","doi-asserted-by":"publisher","first-page":"676","DOI":"10.1016\/j.procs.2017.12.087","volume":"125","author":"J Kumar","year":"2018","unstructured":"Kumar J, Goomer R, Singh AK (2018) Long Short Term Memory Recurrent Neural Network (LSTM-RNN) based workload forecasting model for cloud datacenters. Procedia Comput Sci 125:676\u2013682 (ISSN 1877 \u2013 0509)","journal-title":"Procedia Comput Sci"},{"key":"12723_CR15","doi-asserted-by":"crossref","unstructured":"Kumar S, Hussain L, Banarjee S, Reza M (2018) Energy load forecasting using deep learning approach-LSTM and GRU in spark cluster. Fifth International Conference on Emerging Applications of Information Technology (EAIT), Kolkata, pp 1\u20134","DOI":"10.1109\/EAIT.2018.8470406"},{"key":"12723_CR16","doi-asserted-by":"crossref","unstructured":"Li X, Xianyu H, Tian J, Chen W, Meng F, Xu M et al (2016) A deep bidirectional long short-term memory based multi-scale approach for music dynamic emotion prediction. In: IEEE International Conference in Acoustics, Speech and Signal Processing (ICASSP); Shanghai, China, p 544\u2013548","DOI":"10.1109\/ICASSP.2016.7471734"},{"key":"12723_CR17","unstructured":"Panayotov V, Chen G, Povey D, Khudanpur S. Librispeech: an ASR corpus based on public domain audio books. In: International Conference on Acoustics, Speech, and Signal Processing (ICASSP), Brisbane, Australia, pp 5206\u20135210"},{"key":"12723_CR18","volume-title":"Machine Learning, Optimization, and Big Data. MOD 2016","author":"M Panzner","year":"2016","unstructured":"Panzner M, Cimiano P (2016) Comparing hidden Markov models and long short term memory neural networks for learning action representations. In: Pardalos P, Conca P, Giuffrida G, Nicosia G (eds) Machine Learning, Optimization, and Big Data. MOD 2016, vol 10122. Springer, Cham"},{"key":"12723_CR19","unstructured":"Povey D, Ghoshal A, Boulianne G, Goel N, Hannemann M, Qian Y, Schwarz P, Stemmer G (2011) The kaldi speech recognitiontoolkit. In: Workshop on Automatic Speech Recognition and Understanding (ASRU), Hawaii, US, pp 1\u20134"},{"issue":"2","key":"12723_CR20","doi-asserted-by":"publisher","first-page":"92","DOI":"10.1109\/TETCI.2017.2762739","volume":"2","author":"M Ravanelli","year":"2018","unstructured":"Ravanelli M, Brakel P, Omologo M, Bengio Y (2018) Light gated recurrent units for speech recognition. IEEE Trans Emerg Top Comput Intell 2(2):92\u2013102","journal-title":"IEEE Trans Emerg Top Comput Intell"},{"issue":"11","key":"12723_CR21","doi-asserted-by":"publisher","first-page":"2673","DOI":"10.1109\/78.650093","volume":"45","author":"M Schuster","year":"1997","unstructured":"Schuster M, Paliwal KK (1997) Bidirectional recurrent neural networks. Signal Process IEEE Trans 45(11):2673\u20132681","journal-title":"Signal Process IEEE Trans"},{"key":"12723_CR22","doi-asserted-by":"crossref","unstructured":"Stolcke A (2002) SRILM-An extensible language modeling toolkit. In: International Conference on Spoken Language Processing (ICSLP), Denver, Colorado, pp 901\u2013904","DOI":"10.21437\/ICSLP.2002-303"},{"key":"12723_CR23","doi-asserted-by":"crossref","unstructured":"Thireou T, Reczko M (2007) Bidirectional Long Short-Term Memory Networks for Predicting the Subcellular Localization of Eukaryotic Proteins. IEEE\/ACM Trans Comput Biol Bioinform 4(3):441\u2013446","DOI":"10.1109\/tcbb.2007.1015"},{"key":"12723_CR24","doi-asserted-by":"crossref","unstructured":"Zhang Y, Chen G, Yu D, Yao K, Khudanpur S, Glass JR (2016) Highway long short-term memory RNNS for distant speech recognition. In: Proc. of ICASSP 2016, pp 5755\u20135759","DOI":"10.1109\/ICASSP.2016.7472780"},{"key":"12723_CR25","doi-asserted-by":"crossref","unstructured":"Zhou G-B, Wu J, Zhang C-L, Zhou Z-H (2016) Minimal gated unit for recurrent neural networks. Int J Automat Comput 13(3):226\u2013234","DOI":"10.1007\/s11633-016-1006-2"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-022-12723-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-022-12723-4\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-022-12723-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,1,28]],"date-time":"2023-01-28T12:43:33Z","timestamp":1674909813000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-022-12723-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,3,5]]},"references-count":25,"journal-issue":{"issue":"12","published-print":{"date-parts":[[2022,5]]}},"alternative-id":["12723"],"URL":"https:\/\/doi.org\/10.1007\/s11042-022-12723-4","relation":{},"ISSN":["1380-7501","1573-7721"],"issn-type":[{"value":"1380-7501","type":"print"},{"value":"1573-7721","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022,3,5]]},"assertion":[{"value":"26 December 2020","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"6 August 2021","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"21 February 2022","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"5 March 2022","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}