{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,6]],"date-time":"2026-04-06T10:23:08Z","timestamp":1775470988090,"version":"3.50.1"},"reference-count":50,"publisher":"Springer Science and Business Media LLC","issue":"8","license":[{"start":{"date-parts":[[2024,4,2]],"date-time":"2024-04-02T00:00:00Z","timestamp":1712016000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,4,2]],"date-time":"2024-04-02T00:00:00Z","timestamp":1712016000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"DOI":"10.1007\/s11042-024-19004-2","type":"journal-article","created":{"date-parts":[[2024,4,2]],"date-time":"2024-04-02T05:02:12Z","timestamp":1712034132000},"page":"5205-5237","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":9,"title":["Speech based emotion recognition by using a faster region-based convolutional neural network"],"prefix":"10.1007","volume":"84","author":[{"given":"Chappidi","family":"Suneetha","sequence":"first","affiliation":[]},{"given":"Raju","family":"Anitha","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,4,2]]},"reference":[{"issue":"20","key":"19004_CR1","doi-asserted-by":"crossref","first-page":"29581","DOI":"10.1007\/s11042-019-7367-0","volume":"78","author":"S AlZu\u2019bi","year":"2019","unstructured":"AlZu\u2019bi S, Hawashin B, Mujahed M, Jararweh Y, Gupta BB (2019) An efficient employment of internet of multimedia things in smart and future agriculture. Multimed Tools Appl 78(20):29581\u201329605","journal-title":"Multimed Tools Appl"},{"issue":"11","key":"19004_CR2","doi-asserted-by":"crossref","first-page":"3760","DOI":"10.3390\/s21113760","volume":"21","author":"SA Alanazi","year":"2021","unstructured":"Alanazi SA, Alruwaili M, Ahmad F, Alaerjan A, Alshammari N (2021) Estimation of organizational competitiveness by a hybrid of one-dimensional convolutional neural networks and self-organizing maps using physiological signals for emotional analysis of employees. Sensors 21(11):3760","journal-title":"Sensors"},{"issue":"3","key":"19004_CR3","doi-asserted-by":"crossref","first-page":"592","DOI":"10.3390\/s20030592","volume":"20","author":"A Dzedzickis","year":"2020","unstructured":"Dzedzickis A, Kaklauskas A, Bucinskas V (2020) Human emotion recognition: Review of sensors and methods. Sensors 20(3):592","journal-title":"Sensors"},{"key":"19004_CR4","doi-asserted-by":"crossref","first-page":"10","DOI":"10.1016\/j.inffus.2018.10.009","volume":"51","author":"MM Hassan","year":"2019","unstructured":"Hassan MM, Alam MGR, Uddin MZ, Huda S, Almogren A, Fortino G (2019) Human emotion recognition using deep belief network architecture. Information Fusion 51:10\u201318","journal-title":"Information Fusion"},{"key":"19004_CR5","volume":"84","author":"X Wang","year":"2020","unstructured":"Wang X, Chen X, Cao C (2020) Human emotion recognition by optimally fusing facial expression and speech feature. Signal Processing: Image Communication 84:115831","journal-title":"Signal Processing: Image Communication"},{"key":"19004_CR6","doi-asserted-by":"crossref","first-page":"117327","DOI":"10.1109\/ACCESS.2019.2936124","volume":"7","author":"RA Khalil","year":"2019","unstructured":"Khalil RA, Jones E, Babar MI, Jan T, Zafar MH, Alhussain T (2019) Speech emotion recognition using deep learning techniques: A review. IEEE Access 7:117327\u2013117345","journal-title":"IEEE Access"},{"issue":"3","key":"19004_CR7","doi-asserted-by":"crossref","first-page":"771","DOI":"10.1007\/s12559-021-09865-2","volume":"13","author":"KA Ara\u00f1o","year":"2021","unstructured":"Ara\u00f1o KA, Gloor P, Orsenigo C, Vercellis C (2021) When old meets new: emotion recognition from speech signals. Cogn Comput 13(3):771\u2013783","journal-title":"Cogn Comput"},{"key":"19004_CR8","doi-asserted-by":"crossref","first-page":"312","DOI":"10.1016\/j.bspc.2018.08.035","volume":"47","author":"J Zhao","year":"2019","unstructured":"Zhao J, Mao X, Chen L (2019) Speech emotion recognition using deep 1D & 2D CNN LSTM networks. Biomed Signal Process Control 47:312\u2013323","journal-title":"Biomed Signal Process Control"},{"issue":"3","key":"19004_CR9","first-page":"111","volume":"4","author":"DKA Senthil","year":"2023","unstructured":"Senthil DKA, Srinivasan B (2023) Spoken Keyword Spotting System Design Using Various Wavelet Transformation Techniques with BPNN Classifier. Int J Comput Eng Res Trends 4(3):111\u2013118","journal-title":"Int J Comput Eng Res Trends"},{"key":"19004_CR10","doi-asserted-by":"crossref","first-page":"69","DOI":"10.1016\/j.inffus.2018.09.008","volume":"49","author":"MS Hossain","year":"2019","unstructured":"Hossain MS, Muhammad G (2019) Emotion recognition using deep learning approach from audio\u2013visual emotional big data. Inf Fus 49:69\u201378","journal-title":"Inf Fus"},{"key":"19004_CR11","doi-asserted-by":"crossref","DOI":"10.3389\/frobt.2020.532279","volume":"7","author":"M Spezialetti","year":"2020","unstructured":"Spezialetti M, Placidi G, Rossi S (2020) Emotion recognition for human-robot interaction: Recent advances and future perspectives. Front Robot AI 7:532279","journal-title":"Front Robot AI"},{"key":"19004_CR12","doi-asserted-by":"crossref","unstructured":"Chowdary MK, Nguyen TN, Hemanth DJ (2021) Deep learning-based facial emotion recognition for human\u2013computer interaction applications.\u00a0Neural Comput Appl 1\u201318","DOI":"10.1007\/s00521-021-06012-8"},{"key":"19004_CR13","doi-asserted-by":"crossref","first-page":"56","DOI":"10.1016\/j.specom.2019.12.001","volume":"116","author":"MB Ak\u00e7ay","year":"2020","unstructured":"Ak\u00e7ay MB, O\u011fuz K (2020) Speech emotion recognition: Emotional models, databases, features, preprocessing methods, supporting modalities, and classifiers. Speech Commun 116:56\u201376","journal-title":"Speech Commun"},{"issue":"7","key":"19004_CR14","doi-asserted-by":"crossref","first-page":"R231","DOI":"10.1016\/j.cub.2019.02.034","volume":"29","author":"N Kriegeskorte","year":"2019","unstructured":"Kriegeskorte N, Golan T (2019) Neural network models and deep learning. Curr Biol 29(7):R231\u2013R236","journal-title":"Curr Biol"},{"key":"19004_CR15","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1016\/j.specom.2019.04.004","volume":"110","author":"X Li","year":"2019","unstructured":"Li X, Akagi M (2019) Improving multilingual speech emotion recognition by combining acoustic features in a three-layer model. Speech Commun 110:1\u201312","journal-title":"Speech Commun"},{"issue":"8","key":"19004_CR16","doi-asserted-by":"crossref","first-page":"3187","DOI":"10.1007\/s12652-019-01485-x","volume":"11","author":"MG Salido Ortega","year":"2020","unstructured":"Salido Ortega MG, Rodr\u00edguez LF, Gutierrez-Garcia JO (2020) Towards emotion recognition from contextual information using machine learning. J Ambient Intell Humaniz Comput 11(8):3187\u20133207","journal-title":"J Ambient Intell Humaniz Comput"},{"key":"19004_CR17","doi-asserted-by":"crossref","DOI":"10.1016\/j.bspc.2020.101894","volume":"59","author":"D Issa","year":"2020","unstructured":"Issa D, Demirci MF, Yazici A (2020) Speech emotion recognition with deep convolutional neural networks. Biomed Signal Process Control 59:101894\u00a0 https:\/\/www.sciencedirect.com\/science\/article\/abs\/pii\/S1746809420300501","journal-title":"Biomed Signal Process Control"},{"key":"19004_CR18","volume":"173","author":"D Li","year":"2021","unstructured":"Li D, Liu J, Yang Z, Sun L, Wang Z (2021) Speech emotion recognition using recurrent neural networks with directional self-attention. Expert Syst Appl 173:114683","journal-title":"Expert Syst Appl"},{"issue":"1","key":"19004_CR19","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1186\/s13636-021-00208-5","volume":"2021","author":"D Tang","year":"2021","unstructured":"Tang D, Kuppens P, Geurts L, van Waterschoot T (2021) End-to-end speech emotion recognition using a novel context-stacking dilated convolution neural network. EURASIP J Audio, Speech, Music Process 2021(1):1\u201316","journal-title":"EURASIP J Audio, Speech, Music Process"},{"key":"19004_CR20","doi-asserted-by":"crossref","unstructured":"Chen JIZ, Yeh LT (2023) Apply an optimized NN model to low-dimensional format speech recognition and exploring the performance with restricted factors. Measurement and Control 56(1\u20132):3\u201317","DOI":"10.1177\/00202940221109778"},{"key":"19004_CR21","doi-asserted-by":"crossref","unstructured":"Burkhardt F, Paeschke A, Rolfes, M et al (2005, September) A database of German emotional speech. In: Interspeech, 5(1517\u20131520)","DOI":"10.21437\/Interspeech.2005-446"},{"key":"19004_CR22","unstructured":"Jovicic ST, Kasic Z, Dordevic M, Rajkovic M (2004, September) Serbian emotional speech database: design, processing and evaluation. In: Proceedings of the 9th International Conference Speech and Computer (pp 77\u201381)"},{"key":"19004_CR23","doi-asserted-by":"crossref","first-page":"125830","DOI":"10.1109\/ACCESS.2021.3111659","volume":"9","author":"S Kanwal","year":"2021","unstructured":"Kanwal S, Asghar S (2021) Speech emotion recognition using clustering based GA-optimized feature set. IEEE Access 9:125830\u2013125842","journal-title":"IEEE Access"},{"key":"19004_CR24","doi-asserted-by":"crossref","unstructured":"Efat MIA, Hossain MS, Aditya S, Setu JH, Imtiaz-Ud-Din KM (2022) Identifying optimised speaker identification model using hybrid GRU-CNN feature extraction technique.\u00a0Int J Comput Vis Robot\u00a012(6):662\u2013685","DOI":"10.1504\/IJCVR.2022.126508"},{"issue":"2","key":"19004_CR25","first-page":"319","volume":"56","author":"J Huang","year":"2019","unstructured":"Huang J, Shi Y, Gao Y (2019) Multi-scale faster-RCNN algorithm for small object detection. J Comput Res Dev 56(2):319\u2013327","journal-title":"J Comput Res Dev"},{"issue":"10","key":"19004_CR26","doi-asserted-by":"crossref","first-page":"250","DOI":"10.3390\/fi13100250","volume":"13","author":"LA Corujo","year":"2021","unstructured":"Corujo LA, Kieson E, Schloesser T, Gloor PA (2021) Emotion recognition in horses with convolutional neural networks. Future Internet 13(10):250","journal-title":"Future Internet"},{"issue":"1","key":"19004_CR27","doi-asserted-by":"crossref","first-page":"74","DOI":"10.20965\/jaciii.2022.p0074","volume":"26","author":"A Nakano","year":"2022","unstructured":"Nakano A, Nagamune K (2022) A Development of Robotic Scrub Nurse System-Detection for Surgical Instruments Using Faster Region-Based Convolutional Neural Network\u2013. J Adv Comput Intell Intell Inf 26(1):74\u201382","journal-title":"J Adv Comput Intell Intell Inf"},{"key":"19004_CR28","doi-asserted-by":"crossref","DOI":"10.1016\/j.compeleceng.2021.107280","volume":"93","author":"S Nayak","year":"2021","unstructured":"Nayak S, Nagesh B, Routray A, Sarma M (2021) A Human-Computer Interaction framework for emotion recognition through time-series thermal video sequences. Comput Electr Eng 93:107280","journal-title":"Comput Electr Eng"},{"key":"19004_CR29","unstructured":"Ms B (2022) Transfer learning-based object detection by using faster region based convolution neural networks. International Journal of Innovative Research in Computer and Communication Engineering"},{"key":"19004_CR30","doi-asserted-by":"crossref","DOI":"10.1016\/j.coastaleng.2021.103859","volume":"166","author":"A de Silva","year":"2021","unstructured":"de Silva A, Mori I, Dusek G, Davis J, Pang A (2021) Automated rip current detection with region based convolutional neural networks. Coast Eng 166:103859","journal-title":"Coast Eng"},{"issue":"2","key":"19004_CR31","doi-asserted-by":"crossref","first-page":"317","DOI":"10.3390\/diagnostics12020317","volume":"12","author":"YS Lee","year":"2022","unstructured":"Lee YS, Park WH (2022) Diagnosis of depressive disorder model on facial expression based on fast R-CNN. Diagnostics 12(2):317","journal-title":"Diagnostics"},{"key":"19004_CR32","doi-asserted-by":"crossref","unstructured":"Ahmed K, Mohammadi FG, Matus M, Shenavarmasouleh F, Pereira LM, Zisis I, Amini MH (2021) Towards real-time house detection in aerial images using faster region-based convolutional neural network","DOI":"10.2139\/ssrn.3994191"},{"issue":"11","key":"19004_CR33","doi-asserted-by":"crossref","first-page":"215","DOI":"10.17762\/turcomat.v12i11.5863","volume":"12","author":"M Seshaiah","year":"2021","unstructured":"Seshaiah M (2021) Comparative Analysis of Various Face Detection and Tracking and Recognition Mechanisms using Machine and Deep Learning Methods. Turkish J Comput Math Educ (TURCOMAT) 12(11):215\u2013223","journal-title":"Turkish J Comput Math Educ (TURCOMAT)"},{"issue":"6","key":"19004_CR34","doi-asserted-by":"crossref","first-page":"428","DOI":"10.1049\/cvi2.12028","volume":"15","author":"MS Iqbal","year":"2021","unstructured":"Iqbal MS, Ali H, Tran SN, Iqbal T (2021) Coconut trees detection and segmentation in aerial imagery using mask region-based convolution neural network. IET Comput Vision 15(6):428\u2013439","journal-title":"IET Comput Vision"},{"issue":"3","key":"19004_CR35","doi-asserted-by":"crossref","first-page":"1371","DOI":"10.2298\/CSIS220322037L","volume":"19","author":"P Li","year":"2022","unstructured":"Li P, Zhao L (2022) A novel art gesture recognition model based on two channel region-based convolution neural network for explainable human-computer interaction understanding. Comput Sci Inf Syst 19(3):1371\u20131388","journal-title":"Comput Sci Inf Syst"},{"issue":"7","key":"19004_CR36","doi-asserted-by":"crossref","DOI":"10.1088\/1361-6560\/ac5d74","volume":"67","author":"T Peng","year":"2022","unstructured":"Peng T, Wang C, Zhang Y, Wang J (2022) H-SegNet: hybrid segmentation network for lung segmentation in chest radiographs using mask region-based convolutional neural network and adaptive closed polyline searching method. Phys Med Biol 67(7):075006","journal-title":"Phys Med Biol"},{"issue":"1","key":"19004_CR37","doi-asserted-by":"crossref","first-page":"6991","DOI":"10.1038\/s41598-022-11173-0","volume":"12","author":"T Debnath","year":"2022","unstructured":"Debnath T, Reza MM, Rahman A, Beheshti A, Band SS, Alinejad-Rokny H (2022) Four-layer ConvNet to facial emotion recognition with minimal epochs and the significance of data diversity. Sci Rep 12(1):6991","journal-title":"Sci Rep"},{"issue":"3","key":"19004_CR38","doi-asserted-by":"crossref","first-page":"9","DOI":"10.24018\/ejece.2021.5.3.321","volume":"5","author":"HI Muhammad","year":"2021","unstructured":"Muhammad HI, Musa KI, Abdulrahman ML, Abubakar A, Umar K, Ishola A (2021) Enhancing detection performance of face recognition algorithm using PCA-faster R-CNN. Eur J Electric Eng Comput Sci 5(3):9\u201316","journal-title":"Eur J Electric Eng Comput Sci"},{"key":"19004_CR39","volume":"215","author":"H Ge","year":"2022","unstructured":"Ge H, Zhu Z, Dai Y, Wang B, Wu X (2022) Facial expression recognition based on deep learning. Comput Methods Programs Biomed 215:106621","journal-title":"Comput Methods Programs Biomed"},{"key":"19004_CR40","doi-asserted-by":"publisher","unstructured":"Saurav, S, Gidde, P, Saini, R, Singh, S (2022) Dual integrated convolutional neural network for real-time facial expression recognition in the wild.\u00a0The Visual Computer, 1\u201314. https:\/\/doi.org\/10.1007\/s00371-021-02069-7","DOI":"10.1007\/s00371-021-02069-7"},{"issue":"11","key":"19004_CR41","doi-asserted-by":"crossref","first-page":"1289","DOI":"10.3390\/electronics10111289","volume":"10","author":"N Rathour","year":"2021","unstructured":"Rathour N, Alshamrani SS, Singh R, Gehlot A, Rashid M, Akram SV, AlGhamdi AS (2021) IoMT based facial emotion recognition system using deep convolution neural networks. Electronics 10(11):1289","journal-title":"Electronics"},{"issue":"21","key":"19004_CR42","doi-asserted-by":"crossref","first-page":"4438","DOI":"10.3390\/rs13214438","volume":"13","author":"JA Aird","year":"2021","unstructured":"Aird JA, Quon EW, Barthelmie RJ, Debnath M, Doubrawa P, Pryor SC (2021) Region-based convolutional neural network for wind turbine wake characterization in complex terrain. Remote Sensing 13(21):4438","journal-title":"Remote Sensing"},{"issue":"4","key":"19004_CR43","doi-asserted-by":"crossref","first-page":"409","DOI":"10.30630\/joiv.5.4.735","volume":"5","author":"LR Yee","year":"2021","unstructured":"Yee LR, Kamaludin H, Safar NZM, Wahid N, Abdullah N, Meidelfi D (2021) Intelligence Eye for Blinds and Visually Impaired by Using Region-Based Convolutional Neural Network (R-CNN). JOIV: Int J Inf Visual 5(4):409\u2013414","journal-title":"JOIV: Int J Inf Visual"},{"key":"19004_CR44","volume":"130","author":"R Ali","year":"2021","unstructured":"Ali R, Kang D, Suh G, Cha YJ (2021) Real-time multiple damage mapping using autonomous UAV and deep faster region-based neural networks for GPS-denied structures. Autom Constr 130:103831","journal-title":"Autom Constr"},{"issue":"1","key":"19004_CR45","doi-asserted-by":"crossref","first-page":"1564","DOI":"10.1177\/03611981221105066","volume":"2677","author":"LNH Truong","year":"2023","unstructured":"Truong LNH, Clay E, Mora OE, Cheng W, Singh M, Jia X (2023) Rotated Mask Region-Based Convolutional Neural Network Detection for Parking Space Management System. Transp Res Rec 2677(1):1564\u20131581","journal-title":"Transp Res Rec"},{"issue":"11","key":"19004_CR46","doi-asserted-by":"crossref","first-page":"15549","DOI":"10.3390\/s131115549","volume":"13","author":"F Alonso-Martin","year":"2013","unstructured":"Alonso-Martin F, Malfaz M, Sequeira J, Gorostiza JF, Salichs MA (2013) A multimodal emotion detection system during human\u2013robot interaction. Sensors 13(11):15549\u201315581","journal-title":"Sensors"},{"key":"19004_CR47","first-page":"20230","volume":"34","author":"J He","year":"2021","unstructured":"He J, Erfani S, Ma X, Bailey J, Chi Y, Hua XS (2021) A family of power intersection over union losses for bounding box regression. Adv Neural Inf Process Syst 34:20230\u201320242","journal-title":"Adv Neural Inf Process Syst"},{"issue":"18","key":"19004_CR48","doi-asserted-by":"crossref","first-page":"5212","DOI":"10.3390\/s20185212","volume":"20","author":"T Anvarjon","year":"2020","unstructured":"Anvarjon T, Mustaqeem, Kwon S (2020) Deep-net: A lightweight CNN-based speech emotion recognition system using deep frequency features. Sensors 20(18):5212","journal-title":"Sensors"},{"key":"19004_CR49","doi-asserted-by":"crossref","unstructured":"Likitha MS, Gupta SRR, Hasitha K, Raju AU (2017, March) Speech based human emotion recognition using MFCC. In: 2017 international conference on wireless communications, signal processing and networking (WiSPNET). IEEE, pp 2257\u20132260","DOI":"10.1109\/WiSPNET.2017.8300161"},{"key":"19004_CR50","unstructured":"Tripathi S, Kumar A, Ramesh A, Singh C, Yenigalla P (2019) Deep learning based emotion recognition system using speech features and transcriptions. arXiv preprint arXiv:1906.05681. https:\/\/ieeexplore.ieee.org\/document\/9966603"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-024-19004-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-024-19004-2\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-024-19004-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,3,23]],"date-time":"2025-03-23T00:19:43Z","timestamp":1742689183000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-024-19004-2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,4,2]]},"references-count":50,"journal-issue":{"issue":"8","published-online":{"date-parts":[[2025,3]]}},"alternative-id":["19004"],"URL":"https:\/\/doi.org\/10.1007\/s11042-024-19004-2","relation":{},"ISSN":["1573-7721"],"issn-type":[{"value":"1573-7721","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,4,2]]},"assertion":[{"value":"1 May 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"4 October 2023","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"21 November 2023","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"2 April 2024","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that we have no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}