{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,29]],"date-time":"2026-04-29T03:05:08Z","timestamp":1777431908760,"version":"3.51.4"},"reference-count":31,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018,10]]},"DOI":"10.1109\/iros.2018.8593571","type":"proceedings-article","created":{"date-parts":[[2019,1,24]],"date-time":"2019-01-24T02:33:30Z","timestamp":1548297210000},"page":"854-860","source":"Crossref","is-referenced-by-count":52,"title":["On the Robustness of Speech Emotion Recognition for Human-Robot Interaction with Deep Neural Networks"],"prefix":"10.1109","author":[{"given":"Egor","family":"Lakomkin","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mohammad Ali","family":"Zamani","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Cornelius","family":"Weber","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Sven","family":"Magg","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Stefan","family":"Wermter","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1145\/2647868.2655045"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/MFI.2012.6343022"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1016\/j.neunet.2017.02.013"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2016-448"},{"key":"ref12","article-title":"High-level Feature Representation using Recurrent Neural Network for Speech Emotion Recognition","author":"lee","year":"2015","journal-title":"InterSpeech"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2016.7472669"},{"key":"ref14","doi-asserted-by":"crossref","first-page":"1098","DOI":"10.21437\/Interspeech.2017-1637","article-title":"Progressive Neural Networks for Transfer Learning in Emotion Recognition","author":"gideon","year":"2017","journal-title":"InterSpeech"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2016-868"},{"key":"ref16","first-page":"423","article-title":"Reusing Neural Speech Representations for Auditory Emotion Recognition","volume":"1","author":"lakomkin","year":"2017","journal-title":"Proceedings of the Eighth International Joint Conference on Natural Language Processing"},{"key":"ref17","doi-asserted-by":"crossref","first-page":"1263","DOI":"10.21437\/Interspeech.2017-917","article-title":"Attentive Convolutional Neural Network based Speech Emotion Recognition: A Study on the Impact of Input Features, Signal Length, and Acted Speech","author":"neumann","year":"2017","journal-title":"InterSpeech"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1145\/2750858.2804262"},{"key":"ref19","volume":"abs 1712 7108","author":"zhou","year":"2017","journal-title":"Improved Regularization Techniques for End-to-End Speech Recognition"},{"key":"ref28","article-title":"Adam: A Method for Stochastic Optimization","author":"kingma","year":"2014","journal-title":"International Conference on Learning Representations"},{"key":"ref4","first-page":"1929","article-title":"Dropout: A simple way to prevent neural networks from overfitting","volume":"15","author":"srivastava","year":"2014","journal-title":"The Journal of Machine Learning Research"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/D14-1181"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2017.7989324"},{"key":"ref6","article-title":"Recurrent Batch Normalization","author":"cooijmans","year":"2017","journal-title":"International Conference on Learning Representations"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1007\/s10579-008-9076-6"},{"key":"ref5","first-page":"448","article-title":"Batch normalization: Accelerating deep network training by reducing internal covariate shift","author":"ioffe","year":"2015","journal-title":"International Conference on Machine Learning"},{"key":"ref8","first-page":"1195","article-title":"Mean teachers are better role models: Weight-averaged consistency targets improve semi-supervised deep learning results","volume":"30","author":"tarvainen","year":"2017","journal-title":"Advances in neural information processing systems"},{"key":"ref7","first-page":"5285","article-title":"Layer Normalization","volume":"30","author":"ba","year":"2017","journal-title":"Advances in neural information processing systems"},{"key":"ref2","first-page":"1097","article-title":"ImageNet Classification with Deep Convolutional Neural Networks","volume":"25","author":"krizhevsky","year":"2012","journal-title":"Advances in neural information processing systems"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2015.7178934"},{"key":"ref1","first-page":"173","article-title":"Deep Speech 2: End-to-End Speech Recognition in English and Mandarin","volume":"48","author":"amodei","year":"2016","journal-title":"The 33rd International Conference on Machine Learning"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/TAFFC.2015.2457417"},{"key":"ref22","volume":"abs 1412 5567","author":"hannun","year":"2014","journal-title":"Deep speech Scaling up end-to-end speech recognition"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1145\/2502081.2502224"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P17-1081"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/ICDSP.2009.5201259"},{"key":"ref26","article-title":"Neural Machine Translation by Jointly Learning to align and translate","author":"bahdanau","year":"2015","journal-title":"I nternational Conference on Learning Representations"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1145\/2993148.2993165"}],"event":{"name":"2018 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS)","location":"Madrid","start":{"date-parts":[[2018,10,1]]},"end":{"date-parts":[[2018,10,5]]}},"container-title":["2018 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8574473\/8593358\/08593571.pdf?arnumber=8593571","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,8,24]],"date-time":"2020-08-24T05:47:25Z","timestamp":1598248045000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8593571\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,10]]},"references-count":31,"URL":"https:\/\/doi.org\/10.1109\/iros.2018.8593571","relation":{},"subject":[],"published":{"date-parts":[[2018,10]]}}}