{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,7]],"date-time":"2026-05-07T15:40:03Z","timestamp":1778168403781,"version":"3.51.4"},"reference-count":18,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2017,3]]},"DOI":"10.1109\/icassp.2017.7953138","type":"proceedings-article","created":{"date-parts":[[2017,6,20]],"date-time":"2017-06-20T21:35:36Z","timestamp":1497994536000},"page":"5150-5154","source":"Crossref","is-referenced-by-count":73,"title":["Learning utterance-level representations for speech emotion and age\/gender recognition using deep neural networks"],"prefix":"10.1109","author":[{"given":"Zhong-Qiu","family":"Wang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ivan","family":"Tashev","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref10","article-title":"Hidden Markov Model-based Speech Emotion Recognition","author":"schuller","year":"2003","journal-title":"Proc IEEE InternationalConference Acoustics Speech and Signal Processing"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN.2016.7727636"},{"key":"ref12","article-title":"High-level Feature Representation using Recurrent Neural Network for Speech Emotion Recognition","author":"lee","year":"2015","journal-title":"Proceedings of Interspeech"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/97.736233"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/PACRIM.2009.5291253"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2005.12.126"},{"key":"ref16","author":"bishop","year":"2006","journal-title":"Pattern Recognition and Machine Learning"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ACII.2013.58"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1007\/s10579-008-9076-6"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ACII.2009.5349350"},{"key":"ref3","article-title":"Bag of Tricks for Efficient Text Classification","author":"joulin","year":"2016"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2016.7472669"},{"key":"ref5","first-page":"2196","article-title":"Discriminatively Trained Recurrent Neural Network for Continuous Dimensional Emotion Recognition from Audio","author":"weninger","year":"2016","journal-title":"Proceedings of IJCAI"},{"key":"ref8","article-title":"Speech Emotion Recognition using Deep Neural Network and Extreme Learning Machine","author":"han","year":"2014","journal-title":"Proceedings of Interspeech"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2011.5947651"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2015.2462851"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1016\/j.imavis.2009.11.014"},{"key":"ref9","article-title":"Learning Representations of Affect from Speech","author":"ghosh","year":"2015"}],"event":{"name":"2017 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","location":"New Orleans, LA","start":{"date-parts":[[2017,3,5]]},"end":{"date-parts":[[2017,3,9]]}},"container-title":["2017 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7943262\/7951776\/07953138.pdf?arnumber=7953138","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,8,29]],"date-time":"2017-08-29T18:46:29Z","timestamp":1504032389000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7953138\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,3]]},"references-count":18,"URL":"https:\/\/doi.org\/10.1109\/icassp.2017.7953138","relation":{},"subject":[],"published":{"date-parts":[[2017,3]]}}}