{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,11,28]],"date-time":"2024-11-28T05:06:58Z","timestamp":1732770418562,"version":"3.29.0"},"reference-count":61,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,8,26]],"date-time":"2024-08-26T00:00:00Z","timestamp":1724630400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,8,26]],"date-time":"2024-08-26T00:00:00Z","timestamp":1724630400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,8,26]]},"DOI":"10.1109\/ro-man60168.2024.10731355","type":"proceedings-article","created":{"date-parts":[[2024,10,30]],"date-time":"2024-10-30T17:45:45Z","timestamp":1730310345000},"page":"62-68","source":"Crossref","is-referenced-by-count":0,"title":["Sigh!!! There is more than just faces and verbal speech to recognize emotion in human-robot interaction"],"prefix":"10.1109","author":[{"given":"Rahul Singh","family":"Maharjan","sequence":"first","affiliation":[{"name":"University of Manchester,Manchester Centre for Robotics and AI,Manchester,United Kingdom"}]},{"given":"Marta","family":"Romeo","sequence":"additional","affiliation":[{"name":"Heriot-Watt University,Edinburgh,United Kingdom"}]},{"given":"Angelo","family":"Cangelosi","sequence":"additional","affiliation":[{"name":"University of Manchester,Manchester Centre for Robotics and AI,Manchester,United Kingdom"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1027\/\/1016-9040.6.2.79"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1016\/S1071-5819(03)00018-1"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.4324\/9781315080918-15"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1561\/1100000005"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.4018\/978-1-60566-354-8.ch003"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ACIIW59127.2023.10388072"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-68504-3_1"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1016\/j.ijhcs.2012.01.004"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.3301687"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1007\/s11257-022-09337-8"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1007\/s12369-022-00867-0"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TCE.2009.5278031"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1007\/s12193-010-0053-1"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/RO-MAN53752.2022.9900634"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2017-1395"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1007\/978-981-15-8395-7_19"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1016\/S1364-6613(00)01816-7"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1037\/\/0033-2909.97.3.412"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1007\/BF00992106"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1016\/b978-0-12-057770-5.x5000-0"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.4103\/0976-9668.95933"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1038\/npre.2007.1356.1"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1073\/pnas.0908239106"},{"volume-title":"Social perception","year":"1990","author":"Zebrowitz","key":"ref24"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1177\/0956797614531023"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1037\/emo0000100"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1177\/0956797613517239"},{"key":"ref28","doi-asserted-by":"crossref","first-page":"353","DOI":"10.3389\/fpsyg.2013.00353","article-title":"Crosscultural decoding of positive and negative non-linguistic emotion vocalizations","volume":"4","author":"Laukka","year":"2013","journal-title":"Frontiers in Psychology"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1016\/S0167-6393(02)00078-X"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1037\/amp0000399"},{"article-title":"The icml 2022 expressive vocalizations workshop and competition: Recognizing, generating, and personalizing vocal bursts","year":"2022","author":"Baird","key":"ref31"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/ACIIW57231.2022.10086002"},{"article-title":"Emogator: A new open source vocal burst dataset with baseline machine learning classification methodologies","year":"2023","author":"Buhl","key":"ref33"},{"article-title":"An efficient multitask learning architecture for affective vocal burst analysis","year":"2022","author":"Hallmen","key":"ref34"},{"article-title":"Exploring speaker enrolment for few-shot personalisation in emotional vocalisation prediction","year":"2022","author":"Triantafyllopoulos","key":"ref35"},{"article-title":"Exploring the effectiveness of self-supervised learning and classifier chains in emotion recognition of nonverbal vocalizations","year":"2022","author":"Xin","key":"ref36"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP49357.2023.10096395"},{"article-title":"Self-supervised attention networks and uncertainty loss weighting for multi-task emotion recognition on vocal bursts","year":"2022","author":"Karas","key":"ref38"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2022-10927"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP49357.2023.10095294"},{"key":"ref41","first-page":"12449","article-title":"wav2vec 2.0: A framework for self-supervised learning of speech representations","volume":"33","author":"Baevski","year":"2020","journal-title":"Advances in neural information processing systems"},{"key":"ref42","first-page":"28492","article-title":"Robust speech recognition via large-scale weak supervision","volume-title":"International Conference on Machine Learning","author":"Radford"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1038\/s41562-022-01489-2"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/RAM.2013.6758580"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1007\/s00146-010-0306-2"},{"article-title":"Detection of social signals for recognizing engagement in human-robot interaction","year":"2017","author":"Lala","key":"ref46"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.5772\/55406"},{"article-title":"Sparks of large audio models: A survey and outlook","year":"2023","author":"Latif","key":"ref48"},{"article-title":"Rethinking cnn models for audio classification","year":"2020","author":"Palanisamy","key":"ref49"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.308"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.243"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/JSTSP.2022.3188113"},{"article-title":"Audio recognition using mel spectrograms and convolution neural networks","year":"2019","author":"Thornton","key":"ref55"},{"article-title":"Decoupled weight decay regularization","year":"2017","author":"Loshchilov","key":"ref56"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1109\/FG47880.2020.00110"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1109\/RO-MAN47096.2020.9223564"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1109\/ACIIW57231.2022.10086005"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN54540.2023.10191542"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2017-349"}],"event":{"name":"2024 33rd IEEE International Conference on Robot and Human Interactive Communication (ROMAN)","start":{"date-parts":[[2024,8,26]]},"location":"Pasadena, CA, USA","end":{"date-parts":[[2024,8,30]]}},"container-title":["2024 33rd IEEE International Conference on Robot and Human Interactive Communication (ROMAN)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10731142\/10731137\/10731355.pdf?arnumber=10731355","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,27]],"date-time":"2024-11-27T04:21:38Z","timestamp":1732681298000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10731355\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,8,26]]},"references-count":61,"URL":"https:\/\/doi.org\/10.1109\/ro-man60168.2024.10731355","relation":{},"subject":[],"published":{"date-parts":[[2024,8,26]]}}}