{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,13]],"date-time":"2026-04-13T14:30:48Z","timestamp":1776090648602,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":53,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,11,4]],"date-time":"2024-11-04T00:00:00Z","timestamp":1730678400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"name":"Swedish Research Council","award":["2021-05803"],"award-info":[{"award-number":["2021-05803"]}]},{"name":"Digital Futures"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,11,4]]},"DOI":"10.1145\/3678957.3685729","type":"proceedings-article","created":{"date-parts":[[2024,10,30]],"date-time":"2024-10-30T04:35:53Z","timestamp":1730262953000},"page":"469-478","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":8,"title":["Multimodal User Enjoyment Detection in Human-Robot Conversation: The Power of Large Language Models"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-2428-0468","authenticated-orcid":false,"given":"Andre","family":"Pereira","sequence":"first","affiliation":[{"name":"KTH Royal Institute of Technology, Sweden"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1001-6415","authenticated-orcid":false,"given":"Lubos","family":"Marcinek","sequence":"additional","affiliation":[{"name":"KTH Royal Institute of Technology, Sweden"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-2058-0112","authenticated-orcid":false,"given":"Jura","family":"Miniota","sequence":"additional","affiliation":[{"name":"KTH Royal Institute of Technology, Sweden"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7556-5079","authenticated-orcid":false,"given":"Sofia","family":"Thunberg","sequence":"additional","affiliation":[{"name":"Link\u00f6ping University, Sweden"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8937-8063","authenticated-orcid":false,"given":"Erik","family":"Lagerstedt","sequence":"additional","affiliation":[{"name":"School of Informatics, University of Sk\u00f6vde, Sweden"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0397-6442","authenticated-orcid":false,"given":"Joakim","family":"Gustafson","sequence":"additional","affiliation":[{"name":"KTH Royal Institute of Technology, Sweden"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8579-1790","authenticated-orcid":false,"given":"Gabriel","family":"Skantze","sequence":"additional","affiliation":[{"name":"KTH Royal Institute of Technology, Sweden"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7983-079X","authenticated-orcid":false,"given":"Bahar","family":"Irfan","sequence":"additional","affiliation":[{"name":"KTH Royal Institute of Technology, Sweden"}]}],"member":"320","published-online":{"date-parts":[[2024,11,4]]},"reference":[{"key":"e_1_3_2_2_1_1","volume-title":"On the opportunities and risks of foundation models. arXiv preprint arXiv:2108.07258","author":"Bommasani Rishi","year":"2021","unstructured":"Rishi Bommasani, Drew\u00a0A Hudson, Ehsan Adeli, Russ Altman, Simran Arora, Sydney von Arx, Michael\u00a0S Bernstein, Jeannette Bohg, Antoine Bosselut, Emma Brunskill, 2021. On the opportunities and risks of foundation models. arXiv preprint arXiv:2108.07258 (2021)."},{"key":"e_1_3_2_2_2_1","doi-asserted-by":"publisher","DOI":"10.1145\/2939672.2939785"},{"key":"e_1_3_2_2_3_1","doi-asserted-by":"publisher","DOI":"10.1007\/s42761-023-00191-4"},{"key":"e_1_3_2_2_4_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.sigdial-1.55"},{"key":"e_1_3_2_2_5_1","doi-asserted-by":"publisher","DOI":"10.1109\/Humanoids.2011.6100847"},{"key":"e_1_3_2_2_6_1","volume-title":"Flow and the foundations of positive psychology. Vol.\u00a010","author":"Csikszentmihalyi Mihaly","unstructured":"Mihaly Csikszentmihalyi, Reed Larson, 2014. Flow and the foundations of positive psychology. Vol.\u00a010. Springer."},{"key":"e_1_3_2_2_7_1","volume-title":"An argument for basic emotions. Cognition & emotion 6, 3-4","author":"Ekman Paul","year":"1992","unstructured":"Paul Ekman. 1992. An argument for basic emotions. Cognition & emotion 6, 3-4 (1992), 169\u2013200."},{"key":"e_1_3_2_2_8_1","volume-title":"Quality of Life Enjoyment and Satisfaction Questionnaire: a new measure.Psychopharmacology bulletin 29, 2","author":"Endicott Jean","year":"1993","unstructured":"Jean Endicott, John Nee, Wilma Harrison, and Richard Blumenthal. 1993. Quality of Life Enjoyment and Satisfaction Questionnaire: a new measure.Psychopharmacology bulletin 29, 2 (1993), 321\u2013326."},{"key":"e_1_3_2_2_9_1","doi-asserted-by":"publisher","DOI":"10.1145\/2729095.2729097"},{"key":"e_1_3_2_2_10_1","doi-asserted-by":"publisher","DOI":"10.14786\/flr.v8i3.623"},{"key":"e_1_3_2_2_11_1","unstructured":"Gemini team Google. 2024. Gemini 1.5: Unlocking multimodal understanding across millions of tokens of context. arXiv:https:\/\/storage.googleapis.com\/deepmind-media\/gemini\/gemini_v1_5_report.pdf"},{"key":"e_1_3_2_2_12_1","volume-title":"Gemini: A Family of Highly Capable Multimodal Models. arXiv:https:\/\/storage.googleapis.com\/deepmind-media\/gemini\/gemini_1_report.pdf","author":"Gemini","year":"2024","unstructured":"Gemini team, Google. 2024. Gemini: A Family of Highly Capable Multimodal Models. arXiv:https:\/\/storage.googleapis.com\/deepmind-media\/gemini\/gemini_1_report.pdf"},{"key":"e_1_3_2_2_13_1","volume-title":"20th Amsterdam Colloquium.","author":"Ginzburg Jonathan","unstructured":"Jonathan Ginzburg, Ellen Breitholtz, Robin Cooper, Julian Hough, and Ye Tian. 2015. Understanding laughter. In 20th Amsterdam Colloquium."},{"key":"e_1_3_2_2_14_1","volume-title":"Affective Computing for Human-Robot Interaction Research: Four Critical Lessons for the Hitchhiker. In 2023 32nd IEEE International Conference on Robot and Human Interactive Communication (RO-MAN)","author":"Gunes Hatice","unstructured":"Hatice Gunes and Nikhil Churamani. 2023. Affective Computing for Human-Robot Interaction Research: Four Critical Lessons for the Hitchhiker. In 2023 32nd IEEE International Conference on Robot and Human Interactive Communication (RO-MAN). IEEE, 1565\u20131572."},{"key":"e_1_3_2_2_15_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.pragma.2010.01.010"},{"key":"e_1_3_2_2_16_1","doi-asserted-by":"publisher","DOI":"10.1007\/s12369-010-0068-5"},{"key":"e_1_3_2_2_17_1","volume-title":"Long short-term memory. Neural computation 9, 8","author":"Hochreiter Sepp","year":"1997","unstructured":"Sepp Hochreiter and J\u00fcrgen Schmidhuber. 1997. Long short-term memory. Neural computation 9, 8 (1997), 1735\u20131780."},{"key":"e_1_3_2_2_18_1","doi-asserted-by":"publisher","DOI":"10.1109\/HRI.2013.6483605"},{"key":"e_1_3_2_2_19_1","doi-asserted-by":"publisher","DOI":"10.1145\/3173386.3173389"},{"key":"e_1_3_2_2_20_1","doi-asserted-by":"publisher","unstructured":"Bahar Irfan Sanna-Mari Kuoppam\u00e4ki and Gabriel Skantze. 2023. Between reality and delusion: challenges of applying large language models to companion robots for open-domain dialogues with older adults. (2023). https:\/\/doi.org\/10.21203\/rs.3.rs-2884789\/v1","DOI":"10.21203\/rs.3.rs-2884789"},{"key":"e_1_3_2_2_21_1","volume-title":"Human-Robot Interaction Conversational User Enjoyment Scale (HRI CUES). arXiv preprint arXiv:2405.01354","author":"Irfan Bahar","year":"2024","unstructured":"Bahar Irfan, Jura Miniota, Sofia Thunberg, Erik Lagerstedt, Sanna Kuoppam\u00e4ki, Gabriel Skantze, and Andr\u00e9 Pereira. 2024. Human-Robot Interaction Conversational User Enjoyment Scale (HRI CUES). arXiv preprint arXiv:2405.01354 (2024)."},{"key":"e_1_3_2_2_22_1","volume-title":"Towards Mitigating Hallucination in Large Language Models via Self-Reflection. arXiv preprint arXiv:2310.06271","author":"Ji Ziwei","year":"2023","unstructured":"Ziwei Ji, Tiezheng Yu, Yan Xu, Nayeon Lee, Etsuko Ishii, and Pascale Fung. 2023. Towards Mitigating Hallucination in Large Language Models via Self-Reflection. arXiv preprint arXiv:2310.06271 (2023)."},{"key":"e_1_3_2_2_23_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-981-19-4453-6_2"},{"key":"e_1_3_2_2_24_1","volume-title":"Physical activity enjoyment scale: Two validation studies.Journal of sport & exercise psychology 13, 1","author":"Kendzierski Deborah","year":"1991","unstructured":"Deborah Kendzierski and Kenneth\u00a0J DeCarlo. 1991. Physical activity enjoyment scale: Two validation studies.Journal of sport & exercise psychology 13, 1 (1991)."},{"key":"e_1_3_2_2_25_1","doi-asserted-by":"publisher","DOI":"10.1145\/3568294.3580067"},{"key":"e_1_3_2_2_26_1","doi-asserted-by":"publisher","DOI":"10.1038\/s42256-024-00820-y"},{"key":"e_1_3_2_2_27_1","volume-title":"Is it Fun?: Understanding Enjoyment in Non-Game HCI Research. arXiv preprint arXiv:2209.02308","author":"Kono Michinari","year":"2022","unstructured":"Michinari Kono and Koichi Araake. 2022. Is it Fun?: Understanding Enjoyment in Non-Game HCI Research. arXiv preprint arXiv:2209.02308 (2022)."},{"key":"e_1_3_2_2_28_1","doi-asserted-by":"publisher","DOI":"10.1002\/mar.20196"},{"key":"e_1_3_2_2_29_1","volume-title":"Developing Social Robots with Empathetic Non-Verbal Cues Using Large Language Models. In 2023 32nd IEEE International Conference on Robot & Human Interactive Communication (RO-MAN).","author":"Lee Yoon\u00a0Kyung","year":"2023","unstructured":"Yoon\u00a0Kyung Lee, Yoonwon Jung, Gyuyi Kang, and Sowon Hahn. 2023. Developing Social Robots with Empathetic Non-Verbal Cues Using Large Language Models. In 2023 32nd IEEE International Conference on Robot & Human Interactive Communication (RO-MAN)."},{"key":"e_1_3_2_2_30_1","doi-asserted-by":"publisher","DOI":"10.1145\/2647868.2654924"},{"key":"e_1_3_2_2_31_1","unstructured":"Zhiwei Liu Kailai Yang Tianlin Zhang Qianqian Xie Zeping Yu and Sophia Ananiadou. 2024. EmoLLMs: A Series of Emotional Large Language Models and Annotation Tools for Comprehensive Affective Analysis. arxiv:2401.08508\u00a0[cs.CL]"},{"key":"e_1_3_2_2_32_1","doi-asserted-by":"publisher","DOI":"10.1109\/ACII.2019.8925463"},{"key":"e_1_3_2_2_33_1","doi-asserted-by":"publisher","DOI":"10.1145\/3340555.3353747"},{"key":"e_1_3_2_2_34_1","doi-asserted-by":"publisher","DOI":"10.1145\/2556288.2557078"},{"key":"e_1_3_2_2_35_1","volume-title":"Conversations with Misty the Robot. In 2022 17th ACM\/IEEE International Conference on Human-Robot Interaction (HRI). IEEE, 914\u2013918","author":"Miller Jordan","year":"2022","unstructured":"Jordan Miller and Troy McDaniel. 2022. I enjoyed the chance to meet you and I will always remember you: Healthy Older Adults\u2019 Conversations with Misty the Robot. In 2022 17th ACM\/IEEE International Conference on Human-Robot Interaction (HRI). IEEE, 914\u2013918."},{"key":"e_1_3_2_2_36_1","doi-asserted-by":"publisher","DOI":"10.1145\/3610977.3634941"},{"key":"e_1_3_2_2_37_1","doi-asserted-by":"publisher","DOI":"10.3390\/app11062502"},{"key":"e_1_3_2_2_38_1","doi-asserted-by":"publisher","DOI":"10.1109\/HSI.2018.8431348"},{"key":"e_1_3_2_2_39_1","volume-title":"The circumplex model of affect: an integrative approach to affective neuroscience, cognitive development, and psychopathology.Dev Psychopathol 17, 3 (Summer","author":"Posner Jonathan","year":"2005","unstructured":"Jonathan Posner, James\u00a0A Russell, and Bradley\u00a0S Peterson. 2005. The circumplex model of affect: an integrative approach to affective neuroscience, cognitive development, and psychopathology.Dev Psychopathol 17, 3 (Summer 2005), 715\u2013734."},{"key":"e_1_3_2_2_40_1","volume-title":"The Power of Fun: How to Feel Alive Again","author":"Price C.","unstructured":"C. Price. 2021. The Power of Fun: How to Feel Alive Again. Random House Publishing Group. https:\/\/books.google.se\/books?id=ZgclEAAAQBAJ"},{"key":"e_1_3_2_2_41_1","unstructured":"Alec Radford Jong\u00a0Wook Kim Tao Xu Greg Brockman Christine McLeavey and Ilya Sutskever. 2022. Robust Speech Recognition via Large-Scale Weak Supervision. arxiv:2212.04356\u00a0[eess.AS]"},{"key":"e_1_3_2_2_42_1","doi-asserted-by":"publisher","DOI":"10.1145\/3395035.3425966"},{"key":"e_1_3_2_2_43_1","volume-title":"A circumplex model of affect.Journal of personality and social psychology 39, 6","author":"Russell A","year":"1980","unstructured":"James\u00a0A Russell. 1980. A circumplex model of affect.Journal of personality and social psychology 39, 6 (1980), 1161."},{"key":"e_1_3_2_2_44_1","doi-asserted-by":"crossref","unstructured":"Hesam Sagha Jun Deng and Bj\u00f6rn Schuller. 2017. The effect of personality trait age and gender on the performance of automatic speech valence recognition. In 2017 seventh international conference on affective computing and intelligent interaction (ACII). IEEE 86\u201391.","DOI":"10.1109\/ACII.2017.8273583"},{"key":"e_1_3_2_2_45_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-74889-2_18"},{"key":"e_1_3_2_2_46_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.csl.2016.11.001"},{"key":"e_1_3_2_2_47_1","volume-title":"Consumer acceptance and use of information technology: extending the unified theory of acceptance and use of technology. MIS quarterly","author":"Venkatesh Viswanath","year":"2012","unstructured":"Viswanath Venkatesh, James\u00a0YL Thong, and Xin Xu. 2012. Consumer acceptance and use of information technology: extending the unified theory of acceptance and use of technology. MIS quarterly (2012), 157\u2013178."},{"key":"e_1_3_2_2_48_1","doi-asserted-by":"publisher","DOI":"10.1006\/csla.1998.0110"},{"key":"e_1_3_2_2_49_1","doi-asserted-by":"publisher","DOI":"10.1109\/ACII.2015.7344604"},{"key":"e_1_3_2_2_50_1","doi-asserted-by":"publisher","DOI":"10.1145\/3462244.3479928"},{"key":"e_1_3_2_2_51_1","doi-asserted-by":"publisher","DOI":"10.1145\/3531146.3533088"},{"key":"e_1_3_2_2_52_1","doi-asserted-by":"publisher","DOI":"10.1145\/3610977.3634962"},{"key":"e_1_3_2_2_53_1","doi-asserted-by":"publisher","DOI":"10.1162\/coli_a_00502"}],"event":{"name":"ICMI '24: INTERNATIONAL CONFERENCE ON MULTIMODAL INTERACTION","location":"San Jose Costa Rica","acronym":"ICMI '24"},"container-title":["International Conference on Multimodel Interaction"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3678957.3685729","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3678957.3685729","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T01:10:12Z","timestamp":1750295412000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3678957.3685729"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,11,4]]},"references-count":53,"alternative-id":["10.1145\/3678957.3685729","10.1145\/3678957"],"URL":"https:\/\/doi.org\/10.1145\/3678957.3685729","relation":{},"subject":[],"published":{"date-parts":[[2024,11,4]]},"assertion":[{"value":"2024-11-04","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}