{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,16]],"date-time":"2025-12-16T21:10:27Z","timestamp":1765919427120,"version":"3.48.0"},"publisher-location":"New York, NY, USA","reference-count":48,"publisher":"ACM","content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,10,13]]},"DOI":"10.1145\/3747327.3763031","type":"proceedings-article","created":{"date-parts":[[2025,10,11]],"date-time":"2025-10-11T14:04:34Z","timestamp":1760191474000},"page":"1-6","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":1,"title":["Multimodal Analysis of Listener\u2019s Active Listening Behaviors in Speed Dating Dialogues"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0009-2906-0326","authenticated-orcid":false,"given":"Asahi","family":"Ogushi","sequence":"first","affiliation":[{"name":"Graduate School of Integrated Basic Sciences, Nihon University, Setagaya-Ku, Tokyo, Japan"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-5653-3776","authenticated-orcid":false,"given":"Naoki","family":"Azuma","sequence":"additional","affiliation":[{"name":"Graduate School of Integrated Basic Sciences, Nihon University, Setagaya-Ku, Tokyo, Japan"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-9805-9212","authenticated-orcid":false,"given":"Daichi","family":"Shikama","sequence":"additional","affiliation":[{"name":"Graduate School of Integrated Basic Sciences, Nihon University, Setagaya-Ku, Tokyo, Japan"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-3849-1656","authenticated-orcid":false,"given":"Ryo","family":"Ishii","sequence":"additional","affiliation":[{"name":"Human Informatics Laboratories, NTT Corporation, Yokosuka-shi, Kanagawa, Japan"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-4604-5396","authenticated-orcid":false,"given":"Toshiki","family":"Onishi","sequence":"additional","affiliation":[{"name":"Human Informatics Laboratories, NTT Corporation, Yokosuka-shi, Kanagawa, Japan"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4010-9487","authenticated-orcid":false,"given":"Akihiro","family":"Miyata","sequence":"additional","affiliation":[{"name":"Nihon University, Tokyo, Japan"}]}],"member":"320","published-online":{"date-parts":[[2025,10,12]]},"reference":[{"key":"e_1_3_3_1_2_2","doi-asserted-by":"publisher","DOI":"10.1145\/3292500.3330701"},{"key":"e_1_3_3_1_3_2","doi-asserted-by":"crossref","unstructured":"Michael Argyle Mark Cook and Duncan Cramer. 1994. Gaze and Mutual Gaze. British Journal of Psychiatry 165 6 (1994) 848\u2013850.","DOI":"10.1017\/S0007125000073980"},{"key":"e_1_3_3_1_4_2","doi-asserted-by":"publisher","DOI":"10.1002\/per.768"},{"key":"e_1_3_3_1_5_2","doi-asserted-by":"publisher","DOI":"10.1145\/3706599.3720028"},{"key":"e_1_3_3_1_6_2","doi-asserted-by":"crossref","unstructured":"Jasmin Bergeron and Michel Laroche. 2009. The effects of perceived salesperson listening effectiveness in the financial industry. Journal of Financial Services Marketing 14 (2009) 6\u201325.","DOI":"10.1057\/fsm.2009.1"},{"key":"e_1_3_3_1_7_2","doi-asserted-by":"publisher","DOI":"10.1162\/REST_a_00416"},{"key":"e_1_3_3_1_8_2","doi-asserted-by":"crossref","unstructured":"Lep Breiman. 2001. Random Forests. Machine Learning 45 1 (2001) 5\u201332.","DOI":"10.1023\/A:1010933404324"},{"key":"e_1_3_3_1_9_2","doi-asserted-by":"crossref","unstructured":"Stephen Castleberry C. Shepherd and Rick Ridnour. 1999. Effective interpersonal listening in the personal selling environment: Conceptualization measurement and nomological validity. Journal of Marketing Theory and Practice 7 1 (1999) 30\u201338.","DOI":"10.1080\/10696679.1999.11501817"},{"key":"e_1_3_3_1_10_2","doi-asserted-by":"crossref","unstructured":"Herbert Clark and Meredyth Krych. 2004. Speaking While Monitoring Addressees for Understanding. Journal of Memory and Language 50 (2004) 62\u201381.","DOI":"10.1016\/j.jml.2003.08.004"},{"key":"e_1_3_3_1_11_2","doi-asserted-by":"crossref","unstructured":"Nathan Emery. 2000. The eyes have it: the neuroethology function and evolution of social gaze. Neuroscience & Biobehavioral Reviews 24 6 (2000) 581\u2013604.","DOI":"10.1016\/S0149-7634(00)00025-7"},{"key":"e_1_3_3_1_12_2","doi-asserted-by":"publisher","DOI":"10.1162\/qjec.2006.121.2.673"},{"key":"e_1_3_3_1_13_2","first-page":"540","volume-title":"Personality and Social Psychology Bulletin,","author":"Fletcher Garth J.\u00a0O.","year":"2014","unstructured":"Garth J.\u00a0O. Fletcher, Patrick S.\u00a0G. Kerr, Norman\u00a0P. Li, and Katherine\u00a0A. Valentine. 2014. Predicting Romantic Interest and Decisions in the Very Early Stages of Mate Selection:Standards, Accuracy, and Sex Differences. In Personality and Social Psychology Bulletin, , Vol.\u00a040:4. 540\u2013550."},{"key":"e_1_3_3_1_14_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-74997-4_12"},{"key":"e_1_3_3_1_15_2","doi-asserted-by":"crossref","unstructured":"Alexandra Hoffmann Sabrina Schiestl Philipp Sinske Matthias Gondan Pierre Sachse and Thomas Maran. 2024. Sharing and Receiving Eye-Contact Predicts Mate Choice After a 5-Minute Conversation: Evidence from a Speed-Dating Study. Archives of Sexual Behavior 53 (02 2024) 959\u2013968.","DOI":"10.1007\/s10508-023-02806-0"},{"key":"e_1_3_3_1_16_2","unstructured":"Yukiya Hono Kentaro Mitsui and Kei Sawada. 2023. rinna\/japanese-hubert-base. https:\/\/huggingface.co\/rinna\/japanese-hubert-base."},{"key":"e_1_3_3_1_17_2","first-page":"69","volume-title":"Human Communication,","author":"Houser Marian\u00a0L.","year":"2007","unstructured":"Marian\u00a0L. Houser, Sean\u00a0M. Horan, and Lisa\u00a0A. Furler. 2007. Predicting Relational Outcomes: An Investigation of Thin Slice Judgments in Speed Dating. In Human Communication, , Vol.\u00a010:2. 69\u201381."},{"key":"e_1_3_3_1_18_2","doi-asserted-by":"publisher","DOI":"10.1177\/0265407508093787"},{"key":"e_1_3_3_1_19_2","doi-asserted-by":"crossref","unstructured":"Wei-Ning Hsu Benjamin Bolte Yao-Hung\u00a0Hubert Tsai Kushal Lakhotia Ruslan Salakhutdinov and Abdelrahman Mohamed. 2021. HuBERT: Self-Supervised Speech Representation Learning by Masked Prediction of Hidden Units. IEEE\/ACM Transactions on Audio Speech and Language Processing 29 (2021) 3451\u20133460.","DOI":"10.1109\/TASLP.2021.3122291"},{"key":"e_1_3_3_1_20_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-42293-5_71"},{"key":"e_1_3_3_1_21_2","doi-asserted-by":"crossref","unstructured":"Lamb James. 2018. To Boldly Go: Feedback as Digital Multimodal Dialogue. Multimodal Technologies and Interaction 2 3 (2018) 1\u201317.","DOI":"10.3390\/mti2030049"},{"key":"e_1_3_3_1_22_2","doi-asserted-by":"publisher","DOI":"10.1002\/per.2040"},{"key":"e_1_3_3_1_23_2","first-page":"1478","volume-title":"Psychological Science,","author":"Joel Samantha","year":"2017","unstructured":"Samantha Joel, Paul\u00a0W. Eastwick, and Eli\u00a0J. Finkel. 2017. Is Romantic Desire Predictable? Machine Learning Applied to Initial Romantic Attraction. In Psychological Science, , Vol.\u00a028:10. 1478\u20131489."},{"key":"e_1_3_3_1_24_2","doi-asserted-by":"crossref","unstructured":"Elizabeth Johnson and Kimberly Strauch. 2023. A mixed-methods pilot examination of Montana North Dakota nurse practitioner telepresence behaviors through web-camera eye-tracking and qualitative descriptive interviews. Journal of the American Association of Nurse Practitioners 36 (11 2023) 270\u2013278.","DOI":"10.1097\/JXX.0000000000000974"},{"key":"e_1_3_3_1_25_2","doi-asserted-by":"crossref","unstructured":"Hiroaki Kawamichi Kazufumi Yoshihara Akihiro Sasaki Sho Sugawara Hiroki Tanabe Ryoji Shinohara Yuka Sugisawa Kentaro Tokutake Yukiko Mochizuki Tokie Anme and Norihiro Sadato. 2015. Perceiving active listening activates the reward system and improves the impression of relevant experiences. Social Neuroscience 10 1 (2015) 16\u201326.","DOI":"10.1080\/17470919.2014.954732"},{"key":"e_1_3_3_1_26_2","doi-asserted-by":"crossref","unstructured":"Adom Kendon. 1967. Some functions of gaze-direction in social interaction. Acta Psychologica 26 (1967) 22\u201363.","DOI":"10.1016\/0001-6918(67)90005-4"},{"key":"e_1_3_3_1_27_2","doi-asserted-by":"crossref","unstructured":"Chris Kleinke. 1986. Gaze and Eye Contact. A Research Review. Psychological bulletin 100 (07 1986) 78\u2013100.","DOI":"10.1037\/\/0033-2909.100.1.78"},{"key":"e_1_3_3_1_28_2","doi-asserted-by":"crossref","unstructured":"Avraham Kluger and Thomas Malloy. 2019. Question Asking as a Dyadic Behavior. Journal of Personality and Social Psychology 117 (12 2019) 1127\u20131138.","DOI":"10.1037\/pspi0000156"},{"key":"e_1_3_3_1_29_2","doi-asserted-by":"crossref","unstructured":"Klaus Krippendorff. 2006. Reliability in Content Analysis: Some Common Misconceptions and Recommendations. Human Communication Research 30 3 (01 2006) 411\u2013433.","DOI":"10.1093\/hcr\/30.3.411"},{"key":"e_1_3_3_1_30_2","doi-asserted-by":"publisher","DOI":"10.1109\/ACIIW59127.2023.10388172"},{"key":"e_1_3_3_1_31_2","doi-asserted-by":"publisher","DOI":"10.1037\/a0033777"},{"key":"e_1_3_3_1_32_2","unstructured":"Yinhan Liu Myle Ott Naman Goyal Jingfei Du Mandar Joshi Danqi Chen Omer Levy Mike Lewis Luke Zettlemoyer and Veselin Stoyanov. 2019. RoBERTa: A Robustly Optimized BERT Pretraining Approach. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/1907.11692 (2019) 1\u201313."},{"key":"e_1_3_3_1_33_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"e_1_3_3_1_34_2","doi-asserted-by":"publisher","DOI":"10.1111\/j.1467-6494.2009.00570.x"},{"key":"e_1_3_3_1_35_2","doi-asserted-by":"publisher","DOI":"10.1109\/RO-MAN60168.2024.10731275"},{"key":"e_1_3_3_1_36_2","doi-asserted-by":"publisher","DOI":"10.1177\/0146167210374238"},{"key":"e_1_3_3_1_37_2","first-page":"8121","volume-title":"Proceedings of the Eleventh International Conference on Language Resources and Evaluation (LREC \u201918)","author":"Meng Zhao","year":"2018","unstructured":"Zhao Meng, Lili Mou, and Zhi Jin. 2018. Towards Neural Speaker Modeling in Multi-Party Conversation. In Proceedings of the Eleventh International Conference on Language Resources and Evaluation (LREC \u201918). AAAI Press, Miyazaki, Japan, 8121\u20138122."},{"key":"e_1_3_3_1_38_2","first-page":"1","volume-title":"2024 IEEE International Conference on Electronics, Computing and Communication Technologies (CONECCT)","author":"Minu R\u00a0I","year":"2024","unstructured":"R\u00a0I Minu, Divya P, Ishita B, Anubhav P, Tanishq Kumar, Ramaprabha Jayaram, and Jyotirmoy Karjee. 2024. Emotion Detection in Multimodal Communication through Audio-Visual Gesture Analysis. In 2024 IEEE International Conference on Electronics, Computing and Communication Technologies (CONECCT). 1\u20135."},{"key":"e_1_3_3_1_39_2","doi-asserted-by":"publisher","DOI":"10.1145\/2993148.2993154"},{"key":"e_1_3_3_1_40_2","doi-asserted-by":"crossref","unstructured":"Soujanya Poria Navonil Majumderd Rada Mihalceae and Eduard Hovy. 2019. Emotion Recognition in Conversation: Research Challenges Datasets and Recent Advances. IEEE Access 7 (2019) 100943\u2013100953.","DOI":"10.1109\/ACCESS.2019.2929050"},{"key":"e_1_3_3_1_41_2","doi-asserted-by":"crossref","unstructured":"Lixiong Qin Mei Wang Chao Deng Ke Wang Xi Chen Jiani Hu and Weihong Deng. 2024. SwinFace: A Multi-Task Transformer for Face Recognition Expression Recognition Age Estimation and Attribute Estimation. IEEE Transactions on Circuits and Systems for Video Technology 34 (2024) 2223\u20132234.","DOI":"10.1109\/TCSVT.2023.3304724"},{"key":"e_1_3_3_1_42_2","doi-asserted-by":"crossref","unstructured":"Rosemary\u00a0P. Ramsey and Ravipreet\u00a0S. Sohi. 1997. Listening to your customers: The impact of perceived salesperson listening behavior on relationship outcomes. Journal of the Academy of Marketing Science 25 (1997) 127\u2013137.","DOI":"10.1007\/BF02894348"},{"key":"e_1_3_3_1_43_2","doi-asserted-by":"crossref","unstructured":"Harvey Sacks Emanuel Schegloff and Gail Jefferson. 1974. A simplest systematics for the organization of turn-taking for conversation. Language 50 4 (1974) 696\u2013735.","DOI":"10.1353\/lan.1974.0010"},{"key":"e_1_3_3_1_44_2","first-page":"13898","volume-title":"Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING \u201924)","author":"Sawada Kei","year":"2024","unstructured":"Kei Sawada, Tianyu Zhao, Makoto Shing, Kentaro Mitsui, Akio Kaga, Yukiya Hono, Toshiaki Wakatsuki, and Koh Mitsuda. 2024. Release of Pre-Trained Models for the Japanese Language. In Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING \u201924). ELRA and ICCL, Torino, Italia, 13898\u201313905."},{"key":"e_1_3_3_1_45_2","doi-asserted-by":"crossref","unstructured":"Juncai Sun Tiantian Dong and Ping Liu. 2023. Holistic processing and visual characteristics of regulated and spontaneous expressions. Journal of vision 23 (03 2023) 6.","DOI":"10.1167\/jov.23.3.6"},{"key":"e_1_3_3_1_46_2","first-page":"199","volume-title":"Personal Relationships,","author":"Tidwell Natasha\u00a0D.","year":"2013","unstructured":"Natasha\u00a0D. Tidwell, Paul\u00a0W. Eastwick, and Eli\u00a0J. Finkel. 2013. Perceived, Not Actual, Similarity Predicts Initial Attraction in a Live Romantic Context: Evidence from the Speed-Dating Paradigm. In Personal Relationships, , Vol.\u00a020:2. 199\u2013215."},{"key":"e_1_3_3_1_47_2","doi-asserted-by":"publisher","DOI":"10.1177\/0146167219855048"},{"key":"e_1_3_3_1_48_2","first-page":"1556","volume-title":"Proceedings of the Fifth International Conference on Language Resources and Evaluation (LREC \u201906)","author":"Wittenburg Peter","year":"2006","unstructured":"Peter Wittenburg, Hennie Brugman, Albert Russel, Alex Klassmann, and Han Sloetjes. 2006. ELAN: a professional framework for multimodality research. In Proceedings of the Fifth International Conference on Language Resources and Evaluation (LREC \u201906). European Language Resources Association, Genoa, Italy, 1556\u20131559."},{"key":"e_1_3_3_1_49_2","unstructured":"Tianyu Zhao and Kei Sawada. 2021. rinna\/japanese-roberta-base. https:\/\/huggingface.co\/rinna\/japanese-roberta-base."}],"event":{"name":"ICMI Companion '25: Companion Proceedings of the 27th International Conference on Multimodal Interaction","sponsor":["SIGCHI ACM Special Interest Group on Computer-Human Interaction"],"location":"Canberra Australia","acronym":"ICMI Companion '25"},"container-title":["Companion Proceedings of the 27th International Conference on Multimodal Interaction"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3747327.3763031","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,12,16]],"date-time":"2025-12-16T21:08:30Z","timestamp":1765919310000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3747327.3763031"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,12]]},"references-count":48,"alternative-id":["10.1145\/3747327.3763031","10.1145\/3747327"],"URL":"https:\/\/doi.org\/10.1145\/3747327.3763031","relation":{},"subject":[],"published":{"date-parts":[[2025,10,12]]},"assertion":[{"value":"2025-10-12","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}