{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,9]],"date-time":"2026-06-09T11:59:35Z","timestamp":1781006375902,"version":"3.54.1"},"publisher-location":"New York, NY, USA","reference-count":126,"publisher":"ACM","license":[{"start":{"date-parts":[[2026,4,13]],"date-time":"2026-04-13T00:00:00Z","timestamp":1776038400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0\/legalcode"}],"funder":[{"name":"The National Natural Science Foundation of China","award":["62332016"],"award-info":[{"award-number":["62332016"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2026,4,13]]},"DOI":"10.1145\/3772318.3790631","type":"proceedings-article","created":{"date-parts":[[2026,4,13]],"date-time":"2026-04-13T04:12:28Z","timestamp":1776053548000},"page":"1-24","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":1,"title":["FeelWave: Enabling Emotion-Aware Voice Interaction through Noise-Robust mmWave Emotion Sensing"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0005-5524-1025","authenticated-orcid":false,"given":"Lingyu","family":"Wang","sequence":"first","affiliation":[{"name":"University of Science and Technology of China, Hefei, Anhui, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0004-0769-2924","authenticated-orcid":false,"given":"You","family":"Zuo","sequence":"additional","affiliation":[{"name":"University of Science and Technology of China, Hefei, Anhui, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0877-4636","authenticated-orcid":false,"given":"Dequan","family":"Wang","sequence":"additional","affiliation":[{"name":"University of Science and Technology of China, HeFei, Anhui, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0008-2330-3799","authenticated-orcid":false,"given":"Chenming","family":"He","sequence":"additional","affiliation":[{"name":"University of Science and Technology of China, Hefei, Anhui, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-4285-1905","authenticated-orcid":false,"given":"Chengzhen","family":"Meng","sequence":"additional","affiliation":[{"name":"University of Science and Technology of China, Hefei, Anhui, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0002-1589-4222","authenticated-orcid":false,"given":"Xinran","family":"Zhang","sequence":"additional","affiliation":[{"name":"University of Science and Technology of China, Hefei, Anhui, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6368-9250","authenticated-orcid":false,"given":"Xiaoran","family":"Fan","sequence":"additional","affiliation":[{"name":"Independent Researcher, Sunnyvale, California, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9046-798X","authenticated-orcid":false,"given":"Yanyong","family":"Zhang","sequence":"additional","affiliation":[{"name":"University of Science and Technology of China, Hefei, Anhui, China"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"320","published-online":{"date-parts":[[2026,4,13]]},"reference":[{"key":"e_1_3_3_2_2_2","first-page":"265","volume-title":"International Conference on Machine Learning (ICML)","author":"Aghajanyan Armen","year":"2023","unstructured":"Armen Aghajanyan, Lili Yu, Alexis Conneau, Wei-Ning Hsu, Karen Hambardzumyan, Susan Zhang, Stephen Roller, Naman Goyal, Omer Levy, and Luke Zettlemoyer. 2023. Scaling laws for generative mixed-modal language models. In International Conference on Machine Learning (ICML). 265\u2013279."},{"key":"e_1_3_3_2_3_2","doi-asserted-by":"crossref","unstructured":"Foteini Agrafioti Dimitris Hatzinakos and Adam\u00a0K Anderson. 2011. ECG pattern analysis for emotion detection. IEEE Transactions on affective computing 3 1 (2011) 102\u2013115.","DOI":"10.1109\/T-AFFC.2011.28"},{"key":"e_1_3_3_2_4_2","doi-asserted-by":"crossref","unstructured":"Naveed Ahmed Zaher Al\u00a0Aghbari and Shini Girija. 2023. A systematic survey on multimodal emotion recognition using learning algorithms. Intelligent Systems with Applications 17 (2023) 200171.","DOI":"10.1016\/j.iswa.2022.200171"},{"key":"e_1_3_3_2_5_2","doi-asserted-by":"crossref","unstructured":"Icek Ajzen and Thomas\u00a0J Madden. 1986. Prediction of goal-directed behavior: Attitudes intentions and perceived behavioral control. Journal of experimental social psychology 22 5 (1986) 453\u2013474.","DOI":"10.1016\/0022-1031(86)90045-4"},{"key":"e_1_3_3_2_6_2","doi-asserted-by":"crossref","unstructured":"Paavo Alku. 1992. Glottal wave analysis with pitch synchronous iterative adaptive inverse filtering. Speech communication 11 2-3 (1992) 109\u2013118.","DOI":"10.1016\/0167-6393(92)90005-R"},{"key":"e_1_3_3_2_7_2","doi-asserted-by":"publisher","DOI":"10.1145\/3627673.3679832"},{"key":"e_1_3_3_2_8_2","unstructured":"Anthropic. 2024. Claude 3.5 Haiku. [Online]. https:\/\/www.anthropic.com\/claude\/haiku."},{"key":"e_1_3_3_2_9_2","unstructured":"Apple. 2024. Introducing Apple Intelligence the personal intelligence system that puts powerful generative models at the core of iPhone iPad and Mac. [Online]. https:\/\/www.apple.com\/newsroom\/2024\/06\/introducing-apple-intelligence-for-iphone-ipad-and-mac\/."},{"key":"e_1_3_3_2_10_2","unstructured":"Li Auto. 2024. Li Auto Introduces Fully Self-Developed MindGPT. [Online]. https:\/\/genaigazette.com\/li-auto-introduces-fully-self-developed-mind-gpt."},{"key":"e_1_3_3_2_11_2","unstructured":"Azcom CabinGuard. 2025. A Vehicle In-cabin Monitoring Solution. [Online]. https:\/\/www.azcomtech.com\/markets\/mmwave-radar-sensors\/automotive."},{"key":"e_1_3_3_2_12_2","unstructured":"Aaron Bangor Philip Kortum and James Miller. 2009. Determining what individual SUS scores mean: Adding an adjective rating scale. Journal of usability studies 4 3 (2009) 114\u2013123."},{"key":"e_1_3_3_2_13_2","unstructured":"John Brooke et\u00a0al. 1996. SUS-A quick and dirty usability scale. Usability evaluation in industry 189 194 (1996) 4\u20137."},{"key":"e_1_3_3_2_14_2","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2005-446"},{"key":"e_1_3_3_2_15_2","doi-asserted-by":"publisher","DOI":"10.1145\/3636534.3649350"},{"key":"e_1_3_3_2_16_2","unstructured":"Jingyi Chen Zhimeng Guo Jiyun Chun Pichao Wang Andrew Perrault and Micha Elsner. 2025. Do Audio LLMs Really LISTEN or Just Transcribe? Measuring Lexical vs. Acoustic Emotion Cues Reliance. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2510.10444 (2025)."},{"key":"e_1_3_3_2_17_2","doi-asserted-by":"publisher","DOI":"10.1145\/3586183.3606741"},{"key":"e_1_3_3_2_18_2","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2025-1112"},{"key":"e_1_3_3_2_19_2","doi-asserted-by":"crossref","unstructured":"Zebang Cheng Zhi-Qi Cheng Jun-Yan He Kai Wang Yuxiang Lin Zheng Lian Xiaojiang Peng and Alexander Hauptmann. 2024. Emotion-llama: Multimodal emotion recognition and reasoning with instruction tuning. Advances in Neural Information Processing Systems (NeurIPS) 37 (2024) 110805\u2013110853.","DOI":"10.52202\/079017-3518"},{"key":"e_1_3_3_2_20_2","unstructured":"Pedro Corr\u00eaa Jo\u00e3o Lima Victor Moreno and Paula Dornhofer\u00a0Paro Costa. 2025. Evaluating Emotion Recognition in Spoken Language Models on Emotionally Incongruent Speech. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2510.25054 (2025)."},{"key":"e_1_3_3_2_21_2","doi-asserted-by":"crossref","unstructured":"Livija Cveticanin. 2012. Review on mathematical and mechanical models of the vocal cord. Journal of Applied Mathematics 2012 1 (2012) 928591.","DOI":"10.1155\/2012\/928591"},{"key":"e_1_3_3_2_22_2","unstructured":"Google DeepMind. 2024. Gemma: Lightweight Open Models for Responsible AI. [Online]. https:\/\/ai.google.dev\/gemma."},{"key":"e_1_3_3_2_23_2","unstructured":"Google DeepMind. 2025. Gemini 2.5 Pro. [Online]. https:\/\/blog.google\/products\/gemini\/gemini-2-5-pro-latest-preview\/."},{"key":"e_1_3_3_2_24_2","unstructured":"DeepSeek. 2024. DeepSeek V3. [Online]. https:\/\/github.com\/deepseek-ai\/DeepSeek-V3."},{"key":"e_1_3_3_2_25_2","doi-asserted-by":"crossref","unstructured":"Han Ding Yizhan Wang Hao Li Cui Zhao Ge Wang Wei Xi and Jizhong Zhao. 2022. Ultraspeech: Speech enhancement by interaction between ultrasound and speech. Proceedings of the ACM on Interactive Mobile Wearable and Ubiquitous Technologies (IMWUT) 6 3 (2022) 1\u201325.","DOI":"10.1145\/3550303"},{"key":"e_1_3_3_2_26_2","doi-asserted-by":"crossref","unstructured":"Thomas Drugman Paavo Alku Abeer Alwan and Bayya Yegnanarayana. 2014. Glottal source processing: From analysis to applications. Computer Speech & Language 28 5 (2014) 1117\u20131138.","DOI":"10.1016\/j.csl.2014.03.003"},{"key":"e_1_3_3_2_27_2","doi-asserted-by":"crossref","unstructured":"Moataz El\u00a0Ayadi Mohamed\u00a0S Kamel and Fakhri Karray. 2011. Survey on speech emotion recognition: Features classification schemes and databases. Pattern recognition 44 3 (2011) 572\u2013587.","DOI":"10.1016\/j.patcog.2010.09.020"},{"key":"e_1_3_3_2_28_2","doi-asserted-by":"publisher","DOI":"10.1109\/INFOCOM53939.2023.10229085"},{"key":"e_1_3_3_2_29_2","doi-asserted-by":"publisher","DOI":"10.1145\/3637528.3671470"},{"key":"e_1_3_3_2_30_2","doi-asserted-by":"publisher","DOI":"10.1145\/3706598.3713359"},{"key":"e_1_3_3_2_31_2","doi-asserted-by":"publisher","DOI":"10.1109\/BHI62660.2024.10913781"},{"key":"e_1_3_3_2_32_2","unstructured":"Federal Communications Commission (FCC). 2021. RF Safety Guidelines. [Online]. https:\/\/www.fcc.gov\/general\/radio-frequency-safety-0."},{"key":"e_1_3_3_2_33_2","doi-asserted-by":"crossref","unstructured":"Guy\u00a0William Fincham Clara Strauss Jesus Montero-Marin and Kate Cavanagh. 2023. Effect of breathwork on stress and mental health: A meta-analysis of randomised-controlled trials. Scientific Reports 13 1 (2023) 432.","DOI":"10.1038\/s41598-022-27247-y"},{"key":"e_1_3_3_2_34_2","unstructured":"Yaroslav Ganin Evgeniya Ustinova Hana Ajakan Pascal Germain Hugo Larochelle Fran\u00e7ois Laviolette Mario March and Victor Lempitsky. 2016. Domain-adversarial training of neural networks. Journal of machine learning research (JMLR) 17 59 (2016) 1\u201335."},{"key":"e_1_3_3_2_35_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2017.7952261"},{"key":"e_1_3_3_2_36_2","doi-asserted-by":"crossref","unstructured":"Swapna\u00a0Mol George and P\u00a0Muhamed Ilyas. 2024. A review on speech emotion recognition: A survey recent advances challenges and the influence of noise. Neurocomputing 568 (2024) 127015.","DOI":"10.1016\/j.neucom.2023.127015"},{"key":"e_1_3_3_2_37_2","unstructured":"Google. 2017. Webrtc-vad. [Online]. https:\/\/webrtc.org\/."},{"key":"e_1_3_3_2_38_2","unstructured":"Google. 2021. ok-google.io. [Online]. https:\/\/ok-google.io."},{"key":"e_1_3_3_2_39_2","unstructured":"Google. 2025. Speech-to-Text. [Online]. https:\/\/cloud.google.com\/speech-to-text."},{"key":"e_1_3_3_2_40_2","doi-asserted-by":"crossref","unstructured":"Feiyu Han Panlong Yang You Zuo Fei Shang Fenglei Xu and Xiang-Yang Li. 2024. Earspeech: Exploring in-ear occlusion effect on earphones for data-efficient airborne speech enhancement. Proceedings of the ACM on Interactive Mobile Wearable and Ubiquitous Technologies (IMWUT) 8 3 (2024) 1\u201330.","DOI":"10.1145\/3678594"},{"key":"e_1_3_3_2_41_2","doi-asserted-by":"crossref","unstructured":"Feiyu Han You Zuo Weiwei Jiang Dawei Yan Yuxin Zhao Panlong Yang and Yubo Yan. 2025. EAROE: Enabling Body-Channel Voice Interaction Interface on Earphones via Occlusion Effect. IEEE Internet of Things Journal (IoTJ) (2025).","DOI":"10.1109\/JIOT.2025.3529912"},{"key":"e_1_3_3_2_42_2","unstructured":"Hardso. 2025. AIBI Pocket. [Online]. https:\/\/www.hardso.com\/product\/2fea3b01-c2a1-4050-8e7e-f9d62f88de88."},{"key":"e_1_3_3_2_43_2","unstructured":"Hardso. 2025. PieX Pendant. [Online]. https:\/\/www.hardso.com\/product\/ea05912b-a7fc-4bd5-aee4-f43f8ac4d200."},{"key":"e_1_3_3_2_44_2","doi-asserted-by":"publisher","DOI":"10.1145\/3636534.3690658"},{"key":"e_1_3_3_2_45_2","doi-asserted-by":"publisher","DOI":"10.1145\/3680207.3765237"},{"key":"e_1_3_3_2_46_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2017.7952132"},{"key":"e_1_3_3_2_47_2","unstructured":"Geoffrey Hinton Oriol Vinyals and Jeff Dean. 2015. Distilling the knowledge in a neural network. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/1503.02531 (2015)."},{"key":"e_1_3_3_2_48_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00140"},{"key":"e_1_3_3_2_49_2","doi-asserted-by":"crossref","unstructured":"Jiaxiong Hu Yun Huang Xiaozhu Hu and Yingqing Xu. 2022. The acoustically emotion-aware conversational agent with speech emotion recognition and empathetic responses. IEEE Transactions on Affective Computing 14 1 (2022) 17\u201330.","DOI":"10.1109\/TAFFC.2022.3205919"},{"key":"e_1_3_3_2_50_2","unstructured":"Infineon. 2020. Radar Development Kit. [Online]. https:\/\/www.infineon.com\/cms\/en\/design-support\/tools\/sdk\/radar-development-kit\/."},{"key":"e_1_3_3_2_51_2","unstructured":"Infineon. 2023. bgt60tr13c. [Online]. https:\/\/www.infineon.com\/cms\/en\/product\/sensor\/radar-sensors\/radar-sensors-for-iot\/60ghz-radar\/bgt60tr13c."},{"key":"e_1_3_3_2_52_2","unstructured":"Infineon. 2023. bgt60utr11aip. [Online]. https:\/\/www.infineon.com\/cms\/en\/product\/sensor\/radar-sensors\/radar-sensors-for-iot\/60ghz-radar\/bgt60utr11aip\/."},{"key":"e_1_3_3_2_53_2","unstructured":"Texas Instruments. 2020. IWR6843 intelligent mmWave sensor standard antenna plug-in module. [Online]. https:\/\/www.ti.com\/tool\/IWR6843ISK."},{"key":"e_1_3_3_2_54_2","unstructured":"Texas Instruments. 2024. IWR6843. [Online]. https:\/\/www.ti.com\/product\/IWR6843##order-quality."},{"key":"e_1_3_3_2_55_2","unstructured":"International Commission on Non-Ionizing Radiation Protection (ICNIRP). 2020. Guidelines for Limiting Exposure to Electromagnetic Fields (100 kHz to 300 GHz). [Online]. https:\/\/www.icnirp.org\/cms\/upload\/publications."},{"key":"e_1_3_3_2_56_2","unstructured":"Philip Jackson and SJUoSG Haq. 2014. Surrey audio-visual expressed emotion (savee) database. University of Surrey: Guildford UK (2014)."},{"key":"e_1_3_3_2_57_2","doi-asserted-by":"publisher","DOI":"10.1109\/CSPA.2011.5759912"},{"key":"e_1_3_3_2_58_2","doi-asserted-by":"crossref","unstructured":"Samuel Kakuba and Dong\u00a0Seog Han. 2025. Addressing data scarcity in speech emotion recognition: A comprehensive review. ICT Express 11 1 (2025) 110\u2013123.","DOI":"10.1016\/j.icte.2024.11.003"},{"key":"e_1_3_3_2_59_2","doi-asserted-by":"publisher","DOI":"10.1145\/3399715.3399928"},{"key":"e_1_3_3_2_60_2","doi-asserted-by":"crossref","unstructured":"Adi Lausen and Kurt Hammerschmidt. 2020. Emotion recognition and confidence ratings predicted by vocal stimulus type and prosodic parameters. Humanities and Social Sciences Communications 7 1 (2020) 1\u201317.","DOI":"10.1057\/s41599-020-0499-z"},{"key":"e_1_3_3_2_61_2","unstructured":"Cheng Li Jindong Wang Yixuan Zhang Kaijie Zhu Wenxin Hou Jianxun Lian Fang Luo Qiang Yang and Xing Xie. 2023. Large language models understand and can be enhanced by emotional stimuli. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2307.11760 (2023)."},{"key":"e_1_3_3_2_62_2","unstructured":"Haitao Li Qian Dong Junjie Chen Huixue Su Yujia Zhou Qingyao Ai Ziyi Ye and Yiqun Liu. 2024. Llms-as-judges: a comprehensive survey on llm-based evaluation methods. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2412.05579 (2024)."},{"key":"e_1_3_3_2_63_2","unstructured":"Yuanchun Li Hao Wen Weijun Wang Xiangyu Li Yizhen Yuan Guohong Liu Jiacheng Liu Wenxing Xu Xiang Wang Yi Sun et\u00a0al. 2024. Personal llm agents: Insights and survey about the capability efficiency and security. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2401.05459 (2024)."},{"key":"e_1_3_3_2_64_2","unstructured":"Zaijing Li Gongwei Chen Rui Shao Yuquan Xie Dongmei Jiang and Liqiang Nie. 2024. Enhancing emotional generation capability of large language models via emotional chain-of-thought. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2401.06836 (2024)."},{"key":"e_1_3_3_2_65_2","volume-title":"Forty-second International Conference on Machine Learning (ICML)","author":"Lian Zheng","unstructured":"Zheng Lian, Haoyu Chen, Lan Chen, Haiyang Sun, Licai Sun, Yong Ren, Zebang Cheng, Bin Liu, Rui Liu, Xiaojiang Peng, et\u00a0al. [n. d.]. AffectGPT: A New Dataset, Model, and Benchmark for Emotion Understanding with Multimodal Large Language Models. In Forty-second International Conference on Machine Learning (ICML)."},{"key":"e_1_3_3_2_66_2","unstructured":"Yu-Xiang Lin Chih-Kai Yang Wei-Chih Chen Chen-An Li Chien-yu Huang Xuanjun Chen and Hung-yi Lee. 2025. A preliminary exploration with gpt-4o voice mode. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2502.09940 (2025)."},{"key":"e_1_3_3_2_67_2","doi-asserted-by":"publisher","DOI":"10.1145\/3485730.3485945"},{"key":"e_1_3_3_2_68_2","doi-asserted-by":"publisher","DOI":"10.1145\/3586183.3606775"},{"key":"e_1_3_3_2_69_2","doi-asserted-by":"crossref","unstructured":"Steven\u00a0R Livingstone and Frank\u00a0A Russo. 2018. The Ryerson Audio-Visual Database of Emotional Speech and Song (RAVDESS): A dynamic multimodal set of facial and vocal expressions in North American English. PloS one 13 5 (2018) e0196391.","DOI":"10.1371\/journal.pone.0196391"},{"key":"e_1_3_3_2_70_2","doi-asserted-by":"crossref","unstructured":"Andrey Lovakov and Elena\u00a0R Agadullina. 2021. Empirically derived guidelines for effect size interpretation in social psychology. European Journal of Social Psychology 51 3 (2021) 485\u2013504.","DOI":"10.1002\/ejsp.2752"},{"key":"e_1_3_3_2_71_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613905.3651093"},{"key":"e_1_3_3_2_72_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.findings-acl.931"},{"key":"e_1_3_3_2_73_2","doi-asserted-by":"crossref","unstructured":"Brian McFee Justin Salamon and Juan\u00a0Pablo Bello. 2018. Adaptive pooling operators for weakly labeled sound event detection. IEEE\/ACM Transactions on Audio Speech and Language Processing (TASLP) 26 11 (2018) 2180\u20132193.","DOI":"10.1109\/TASLP.2018.2858559"},{"key":"e_1_3_3_2_74_2","doi-asserted-by":"crossref","unstructured":"Chengzhen Meng Yifan Duan Chenming He Dequan Wang Xiaoran Fan and Yanyong Zhang. 2024. mmPlace: Robust Place Recognition With Intermediate Frequency Signal of Low-Cost Single-Chip Millimeter Wave Radar. IEEE Robotics and Automation Letters (RAL) 9 6 (2024) 4878\u20134885.","DOI":"10.1109\/LRA.2024.3377562"},{"key":"e_1_3_3_2_75_2","doi-asserted-by":"crossref","unstructured":"Chengzhen Meng Chenming He Dequan Wang Yuxuan Xiao Lingyu Wang Xiaoran Fan Lu Zhang and Yanyong Zhang. 2025. Gr-fall: A fall detection system with gait recognition for indoor environments using siso mmwave radar. Proceedings of the ACM on Interactive Mobile Wearable and Ubiquitous Technologies (IMWUT) 9 3 (2025) 1\u201326.","DOI":"10.1145\/3749471"},{"key":"e_1_3_3_2_76_2","unstructured":"Meta AI. 2024. Llama 3.1. [Online]. https:\/\/ai.meta.com\/blog\/meta-llama-3-1\/."},{"key":"e_1_3_3_2_77_2","unstructured":"ICLEGEND MICRO. 2024. 24GHz mmWave Sensor SoC. [Online]. https:\/\/www.iclegend.com\/zh-hans\/product\/category\/Sensor."},{"key":"e_1_3_3_2_78_2","unstructured":"NOVELIC. 2025. A Whole-Cabin Solution for Vehicle Safety and Comfort. [Online]. https:\/\/www.novelic.com\/acam-automotive-in-cabin-monitoring-radar\/."},{"key":"e_1_3_3_2_79_2","unstructured":"OpenAI. 2024. GPT-4o. [Online]. https:\/\/openai.com\/index\/hello-gpt-4o\/."},{"key":"e_1_3_3_2_80_2","unstructured":"OpenAI. 2024. GPT-4o Audio Preview. [Online]. https:\/\/platform.openai.com\/docs\/models\/gpt-4o-audio-preview."},{"key":"e_1_3_3_2_81_2","unstructured":"OpenAI. 2024. Introducing Our Next-Generation Audio Models. [Online]. https:\/\/openai.com\/index\/introducing-our-next-generation-audio-models\/."},{"key":"e_1_3_3_2_82_2","unstructured":"OpenAI. 2025. GPT-4o-mini. [Online]. https:\/\/platform.openai.com\/docs\/models\/gpt-4o-mini."},{"key":"e_1_3_3_2_83_2","unstructured":"OpenAI. 2025. GPT-4o-mini-TTS. [Online]. https:\/\/platform.openai.com\/docs\/models\/gpt-4o-mini-tts."},{"key":"e_1_3_3_2_84_2","unstructured":"OpenAI. 2025. GPT-4o-transcribe. [Online]. https:\/\/platform.openai.com\/docs\/models\/gpt-4o-transcribe."},{"key":"e_1_3_3_2_85_2","unstructured":"OpenAI. 2025. OpenAI Security and Privacy. [Online]. https:\/\/openai.com\/security-and-privacy\/?utm_source=chatgpt.com."},{"key":"e_1_3_3_2_86_2","volume-title":"Discrete-Time Signal Processing (3 ed.)","author":"Oppenheim Alan","year":"2013","unstructured":"Alan Oppenheim and Ronald Schafer. 2013. Discrete-Time Signal Processing (3 ed.). Pearson Deutschland."},{"key":"e_1_3_3_2_87_2","doi-asserted-by":"publisher","DOI":"10.1109\/SAS.2016.7479875"},{"key":"e_1_3_3_2_88_2","doi-asserted-by":"crossref","unstructured":"Muhammed\u00a0Zahid Ozturk Chenshu Wu Beibei Wang Min Wu and KJ\u00a0Ray Liu. 2023. Radio SES: mmWave-Based Audioradio Speech Enhancement and Separation System. IEEE\/ACM Transactions on Audio Speech and Language Processing (TASLP) 31 (2023) 1333\u20131347.","DOI":"10.1109\/TASLP.2023.3250846"},{"key":"e_1_3_3_2_89_2","doi-asserted-by":"crossref","unstructured":"Ashutosh Pandey and DeLiang Wang. 2019. A new framework for CNN-based speech enhancement in the time domain. IEEE\/ACM Transactions on Audio Speech and Language Processing (TASLP) 27 7 (2019) 1179\u20131188.","DOI":"10.1109\/TASLP.2019.2913512"},{"key":"e_1_3_3_2_90_2","doi-asserted-by":"publisher","DOI":"10.1145\/3706598.3713726"},{"key":"e_1_3_3_2_91_2","doi-asserted-by":"publisher","DOI":"10.5555\/265013"},{"key":"e_1_3_3_2_92_2","volume-title":"The Thirteenth International Conference on Learning Representations (ICLR)","author":"Qi Zhenting","year":"2025","unstructured":"Zhenting Qi, Hongyin Luo, Xuliang Huang, Zhuokai Zhao, Yibo Jiang, Xiangjun Fan, Himabindu Lakkaraju, and James\u00a0R. Glass. 2025. Quantifying Generalization Complexity for Large Language Models. In The Thirteenth International Conference on Learning Representations (ICLR)."},{"key":"e_1_3_3_2_93_2","doi-asserted-by":"crossref","unstructured":"Maija Reblin and Bert\u00a0N Uchino. 2008. Social and emotional support and its implication for health. Current opinion in psychiatry 21 2 (2008) 201\u2013205.","DOI":"10.1097\/YCO.0b013e3282f3ad89"},{"key":"e_1_3_3_2_94_2","doi-asserted-by":"publisher","DOI":"10.1145\/3715014.3722082"},{"key":"e_1_3_3_2_95_2","unstructured":"Google Research. 2020. Soli Radar-based Perception and Interaction in Pixel 4. [Online]. https:\/\/research.google\/blog\/soli-radar-based-perception-and-interaction-in-pixel-4\/."},{"key":"e_1_3_3_2_96_2","unstructured":"RESEMBLE.AI. 2023. Introducing Resemble Enhance: Open Source Speech Super Resolution AI Model. [Online]. https:\/\/www.resemble.ai\/introducing-resemble-enhance\/."},{"key":"e_1_3_3_2_97_2","volume-title":"Fundamentals of Radar Signal Processing","author":"Richards Mark\u00a0A.","year":"2005","unstructured":"Mark\u00a0A. Richards. 2005. Fundamentals of Radar Signal Processing. McGraw-Hill."},{"key":"e_1_3_3_2_98_2","doi-asserted-by":"crossref","unstructured":"Chantel Ritter and Tara Vongpaisal. 2018. Multimodal and spectral degradation effects on speech and emotion recognition in adult listeners. Trends in Hearing 22 (2018).","DOI":"10.1177\/2331216518804966"},{"key":"e_1_3_3_2_99_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.acl-long.326"},{"key":"e_1_3_3_2_100_2","unstructured":"Samsung. 2021. mmWave 5G: Past Present and Future. [Online]. https:\/\/www.samsung.com\/global\/business\/networks\/insights\/blog\/0218-mmwave-5g-past-present-and-future\/."},{"key":"e_1_3_3_2_101_2","doi-asserted-by":"crossref","unstructured":"Katja Schlegel Nils\u00a0R Sommer and Marcello Mortillaro. 2025. Large language models are proficient in solving and creating emotional intelligence tests. Communications Psychology 3 1 (2025) 80.","DOI":"10.1038\/s44271-025-00258-x"},{"key":"e_1_3_3_2_102_2","doi-asserted-by":"crossref","unstructured":"Katie Seaborn Norihisa\u00a0P Miyake Peter Pennefather and Mihoko Otake-Matsuura. 2021. Voice in human\u2013agent interaction: A survey. ACM Computing Surveys (CSUR) 54 4 (2021) 1\u201343.","DOI":"10.1145\/3386867"},{"key":"e_1_3_3_2_103_2","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2020-1242"},{"key":"e_1_3_3_2_104_2","first-page":"37","volume-title":"Psychology of learning and motivation","author":"Sweller John","year":"2011","unstructured":"John Sweller. 2011. Cognitive load theory. In Psychology of learning and motivation. Vol.\u00a055. 37\u201376."},{"key":"e_1_3_3_2_105_2","doi-asserted-by":"crossref","unstructured":"Maya Tamir. 2016. Why do people regulate their emotions? A taxonomy of motives in emotion regulation. Personality and social psychology review 20 3 (2016) 199\u2013222.","DOI":"10.1177\/1088868315586325"},{"key":"e_1_3_3_2_106_2","unstructured":"Gemini Team Rohan Anil Sebastian Borgeaud Jean-Baptiste Alayrac Jiahui Yu Radu Soricut Johan Schalkwyk Andrew\u00a0M Dai Anja Hauth Katie Millican et\u00a0al. 2023. Gemini: a family of highly capable multimodal models. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2312.11805 (2023)."},{"key":"e_1_3_3_2_107_2","doi-asserted-by":"publisher","DOI":"10.1145\/3411764.3445536"},{"key":"e_1_3_3_2_108_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.emnlp-main.1070"},{"key":"e_1_3_3_2_109_2","doi-asserted-by":"publisher","DOI":"10.1145\/3772318.3790623"},{"key":"e_1_3_3_2_110_2","doi-asserted-by":"crossref","unstructured":"Dequan Wang Xinran Zhang Kai Wang Lingyu Wang Xiaoran Fan and Yanyong Zhang. 2024. Rdgait: A mmwave based gait user recognition system for complex indoor environments using single-chip radar. Proceedings of the ACM on Interactive Mobile Wearable and Ubiquitous Technologies (IMWUT) 8 3 (2024) 1\u201331.","DOI":"10.1145\/3678552"},{"key":"e_1_3_3_2_111_2","doi-asserted-by":"crossref","unstructured":"Xuena Wang Xueting Li Zi Yin Yue Wu and Jia Liu. 2023. Emotional intelligence of large language models. Journal of Pacific Rim Psychology 17 (2023).","DOI":"10.1177\/18344909231213958"},{"key":"e_1_3_3_2_112_2","unstructured":"Jason Wei Yi Tay Rishi Bommasani Colin Raffel Barret Zoph Sebastian Borgeaud Dani Yogatama Maarten Bosma Denny Zhou Donald Metzler et\u00a0al. 2022. Emergent abilities of large language models. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2206.07682 (2022)."},{"key":"e_1_3_3_2_113_2","doi-asserted-by":"crossref","unstructured":"Jason Wei Xuezhi Wang Dale Schuurmans Maarten Bosma Fei Xia Ed Chi Quoc\u00a0V Le Denny Zhou et\u00a0al. 2022. Chain-of-thought prompting elicits reasoning in large language models. Advances in neural information processing systems 35 (2022) 24824\u201324837.","DOI":"10.52202\/068431-1800"},{"key":"e_1_3_3_2_114_2","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2022\/320"},{"key":"e_1_3_3_2_115_2","unstructured":"Wikipedia. 2024. Voice frequency. [Online]. https:\/\/en.wikipedia.org\/wiki\/Voice_frequency."},{"key":"e_1_3_3_2_116_2","unstructured":"Wikipedia. 2025. Tukey window (cosine-tapered window). [Online]. https:\/\/en.wikipedia.org\/wiki\/Window_function."},{"key":"e_1_3_3_2_117_2","doi-asserted-by":"crossref","unstructured":"Mingyang Wu and DeLiang Wang. 2006. A two-stage algorithm for one-microphone reverberant speech enhancement. IEEE Transactions on Audio Speech and Language Processing (TASLP) 14 3 (2006) 774\u2013784.","DOI":"10.1109\/TSA.2005.858066"},{"key":"e_1_3_3_2_118_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2025.findings-naacl.117"},{"key":"e_1_3_3_2_119_2","doi-asserted-by":"publisher","DOI":"10.1109\/PIC.2018.8706134"},{"key":"e_1_3_3_2_120_2","doi-asserted-by":"publisher","DOI":"10.1145\/3307334.3326073"},{"key":"e_1_3_3_2_121_2","doi-asserted-by":"publisher","DOI":"10.1145\/3458864.3467679"},{"key":"e_1_3_3_2_122_2","doi-asserted-by":"crossref","unstructured":"Huanpu Yin Shuhui Yu Yingshuo Zhang Anfu Zhou Xin Wang Liang Liu Huadong Ma Jianhua Liu and Ning Yang. 2022. Let iot know you better: User identification and emotion recognition through millimeter-wave sensing. IEEE Internet of Things Journal (IoTJ) 10 2 (2022) 1149\u20131161.","DOI":"10.1109\/JIOT.2022.3204779"},{"key":"e_1_3_3_2_123_2","volume-title":"The blizzard challenge 2008 workshop","author":"Zhang JTFLM","year":"2008","unstructured":"JTFLM Zhang and Huibin Jia. 2008. Design of speech corpus for mandarin text to speech. In The blizzard challenge 2008 workshop."},{"key":"e_1_3_3_2_124_2","doi-asserted-by":"publisher","DOI":"10.1145\/3570361.3592515"},{"key":"e_1_3_3_2_125_2","doi-asserted-by":"publisher","DOI":"10.1145\/2973750.2973762"},{"key":"e_1_3_3_2_126_2","doi-asserted-by":"crossref","unstructured":"Running Zhao Jiangtao Yu Hang Zhao and Edith\u00a0CH Ngai. 2023. Radio2Text: Streaming Speech Recognition Using mmWave Radio Signals. Proceedings of the ACM on Interactive Mobile Wearable and Ubiquitous Technologies (IMWUT) 7 3 (2023) 1\u201328.","DOI":"10.1145\/3610873"},{"key":"e_1_3_3_2_127_2","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2020-2472"}],"event":{"name":"CHI 2026: CHI Conference on Human Factors in Computing Systems","location":"Barcelona Spain","acronym":"CHI '26","sponsor":["SIGCHI ACM Special Interest Group on Computer-Human Interaction"]},"container-title":["Proceedings of the 2026 CHI Conference on Human Factors in Computing Systems"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3772318.3790631","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,6,9]],"date-time":"2026-06-09T11:18:42Z","timestamp":1781003922000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3772318.3790631"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,4,13]]},"references-count":126,"alternative-id":["10.1145\/3772318.3790631","10.1145\/3772318"],"URL":"https:\/\/doi.org\/10.1145\/3772318.3790631","relation":{},"subject":[],"published":{"date-parts":[[2026,4,13]]},"assertion":[{"value":"2026-04-13","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}