{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,7,4]],"date-time":"2026-07-04T16:21:56Z","timestamp":1783182116254,"version":"3.54.6"},"publisher-location":"New York, NY, USA","reference-count":202,"publisher":"ACM","license":[{"start":{"date-parts":[[2025,4,25]],"date-time":"2025-04-25T00:00:00Z","timestamp":1745539200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"DOI":"10.13039\/501100000923","name":"Australian Research Council","doi-asserted-by":"publisher","award":["DP190102068, DP200102612, LP210200656"],"award-info":[{"award-number":["DP190102068, DP200102612, LP210200656"]}],"id":[{"id":"10.13039\/501100000923","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Core Industry IT Convergence Program, facilitated by the Ministry of Trade, Industry & Energy (MOTIE, Korea).","award":["20016243"],"award-info":[{"award-number":["20016243"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,4,26]]},"DOI":"10.1145\/3706598.3714161","type":"proceedings-article","created":{"date-parts":[[2025,4,28]],"date-time":"2025-04-28T14:16:17Z","timestamp":1745849777000},"page":"1-31","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":18,"title":["Vision-Based Multimodal Interfaces: A Survey and Taxonomy for Enhanced Context-Aware System Design"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-1315-8969","authenticated-orcid":false,"given":"Yongquan \u2018Owen\u2019","family":"Hu","sequence":"first","affiliation":[{"name":"School of Computer Science and Engineering, University of New South Wales, Sydney, Australia"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0008-8259-8531","authenticated-orcid":false,"given":"Jingyu","family":"Tang","sequence":"additional","affiliation":[{"name":"School of Computer Science and Technology, Huazhong University of Science and Technology, Wuhan, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0005-6414-9351","authenticated-orcid":false,"given":"Xinya","family":"Gong","sequence":"additional","affiliation":[{"name":"Department of Computer Science and Engineering, Southern University of Science and Technology, Shenzhen, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1363-7313","authenticated-orcid":false,"given":"Zhongyi","family":"Zhou","sequence":"additional","affiliation":[{"name":"The University of Tokyo, Tokyo, Japan"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4145-117X","authenticated-orcid":false,"given":"Shuning","family":"Zhang","sequence":"additional","affiliation":[{"name":"Tsinghua University, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8013-5989","authenticated-orcid":false,"given":"Don Samitha","family":"Elvitigala","sequence":"additional","affiliation":[{"name":"Exertion Games Lab, Department of Human-Centred Computing, Monash University, Melbourne, Australia"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6472-3476","authenticated-orcid":false,"given":"Florian \u2018Floyd\u2019","family":"Mueller","sequence":"additional","affiliation":[{"name":"Exertion Games Lab, Department of Human-Centred Computing, Monash University, Melbourne, Australia"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4076-1811","authenticated-orcid":false,"given":"Wen","family":"Hu","sequence":"additional","affiliation":[{"name":"School of Computer Science and Engineering, University of New South Wales, Syndey, Australia"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5274-6889","authenticated-orcid":false,"given":"Aaron J.","family":"Quigley","sequence":"additional","affiliation":[{"name":"CSIRO's Data61, Sydney, Australia and University of New South Wales, Sydney, Australia"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"320","published-online":{"date-parts":[[2025,4,25]]},"reference":[{"key":"e_1_3_3_3_2_2","doi-asserted-by":"publisher","unstructured":"2009. The PRISMA Statement for Reporting Systematic Reviews and Meta-Analyses of Studies That Evaluate Health Care Interventions: Explanation and Elaboration. Annals of Internal Medicine 151 4 (2009) W\u201365\u2013W\u201394. 10.7326\/0003-4819-151-4-200908180-00136PMID: 19622512.","DOI":"10.7326\/0003-4819-151-4-200908180-00136"},{"key":"e_1_3_3_3_3_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCOINS.2018.8510584"},{"key":"e_1_3_3_3_4_2","doi-asserted-by":"publisher","DOI":"10.1007\/3-540-48157-5_29"},{"key":"e_1_3_3_3_5_2","doi-asserted-by":"publisher","DOI":"10.1145\/3411764.3445582"},{"key":"e_1_3_3_3_6_2","doi-asserted-by":"crossref","unstructured":"Sheeraz Athar Gaurav Patel Zhengtong Xu Qiang Qiu and Yu She. 2023. VisTac Toward a Unified Multimodal Sensing Finger for Robotic Manipulation. IEEE Sensors Journal 23 (2023) 25440\u201325450. https:\/\/api.semanticscholar.org\/CorpusID:261599688","DOI":"10.1109\/JSEN.2023.3310918"},{"key":"e_1_3_3_3_7_2","doi-asserted-by":"crossref","unstructured":"Tadas Baltru\u0161aitis Chaitanya Ahuja and Louis-Philippe Morency. 2018. Multimodal machine learning: A survey and taxonomy. IEEE transactions on pattern analysis and machine intelligence 41 2 (2018) 423\u2013443.","DOI":"10.1109\/TPAMI.2018.2798607"},{"key":"e_1_3_3_3_8_2","doi-asserted-by":"crossref","unstructured":"Kimin Ban and Eui\u00a0S Jung. 2020. Ear shape categorization for ergonomic product design. International Journal of Industrial Ergonomics 80 (2020) 102962.","DOI":"10.1016\/j.ergon.2020.102962"},{"key":"e_1_3_3_3_9_2","doi-asserted-by":"crossref","unstructured":"Hyuntae Bang Jiyoung Min and Haemin Jeon. 2021. Deep Learning-Based Concrete Surface Damage Monitoring Method Using Structured Lights and Depth Camera. Sensors (Basel Switzerland) 21 (2021). https:\/\/api.semanticscholar.org\/CorpusID:233396089","DOI":"10.3390\/s21082759"},{"key":"e_1_3_3_3_10_2","doi-asserted-by":"crossref","unstructured":"Abdelkareem Bedri Richard Li Malcolm Haynes Raj\u00a0Prateek Kosaraju Ishaan Grover Temiloluwa Prioleau Min\u00a0Yan Beh Mayank Goel Thad Starner and Gregory Abowd. 2017. EarBit: using wearable sensors to detect eating episodes in unconstrained environments. Proceedings of the ACM on interactive mobile wearable and ubiquitous technologies 1 3 (2017) 1\u201320.","DOI":"10.1145\/3130902"},{"key":"e_1_3_3_3_11_2","doi-asserted-by":"publisher","DOI":"10.1145\/1449715.1449729"},{"key":"e_1_3_3_3_12_2","doi-asserted-by":"publisher","DOI":"10.1145\/3472749.3474775"},{"key":"e_1_3_3_3_13_2","doi-asserted-by":"crossref","unstructured":"Anuraag Bodi Samuel Berweger Raied Caromi Jihoon Bang Jelena Senic and Camillo Gentile. 2024. AI-Based Environment Segmentation Using a Context-Aware Channel Sounder. 2024 18th European Conference on Antennas and Propagation (EuCAP) (2024) 1\u20135. https:\/\/api.semanticscholar.org\/CorpusID:269389651","DOI":"10.23919\/EuCAP60739.2024.10501743"},{"key":"e_1_3_3_3_14_2","doi-asserted-by":"publisher","DOI":"10.1145\/3355355.3361885"},{"key":"e_1_3_3_3_15_2","doi-asserted-by":"crossref","unstructured":"Cristiana Bolchini Carlo\u00a0A Curino Elisa Quintarelli Fabio\u00a0A Schreiber and Letizia Tanca. 2007. A data-oriented survey of context models. ACM Sigmod Record 36 4 (2007) 19\u201326.","DOI":"10.1145\/1361348.1361353"},{"key":"e_1_3_3_3_16_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2004.314"},{"key":"e_1_3_3_3_17_2","doi-asserted-by":"crossref","unstructured":"Jacob Bouchard-Roy Aidin Delnavaz and J\u00e9r\u00e9mie Voix. 2020. In-ear energy harvesting: Evaluation of the power capability of the temporomandibular joint. IEEE Sensors Journal 20 12 (2020) 6338\u20136345.","DOI":"10.1109\/JSEN.2020.2976925"},{"key":"e_1_3_3_3_18_2","unstructured":"John Brooke. 2013. SUS: a retrospective. Journal of Usability Studies 8 (01 2013) 29\u201340."},{"key":"e_1_3_3_3_19_2","doi-asserted-by":"crossref","unstructured":"Qiong Cai Hao Wang Zhenmin Li and Xiao Liu. 2019. A survey on multimodal data-driven smart healthcare systems: approaches and applications. IEEE Access 7 (2019) 133583\u2013133599.","DOI":"10.1109\/ACCESS.2019.2941419"},{"key":"e_1_3_3_3_20_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642320"},{"key":"e_1_3_3_3_21_2","doi-asserted-by":"crossref","unstructured":"Yanpeng Cao Baobei Xu Zhangyu Ye Jiangxin Yang Yanlong Cao Christel-Lo\u00efc Tisse and Xin Li. 2018. Depth and thermal sensor fusion to enhance 3D thermographic reconstruction. Optics express 26 7 (2018) 8179\u20138193. https:\/\/api.semanticscholar.org\/CorpusID:25437618","DOI":"10.1364\/OE.26.008179"},{"key":"e_1_3_3_3_22_2","doi-asserted-by":"crossref","unstructured":"Nitesh\u00a0V Chawla Kevin\u00a0W Bowyer Lawrence\u00a0O Hall and W\u00a0Philip Kegelmeyer. 2002. SMOTE: synthetic minority over-sampling technique. Journal of artificial intelligence research 16 (2002) 321\u2013357.","DOI":"10.1613\/jair.953"},{"key":"e_1_3_3_3_23_2","doi-asserted-by":"publisher","DOI":"10.1145\/3586183.3606832"},{"key":"e_1_3_3_3_24_2","doi-asserted-by":"publisher","DOI":"10.1109\/VR58804.2024.00073"},{"key":"e_1_3_3_3_25_2","doi-asserted-by":"crossref","unstructured":"Tuochao Chen Yaxuan Li Songyun Tao Hyunchul Lim Mose Sakashita Ruidong Zhang Fran\u00e7ois Guimbreti\u00e8re and Cheng Zhang. 2021. NeckFace: Continuously Tracking Full Facial Expressions on Neck-mounted Wearables. Proceedings of the ACM on Interactive Mobile Wearable and Ubiquitous Technologies 5 (2021) 1 \u2013 31. https:\/\/api.semanticscholar.org\/CorpusID:235631104","DOI":"10.1145\/3463511"},{"key":"e_1_3_3_3_26_2","doi-asserted-by":"crossref","unstructured":"Xiaoming Chen Zeke\u00a0Zexi Hu Guangxin Zhao Haisheng Li Vera Chung and Aaron Quigley. 2024. Video2Haptics: Converting Video Motion to Dynamic Haptic Feedback with Bio-Inspired Event Processing. IEEE Transactions on Visualization and Computer Graphics (2024).","DOI":"10.1109\/TVCG.2024.3360468"},{"key":"e_1_3_3_3_27_2","doi-asserted-by":"publisher","DOI":"10.1145\/3472749.3474750"},{"key":"e_1_3_3_3_28_2","doi-asserted-by":"publisher","DOI":"10.1145\/3173574.3173576"},{"key":"e_1_3_3_3_29_2","doi-asserted-by":"crossref","unstructured":"Chieh Chou Haifeng Li and Dezhen Song. 2020. Encoder-Camera-Ground Penetrating Radar Sensor Fusion: Bimodal Calibration and Subsurface Mapping. IEEE Transactions on Robotics 37 (2020) 67\u201381. https:\/\/api.semanticscholar.org\/CorpusID:225506468","DOI":"10.1109\/TRO.2020.3010640"},{"key":"e_1_3_3_3_30_2","doi-asserted-by":"publisher","DOI":"10.5555\/2889933.2889935"},{"key":"e_1_3_3_3_31_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642579"},{"key":"e_1_3_3_3_32_2","doi-asserted-by":"crossref","unstructured":"Aidin Delnavaz and J\u00e9r\u00e9mie Voix. 2013. Piezo-earpiece for micro-power generation from ear canal dynamic motion. Journal of Micromechanics and microengineering 23 11 (2013) 114001.","DOI":"10.1088\/0960-1317\/23\/11\/114001"},{"key":"e_1_3_3_3_33_2","doi-asserted-by":"crossref","unstructured":"Pengchao Deng Chenyang Ge Hao Wei Yuan Sun and Xin Qiao. 2023. Attention-Aware Dual-Stream Network for Multimodal Face Anti-Spoofing. IEEE Transactions on Information Forensics and Security 18 (2023) 4258\u20134271. https:\/\/api.semanticscholar.org\/CorpusID:259612172","DOI":"10.1109\/TIFS.2023.3293423"},{"key":"e_1_3_3_3_34_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVIDL58838.2023.10166260"},{"key":"e_1_3_3_3_35_2","doi-asserted-by":"crossref","unstructured":"Anind\u00a0K Dey Gregory\u00a0D Abowd and Daniel Salber. 2001. A conceptual framework and a toolkit for supporting the rapid prototyping of context-aware applications. Human\u2013Computer Interaction 16 2-4 (2001) 97\u2013166.","DOI":"10.1207\/S15327051HCI16234_02"},{"key":"e_1_3_3_3_36_2","doi-asserted-by":"crossref","unstructured":"Anind\u00a0K Dey and Jennifer Mankoff. 2005. Designing mediation for context-aware applications. ACM Transactions on Computer-Human Interaction (TOCHI) 12 1 (2005) 53\u201380.","DOI":"10.1145\/1057237.1057241"},{"key":"e_1_3_3_3_37_2","volume-title":"Human-computer interaction","author":"Dix Alan","year":"2004","unstructured":"Alan Dix. 2004. Human-computer interaction. Vol.\u00a01. Pearson Education."},{"key":"e_1_3_3_3_38_2","doi-asserted-by":"publisher","DOI":"10.1145\/3472749.3474733"},{"key":"e_1_3_3_3_39_2","doi-asserted-by":"crossref","unstructured":"Messaoud Doudou Abdelmadjid Bouabdallah and V\u00e9ronique Berge-Cherfaoui. 2019. Driver Drowsiness Measurement Technologies: Current Research Market Solutions and Challenges. International Journal of Intelligent Transportation Systems Research 18 (2019) 297 \u2013 319. https:\/\/api.semanticscholar.org\/CorpusID:203081957","DOI":"10.1007\/s13177-019-00199-w"},{"key":"e_1_3_3_3_40_2","doi-asserted-by":"crossref","unstructured":"Paul Dourish. 2004. What we talk about when we talk about context. Personal and ubiquitous computing 8 (2004) 19\u201330.","DOI":"10.1007\/s00779-003-0253-8"},{"key":"e_1_3_3_3_41_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-00437-7_1"},{"key":"e_1_3_3_3_42_2","doi-asserted-by":"publisher","DOI":"10.1145\/3586183.3606738"},{"key":"e_1_3_3_3_43_2","doi-asserted-by":"crossref","unstructured":"Zachary Englhardt Chengqian Ma Margaret\u00a0E. Morris Chun-Cheng Chang Xuhai\u00a0Orson Xu Lianhui Qin Daniel McDuff Xin Liu Shwetak\u00a0N. Patel and Vikram Iyer. 2023. From Classification to Clinical Insights. Proceedings of the ACM on Interactive Mobile Wearable and Ubiquitous Technologies 8 (2023) 1 \u2013 25. https:\/\/api.semanticscholar.org\/CorpusID:265351685","DOI":"10.1145\/3659604"},{"key":"e_1_3_3_3_44_2","doi-asserted-by":"crossref","unstructured":"Eva Eriksson Thomas\u00a0Riisgaard Hansen and Andreas Lykke-Olesen. 2007. Movement-based interaction in camera spaces: a conceptual framework. Personal and Ubiquitous Computing 11 (2007) 621\u2013632.","DOI":"10.1007\/s00779-006-0134-z"},{"key":"e_1_3_3_3_45_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642129"},{"key":"e_1_3_3_3_46_2","doi-asserted-by":"publisher","DOI":"10.1145\/3279778.3279794"},{"key":"e_1_3_3_3_47_2","doi-asserted-by":"publisher","DOI":"10.1145\/3290605.3300464"},{"key":"e_1_3_3_3_48_2","doi-asserted-by":"publisher","DOI":"10.1145\/2380296.2380338"},{"key":"e_1_3_3_3_49_2","doi-asserted-by":"crossref","unstructured":"Fang Fu and Yan Luximon. 2020. A systematic review on ear anthropometry and its industrial design applications. Human Factors and Ergonomics in Manufacturing & Service Industries 30 3 (2020) 176\u2013194.","DOI":"10.1002\/hfm.20832"},{"key":"e_1_3_3_3_50_2","doi-asserted-by":"publisher","DOI":"10.1145\/3532719.3543245"},{"key":"e_1_3_3_3_51_2","doi-asserted-by":"publisher","DOI":"10.5555\/1733343.1733606"},{"key":"e_1_3_3_3_52_2","doi-asserted-by":"crossref","unstructured":"Jens Grubert Tobias Langlotz Stefanie Zollmann and Holger Regenbrecht. 2017. Towards Pervasive Augmented Reality: Context-Awareness in Augmented Reality. IEEE Transactions on Visualization and Computer Graphics 23 (2017) 1706\u20131724. https:\/\/api.semanticscholar.org\/CorpusID:2560516","DOI":"10.1109\/TVCG.2016.2543720"},{"key":"e_1_3_3_3_53_2","doi-asserted-by":"publisher","DOI":"10.1145\/3399715.3399838"},{"key":"e_1_3_3_3_54_2","doi-asserted-by":"publisher","DOI":"10.1145\/3610549.3614596"},{"key":"e_1_3_3_3_55_2","first-page":"1903","volume-title":"31st USENIX Security Symposium (USENIX Security 22)","author":"Hallyburton R.\u00a0Spencer","year":"2022","unstructured":"R.\u00a0Spencer Hallyburton, Yupei Liu, Yulong Cao, Z.\u00a0Morley Mao, and Miroslav Pajic. 2022. Security Analysis of Camera-LiDAR Fusion Against Black-Box Attacks on Autonomous Vehicles. In 31st USENIX Security Symposium (USENIX Security 22). USENIX Association, Boston, MA, 1903\u20131920. https:\/\/www.usenix.org\/conference\/usenixsecurity22\/presentation\/hallyburton"},{"key":"e_1_3_3_3_56_2","doi-asserted-by":"crossref","unstructured":"Albert Haque Arnold Milstein and Li Fei-Fei. 2020. Illuminating the dark spaces of healthcare with ambient intelligence. Nature 585 7824 (2020) 193\u2013202.","DOI":"10.1038\/s41586-020-2669-y"},{"key":"e_1_3_3_3_57_2","doi-asserted-by":"publisher","DOI":"10.1145\/1449715.1449761"},{"key":"e_1_3_3_3_58_2","doi-asserted-by":"publisher","unstructured":"Sandra\u00a0G. Hart. 2006. Nasa-Task Load Index (NASA-TLX); 20 Years Later. Proceedings of the Human Factors and Ergonomics Society Annual Meeting 50 9 (2006) 904\u2013908. 10.1177\/154193120605000909 arXiv:10.1177\/154193120605000909","DOI":"10.1177\/154193120605000909"},{"key":"e_1_3_3_3_59_2","doi-asserted-by":"publisher","DOI":"10.1145\/313451.313476"},{"key":"e_1_3_3_3_60_2","doi-asserted-by":"publisher","DOI":"10.1109\/ACSAT.2012.37"},{"key":"e_1_3_3_3_61_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613905.3650987"},{"key":"e_1_3_3_3_62_2","doi-asserted-by":"crossref","unstructured":"Haibo He and Edwardo\u00a0A Garcia. 2009. Learning from imbalanced data. IEEE Transactions on knowledge and data engineering 21 9 (2009) 1263\u20131284.","DOI":"10.1109\/TKDE.2008.239"},{"key":"e_1_3_3_3_63_2","doi-asserted-by":"publisher","DOI":"10.1145\/3586182.3616646"},{"key":"e_1_3_3_3_64_2","doi-asserted-by":"crossref","unstructured":"Tom Heath Christian Bizer and J Hendler. 2011. Synthesis lectures on the Semantic Web: theory and technology. Linked data: Evolving the Web into a global data space 1 (2011) 1\u2013136.","DOI":"10.1007\/978-3-031-79432-2_1"},{"key":"e_1_3_3_3_65_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613905.3650760"},{"key":"e_1_3_3_3_66_2","doi-asserted-by":"publisher","DOI":"10.1145\/3640471.3686646"},{"key":"e_1_3_3_3_67_2","unstructured":"Yongquan Hu Black Sun Pengcheng An Zhuying Li Wen Hu and Aaron\u00a0J Quigley. 2024. MultiSurf-GPT: Facilitating Context-Aware Reasoning with Large-Scale Language Models for Multimodal Surface Sensing. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2408.07311 (2024)."},{"key":"e_1_3_3_3_68_2","doi-asserted-by":"crossref","unstructured":"Yongquan Hu Hui-Shyong Yeo Mingyue Yuan Haoran Fan Don\u00a0Samitha Elvitigala Wen Hu and Aaron Quigley. 2023. Microcam: Leveraging smartphone microscope camera for context-aware contact surface sensing. Proceedings of the ACM on Interactive Mobile Wearable and Ubiquitous Technologies 7 3 (2023) 1\u201328.","DOI":"10.1145\/3610921"},{"key":"e_1_3_3_3_69_2","unstructured":"Yongquan Hu Mingyue Yuan Kaiqi Xian Don\u00a0Samitha Elvitigala and Aaron Quigley. 2023. Exploring the design space of employing ai-generated content for augmented reality display. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2303.16593 (2023)."},{"key":"e_1_3_3_3_70_2","doi-asserted-by":"publisher","DOI":"10.1145\/3675094.3678494"},{"key":"e_1_3_3_3_71_2","volume-title":"Vision-based interaction","author":"Hua Gang","year":"2022","unstructured":"Gang Hua and Matthew Turk. 2022. Vision-based interaction. Springer Nature."},{"key":"e_1_3_3_3_72_2","doi-asserted-by":"publisher","DOI":"10.1109\/EMBC.2016.7590669"},{"key":"e_1_3_3_3_73_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613905.3651031"},{"key":"e_1_3_3_3_74_2","doi-asserted-by":"publisher","DOI":"10.1145\/3379337.3415856"},{"key":"e_1_3_3_3_75_2","doi-asserted-by":"publisher","DOI":"10.1145\/2801040.2801058"},{"key":"e_1_3_3_3_76_2","doi-asserted-by":"crossref","unstructured":"Suphanut Jamonnak Ye Zhao Xinyi Huang and Md. Amiruzzaman. 2021. Geo-Context Aware Study of Vision-Based Autonomous Driving Models and Spatial Video Data. IEEE Transactions on Visualization and Computer Graphics PP (2021) 1\u20131. https:\/\/api.semanticscholar.org\/CorpusID:237592808","DOI":"10.1109\/TVCG.2021.3114853"},{"key":"e_1_3_3_3_77_2","unstructured":"Mingyu Jin Qinkai Yu Dong Shu Chong Zhang Lizhou Fan Wenyue Hua Suiyuan Zhu Yanda Meng Zhenting Wang Mengnan Du and Yongfeng Zhang. 2024. Health-LLM: Personalized Retrieval-Augmented Disease Prediction System. arxiv:https:\/\/arXiv.org\/abs\/2402.00746\u00a0[cs.CL] https:\/\/arxiv.org\/abs\/2402.00746"},{"key":"e_1_3_3_3_78_2","doi-asserted-by":"publisher","DOI":"10.1145\/3544548.3581395"},{"key":"e_1_3_3_3_79_2","doi-asserted-by":"crossref","unstructured":"Ankur Joshi Saket Kale Satish Chandel and D\u00a0Kumar Pal. 2015. Likert scale: Explored and explained. British journal of applied science & technology 7 4 (2015) 396\u2013403.","DOI":"10.9734\/BJAST\/2015\/14975"},{"key":"e_1_3_3_3_80_2","doi-asserted-by":"publisher","DOI":"10.1109\/PIMRC.2005.1651849"},{"key":"e_1_3_3_3_81_2","doi-asserted-by":"publisher","DOI":"10.1145\/3458709.3458963"},{"key":"e_1_3_3_3_82_2","doi-asserted-by":"crossref","unstructured":"Mohammad Kianpisheh Alex Mariakakis and Khai\u2010Nghi Truong. 2024. exHAR: An Interface for Helping Non-Experts Develop and Debug Knowledge-based Human Activity Recognition Systems. Proceedings of the ACM on Interactive Mobile Wearable and Ubiquitous Technologies 8 1 (2024) 1 \u2013 30. https:\/\/api.semanticscholar.org\/CorpusID:268286108","DOI":"10.1145\/3643500"},{"key":"e_1_3_3_3_83_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642067"},{"key":"e_1_3_3_3_84_2","doi-asserted-by":"publisher","DOI":"10.1145\/3544548.3580975"},{"key":"e_1_3_3_3_85_2","doi-asserted-by":"publisher","DOI":"10.1109\/MOBIQ.2004.1331713"},{"key":"e_1_3_3_3_86_2","doi-asserted-by":"publisher","DOI":"10.1145\/3462244.3479938"},{"key":"e_1_3_3_3_87_2","doi-asserted-by":"publisher","DOI":"10.1145\/3027063.3053088"},{"key":"e_1_3_3_3_88_2","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.1994.407586"},{"key":"e_1_3_3_3_89_2","doi-asserted-by":"crossref","unstructured":"Alexander Kunze Steve\u00a0J. Summerskill Russell Marshall and Ashleigh\u00a0J. Filtness. 2019. Automation transparency: implications of uncertainty communication for human-automation interaction and interfaces. Ergonomics 62 (2019) 345 \u2013 360. https:\/\/api.semanticscholar.org\/CorpusID:54507824","DOI":"10.1080\/00140139.2018.1547842"},{"key":"e_1_3_3_3_90_2","doi-asserted-by":"publisher","DOI":"10.1145\/2856767.2856812"},{"key":"e_1_3_3_3_91_2","doi-asserted-by":"publisher","DOI":"10.5555\/2889933.2889934"},{"key":"e_1_3_3_3_92_2","doi-asserted-by":"crossref","unstructured":"Jeungchan Lee Ishtiaq Mawla Jieun Kim Marco\u00a0L Loggia Ana Ortiz Changjin Jung Suk-Tak Chan Jessica Gerber Vincent\u00a0J Schmithorst Robert\u00a0R Edwards et\u00a0al. 2019. Machine learning\u2013based prediction of clinical pain using multimodal neuroimaging and autonomic metrics. pain 160 3 (2019) 550\u2013560.","DOI":"10.1097\/j.pain.0000000000001417"},{"key":"e_1_3_3_3_93_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642230"},{"key":"e_1_3_3_3_94_2","unstructured":"John\u00a0D Lee Dary Fiorentino Michelle\u00a0L Reyes Timothy\u00a0L Brown Omar Ahmad James Fell Nic Ward and Robert Dufour. 2010. Assessing the feasibility of vehicle-based sensors to detect alcohol impairment. Washington DC: National Highway Traffic Safety Administration 1 2 (2010) 7."},{"key":"e_1_3_3_3_95_2","doi-asserted-by":"crossref","unstructured":"Wonsup Lee Xiaopeng Yang Hayoung Jung Ilgeun Bok Chulwoo Kim Ochae Kwon and Heecheon You. 2018. Anthropometric analysis of 3D ear scans of Koreans and Caucasians for ear product design. Ergonomics 61 11 (2018) 1480\u20131495.","DOI":"10.1080\/00140139.2018.1493150"},{"key":"e_1_3_3_3_96_2","doi-asserted-by":"crossref","unstructured":"Shengyu Li Xingxing Li Shuolong Chen Yuxuan Zhou and Shiwen Wang. 2023. Two-Step LiDAR\/Camera\/IMU Spatial and Temporal Calibration Based on Continuous-Time Trajectory Estimation. IEEE Transactions on Industrial Electronics 71 (2023) 3182\u20133191. https:\/\/api.semanticscholar.org\/CorpusID:258452547","DOI":"10.1109\/TIE.2023.3270506"},{"key":"e_1_3_3_3_97_2","doi-asserted-by":"publisher","DOI":"10.1145\/3313831.3376498"},{"key":"e_1_3_3_3_98_2","doi-asserted-by":"publisher","DOI":"10.1145\/3489849.3489887"},{"key":"e_1_3_3_3_99_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642399"},{"key":"e_1_3_3_3_100_2","doi-asserted-by":"crossref","unstructured":"Yuanfeng Lian Xu Shi ShaoChen Shen and Jing Hua. 2024. Multitask learning for image translation and salient object detection from multimodal remote sensing images. The Visual Computer 40 3 (2024) 1395\u20131414.","DOI":"10.1007\/s00371-023-02857-3"},{"key":"e_1_3_3_3_101_2","doi-asserted-by":"publisher","DOI":"10.1145\/3411764.3445624"},{"key":"e_1_3_3_3_102_2","doi-asserted-by":"publisher","unstructured":"Haicheng Liao Huanming Shen Zhenning Li Chengyue Wang Guofa Li Yiming Bie and Chengzhong Xu. 2024. GPT-4 enhanced multimodal grounding for autonomous driving: Leveraging cross-modal attention with large language models. Communications in Transportation Research 4 (2024) 100116. 10.1016\/j.commtr.2023.100116","DOI":"10.1016\/j.commtr.2023.100116"},{"key":"e_1_3_3_3_103_2","doi-asserted-by":"publisher","DOI":"10.1145\/3643834.3661631"},{"key":"e_1_3_3_3_104_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642846"},{"key":"e_1_3_3_3_105_2","doi-asserted-by":"crossref","unstructured":"Qing Lin and Youngjoon Han. 2014. A Context-Aware-Based Audio Guidance System for Blind People Using a Multimodal Profile Model. Sensors (Basel Switzerland) 14 (2014) 18670 \u2013 18700. https:\/\/api.semanticscholar.org\/CorpusID:1897887","DOI":"10.3390\/s141018670"},{"key":"e_1_3_3_3_106_2","unstructured":"Zihan Lin Francisco Cruz and Eduardo\u00a0Benitez Sandoval. 2024. Self context-aware emotion perception on human-robot interaction. arxiv:https:\/\/arXiv.org\/abs\/2401.10946\u00a0[cs.HC] https:\/\/arxiv.org\/abs\/2401.10946"},{"key":"e_1_3_3_3_107_2","unstructured":"Xubo Liu Qiushi Huang Xinhao Mei Haohe Liu Qiuqiang Kong Jianyuan Sun Shengchen Li Tom Ko Yu Zhang Lilian\u00a0H. Tang Mark\u00a0D. Plumbley Volkan K\u0131l\u0131\u00e7 and Wenwu Wang. 2023. Visually-Aware Audio Captioning With Adaptive Audio-Visual Attention. arxiv:https:\/\/arXiv.org\/abs\/2210.16428\u00a0[eess.AS] https:\/\/arxiv.org\/abs\/2210.16428"},{"key":"e_1_3_3_3_108_2","doi-asserted-by":"publisher","DOI":"10.1145\/3581783.3612268"},{"key":"e_1_3_3_3_109_2","unstructured":"Camillo Lugaresi Jiuqiang Tang Hadon Nash Chris McClanahan Esha Uboweja Michael Hays Fan Zhang Chuo-Ling Chang Ming\u00a0Guang Yong Juhyun Lee et\u00a0al. 2019. Mediapipe: A framework for building perception pipelines. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/1906.08172 (2019)."},{"key":"e_1_3_3_3_110_2","doi-asserted-by":"publisher","DOI":"10.5772\/7743"},{"key":"e_1_3_3_3_111_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCPS54341.2022.00013"},{"key":"e_1_3_3_3_112_2","doi-asserted-by":"publisher","DOI":"10.1145\/3472749.3474820"},{"key":"e_1_3_3_3_113_2","doi-asserted-by":"publisher","DOI":"10.1145\/3267305.3267687"},{"key":"e_1_3_3_3_114_2","unstructured":"Daniel McDuff Kael Rowan Piali Choudhury Jessica Wolk ThuVan Pham and Mary Czerwinski. 2019. A Multimodal Emotion Sensing Platform for Building Emotion-Aware Applications. arxiv:https:\/\/arXiv.org\/abs\/1903.12133\u00a0[cs.HC] https:\/\/arxiv.org\/abs\/1903.12133"},{"key":"e_1_3_3_3_115_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW56347.2022.00261"},{"key":"e_1_3_3_3_116_2","doi-asserted-by":"crossref","unstructured":"Johannes Meyer Adrian Frank Thomas Schlebusch and Enkelejda Kasneci. 2021. A CNN-based Human Activity Recognition System Combining a Laser Feedback Interferometry Eye Movement Sensor and an IMU for Context-aware Smart Glasses. Proceedings of the ACM on Interactive Mobile Wearable and Ubiquitous Technologies 5 4 (2021) 1 \u2013 24. https:\/\/api.semanticscholar.org\/CorpusID:245568506","DOI":"10.1145\/3494998"},{"key":"e_1_3_3_3_117_2","doi-asserted-by":"crossref","unstructured":"Johannes Meyer Adrian Frank Thomas Schlebusch and Enkelejda Kasneci. 2022. U-har: A convolutional approach to human activity recognition combining head and eye movements for context-aware smart glasses. Proceedings of the ACM on Human-Computer Interaction 6 ETRA (2022) 1\u201319. https:\/\/api.semanticscholar.org\/CorpusID:248753659","DOI":"10.1145\/3530884"},{"key":"e_1_3_3_3_118_2","doi-asserted-by":"publisher","DOI":"10.1145\/3341163.3347716"},{"key":"e_1_3_3_3_119_2","doi-asserted-by":"crossref","unstructured":"Trisha Mittal Aniket Bera and Dinesh Manocha. 2021. Multimodal and Context-Aware Emotion Perception Model With Multiplicative Fusion. IEEE MultiMedia 28 (2021) 67\u201375. https:\/\/api.semanticscholar.org\/CorpusID:234228590","DOI":"10.1109\/MMUL.2021.3068387"},{"key":"e_1_3_3_3_120_2","doi-asserted-by":"publisher","DOI":"10.1145\/3637989.3638004"},{"key":"e_1_3_3_3_121_2","doi-asserted-by":"crossref","unstructured":"Colver Ken\u00a0Howe Ne Jameel Muzaffar Aakash Amlani and Manohar Bance. 2021. Hearables in-ear sensing devices for bio-signal acquisition: a narrative review. Expert Review of Medical Devices 18 sup1 (2021) 95\u2013128.","DOI":"10.1080\/17434440.2021.2014321"},{"key":"e_1_3_3_3_122_2","doi-asserted-by":"crossref","unstructured":"Ilpo Niskanen Guoyong Duan Erik Vartiainen Matti Immonen Lauri\u00a0W. Hallman Juha Kostamovaara and Rauno Heikkil\u00e4. 2024. Enhancing point cloud data fusion through 2D thermal infrared camera and 2D lidar scanning. Infrared Physics & Technology (2024). https:\/\/api.semanticscholar.org\/CorpusID:271042263","DOI":"10.1016\/j.infrared.2024.105432"},{"key":"e_1_3_3_3_123_2","doi-asserted-by":"crossref","unstructured":"Mina Nouredanesh Alan Godfrey Dylan Powell and James Tung. 2022. Egocentric vision-based detection of surfaces: towards context-aware free-living digital biomarkers for gait and fall risk assessment. Journal of neuroengineering and rehabilitation 19 1 (2022) 79.","DOI":"10.1186\/s12984-022-01022-6"},{"key":"e_1_3_3_3_124_2","first-page":"286","volume-title":"Multimodal interfaces","author":"Oviatt Sharon","year":"2002","unstructured":"Sharon Oviatt. 2002. Multimodal interfaces. L. Erlbaum Associates Inc., USA, 286\u2013304."},{"key":"e_1_3_3_3_125_2","doi-asserted-by":"crossref","unstructured":"Jos\u00e9\u00a0Ram\u00f3n Padilla-L\u00f3pez Alexandros\u00a0Andre Chaaraoui and Francisco Fl\u00f3rez-Revuelta. 2015. Visual privacy protection methods: A survey. Expert Systems with Applications 42 9 (2015) 4177\u20134195.","DOI":"10.1016\/j.eswa.2015.01.041"},{"key":"e_1_3_3_3_126_2","unstructured":"Frederik Pahde Mihai Puscas Tassilo Klein and Moin Nabi. 2020. Multimodal Prototypical Networks for Few-shot Learning. arxiv:https:\/\/arXiv.org\/abs\/2011.08899\u00a0[cs.CV] https:\/\/arxiv.org\/abs\/2011.08899"},{"key":"e_1_3_3_3_127_2","doi-asserted-by":"publisher","DOI":"10.1145\/2305484.2305500"},{"key":"e_1_3_3_3_128_2","doi-asserted-by":"publisher","DOI":"10.1109\/ISSNIP.2013.6529836"},{"key":"e_1_3_3_3_129_2","doi-asserted-by":"publisher","DOI":"10.1145\/3625468.3652193"},{"key":"e_1_3_3_3_130_2","doi-asserted-by":"crossref","unstructured":"Yogesh\u00a0Singh Rawat and M. Kankanhalli. 2017. ClickSmart: A Context-Aware Viewpoint Recommendation System for Mobile Photography. IEEE Transactions on Circuits and Systems for Video Technology 27 (2017) 149\u2013158. https:\/\/api.semanticscholar.org\/CorpusID:9415762","DOI":"10.1109\/TCSVT.2016.2555658"},{"key":"e_1_3_3_3_131_2","doi-asserted-by":"publisher","DOI":"10.1016\/B978-0-12-374825-6.00010-1"},{"key":"e_1_3_3_3_132_2","doi-asserted-by":"publisher","DOI":"10.2312\/pt.20011318"},{"key":"e_1_3_3_3_133_2","doi-asserted-by":"publisher","DOI":"10.1145\/3544548.3580924"},{"key":"e_1_3_3_3_134_2","volume-title":"Colloque sur la multimodalit\u00e9","author":"Salber Daniel","year":"2000","unstructured":"Daniel Salber. 2000. Context-awareness and multimodality. In Colloque sur la multimodalit\u00e9."},{"key":"e_1_3_3_3_135_2","doi-asserted-by":"publisher","DOI":"10.1145\/3625468.3652201"},{"key":"e_1_3_3_3_136_2","doi-asserted-by":"publisher","DOI":"10.1109\/WMCSA.1994.16"},{"key":"e_1_3_3_3_137_2","doi-asserted-by":"crossref","unstructured":"Albrecht Schmidt. 2000. Implicit human computer interaction through context. Personal technologies 4 (2000) 191\u2013199.","DOI":"10.1007\/BF01324126"},{"key":"e_1_3_3_3_138_2","doi-asserted-by":"publisher","DOI":"10.1145\/3411763.3451753"},{"key":"e_1_3_3_3_139_2","doi-asserted-by":"publisher","DOI":"10.1145\/3462244.3479879"},{"key":"e_1_3_3_3_140_2","doi-asserted-by":"publisher","DOI":"10.1109\/IST59124.2023.10355731"},{"key":"e_1_3_3_3_141_2","doi-asserted-by":"crossref","unstructured":"Omer\u00a0Berat Sezer Erdogan Dogdu and Ahmet\u00a0Murat Ozbayoglu. 2017. Context-aware computing learning and big data in internet of things: a survey. IEEE Internet of Things Journal 5 1 (2017) 1\u201327.","DOI":"10.1109\/JIOT.2017.2773600"},{"key":"e_1_3_3_3_142_2","doi-asserted-by":"crossref","unstructured":"Rajeev Sharma Vladimir\u00a0I Pavlovic and Thomas\u00a0S Huang. 1998. Toward multimodal human-computer interface. Proc. IEEE 86 5 (1998) 853\u2013869.","DOI":"10.1109\/5.664275"},{"key":"e_1_3_3_3_143_2","doi-asserted-by":"crossref","unstructured":"Mali Shen Yun Gu Ning Liu and Guang-Zhong Yang. 2019. Context-Aware Depth and Pose Estimation for Bronchoscopic Navigation. IEEE Robotics and Automation Letters 4 (2019) 732\u2013739. https:\/\/api.semanticscholar.org\/CorpusID:59619567","DOI":"10.1109\/LRA.2019.2893419"},{"key":"e_1_3_3_3_144_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642225"},{"key":"e_1_3_3_3_145_2","unstructured":"Jingyu Shi Rahul Jain Hyungjun Doh Ryo Suzuki and Karthik Ramani. 2024. An HCI-Centric Survey and Taxonomy of Human-Generative-AI Interactions. arxiv:https:\/\/arXiv.org\/abs\/2310.07127\u00a0[cs.HC] https:\/\/arxiv.org\/abs\/2310.07127"},{"key":"e_1_3_3_3_146_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCIT.2007.142"},{"key":"e_1_3_3_3_147_2","doi-asserted-by":"publisher","DOI":"10.1145\/3570945.3607317"},{"key":"e_1_3_3_3_148_2","doi-asserted-by":"crossref","unstructured":"Muhammad\u00a0Hameed Siddiqi Nabil Almashfi Amjad Ali Madallah Alruwaili Yousef Alhwaiti Saad\u00a0Awadh Alanazi and M.\u00a0M. Kamruzzaman. 2021. A Unified Approach for Patient Activity Recognition in Healthcare Using Depth Camera. IEEE Access 9 (2021) 92300\u201392317. https:\/\/api.semanticscholar.org\/CorpusID:235780004","DOI":"10.1109\/ACCESS.2021.3092403"},{"key":"e_1_3_3_3_149_2","doi-asserted-by":"crossref","unstructured":"Amit\u00a0Kumar Sikder Leonardo Babun Z\u00a0Berkay Celik Hidayet Aksu Patrick McDaniel Engin Kirda and A\u00a0Selcuk Uluagac. 2022. Who\u2019s controlling my device? Multi-user multi-device-aware access control system for shared smart home environment. ACM Transactions on Internet of Things 3 4 (2022) 1\u201339.","DOI":"10.1145\/3543513"},{"key":"e_1_3_3_3_150_2","doi-asserted-by":"publisher","DOI":"10.1145\/3611659.3615687"},{"key":"e_1_3_3_3_151_2","doi-asserted-by":"crossref","unstructured":"Dimitrios-Emmanuel Spanos Periklis Stavrou Nikolas Mitrou and Nikolas Konstantinou. 2012. SensorStream: A semantic real\u2013time stream management system. International Journal of Ad Hoc and Ubiquitous Computing 11 2-3 (2012) 178\u2013193.","DOI":"10.1504\/IJAHUC.2012.050252"},{"key":"e_1_3_3_3_152_2","unstructured":"Thad Starner. 1995. Visual recognition of american sign language using hidden markov models. Ph.\u00a0D. Dissertation. Massachusetts Institute of Technology."},{"key":"e_1_3_3_3_153_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613905.3650927"},{"key":"e_1_3_3_3_154_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642140"},{"key":"e_1_3_3_3_155_2","doi-asserted-by":"publisher","DOI":"10.1145\/3448018.3458011"},{"key":"e_1_3_3_3_156_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCVW60793.2023.00459"},{"key":"e_1_3_3_3_157_2","doi-asserted-by":"publisher","DOI":"10.1145\/3394171.3413734"},{"key":"e_1_3_3_3_158_2","doi-asserted-by":"publisher","DOI":"10.1145\/3290605.3300243"},{"key":"e_1_3_3_3_159_2","doi-asserted-by":"publisher","DOI":"10.1145\/3491102.3517719"},{"key":"e_1_3_3_3_160_2","doi-asserted-by":"publisher","DOI":"10.1109\/IIAI-AAI.2019.00035"},{"key":"e_1_3_3_3_161_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCSP60870.2024.10543666"},{"key":"e_1_3_3_3_162_2","unstructured":"Shengbang Tong Ellis Brown Penghao Wu Sanghyun Woo Manoj Middepogu Sai\u00a0Charitha Akula Jihan Yang Shusheng Yang Adithya Iyer Xichen Pan Austin Wang Rob Fergus Yann LeCun and Saining Xie. 2024. Cambrian-1: A Fully Open Vision-Centric Exploration of Multimodal LLMs. arxiv:https:\/\/arXiv.org\/abs\/2406.16860\u00a0[cs.CV] https:\/\/arxiv.org\/abs\/2406.16860"},{"key":"e_1_3_3_3_163_2","unstructured":"Hsin-Ruey Tsai Shih-Kang Chiu and Bryan Wang. 2024. GazeNoter: Co-Piloted AR Note-Taking via Gaze Selection of LLM Suggestions to Match Users\u2019 Intentions. arxiv:https:\/\/arXiv.org\/abs\/2407.01161\u00a0[cs.HC] https:\/\/arxiv.org\/abs\/2407.01161"},{"key":"e_1_3_3_3_164_2","doi-asserted-by":"publisher","DOI":"10.1109\/RO-MAN57019.2023.10309404"},{"key":"e_1_3_3_3_165_2","doi-asserted-by":"crossref","unstructured":"Chongyang Wang Yuan Feng Lin\u00a0Xiao Zhong Siyi Zhu Chi Zhang Siqi Zheng Chen Liang Yuntao Wang Chen-Jun He Chun Yu and Yuanchun Shi. 2023. UbiPhysio: Support Daily Functioning Fitness and Rehabilitation with Action Understanding and Feedback in Natural Language. Proceedings of the ACM on Interactive Mobile Wearable and Ubiquitous Technologies 8 (2023) 1 \u2013 27. https:\/\/api.semanticscholar.org\/CorpusID:261049773","DOI":"10.1145\/3643552"},{"key":"e_1_3_3_3_166_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642231"},{"key":"e_1_3_3_3_167_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642878"},{"key":"e_1_3_3_3_168_2","doi-asserted-by":"publisher","DOI":"10.1145\/3379337.3415815"},{"key":"e_1_3_3_3_169_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642092"},{"key":"e_1_3_3_3_170_2","doi-asserted-by":"publisher","DOI":"10.1109\/PERCOMW.2004.1276898"},{"key":"e_1_3_3_3_171_2","doi-asserted-by":"publisher","DOI":"10.1145\/3474085.3475414"},{"key":"e_1_3_3_3_172_2","doi-asserted-by":"crossref","unstructured":"Zeyu Wang Yuanchun Shi Yuntao Wang Yuchen Yao Kun Yan Yuhan Wang Lei Ji Xuhai Xu and Chun Yu. 2024. G-VOILA: Gaze-Facilitated Information Querying in Daily Scenarios. Proceedings of the ACM on Interactive Mobile Wearable and Ubiquitous Technologies 8 (2024) 1 \u2013 33. https:\/\/api.semanticscholar.org\/CorpusID:269758074","DOI":"10.1145\/3659623"},{"key":"e_1_3_3_3_173_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642235"},{"key":"e_1_3_3_3_174_2","doi-asserted-by":"crossref","unstructured":"Mark Weiser. 1999. The computer for the 21st century. ACM SIGMOBILE mobile computing and communications review 3 3 (1999) 3\u201311.","DOI":"10.1145\/329124.329126"},{"key":"e_1_3_3_3_175_2","doi-asserted-by":"crossref","unstructured":"Mark Weiser and John\u00a0Seely Brown. 1996. Designing calm technology. PowerGrid Journal 1 1 (1996) 75\u201385.","DOI":"10.1007\/978-1-4612-0685-9_6"},{"key":"e_1_3_3_3_176_2","unstructured":"Linda\u00a0Yilin Wen Cecily Morrison Martin Grayson Rita\u00a0Faia Marques Daniela Massiceti Camilla Longden and Edward Cutrell. 2024. Find My Things: Personalized Accessibility through Teachable AI for People who are Blind or Low Vision. Extended Abstracts of the CHI Conference on Human Factors in Computing Systems (2024). https:\/\/api.semanticscholar.org\/CorpusID:269748025"},{"key":"e_1_3_3_3_177_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642876"},{"key":"e_1_3_3_3_178_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642358"},{"key":"e_1_3_3_3_179_2","doi-asserted-by":"publisher","DOI":"10.1145\/3532719.3543197"},{"key":"e_1_3_3_3_180_2","doi-asserted-by":"crossref","unstructured":"Xinyu Xie Xiaozhi Zhang Dongping Xiong and Lijun Ouyang. 2023. MFA-DAF: Unsupervised Multimodal Medical Image Fusion via Multiscale Fourier Attention and Detail-Aware Fusion Strategy. 2023 International Conference on Image Processing Computer Vision and Machine Learning (ICICML) (2023) 208\u2013214. https:\/\/api.semanticscholar.org\/CorpusID:267659859","DOI":"10.1109\/ICICML60161.2023.10424785"},{"key":"e_1_3_3_3_181_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642103"},{"key":"e_1_3_3_3_182_2","doi-asserted-by":"publisher","unstructured":"Xuhai Xu Bingsheng Yao Yuanzhe Dong Saadia Gabriel Hong Yu James Hendler Marzyeh Ghassemi Anind\u00a0K. Dey and Dakuo Wang. 2024. Mental-LLM: Leveraging Large Language Models for Mental Health Prediction via Online Text Data. Proc. ACM Interact. Mob. Wearable Ubiquitous Technol. 8 1 Article 31 (March 2024) 32\u00a0pages. 10.1145\/3643540","DOI":"10.1145\/3643540"},{"key":"e_1_3_3_3_183_2","volume-title":"British Machine Vision Conference","author":"Xu Yating","year":"2022","unstructured":"Yating Xu, Conghui Hu, and Gim\u00a0Hee Lee. 2022. Motion and Context-Aware Audio-Visual Conditioned Video Prediction. In British Machine Vision Conference. https:\/\/api.semanticscholar.org\/CorpusID:254536032"},{"key":"e_1_3_3_3_184_2","doi-asserted-by":"publisher","unstructured":"Zhenyu Xu Hailin Xu Zhouyang Lu Yingying Zhao Rui Zhu Yujiang Wang Mingzhi Dong Yuhu Chang Qin Lv Robert\u00a0P Dick et\u00a0al. 2024. Can Large Language Models Be Good Companions? An LLM-Based Eyewear System with Conversational Common Ground. Proceedings of the ACM on Interactive Mobile Wearable and Ubiquitous Technologies 8 2 Article 87 (May 2024) 41\u00a0pages. 10.1145\/3659600","DOI":"10.1145\/3659600"},{"key":"e_1_3_3_3_185_2","doi-asserted-by":"publisher","DOI":"10.1145\/3581783.3611765"},{"key":"e_1_3_3_3_186_2","doi-asserted-by":"publisher","DOI":"10.1145\/2380116.2380137"},{"key":"e_1_3_3_3_187_2","doi-asserted-by":"publisher","DOI":"10.1145\/3524273.3528189"},{"key":"e_1_3_3_3_188_2","doi-asserted-by":"publisher","DOI":"10.1145\/3098279.3098541"},{"key":"e_1_3_3_3_189_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642013"},{"key":"e_1_3_3_3_190_2","doi-asserted-by":"publisher","DOI":"10.1109\/VR58804.2024.00090"},{"key":"e_1_3_3_3_191_2","doi-asserted-by":"crossref","unstructured":"Watcharaphong Yookwan Krisana Chinnasarn C. So-In and Paramate Horkaew. 2022. Multimodal Fusion of Deeply Inferred Point Clouds for 3D Scene Reconstruction Using Cross-Entropy ICP. IEEE Access 10 (2022) 77123\u201377136. https:\/\/api.semanticscholar.org\/CorpusID:250976713","DOI":"10.1109\/ACCESS.2022.3192869"},{"key":"e_1_3_3_3_192_2","doi-asserted-by":"crossref","unstructured":"Xenophon Zabulis Haris Baltzakis and Antonis\u00a0A Argyros. 2009. Vision-Based Hand Gesture Recognition for Human-Computer Interaction. The universal access handbook 34 (2009) 30.","DOI":"10.1201\/9781420064995-c34"},{"key":"e_1_3_3_3_193_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642426"},{"key":"e_1_3_3_3_194_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642647"},{"key":"e_1_3_3_3_195_2","doi-asserted-by":"crossref","unstructured":"Xiyuxing Zhang Yuntao Wang Yuxuan Han Chen Liang Ishan Chatterjee Jiankai Tang Xin Yi Shwetak Patel and Yuanchun Shi. 2024. The EarSAVAS Dataset: Enabling Subject-Aware Vocal Activity Sensing on Earables. Proceedings of the ACM on Interactive Mobile Wearable and Ubiquitous Technologies 8 2 (2024) 1\u201326.","DOI":"10.1145\/3659616"},{"key":"e_1_3_3_3_196_2","doi-asserted-by":"publisher","unstructured":"Fei Zhao Chengcui Zhang and Baocheng Geng. 2024. Deep Multimodal Data Fusion. ACM Comput. Surv. 56 9 Article 216 (April 2024) 36\u00a0pages. 10.1145\/3649447","DOI":"10.1145\/3649447"},{"key":"e_1_3_3_3_197_2","doi-asserted-by":"crossref","unstructured":"Nan Zhao Elena Kodama and Joseph\u00a0A. Paradiso. 2022. Mediated Atmosphere Table (MAT): Adaptive Multimodal Media System for Stress Restoration. IEEE Internet of Things Journal 9 (2022) 23614\u201323625. https:\/\/api.semanticscholar.org\/CorpusID:250564158","DOI":"10.1109\/JIOT.2022.3190929"},{"key":"e_1_3_3_3_198_2","doi-asserted-by":"crossref","unstructured":"Y. Zheng Yuejie Zhang Rui Feng Tao Zhang and Weiguo Fan. 2021. Stacked Multimodal Attention Network for Context-Aware Video Captioning. IEEE Transactions on Circuits and Systems for Video Technology 32 (2021) 31\u201342. https:\/\/api.semanticscholar.org\/CorpusID:236657677","DOI":"10.1109\/TCSVT.2021.3058626"},{"key":"e_1_3_3_3_199_2","doi-asserted-by":"crossref","unstructured":"Dingfu Zhou Xibin Song Jin Fang Yuchao Dai Hongdong Li and Liangjun Zhang. 2022. Context-Aware 3D Object Detection From a Single Image in Autonomous Driving. IEEE Transactions on Intelligent Transportation Systems 23 (2022) 18568\u201318580. https:\/\/api.semanticscholar.org\/CorpusID:247339223","DOI":"10.1109\/TITS.2022.3154022"},{"key":"e_1_3_3_3_200_2","unstructured":"Zhongyi Zhou Jing Jin Vrushank Phadnis Xiuxiu Yuan Jun Jiang Xun Qian Jingtao Zhou Yiyi Huang Zheng Xu Yinda Zhang et\u00a0al. 2023. InstructPipe: Building Visual Programming Pipelines with Human Instructions. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2312.09672 (2023)."},{"key":"e_1_3_3_3_201_2","doi-asserted-by":"publisher","DOI":"10.1145\/3526113.3545648"},{"key":"e_1_3_3_3_202_2","doi-asserted-by":"crossref","unstructured":"Rongrong Zhu Liang Shi Yunpeng Song and Zhongmin Cai. 2023. Integrating Gaze and Mouse Via Joint Cross-Attention Fusion Net for Students\u2019 Activity Recognition in E-learning. Proceedings of the ACM on Interactive Mobile Wearable and Ubiquitous Technologies 7 (2023) 1 \u2013 35. https:\/\/api.semanticscholar.org\/CorpusID:263153323","DOI":"10.1145\/3610876"},{"key":"e_1_3_3_3_203_2","doi-asserted-by":"publisher","DOI":"10.1145\/3491101.3503552"}],"event":{"name":"CHI 2025: CHI Conference on Human Factors in Computing Systems","location":"Yokohama Japan","acronym":"CHI '25","sponsor":["SIGCHI ACM Special Interest Group on Computer-Human Interaction"]},"container-title":["Proceedings of the 2025 CHI Conference on Human Factors in Computing Systems"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3706598.3714161","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3706598.3714161","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,7,4]],"date-time":"2025-07-04T05:21:49Z","timestamp":1751606509000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3706598.3714161"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,4,25]]},"references-count":202,"alternative-id":["10.1145\/3706598.3714161","10.1145\/3706598"],"URL":"https:\/\/doi.org\/10.1145\/3706598.3714161","relation":{},"subject":[],"published":{"date-parts":[[2025,4,25]]},"assertion":[{"value":"2025-04-25","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}