{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,3]],"date-time":"2026-04-03T15:39:54Z","timestamp":1775230794807,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":65,"publisher":"ACM","license":[{"start":{"date-parts":[[2025,4,25]],"date-time":"2025-04-25T00:00:00Z","timestamp":1745539200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,4,26]]},"DOI":"10.1145\/3706598.3714310","type":"proceedings-article","created":{"date-parts":[[2025,4,24]],"date-time":"2025-04-24T04:45:58Z","timestamp":1745469958000},"page":"1-20","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":4,"title":["Gesture and Audio-Haptic Guidance Techniques to Direct Conversations with Intelligent Voice Interfaces"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-7645-4488","authenticated-orcid":false,"given":"Shwetha","family":"Rajaram","sequence":"first","affiliation":[{"name":"Reality Labs Research, Meta, Toronto, Ontario, Canada"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6616-2895","authenticated-orcid":false,"given":"Hemant Bhaskar","family":"Surale","sequence":"additional","affiliation":[{"name":"Reality Labs Research, Meta, Toronto, Ontario, Canada"}]},{"ORCID":"https:\/\/orcid.org\/0009-0004-4546-229X","authenticated-orcid":false,"given":"Codie","family":"McConkey","sequence":"additional","affiliation":[{"name":"Reality Labs Research, Meta, Toronto, Ontario, Canada"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7527-1479","authenticated-orcid":false,"given":"Carine","family":"Rognon","sequence":"additional","affiliation":[{"name":"Reality Labs Research, Meta, Redmond, Washington, USA"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-5627-5822","authenticated-orcid":false,"given":"Hrim","family":"Mehta","sequence":"additional","affiliation":[{"name":"Reality Labs Research, Meta, Toronto, Ontario, Canada"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7969-5025","authenticated-orcid":false,"given":"Michael","family":"Glueck","sequence":"additional","affiliation":[{"name":"Reality Labs Research, Meta, Toronto, Ontario, Canada"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4520-7000","authenticated-orcid":false,"given":"Christopher","family":"Collins","sequence":"additional","affiliation":[{"name":"Reality Labs Research, Meta, Toronto, Ontario, Canada"}]}],"member":"320","published-online":{"date-parts":[[2025,4,25]]},"reference":[{"key":"e_1_3_3_3_2_2","first-page":"1","volume-title":"Proc. of the 5th Int. Conf. on Conversational User Interfaces","author":"Aylett Matthew\u00a0Peter","year":"2023","unstructured":"Matthew\u00a0Peter Aylett and Marta Romeo. 2023. You don\u2019t need to speak, you need to liste: Robot interaction and human-like turn-taking. In Proc. of the 5th Int. Conf. on Conversational User Interfaces. 1\u20135."},{"key":"e_1_3_3_3_3_2","first-page":"13","volume-title":"Informatics","author":"Azofeifa Jose\u00a0Daniel","year":"2022","unstructured":"Jose\u00a0Daniel Azofeifa, Julieta Noguez, Sergio Ruiz, Jos\u00e9\u00a0Mart\u00edn Molina-Espinosa, Alejandra\u00a0J Magana, and Bedrich Benes. 2022. Systematic review of multimodal human-computer interaction. In Informatics , Vol.\u00a09. MDPI, 13."},{"key":"e_1_3_3_3_4_2","doi-asserted-by":"publisher","unstructured":"Alan Baddeley. 1992. Working memory. Science 255 5044 (1992) 556\u2013559. 10.1126\/science.1736359","DOI":"10.1126\/science.1736359"},{"key":"e_1_3_3_3_5_2","doi-asserted-by":"publisher","DOI":"10.1145\/3491102.3517638"},{"key":"e_1_3_3_3_6_2","doi-asserted-by":"publisher","DOI":"10.1145\/3477495.3531926"},{"key":"e_1_3_3_3_7_2","doi-asserted-by":"publisher","DOI":"10.1145\/800250.807503"},{"key":"e_1_3_3_3_8_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642320"},{"key":"e_1_3_3_3_9_2","doi-asserted-by":"crossref","unstructured":"P.\u00a0A. Chandler and J. Sweller. 1992. The split-attention effect as a factor in the design of instruction. British Journal of Educational Psychology 62 (1992) 233\u2013246.","DOI":"10.1111\/j.2044-8279.1992.tb01017.x"},{"key":"e_1_3_3_3_10_2","doi-asserted-by":"crossref","unstructured":"Neila Chettaoui Ayman Atia and Med\u00a0Salim Bouhlel. 2022. Exploring the impact of interaction modality on students\u2019 learning performance. J. Educational Computing Research 60 1 (2022) 4\u201327.","DOI":"10.1177\/07356331211027297"},{"key":"e_1_3_3_3_11_2","doi-asserted-by":"publisher","DOI":"10.1145\/266180.266328"},{"key":"e_1_3_3_3_12_2","doi-asserted-by":"publisher","DOI":"10.1145\/2207676.2208589"},{"key":"e_1_3_3_3_13_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-00437-7_1"},{"key":"e_1_3_3_3_14_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642491"},{"key":"e_1_3_3_3_15_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-39209-2_5"},{"key":"e_1_3_3_3_16_2","doi-asserted-by":"publisher","DOI":"10.1145\/3491102.3517684"},{"key":"e_1_3_3_3_17_2","doi-asserted-by":"publisher","DOI":"10.1145\/1866029.1866036"},{"key":"e_1_3_3_3_18_2","doi-asserted-by":"publisher","unstructured":"Kate Hone Ub Ph Robert Graham and Alencon Link. 2000. Towards a tool for the subjective assessment of speech system interfaces (SASSI). Natural Language Engineering 6 (07 2000). 10.1017\/S1351324900002497","DOI":"10.1017\/S1351324900002497"},{"key":"e_1_3_3_3_19_2","doi-asserted-by":"publisher","DOI":"10.1145\/3586183.3606737"},{"key":"e_1_3_3_3_20_2","doi-asserted-by":"publisher","DOI":"10.1145\/3586183.3606713"},{"key":"e_1_3_3_3_21_2","doi-asserted-by":"publisher","DOI":"10.1145\/1294211.1294256"},{"key":"e_1_3_3_3_22_2","doi-asserted-by":"publisher","DOI":"10.1145\/3313831.3376863"},{"key":"e_1_3_3_3_23_2","doi-asserted-by":"publisher","DOI":"10.1145\/3357251.3357581"},{"key":"e_1_3_3_3_24_2","doi-asserted-by":"publisher","DOI":"10.1145\/3411764.3445094"},{"key":"e_1_3_3_3_25_2","doi-asserted-by":"publisher","unstructured":"Jung Kim Hyun Kim Boon\u00a0K. Tay Manivannan Muniyandi Joel Jordan Jesper Mortensen Manuel Oliveira Mel Slater and Mandayam\u00a0A. Srinivasan. 2004. Transatlantic Touch: A study of haptic collaboration over long distances. Presence Teleoperators Virtual Environ. 13 3 (2004) 328\u2013337. 10.1162\/1054746041422370","DOI":"10.1162\/1054746041422370"},{"key":"e_1_3_3_3_26_2","unstructured":"Tae\u00a0Soo Kim Arghya Sarkar Yoonjoo Lee Minsuk Chang and Juho Kim. 2023. LMCanvas: Object-oriented interaction to personalize large language mode-powered writing environments. arxiv:https:\/\/arXiv.org\/abs\/2303.15125\u00a0[cs.HC] https:\/\/arxiv.org\/abs\/2303.15125"},{"key":"e_1_3_3_3_27_2","doi-asserted-by":"publisher","DOI":"10.1145\/3640543.3645148"},{"key":"e_1_3_3_3_28_2","doi-asserted-by":"publisher","DOI":"10.1145\/3340555.3353727"},{"key":"e_1_3_3_3_29_2","doi-asserted-by":"publisher","DOI":"10.1145\/3411764.3445312"},{"key":"e_1_3_3_3_30_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642230"},{"key":"e_1_3_3_3_31_2","volume-title":"Designing for People: An Introduction to Human Factors Engineering","author":"Lee John","year":"2017","unstructured":"John Lee, Christopher Wickens, Yili Liu, and Linda Boyle. 2017. Designing for People: An Introduction to Human Factors Engineering. CreateSpace. 159\u2013161 pages."},{"key":"e_1_3_3_3_32_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642068"},{"key":"e_1_3_3_3_33_2","doi-asserted-by":"publisher","DOI":"10.1145\/2858036.2858288"},{"key":"e_1_3_3_3_34_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642462"},{"key":"e_1_3_3_3_35_2","doi-asserted-by":"publisher","DOI":"10.1145\/2470654.2466142"},{"key":"e_1_3_3_3_36_2","doi-asserted-by":"publisher","DOI":"10.1109\/ISWC.2005.47"},{"key":"e_1_3_3_3_37_2","doi-asserted-by":"crossref","unstructured":"Anja\u00a0B Naumann Ina Wechsung and J\u00f6rn Hurtienne. 2010. Multimodal interaction: A suitable strategy for including older users? Interacting with Computers 22 6 (2010) 465\u2013474.","DOI":"10.1016\/j.intcom.2010.08.005"},{"key":"e_1_3_3_3_38_2","doi-asserted-by":"publisher","DOI":"10.1145\/2858036.2858048"},{"key":"e_1_3_3_3_39_2","doi-asserted-by":"publisher","DOI":"10.1145\/3229434.3229463"},{"key":"e_1_3_3_3_40_2","doi-asserted-by":"crossref","unstructured":"Sharon Oviatt. 2003. User-centered modeling and evaluation of multimodal interfaces. Proc. of the IEEE 91 9 (2003) 1457\u20131468.","DOI":"10.1109\/JPROC.2003.817127"},{"key":"e_1_3_3_3_41_2","doi-asserted-by":"publisher","unstructured":"Sharon\u00a0L. Oviatt. 1999. Ten myths of multimodal interaction. Commun. ACM 42 11 (1999) 74\u201381. 10.1145\/319382.319398","DOI":"10.1145\/319382.319398"},{"key":"e_1_3_3_3_42_2","doi-asserted-by":"publisher","DOI":"10.1145\/503376.503428"},{"key":"e_1_3_3_3_43_2","doi-asserted-by":"publisher","unstructured":"Peter Pirolli and Stuart Card. 1999. Information Foraging. Psychological Review 106 (10 1999) 643\u2013675. 10.1037\/0033-295X.106.4.643","DOI":"10.1037\/0033-295X.106.4.643"},{"key":"e_1_3_3_3_44_2","doi-asserted-by":"publisher","DOI":"10.1145\/3173574.3174214"},{"key":"e_1_3_3_3_45_2","volume-title":"The humane interface: New directions for designing interactive systems","author":"Raskin Jeff","year":"2000","unstructured":"Jeff Raskin. 2000. The humane interface: New directions for designing interactive systems. Addison-Wesley."},{"key":"e_1_3_3_3_46_2","doi-asserted-by":"publisher","DOI":"10.1145\/302979.303005"},{"key":"e_1_3_3_3_47_2","doi-asserted-by":"publisher","DOI":"10.1145\/288392.288597"},{"key":"e_1_3_3_3_48_2","doi-asserted-by":"crossref","unstructured":"Raymond Scupin. 1997. The KJ Method: A technique for analyzing data derived from Japanese ethnology. Human Organization 56 2 (1997) 233\u2013237.","DOI":"10.17730\/humo.56.2.x335923511444655"},{"key":"e_1_3_3_3_49_2","doi-asserted-by":"crossref","unstructured":"Abigail\u00a0J Sellen Gordon\u00a0P Kurtenbach and William\u00a0AS Buxton. 1992. The prevention of mode errors through sensory feedback. Human-Computer Interaction 7 2 (1992) 141\u2013164.","DOI":"10.1207\/s15327051hci0702_1"},{"key":"e_1_3_3_3_50_2","doi-asserted-by":"publisher","DOI":"10.1145\/3491102.3501972"},{"key":"e_1_3_3_3_51_2","doi-asserted-by":"publisher","unstructured":"R. Sharma V.I. Pavlovic and T.S. Huang. 1998. Toward multimodal human-computer interface. Proc. of the IEEE 86 5 (1998) 853\u2013869. 10.1109\/5.664275","DOI":"10.1109\/5.664275"},{"key":"e_1_3_3_3_52_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642400"},{"key":"e_1_3_3_3_53_2","doi-asserted-by":"publisher","DOI":"10.1145\/3586183.3606756"},{"key":"e_1_3_3_3_54_2","doi-asserted-by":"publisher","DOI":"10.1145\/3290605.3300243"},{"key":"e_1_3_3_3_55_2","doi-asserted-by":"publisher","unstructured":"Hong\u00a0Z. Tan Seungmoon Choi Frances W.\u00a0Y. Lau and Freddy Abnousi. 2020. Methodology for maximizing information transmission of haptic devices: A survey. Proc. of the IEEE 108 6 (2020) 945\u2013965. 10.1109\/JPROC.2020.2992561","DOI":"10.1109\/JPROC.2020.2992561"},{"key":"e_1_3_3_3_56_2","doi-asserted-by":"publisher","unstructured":"Michael Terry Chinmay Kulkarni Martin Wattenberg Lucas Dixon and Meredith\u00a0Ringel Morris. 2023. AI alignment in the design of interactive AI: Specification alignment process alignment and evaluation support. CoRR abs\/2311.00710 (2023). 10.48550\/ARXIV.2311.00710 arXiv:https:\/\/arXiv.org\/abs\/2311.00710","DOI":"10.48550\/ARXIV.2311.00710"},{"key":"e_1_3_3_3_57_2","doi-asserted-by":"publisher","DOI":"10.1145\/3308561.3353773"},{"key":"e_1_3_3_3_58_2","doi-asserted-by":"publisher","unstructured":"Nina\u00a0Zhuxiaona Wei and James\u00a0A. Landay. 2018. Evaluating speech-based smart devices using new usability heuristics. IEEE Pervasive Comput. 17 2 (2018) 84\u201396. 10.1109\/MPRV.2018.022511249","DOI":"10.1109\/MPRV.2018.022511249"},{"key":"e_1_3_3_3_59_2","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2017-1250"},{"key":"e_1_3_3_3_60_2","doi-asserted-by":"publisher","DOI":"10.1145\/3643834.3660691"},{"key":"e_1_3_3_3_61_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642735"},{"key":"e_1_3_3_3_62_2","doi-asserted-by":"publisher","DOI":"10.1145\/3332165.3347869"},{"key":"e_1_3_3_3_63_2","doi-asserted-by":"publisher","DOI":"10.1145\/2858036.2858082"},{"key":"e_1_3_3_3_64_2","doi-asserted-by":"publisher","DOI":"10.1145\/1240624.1240836"},{"key":"e_1_3_3_3_65_2","doi-asserted-by":"publisher","DOI":"10.1145\/3643834.3660683"},{"key":"e_1_3_3_3_66_2","doi-asserted-by":"publisher","DOI":"10.1145\/3313831.3376233"}],"event":{"name":"CHI 2025: CHI Conference on Human Factors in Computing Systems","location":"Yokohama Japan","acronym":"CHI '25","sponsor":["SIGCHI ACM Special Interest Group on Computer-Human Interaction"]},"container-title":["Proceedings of the 2025 CHI Conference on Human Factors in Computing Systems"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3706598.3714310","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3706598.3714310","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,7,4]],"date-time":"2025-07-04T05:47:09Z","timestamp":1751608029000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3706598.3714310"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,4,25]]},"references-count":65,"alternative-id":["10.1145\/3706598.3714310","10.1145\/3706598"],"URL":"https:\/\/doi.org\/10.1145\/3706598.3714310","relation":{},"subject":[],"published":{"date-parts":[[2025,4,25]]},"assertion":[{"value":"2025-04-25","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}