{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,23]],"date-time":"2026-04-23T07:58:06Z","timestamp":1776931086824,"version":"3.51.2"},"publisher-location":"New York, NY, USA","reference-count":66,"publisher":"ACM","content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,11,10]]},"DOI":"10.1145\/3694907.3765913","type":"proceedings-article","created":{"date-parts":[[2025,10,25]],"date-time":"2025-10-25T10:20:37Z","timestamp":1761387637000},"page":"1-12","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":2,"title":["A Comparative Study of Speech-and-Pointing and Disocclusion Mini-Map Techniques for Object Selection in Virtual Reality"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-7375-6525","authenticated-orcid":false,"given":"Junlong","family":"Chen","sequence":"first","affiliation":[{"name":"University of Cambridge, Cambridge, United Kingdom"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3858-2961","authenticated-orcid":false,"given":"Jens","family":"Grubert","sequence":"additional","affiliation":[{"name":"Coburg University of Applied Sciences and Arts, Coburg, Germany"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7139-871X","authenticated-orcid":false,"given":"Per Ola","family":"Kristensson","sequence":"additional","affiliation":[{"name":"University of Cambridge, Cambridge, United Kingdom"}]}],"member":"320","published-online":{"date-parts":[[2025,11,9]]},"reference":[{"key":"e_1_3_3_3_2_2","doi-asserted-by":"crossref","unstructured":"Ferran Argelaguet and Carlos Andujar. 2013. A survey of 3D object selection techniques for virtual environments. Computers & Graphics 37 3 (2013) 121\u2013136.","DOI":"10.1016\/j.cag.2012.12.003"},{"key":"e_1_3_3_3_3_2","doi-asserted-by":"publisher","DOI":"10.1145\/3290605.3300331"},{"key":"e_1_3_3_3_4_2","doi-asserted-by":"publisher","DOI":"10.1145\/3411764.3445193"},{"key":"e_1_3_3_3_5_2","doi-asserted-by":"publisher","unstructured":"Richard\u00a0A. Bolt. 1980. \u201cPut-that-there\u201d: Voice and gesture at the graphics interface. SIGGRAPH Comput. Graph. 14 3 (July 1980) 262\u2013270. 10.1145\/965105.807503","DOI":"10.1145\/965105.807503"},{"key":"e_1_3_3_3_6_2","doi-asserted-by":"crossref","unstructured":"Doug\u00a0A Bowman and Larry\u00a0F Hodges. 1999. Formalizing the design evaluation and application of interaction techniques for immersive virtual environments. Journal of Visual Languages & Computing 10 1 (1999) 37\u201353.","DOI":"10.1006\/jvlc.1998.0111"},{"key":"e_1_3_3_3_7_2","unstructured":"John Brooke et\u00a0al. 1996. SUS-A quick and dirty usability scale. Usability evaluation in industry 189 194 (1996) 4\u20137."},{"key":"e_1_3_3_3_8_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICDSCA53499.2021.9650256"},{"key":"e_1_3_3_3_9_2","doi-asserted-by":"publisher","DOI":"10.1109\/COLCOM.2006.361859"},{"key":"e_1_3_3_3_10_2","doi-asserted-by":"publisher","DOI":"10.1145\/3611659.3615693"},{"key":"e_1_3_3_3_11_2","doi-asserted-by":"publisher","DOI":"10.1109\/VR59515.2025.00045"},{"key":"e_1_3_3_3_12_2","doi-asserted-by":"crossref","unstructured":"Jin Chen Zheng Liu Xu Huang Chenwang Wu Qi Liu Gangwei Jiang Yuanhao Pu Yuxuan Lei Xiaolong Chen Xingmei Wang et\u00a0al. 2024. When large language models meet personalization: Perspectives of challenges and opportunities. World Wide Web 27 4 (2024) 42.","DOI":"10.1007\/s11280-024-01276-1"},{"key":"e_1_3_3_3_13_2","unstructured":"Qian Chen Zhu Zhuo and Wen Wang. 2019. BERT for Joint Intent Classification and Slot Filling. arxiv:https:\/\/arXiv.org\/abs\/1902.10909\u00a0[cs.CL] https:\/\/arxiv.org\/abs\/1902.10909"},{"key":"e_1_3_3_3_14_2","doi-asserted-by":"crossref","unstructured":"Leigh Clark Philip Doyle Diego Garaialde Emer Gilmartin Stephan Schl\u00f6gl Jens Edlund Matthew Aylett Jo\u00e3o Cabral Cosmin Munteanu Justin Edwards et\u00a0al. 2019. The state of speech in HCI: Trends themes and challenges. Interacting with computers 31 4 (2019) 349\u2013371.","DOI":"10.1093\/iwc\/iwz016"},{"key":"e_1_3_3_3_15_2","series-title":"(EGVE\u201905)","first-page":"201","volume-title":"Proceedings of the 11th Eurographics Conference on Virtual Environments","author":"Haan Gerwin de","year":"2005","unstructured":"Gerwin de Haan, Michal Koutek, and Frits\u00a0H. Post. 2005. IntenSelect: using dynamic object rating for assisting 3D object selection. In Proceedings of the 11th Eurographics Conference on Virtual Environments (Aalborg, Denmark) (EGVE\u201905). Eurographics Association, Goslar, DEU, 201\u2013209."},{"key":"e_1_3_3_3_16_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642579"},{"key":"e_1_3_3_3_17_2","unstructured":"Jacob Devlin Ming-Wei Chang Kenton Lee and Kristina Toutanova. 2018. BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/1810.04805 (2018)."},{"key":"e_1_3_3_3_18_2","doi-asserted-by":"publisher","DOI":"10.1145\/3611659.3615716"},{"key":"e_1_3_3_3_19_2","doi-asserted-by":"publisher","DOI":"10.1109\/VR58804.2024.00078"},{"key":"e_1_3_3_3_20_2","doi-asserted-by":"crossref","unstructured":"Emanuela Guglielmi Giovanni Rosa Simone Scalabrino Gabriele Bavota and Rocco Oliveto. 2024. Help Them Understand: Testing and Improving Voice User Interfaces. ACM Transactions on Software Engineering and Methodology 33 6 (2024) 1\u201333.","DOI":"10.1145\/3654438"},{"key":"e_1_3_3_3_21_2","doi-asserted-by":"publisher","DOI":"10.1016\/S0166-4115(08)62386-9"},{"key":"e_1_3_3_3_22_2","doi-asserted-by":"publisher","unstructured":"Yahya Hmaiti Mykola Maslych Amirpouya Ghasemaghaei Ryan\u00a0K Ghamandi and Joseph\u00a0J. LaViola. 2024. Visual Perceptual Confidence: Exploring Discrepancies Between Self-reported and Actual Distance Perception In Virtual Reality. IEEE Transactions on Visualization and Computer Graphics 30 11 (Nov. 2024) 7245\u20137254. 10.1109\/TVCG.2024.3456165","DOI":"10.1109\/TVCG.2024.3456165"},{"key":"e_1_3_3_3_23_2","doi-asserted-by":"crossref","unstructured":"Yidi Jiang Bidisha Sharma Maulik Madhavi and Haizhou Li. 2021. Knowledge Distillation from BERT Transformer to Speech Transformer for Intent Classification.","DOI":"10.21437\/Interspeech.2021-402"},{"key":"e_1_3_3_3_24_2","doi-asserted-by":"crossref","unstructured":"Joo\u00a0Chan Kim Teemu\u00a0H Laine and Christer \u00c5hlund. 2021. Multimodal interaction systems based on internet of things and augmented reality: A systematic literature review. Applied Sciences 11 4 (2021) 1738.","DOI":"10.3390\/app11041738"},{"key":"e_1_3_3_3_25_2","doi-asserted-by":"publisher","DOI":"10.1145\/3411764.3445579"},{"key":"e_1_3_3_3_26_2","doi-asserted-by":"publisher","unstructured":"Marcel Kruger Tim Gerrits Timon Romer Torsten Kuhlen and Tim Weissker. 2024. IntenSelect+: Enhancing Score-Based Selection in Virtual Reality. IEEE Transactions on Visualization & Computer Graphics 30 05 (May 2024) 2829\u20132838. 10.1109\/TVCG.2024.3372077","DOI":"10.1109\/TVCG.2024.3372077"},{"key":"e_1_3_3_3_27_2","doi-asserted-by":"publisher","DOI":"10.1145\/3313831.3376698"},{"key":"e_1_3_3_3_28_2","doi-asserted-by":"crossref","unstructured":"Yuan Li Ibrahim\u00a0A Tahmid Feiyu Lu and Doug\u00a0A Bowman. 2022. Evaluation of pointing ray techniques for distant object referencing in model-free outdoor collaborative augmented reality. IEEE Transactions on Visualization and Computer Graphics 28 11 (2022) 3896\u20133906.","DOI":"10.1109\/TVCG.2022.3203094"},{"key":"e_1_3_3_3_29_2","doi-asserted-by":"publisher","DOI":"10.1145\/3371300.3383343"},{"key":"e_1_3_3_3_30_2","doi-asserted-by":"publisher","DOI":"10.1109\/VR55154.2023.00061"},{"key":"e_1_3_3_3_31_2","doi-asserted-by":"publisher","DOI":"10.1109\/ISMAR62088.2024.00115"},{"key":"e_1_3_3_3_32_2","unstructured":"Mark\u00a0R Mine. 1995. Virtual environment interaction techniques. UNC Chapel Hill CS Dept (1995)."},{"key":"e_1_3_3_3_33_2","doi-asserted-by":"publisher","DOI":"10.1109\/ISMAR59233.2023.00116"},{"key":"e_1_3_3_3_34_2","doi-asserted-by":"publisher","DOI":"10.1145\/1040830.1040900"},{"key":"e_1_3_3_3_35_2","unstructured":"OpenAI Josh Achiam Steven Adler Sandhini Agarwal Lama Ahmad Ilge Akkaya Florencia\u00a0Leoni Aleman Diogo Almeida Janko Altenschmidt Sam Altman Shyamal Anadkat et\u00a0al. 2024. GPT-4 Technical Report. arxiv:https:\/\/arXiv.org\/abs\/2303.08774\u00a0[cs.CL] https:\/\/arxiv.org\/abs\/2303.08774"},{"key":"e_1_3_3_3_36_2","doi-asserted-by":"crossref","unstructured":"Sharon Oviatt. 1999. Ten myths of multimodal interaction. Commun. ACM 42 11 (1999) 74\u201381.","DOI":"10.1145\/319382.319398"},{"key":"e_1_3_3_3_37_2","doi-asserted-by":"publisher","DOI":"10.1145\/1027933.1027957"},{"key":"e_1_3_3_3_38_2","doi-asserted-by":"publisher","DOI":"10.1145\/3173574.3174107"},{"key":"e_1_3_3_3_39_2","doi-asserted-by":"publisher","DOI":"10.1145\/3359996.3364264"},{"key":"e_1_3_3_3_40_2","doi-asserted-by":"crossref","unstructured":"St\u00e9phanie Philippe Alexis\u00a0D Souchet Petros Lameras Panagiotis Petridis Julien Caporal Gildas Coldeboeuf and Hadrien Duzan. 2020. Multimodal teaching learning and training in virtual reality: a review and case study. Virtual Reality & Intelligent Hardware 2 5 (2020) 421\u2013442.","DOI":"10.1016\/j.vrih.2020.07.008"},{"key":"e_1_3_3_3_41_2","doi-asserted-by":"crossref","unstructured":"Ivan Poupyrev and Tadao Ichikawa. 1999. Manipulating objects in virtual worlds: Categorization and empirical evaluation of interaction techniques. Journal of Visual Languages & Computing 10 1 (1999) 19\u201335.","DOI":"10.1006\/jvlc.1998.0112"},{"key":"e_1_3_3_3_42_2","doi-asserted-by":"crossref","unstructured":"Ismo Rakkolainen Ahmed Farooq Jari Kangas Jaakko Hakulinen Jussi Rantala Markku Turunen and Roope Raisamo. 2021. Technologies for multimodal interaction in extended reality\u2014a scoping review. Multimodal Technologies and Interaction 5 12 (2021) 81.","DOI":"10.3390\/mti5120081"},{"key":"e_1_3_3_3_43_2","doi-asserted-by":"crossref","unstructured":"Leah\u00a0M Reeves Jennifer Lai James\u00a0A Larson Sharon Oviatt TS Balaji St\u00e9phanie Buisine Penny Collings Phil Cohen Ben Kraal Jean-Claude Martin et\u00a0al. 2004. Guidelines for multimodal user interface design. Commun. ACM 47 1 (2004) 57\u201359.","DOI":"10.1145\/962081.962106"},{"key":"e_1_3_3_3_44_2","doi-asserted-by":"crossref","unstructured":"Martin Schrepp Andreas Hinderks and J\u00f6rg Thomaschewski. 2017. Design and evaluation of a short version of the user experience questionnaire (UEQ-S). International Journal of Interactive Multimedia and Artificial Intelligence 4 (6) 103-108. (2017).","DOI":"10.9781\/ijimai.2017.09.001"},{"key":"e_1_3_3_3_45_2","doi-asserted-by":"crossref","unstructured":"Felix Sch\u00fcssel Frank Honold and Michael Weber. 2013. Influencing factors on multimodal interaction during selection tasks. Journal on Multimodal User Interfaces 7 (2013) 299\u2013310.","DOI":"10.1007\/s12193-012-0117-5"},{"key":"e_1_3_3_3_46_2","doi-asserted-by":"publisher","DOI":"10.1145\/3544549.3585615"},{"key":"e_1_3_3_3_47_2","doi-asserted-by":"publisher","DOI":"10.1145\/3313831.3376438"},{"key":"e_1_3_3_3_48_2","unstructured":"F\u00e1bio Souza Rodrigo Nogueira and Roberto Lotufo. 2019. Portuguese named entity recognition using BERT-CRF. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/1909.10649 (2019)."},{"key":"e_1_3_3_3_49_2","doi-asserted-by":"crossref","unstructured":"Anthony Steed and Chris Parker. 2005. Evaluating effectiveness of interaction techniques across immersive virtual environmental systems. Presence 14 5 (2005) 511\u2013527.","DOI":"10.1162\/105474605774918750"},{"key":"e_1_3_3_3_50_2","doi-asserted-by":"crossref","unstructured":"Bernhard Suhm Brad Myers and Alex Waibel. 2001. Multimodal error correction for speech user interfaces. ACM transactions on computer-human interaction (TOCHI) 8 1 (2001) 60\u201398.","DOI":"10.1145\/371127.371166"},{"key":"e_1_3_3_3_51_2","doi-asserted-by":"publisher","DOI":"10.1145\/3706598.3714224"},{"key":"e_1_3_3_3_52_2","doi-asserted-by":"crossref","unstructured":"Laura\u00a0A Thompson and Dominic\u00a0W Massaro. 1986. Evaluation and integration of speech and pointing gestures during referential understanding. Journal of experimental child psychology 42 1 (1986) 144\u2013168.","DOI":"10.1016\/0022-0965(86)90020-2"},{"key":"e_1_3_3_3_53_2","doi-asserted-by":"crossref","unstructured":"Matthew Turk. 2014. Multimodal interaction: A review. Pattern recognition letters 36 (2014) 189\u2013195.","DOI":"10.1016\/j.patrec.2013.07.003"},{"key":"e_1_3_3_3_54_2","doi-asserted-by":"publisher","DOI":"10.1109\/3DUI.2007.340783"},{"key":"e_1_3_3_3_55_2","doi-asserted-by":"crossref","unstructured":"Lode Vanacken Tovi Grossman and Karin Coninx. 2009. Multimodal selection techniques for dense and occluded 3D virtual environments. International Journal of Human-Computer Studies 67 3 (2009) 237\u2013255.","DOI":"10.1016\/j.ijhcs.2008.09.001"},{"key":"e_1_3_3_3_56_2","doi-asserted-by":"crossref","unstructured":"Uta Wagner Matthias Albrecht Andreas\u00a0Asferg Jacobsen Haopeng Wang Hans Gellersen and Ken Pfeuffer. 2024. Gaze Wall and Racket: Combining Gaze and Hand-Controlled Plane for 3D Selection in Virtual Reality. Proceedings of the ACM on Human-Computer Interaction 8 ISS (2024) 189\u2013213.","DOI":"10.1145\/3698134"},{"key":"e_1_3_3_3_57_2","doi-asserted-by":"publisher","DOI":"10.1109\/VR50410.2021.00045"},{"key":"e_1_3_3_3_58_2","doi-asserted-by":"publisher","DOI":"10.1109\/CW.2018.00021"},{"key":"e_1_3_3_3_59_2","doi-asserted-by":"crossref","unstructured":"Ren\u00e9 Weller Waldemar Wegele Christoph Schr\u00f6der and Gabriel Zachmann. 2021. LenSelect: Object selection in virtual environments by dynamic object scaling. Frontiers in Virtual Reality 2 (2021) 684677.","DOI":"10.3389\/frvir.2021.684677"},{"key":"e_1_3_3_3_60_2","doi-asserted-by":"publisher","DOI":"10.1145\/1978942.1978963"},{"key":"e_1_3_3_3_61_2","doi-asserted-by":"publisher","unstructured":"Huiyue Wu Xiaoxuan Sun Huawei Tu and Xiaolong Zhang. 2024. ClockRay: A Wrist-Rotation Based Technique for Occluded-Target Selection in Virtual Reality. IEEE Transactions on Visualization and Computer Graphics 30 7 (July 2024) 3767\u20133778. 10.1109\/TVCG.2023.3239951","DOI":"10.1109\/TVCG.2023.3239951"},{"key":"e_1_3_3_3_62_2","doi-asserted-by":"publisher","DOI":"10.1109\/VR58804.2024.00090"},{"key":"e_1_3_3_3_63_2","unstructured":"Difeng Yu Hai-Ning Liang Feiyu Lu Vijayakumar Nanjappan Konstantinos Papangelis Wei Wang et\u00a0al. 2018. Target Selection in Head-Mounted Display Virtual Reality Environments. J. Univers. Comput. Sci. 24 9 (2018) 1217\u20131243."},{"key":"e_1_3_3_3_64_2","doi-asserted-by":"publisher","DOI":"10.1145\/3411764.3445343"},{"key":"e_1_3_3_3_65_2","doi-asserted-by":"crossref","unstructured":"Difeng Yu Qiushi Zhou Joshua Newn Tilman Dingler Eduardo Velloso and Jorge Goncalves. 2020. Fully-occluded target selection in virtual reality. IEEE transactions on visualization and computer graphics 26 12 (2020) 3402\u20133413.","DOI":"10.1109\/TVCG.2020.3023606"},{"key":"e_1_3_3_3_66_2","doi-asserted-by":"crossref","unstructured":"Haiyan Zhao Hanjie Chen Fan Yang Ninghao Liu Huiqi Deng Hengyi Cai Shuaiqiang Wang Dawei Yin and Mengnan Du. 2024. Explainability for large language models: A survey. ACM Transactions on Intelligent Systems and Technology 15 2 (2024) 1\u201338.","DOI":"10.1145\/3639372"},{"key":"e_1_3_3_3_67_2","doi-asserted-by":"publisher","DOI":"10.1145\/3313831.3376639"}],"event":{"name":"SUI '25: ACM Symposium on Spatial User Interaction","location":"Montreal QC Canada","acronym":"SUI '25","sponsor":["SIGCHI ACM Special Interest Group on Computer-Human Interaction","SIGGRAPH ACM Special Interest Group on Computer Graphics and Interactive Techniques"]},"container-title":["Proceedings of the 2025 ACM Symposium on Spatial User Interaction"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3694907.3765913","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,1,9]],"date-time":"2026-01-09T19:25:42Z","timestamp":1767986742000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3694907.3765913"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,11,9]]},"references-count":66,"alternative-id":["10.1145\/3694907.3765913","10.1145\/3694907"],"URL":"https:\/\/doi.org\/10.1145\/3694907.3765913","relation":{},"subject":[],"published":{"date-parts":[[2025,11,9]]},"assertion":[{"value":"2025-11-09","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}