{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,7]],"date-time":"2026-05-07T15:13:27Z","timestamp":1778166807100,"version":"3.51.4"},"publisher-location":"New York, NY, USA","reference-count":59,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,10,11]],"date-time":"2024-10-11T00:00:00Z","timestamp":1728604800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"DOI":"10.13039\/https:\/\/doi.org\/10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","award":["DGE1745016"],"award-info":[{"award-number":["DGE1745016"]}],"id":[{"id":"10.13039\/https:\/\/doi.org\/10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,10,13]]},"DOI":"10.1145\/3654777.3676401","type":"proceedings-article","created":{"date-parts":[[2024,10,11]],"date-time":"2024-10-11T10:50:36Z","timestamp":1728643836000},"page":"1-18","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":33,"title":["VoicePilot: Harnessing LLMs as Speech Interfaces for Physically Assistive Robots"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-8603-8146","authenticated-orcid":false,"given":"Akhil","family":"Padmanabha","sequence":"first","affiliation":[{"name":"Carnegie Mellon University, United States"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-5314-3224","authenticated-orcid":false,"given":"Jessie","family":"Yuan","sequence":"additional","affiliation":[{"name":"Carnegie Mellon University, United States"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7536-1685","authenticated-orcid":false,"given":"Janavi","family":"Gupta","sequence":"additional","affiliation":[{"name":"Carnegie Mellon University, United States"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-4234-3513","authenticated-orcid":false,"given":"Zulekha","family":"Karachiwalla","sequence":"additional","affiliation":[{"name":"Carnegie Mellon University, United States"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6469-9645","authenticated-orcid":false,"given":"Carmel","family":"Majidi","sequence":"additional","affiliation":[{"name":"Carnegie Mellon University, United States"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1796-2196","authenticated-orcid":false,"given":"Henny","family":"Admoni","sequence":"additional","affiliation":[{"name":"Robotics Institute, Carnegie Mellon University, United States"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6760-6213","authenticated-orcid":false,"given":"Zackory","family":"Erickson","sequence":"additional","affiliation":[{"name":"Carnegie Mellon University, United States"}]}],"member":"320","published-online":{"date-parts":[[2024,10,11]]},"reference":[{"key":"e_1_3_2_2_1_1","unstructured":"[n. d.]. ATLAS.ti | The #1 Software for Qualitative Data Analysis. https:\/\/atlasti.com\/"},{"key":"e_1_3_2_2_2_1","unstructured":"[n. d.]. Obi Feeding Robot. https:\/\/meetobi.com\/"},{"key":"e_1_3_2_2_3_1","unstructured":"[n. d.]. OpenAI API - GPT-3.5 Turbo. https:\/\/platform.openai.com\/docs\/models\/gpt-3-5-turbo"},{"key":"e_1_3_2_2_4_1","unstructured":"[n. d.]. OpenAI API - Whisper. https:\/\/platform.openai.com\/docs\/models\/whisper"},{"key":"e_1_3_2_2_5_1","unstructured":"[n. d.]. Porcupine Wake Word Python API. https:\/\/picovoice.ai\/docs\/api\/porcupine-python\/"},{"key":"e_1_3_2_2_6_1","volume-title":"Autort: Embodied foundation models for large scale orchestration of robotic agents. arXiv preprint arXiv:2401.12963","author":"Ahn Michael","year":"2024","unstructured":"Michael Ahn, Debidatta Dwibedi, Chelsea Finn, Montse\u00a0Gonzalez Arenas, Keerthana Gopalakrishnan, Karol Hausman, Brian Ichter, Alex Irpan, Nikhil Joshi, Ryan Julian, 2024. Autort: Embodied foundation models for large scale orchestration of robotic agents. arXiv preprint arXiv:2401.12963 (2024)."},{"key":"e_1_3_2_2_7_1","unstructured":"Montserrat\u00a0Gonzalez Arenas Ted Xiao Sumeet Singh Vidhi Jain Allen\u00a0Z Ren Quan Vuong Jake Varley Alexander Herzog Isabel Leal Sean Kirmani 2023. How to prompt your robot: A promptbook for manipulation skills with code as policies. In Towards Generalist Robots: Learning Paradigms for Scalable Skill Acquisition@ CoRL2023."},{"key":"e_1_3_2_2_8_1","volume-title":"Prevalence and causes of paralysis\u2014United States","author":"Armour S","year":"2013","unstructured":"Brian\u00a0S Armour, Elizabeth\u00a0A Courtney-Long, Michael\u00a0H Fox, Heidi Fredine, and Anthony Cahill. 2016. Prevalence and causes of paralysis\u2014United States, 2013. American journal of public health 106, 10 (2016), 1855\u20131857."},{"key":"e_1_3_2_2_9_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA46639.2022.9812332"},{"key":"e_1_3_2_2_10_1","doi-asserted-by":"publisher","DOI":"10.1145\/3308561.3353803"},{"key":"e_1_3_2_2_11_1","doi-asserted-by":"publisher","DOI":"10.1145\/3319502.3374818"},{"key":"e_1_3_2_2_12_1","volume-title":"Rt-2: Vision-language-action models transfer web knowledge to robotic control. arXiv preprint arXiv:2307.15818","author":"Brohan Anthony","year":"2023","unstructured":"Anthony Brohan, Noah Brown, Justice Carbajal, Yevgen Chebotar, Xi Chen, Krzysztof Choromanski, Tianli Ding, Danny Driess, Avinava Dubey, Chelsea Finn, 2023. Rt-2: Vision-language-action models transfer web knowledge to robotic control. arXiv preprint arXiv:2307.15818 (2023)."},{"key":"e_1_3_2_2_13_1","doi-asserted-by":"publisher","DOI":"10.1109\/RO-MAN50785.2021.9515511"},{"key":"e_1_3_2_2_14_1","doi-asserted-by":"publisher","DOI":"10.1109\/MRA.2012.2229950"},{"key":"e_1_3_2_2_15_1","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2012.6385907"},{"key":"e_1_3_2_2_16_1","doi-asserted-by":"publisher","DOI":"10.1109\/TCST.2019.2952317"},{"key":"e_1_3_2_2_17_1","doi-asserted-by":"publisher","DOI":"10.2196\/10410"},{"key":"e_1_3_2_2_18_1","doi-asserted-by":"publisher","DOI":"10.1682\/JRRD.2004.08.0100"},{"key":"e_1_3_2_2_19_1","volume-title":"Health implications of physical activity in individuals with spinal cord injury: a literature review.Journal of health and human services administration 30 4","author":"Fernhall Bo","year":"2008","unstructured":"Bo Fernhall, Kevin\u00a0S Heffernan, Sae\u00a0Young Jae, and Bradley\u00a0N. Hedrick. 2008. Health implications of physical activity in individuals with spinal cord injury: a literature review.Journal of health and human services administration 30 4 (2008), 468\u2013502."},{"key":"e_1_3_2_2_20_1","volume-title":"Foundation models in robotics: Applications, challenges, and the future. arXiv preprint arXiv:2312.07843","author":"Firoozi Roya","year":"2023","unstructured":"Roya Firoozi, Johnathan Tucker, Stephen Tian, Anirudha Majumdar, Jiankai Sun, Weiyu Liu, Yuke Zhu, Shuran Song, Ashish Kapoor, Karol Hausman, 2023. Foundation models in robotics: Applications, challenges, and the future. arXiv preprint arXiv:2312.07843 (2023)."},{"key":"e_1_3_2_2_21_1","volume-title":"Behavioral adaptation and late-life disability: a new spectrum for assessing public health impacts. American journal of public health 104, 2","author":"Freedman A","year":"2014","unstructured":"Vicki\u00a0A Freedman, Judith\u00a0D Kasper, Brenda\u00a0C Spillman, Emily\u00a0M Agree, Vincent Mor, Robert\u00a0B Wallace, and Douglas\u00a0A Wolf. 2014. Behavioral adaptation and late-life disability: a new spectrum for assessing public health impacts. American journal of public health 104, 2 (2014), e88\u2013e94."},{"key":"e_1_3_2_2_22_1","volume-title":"Quality of life in adults with multiple sclerosis: a systematic review. BMJ open 10, 11","author":"Gil-Gonz\u00e1lez Irene","year":"2020","unstructured":"Irene Gil-Gonz\u00e1lez, Agust\u00edn Mart\u00edn-Rodr\u00edguez, Rupert Conrad, and Mar\u00eda\u00a0\u00c1ngeles P\u00e9rez-San-Gregorio. 2020. Quality of life in adults with multiple sclerosis: a systematic review. BMJ open 10, 11 (2020), e041249."},{"key":"e_1_3_2_2_23_1","doi-asserted-by":"publisher","DOI":"10.1145\/3610978.3641085"},{"key":"e_1_3_2_2_24_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.rcim.2020.101998"},{"key":"e_1_3_2_2_25_1","doi-asserted-by":"publisher","DOI":"10.1109\/CIRAT.2014.7009736"},{"key":"e_1_3_2_2_26_1","doi-asserted-by":"publisher","DOI":"10.1145\/1518701.1518731"},{"key":"e_1_3_2_2_27_1","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2024.3360020"},{"key":"e_1_3_2_2_28_1","doi-asserted-by":"publisher","DOI":"10.1177\/0278364918776060"},{"key":"e_1_3_2_2_29_1","doi-asserted-by":"publisher","DOI":"10.1145\/3610977.3634975"},{"key":"e_1_3_2_2_30_1","volume-title":"Real-World Robot Applications of Foundation Models: A Review. arXiv preprint arXiv:2402.05741","author":"Kawaharazuka Kento","year":"2024","unstructured":"Kento Kawaharazuka, Tatsuya Matsushima, Andrew Gambardella, Jiaxian Guo, Chris Paxton, and Andy Zeng. 2024. Real-World Robot Applications of Foundation Models: A Review. arXiv preprint arXiv:2402.05741 (2024)."},{"key":"e_1_3_2_2_31_1","volume-title":"Can an LLM-Powered Socially Assistive Robot Effectively and Safely Deliver Cognitive Behavioral Therapy? A Study With University Students. arXiv preprint arXiv:2402.17937","author":"Kian J","year":"2024","unstructured":"Mina\u00a0J Kian, Mingyu Zong, Katrin Fischer, Abhyuday Singh, Anna-Maria Velentza, Pau Sang, Shriya Upadhyay, Anika Gupta, Misha\u00a0A Faruki, Wallace Browning, 2024. Can an LLM-Powered Socially Assistive Robot Effectively and Safely Deliver Cognitive Behavioral Therapy? A Study With University Students. arXiv preprint arXiv:2402.17937 (2024)."},{"key":"e_1_3_2_2_32_1","volume-title":"Understanding Large-Language Model (LLM)-powered Human-Robot Interaction. arXiv preprint arXiv:2401.03217","author":"Kim Y","year":"2024","unstructured":"Callie\u00a0Y Kim, Christine\u00a0P Lee, and Bilge Mutlu. 2024. Understanding Large-Language Model (LLM)-powered Human-Robot Interaction. arXiv preprint arXiv:2401.03217 (2024)."},{"key":"e_1_3_2_2_33_1","doi-asserted-by":"publisher","DOI":"10.3109\/17483107.2011.615374"},{"key":"e_1_3_2_2_34_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICORR.2017.8009380"},{"key":"e_1_3_2_2_35_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48891.2023.10160591"},{"key":"e_1_3_2_2_36_1","doi-asserted-by":"publisher","DOI":"10.1145\/3610978.3640671"},{"key":"e_1_3_2_2_37_1","doi-asserted-by":"publisher","DOI":"10.1145\/3610977.3634999"},{"key":"e_1_3_2_2_38_1","doi-asserted-by":"publisher","DOI":"10.1145\/3568162.3576988"},{"key":"e_1_3_2_2_39_1","volume-title":"Physically Assistive Robots: A Systematic Review of Mobile and Manipulator Robots That Physically Assist People with Disabilities. Annual Review of Control, Robotics, and Autonomous Systems 7","author":"Nanavati Amal","year":"2023","unstructured":"Amal Nanavati, Vinitha Ranganeni, and Maya Cakmak. 2023. Physically Assistive Robots: A Systematic Review of Mobile and Manipulator Robots That Physically Assist People with Disabilities. Annual Review of Control, Robotics, and Autonomous Systems 7 (2023)."},{"key":"e_1_3_2_2_40_1","doi-asserted-by":"publisher","DOI":"10.1145\/3610977.3634964"},{"key":"e_1_3_2_2_41_1","volume-title":"HAT: Head-Worn Assistive Teleoperation of Mobile Manipulators. In 2023 IEEE International Conference on Robotics and Automation (ICRA). IEEE, 12542\u201312548","author":"Padmanabha Akhil","year":"2023","unstructured":"Akhil Padmanabha, Qin Wang, Daphne Han, Jashkumar Diyora, Kriti Kacker, Hamza Khalid, Liang-Jung Chen, Carmel Majidi, and Zackory Erickson. 2023. HAT: Head-Worn Assistive Teleoperation of Mobile Manipulators. In 2023 IEEE International Conference on Robotics and Automation (ICRA). IEEE, 12542\u201312548."},{"key":"e_1_3_2_2_42_1","doi-asserted-by":"publisher","DOI":"10.3390\/robotics12040097"},{"key":"e_1_3_2_2_43_1","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2018.2801475"},{"key":"e_1_3_2_2_44_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICORR.2019.8779524"},{"key":"e_1_3_2_2_45_1","doi-asserted-by":"publisher","DOI":"10.1109\/BIOROB.2018.8487200"},{"key":"e_1_3_2_2_46_1","doi-asserted-by":"publisher","DOI":"10.1145\/3610978.3638359"},{"key":"e_1_3_2_2_47_1","volume-title":"Evaluating Customization of Remote Tele-operation Interfaces for Assistive Robots. In 2023 32nd IEEE International Conference on Robot and Human Interactive Communication (RO-MAN). IEEE, 1633\u20131640","author":"Ranganeni Vinitha","year":"2023","unstructured":"Vinitha Ranganeni, Noah Ponto, and Maya Cakmak. 2023. Evaluating Customization of Remote Tele-operation Interfaces for Assistive Robots. In 2023 32nd IEEE International Conference on Robot and Human Interactive Communication (RO-MAN). IEEE, 1633\u20131640."},{"key":"e_1_3_2_2_48_1","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2016.7759067"},{"key":"e_1_3_2_2_49_1","volume-title":"Defining aging in place: The intersectionality of space, person, and time. Innovation in aging 4, 4","author":"Rogers A","year":"2020","unstructured":"Wendy\u00a0A Rogers, Widya\u00a0A Ramadhani, and Maurita\u00a0T Harris. 2020. Defining aging in place: The intersectionality of space, person, and time. Innovation in aging 4, 4 (2020), igaa036."},{"key":"e_1_3_2_2_50_1","doi-asserted-by":"publisher","DOI":"10.1038\/sc.2009.93"},{"key":"e_1_3_2_2_51_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48891.2023.10161317"},{"key":"e_1_3_2_2_52_1","doi-asserted-by":"publisher","DOI":"10.1007\/s12369-022-00914-w"},{"key":"e_1_3_2_2_53_1","volume-title":"Chatgpt for robotics: Design principles and model abilities. arXiv preprint arXiv:2306.17582","author":"Vemprala Sai","year":"2023","unstructured":"Sai Vemprala, Rogerio Bonatti, Arthur Bucker, and Ashish Kapoor. 2023. Chatgpt for robotics: Design principles and model abilities. arXiv preprint arXiv:2306.17582 (2023)."},{"key":"e_1_3_2_2_54_1","volume-title":"Grid: A platform for general robot intelligence development. arXiv preprint arXiv:2310.00887","author":"Vemprala Sai","year":"2023","unstructured":"Sai Vemprala, Shuhang Chen, Abhinav Shukla, Dinesh Narayanan, and Ashish Kapoor. 2023. Grid: A platform for general robot intelligence development. arXiv preprint arXiv:2310.00887 (2023)."},{"key":"e_1_3_2_2_55_1","volume-title":"LaMI: Large Language Models for Multi-Modal Human-Robot Interaction. In Extended Abstracts of the CHI Conference on Human Factors in Computing Systems. 1\u201310","author":"Wang Chao","year":"2024","unstructured":"Chao Wang, Stephan Hasler, Daniel Tanneberg, Felix Ocker, Frank Joublin, Antonello Ceravola, Joerg Deigmoeller, and Michael Gienger. 2024. LaMI: Large Language Models for Multi-Modal Human-Robot Interaction. In Extended Abstracts of the CHI Conference on Human Factors in Computing Systems. 1\u201310."},{"key":"e_1_3_2_2_56_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10514-023-10139-z"},{"key":"e_1_3_2_2_57_1","volume-title":"High-density Electromyography for Effective Gesture-based Control of Physically Assistive Mobile Manipulators. arXiv preprint arXiv:2312.07745","author":"Yang Jehan","year":"2023","unstructured":"Jehan Yang, Kent Shibata, Douglas Weber, and Zackory Erickson. 2023. High-density Electromyography for Effective Gesture-based Control of Physically Assistive Mobile Manipulators. arXiv preprint arXiv:2312.07745 (2023)."},{"key":"e_1_3_2_2_58_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.birob.2023.100131"},{"key":"e_1_3_2_2_59_1","doi-asserted-by":"publisher","DOI":"10.1109\/IROS55552.2023.10342363"}],"event":{"name":"UIST '24: The 37th Annual ACM Symposium on User Interface Software and Technology","location":"Pittsburgh PA USA","acronym":"UIST '24"},"container-title":["Proceedings of the 37th Annual ACM Symposium on User Interface Software and Technology"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3654777.3676401","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3654777.3676401","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,4]],"date-time":"2025-08-04T21:13:19Z","timestamp":1754341999000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3654777.3676401"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,10,11]]},"references-count":59,"alternative-id":["10.1145\/3654777.3676401","10.1145\/3654777"],"URL":"https:\/\/doi.org\/10.1145\/3654777.3676401","relation":{},"subject":[],"published":{"date-parts":[[2024,10,11]]},"assertion":[{"value":"2024-10-11","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}