{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,13]],"date-time":"2026-06-13T07:22:15Z","timestamp":1781335335046,"version":"3.54.1"},"publisher-location":"New York, NY, USA","reference-count":100,"publisher":"ACM","content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,10,26]]},"DOI":"10.1145\/3663547.3746319","type":"proceedings-article","created":{"date-parts":[[2025,10,22]],"date-time":"2025-10-22T16:33:49Z","timestamp":1761150829000},"page":"1-14","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":9,"title":["Probing the Gaps in ChatGPT's Live Video Chat for Real-World Assistance for People who are Blind or Visually Impaired"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-7545-4136","authenticated-orcid":false,"given":"Ruei-Che","family":"Chang","sequence":"first","affiliation":[{"name":"Computer Science and Engineering, University of Michigan, Ann Arbor, Michigan, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8912-7627","authenticated-orcid":false,"given":"Rosiana","family":"Natalie","sequence":"additional","affiliation":[{"name":"University of Michigan, Ann Arbor, Michigan, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-1822-0652","authenticated-orcid":false,"given":"Wenqian","family":"Xu","sequence":"additional","affiliation":[{"name":"Human AI Lab, University of Michigan, Ann Arbor, Michigan, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0000-0933-2878","authenticated-orcid":false,"given":"Jovan Zheng Feng","family":"Yap","sequence":"additional","affiliation":[{"name":"Computer Science and Engineering, University of Michigan, Ann Arbor, Michigan, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4447-7818","authenticated-orcid":false,"given":"Anhong","family":"Guo","sequence":"additional","affiliation":[{"name":"Computer Science and Engineering, University of Michigan, Ann Arbor, Michigan, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"320","published-online":{"date-parts":[[2025,10,22]]},"reference":[{"key":"e_1_3_3_2_2_2","unstructured":"2025. Aira. https:\/\/aira.io\/"},{"key":"e_1_3_3_2_3_2","unstructured":"2025. BeMyEyes. https:\/\/www.bemyeyes.com\/"},{"key":"e_1_3_3_2_4_2","unstructured":"2025. ChatGPT can now see hear and speak. https:\/\/openai.com\/index\/chatgpt-can-now-see-hear-and-speak\/"},{"key":"e_1_3_3_2_5_2","unstructured":"2025. Envision AI. https:\/\/www.letsenvision.com\/"},{"key":"e_1_3_3_2_6_2","unstructured":"2025. Introducing Be My AI (formerly Virtual Volunteer) for People who are Blind or Have Low Vision Powered by OpenAI\u2019s GPT-4. https:\/\/www.bemyeyes.com\/blog\/introducing-be-my-eyes-virtual-volunteer"},{"key":"e_1_3_3_2_7_2","unstructured":"2025. Orcam: Empowering Accessibility with AI. https:\/\/www.orcam.com\/en-us\/home?srsltid=AfmBOoqOElsZ58Z5kmCs_LDgPW7eq4WRpLVMbFGtydZn4aqayDxc7wxR"},{"key":"e_1_3_3_2_8_2","unstructured":"2025. PiccyBot. https:\/\/www.piccybot.com\/"},{"key":"e_1_3_3_2_9_2","unstructured":"2025. SeeingAI. https:\/\/www.seeingai.com\/"},{"key":"e_1_3_3_2_10_2","doi-asserted-by":"publisher","DOI":"10.1145\/2935334.2935361"},{"key":"e_1_3_3_2_11_2","doi-asserted-by":"publisher","unstructured":"Rahaf Alharbi Robin\u00a0N. Brewer and Sarita Schoenebeck. 2022. Understanding Emerging Obfuscation Technologies in Visual Description Services for Blind and Low Vision People. Proc. ACM Hum.-Comput. Interact. 6 CSCW2 Article 469 (Nov. 2022) 33\u00a0pages. 10.1145\/3555570","DOI":"10.1145\/3555570"},{"key":"e_1_3_3_2_12_2","doi-asserted-by":"publisher","DOI":"10.1145\/3663548.3675659"},{"key":"e_1_3_3_2_13_2","doi-asserted-by":"publisher","DOI":"10.1109\/SCOReD.2013.7002560"},{"key":"e_1_3_3_2_14_2","doi-asserted-by":"publisher","DOI":"10.1145\/3290605.3300233"},{"key":"e_1_3_3_2_15_2","doi-asserted-by":"crossref","unstructured":"Aries Arditi Emily Holmes Peter Reedijk and Roger Whitehouse. 1999. Interactive tactile maps visual disability and accessibility of building interiors. Visual Impairment Research 1 1 (1999) 11\u201321.","DOI":"10.1076\/vimr.1.1.11.4456"},{"key":"e_1_3_3_2_16_2","doi-asserted-by":"crossref","unstructured":"Masatoshi Arikawa Shin\u2019ichi Konomi and Keisuke Ohnishi. 2007. Navitime: Supporting pedestrian navigation in the real world. IEEE Pervasive Computing 6 3 (2007) 21\u201329.","DOI":"10.1109\/MPRV.2007.61"},{"key":"e_1_3_3_2_17_2","doi-asserted-by":"publisher","DOI":"10.1145\/2910674.2935839"},{"key":"e_1_3_3_2_18_2","doi-asserted-by":"crossref","unstructured":"Tita\u00a0Alissa Bach Amna Khan Harry Hallock Gabriela Beltr\u00e3o and Sonia Sousa. 2024. A systematic literature review of user trust in AI-enabled systems: An HCI perspective. International Journal of Human\u2013Computer Interaction 40 5 (2024) 1251\u20131266.","DOI":"10.1080\/10447318.2022.2138826"},{"key":"e_1_3_3_2_19_2","doi-asserted-by":"publisher","DOI":"10.1145\/3290607.3313008"},{"key":"e_1_3_3_2_20_2","doi-asserted-by":"publisher","DOI":"10.1609\/aaaiss.v3i1.31232"},{"key":"e_1_3_3_2_21_2","doi-asserted-by":"publisher","DOI":"10.1145\/1866029.1866080"},{"key":"e_1_3_3_2_22_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW.2010.5543821"},{"key":"e_1_3_3_2_23_2","doi-asserted-by":"publisher","DOI":"10.1145\/2470654.2481291"},{"key":"e_1_3_3_2_24_2","doi-asserted-by":"publisher","DOI":"10.1145\/2441776.2441915"},{"key":"e_1_3_3_2_25_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-94-017-1400-6_33"},{"key":"e_1_3_3_2_26_2","doi-asserted-by":"publisher","DOI":"10.1145\/3654777.3676375"},{"key":"e_1_3_3_2_27_2","doi-asserted-by":"publisher","DOI":"10.1145\/3663548.3675599"},{"key":"e_1_3_3_2_28_2","doi-asserted-by":"crossref","unstructured":"Hyesun Choung Prabu David and Arun Ross. 2023. Trust in AI and its role in the acceptance of AI technologies. International Journal of Human\u2013Computer Interaction 39 9 (2023) 1727\u20131739.","DOI":"10.1080\/10447318.2022.2050543"},{"key":"e_1_3_3_2_29_2","doi-asserted-by":"publisher","DOI":"10.1109\/IPIN.2012.6418882"},{"key":"e_1_3_3_2_30_2","doi-asserted-by":"publisher","DOI":"10.1109\/DSAA.2018.00018"},{"key":"e_1_3_3_2_31_2","doi-asserted-by":"publisher","DOI":"10.1145\/3597638.3614548"},{"key":"e_1_3_3_2_32_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642211"},{"key":"e_1_3_3_2_33_2","doi-asserted-by":"crossref","unstructured":"Christina Granquist Susan\u00a0Y Sun Sandra\u00a0R Montezuma Tu\u00a0M Tran Rachel Gage and Gordon\u00a0E Legge. 2021. Evaluation and comparison of artificial intelligence vision aids: Orcam myeye 1 and seeing ai. Journal of Visual Impairment & Blindness 115 4 (2021) 277\u2013285.","DOI":"10.1177\/0145482X211027492"},{"key":"e_1_3_3_2_34_2","doi-asserted-by":"publisher","DOI":"10.1145\/3308561.3353771"},{"key":"e_1_3_3_2_35_2","doi-asserted-by":"publisher","DOI":"10.1145\/3544548.3580688"},{"key":"e_1_3_3_2_36_2","volume-title":"The UX Book: Process and Guidelines for Ensuring a Quality User Experience","author":"Hartson R.","year":"2012","unstructured":"R. Hartson and P.S. Pyla. 2012. The UX Book: Process and Guidelines for Ensuring a Quality User Experience. Elsevier Science. https:\/\/books.google.ca\/books?id=w4I3Y64SWLoC"},{"key":"e_1_3_3_2_37_2","doi-asserted-by":"publisher","DOI":"10.1145\/3544548.3581249"},{"key":"e_1_3_3_2_38_2","doi-asserted-by":"crossref","unstructured":"Nicole Holmes and Kelly Prentice. 2015. iPhone video link as an orientation tool: Remote O&M for people with vision impairment. Vision Rehabilitation International 7 1 (2015) 60\u201367.","DOI":"10.21307\/ijom-2017-057"},{"key":"e_1_3_3_2_39_2","doi-asserted-by":"publisher","DOI":"10.1145\/3517428.3544824"},{"key":"e_1_3_3_2_40_2","doi-asserted-by":"publisher","DOI":"10.1145\/3663548.3675635"},{"key":"e_1_3_3_2_41_2","doi-asserted-by":"crossref","unstructured":"Karst\u00a0MP Hoogsteen Sarit Szpiro Gabriel Kreiman and Eli Peli. 2022. Beyond the cane: describing urban scenes to blind people for mobility tasks. ACM Transactions on Accessible Computing (TACCESS) 15 3 (2022) 1\u201329.","DOI":"10.1145\/3522757"},{"key":"e_1_3_3_2_42_2","doi-asserted-by":"publisher","DOI":"10.1145\/3025453.3025899"},{"key":"e_1_3_3_2_43_2","doi-asserted-by":"crossref","unstructured":"Amy\u00a0A Kalia Gordon\u00a0E Legge Rudrava Roy and Advait Ogale. 2010. Assessment of indoor route-finding technology for people who are visually impaired. Journal of visual impairment & blindness 104 3 (2010) 135\u2013147.","DOI":"10.1177\/0145482X1010400303"},{"key":"e_1_3_3_2_44_2","doi-asserted-by":"publisher","DOI":"10.1145\/3313831.3376823"},{"key":"e_1_3_3_2_45_2","doi-asserted-by":"crossref","unstructured":"Hyung\u00a0Nam Kim. 2022. User experience of assistive apps among people with visual impairment. Technology and Disability 34 3 (2022) 165\u2013174.","DOI":"10.3233\/TAD-220377"},{"key":"e_1_3_3_2_46_2","doi-asserted-by":"crossref","unstructured":"Elisa Kreiss Cynthia Bennett Shayan Hooshmand Eric Zelikman Meredith\u00a0Ringel Morris and Christopher Potts. 2022. Context matters for image descriptions for accessibility: Challenges for referenceless evaluation metrics. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2205.10646 (2022).","DOI":"10.18653\/v1\/2022.emnlp-main.309"},{"key":"e_1_3_3_2_47_2","doi-asserted-by":"crossref","unstructured":"Vladimir Kulyukin Chaitanya Gharpure John Nicholson and Grayson Osborne. 2006. Robot-assisted wayfinding for the visually impaired in structured indoor environments. Autonomous robots 21 (2006) 29\u201341.","DOI":"10.1007\/s10514-006-7223-8"},{"key":"e_1_3_3_2_48_2","unstructured":"Elizabeth Kupferstein Yuhang Zhao Shiri Azenkot and Hathaitorn Rojnirun. 2020. Understanding the use of artificial intelligence based visual aids for people with visual impairments. Investigative Ophthalmology & Visual Science 61 7 (2020) 932\u2013932."},{"key":"e_1_3_3_2_49_2","doi-asserted-by":"crossref","unstructured":"Masaki Kuribayashi Kohei Uehara Allan Wang Shigeo Morishima and Chieko Asakawa. 2025. WanderGuide: Indoor Map-less Robotic Guide for Exploration by Blind People. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2502.08906 (2025).","DOI":"10.1145\/3706598.3713788"},{"key":"e_1_3_3_2_50_2","doi-asserted-by":"crossref","unstructured":"Nancy\u00a0K Lankton D\u00a0Harrison McKnight and John Tripp. 2015. Technology humanness and trust: Rethinking trust in technology. Journal of the Association for Information Systems 16 10 (2015) 1.","DOI":"10.17705\/1jais.00411"},{"key":"e_1_3_3_2_51_2","doi-asserted-by":"publisher","DOI":"10.1145\/3491102.3501966"},{"key":"e_1_3_3_2_52_2","doi-asserted-by":"crossref","unstructured":"John\u00a0D Lee and Katrina\u00a0A See. 2004. Trust in automation: Designing for appropriate reliance. Human factors 46 1 (2004) 50\u201380.","DOI":"10.1518\/hfes.46.1.50.30392"},{"key":"e_1_3_3_2_53_2","doi-asserted-by":"publisher","DOI":"10.1145\/3308561.3353799"},{"key":"e_1_3_3_2_54_2","doi-asserted-by":"publisher","DOI":"10.1145\/3290605.3300566"},{"key":"e_1_3_3_2_55_2","doi-asserted-by":"publisher","DOI":"10.1145\/3411763.3451806"},{"key":"e_1_3_3_2_56_2","doi-asserted-by":"publisher","DOI":"10.1109\/WACV45572.2020.9093353"},{"key":"e_1_3_3_2_57_2","doi-asserted-by":"crossref","unstructured":"Kyungjun Lee Abhinav Shrivastava and Hernisa Kacorri. 2021. Leveraging hand-object interactions in assistive egocentric vision. IEEE Transactions on Pattern Analysis and Machine Intelligence 45 6 (2021) 6820\u20136831.","DOI":"10.1109\/TPAMI.2021.3123303"},{"key":"e_1_3_3_2_58_2","unstructured":"Sooyeon Lee Madison Reddie Krish Gurdasani Xiying Wang Jordan Beck Mary\u00a0Beth Rosson and John\u00a0M Carroll. 2018. Conversations for Vision: Remote Sighted Assistants Helping People with Visual Impairments. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/1812.00148 (2018)."},{"key":"e_1_3_3_2_59_2","doi-asserted-by":"publisher","DOI":"10.1145\/3313831.3376591"},{"key":"e_1_3_3_2_60_2","doi-asserted-by":"crossref","unstructured":"Yue Lian De-er Liu and Wei-zhen Ji. 2024. Survey and analysis of the current status of research in the field of outdoor navigation for the blind. Disability and Rehabilitation: Assistive Technology 19 4 (2024) 1657\u20131675.","DOI":"10.1080\/17483107.2023.2227224"},{"key":"e_1_3_3_2_61_2","doi-asserted-by":"crossref","unstructured":"Zachary\u00a0C Lipton. 2018. The mythos of model interpretability: In machine learning the concept of interpretability is both important and slippery. Queue 16 3 (2018) 31\u201357.","DOI":"10.1145\/3236386.3241340"},{"key":"e_1_3_3_2_62_2","unstructured":"Hanchao Liu Wenyuan Xue Yifei Chen Dapeng Chen Xiutian Zhao Ke Wang Liping Hou Rongjun Li and Wei Peng. 2024. A survey on hallucination in large vision-language models. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2402.00253 (2024)."},{"key":"e_1_3_3_2_63_2","doi-asserted-by":"publisher","DOI":"10.1145\/3706598.3713760"},{"key":"e_1_3_3_2_64_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642939"},{"key":"e_1_3_3_2_65_2","doi-asserted-by":"crossref","unstructured":"Jack\u00a0M Loomis Reginald\u00a0G Golledge and Roberta\u00a0L Klatzky. 1998. Navigation system for the blind: Auditory display modes and guidance. Presence 7 2 (1998) 193\u2013203.","DOI":"10.1162\/105474698565677"},{"key":"e_1_3_3_2_66_2","doi-asserted-by":"publisher","DOI":"10.1145\/2858036.2858288"},{"key":"e_1_3_3_2_67_2","doi-asserted-by":"publisher","DOI":"10.1145\/3025453.3025814"},{"key":"e_1_3_3_2_68_2","doi-asserted-by":"publisher","DOI":"10.1145\/3597638.3608395"},{"key":"e_1_3_3_2_69_2","doi-asserted-by":"crossref","unstructured":"Annika Muehlbradt and Shaun\u00a0K Kane. 2022. What\u2019s in an ALT Tag? Exploring Caption Content Priorities through Collaborative Captioning. ACM Transactions on Accessible Computing (TACCESS) 15 1 (2022) 1\u201332.","DOI":"10.1145\/3507659"},{"key":"e_1_3_3_2_70_2","doi-asserted-by":"publisher","DOI":"10.1109\/PERCOM.2018.8444593"},{"key":"e_1_3_3_2_71_2","doi-asserted-by":"publisher","DOI":"10.1007\/11788713_187"},{"key":"e_1_3_3_2_72_2","doi-asserted-by":"publisher","DOI":"10.1145\/3544548.3581302"},{"key":"e_1_3_3_2_73_2","doi-asserted-by":"crossref","unstructured":"Brian\u00a0J Nguyen William\u00a0S Chen Allison\u00a0J Chen Andrew Utt Emily Hill Ryan Apgar and Daniel\u00a0L Chao. 2019. Large-scale assessment of needs in low vision individuals using the Aira assistive technology. Clinical ophthalmology (2019) 1853\u20131868.","DOI":"10.2147\/OPTH.S215658"},{"key":"e_1_3_3_2_74_2","doi-asserted-by":"crossref","unstructured":"Brian\u00a0J Nguyen Yeji Kim Kathryn Park Allison\u00a0J Chen Scarlett Chen Donald Van\u00a0Fossan and Daniel\u00a0L Chao. 2018. Improvement in patient-reported quality of life outcomes in severely visually impaired individuals using the Aira assistive technology system. Translational vision science & technology 7 5 (2018) 30\u201330.","DOI":"10.1167\/tvst.7.5.30"},{"key":"e_1_3_3_2_75_2","doi-asserted-by":"publisher","DOI":"10.1145\/3586183.3606763"},{"key":"e_1_3_3_2_76_2","doi-asserted-by":"crossref","unstructured":"Ricardo E\u00a0Gonzalez Penuela Ruiying Hu Sharon Lin Tanisha Shende and Shiri Azenkot. 2025. Towards Understanding the Use of MLLM-Enabled Applications for Visual Interpretation by Blind and Low Vision People. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2503.05899 (2025).","DOI":"10.1145\/3706599.3719714"},{"key":"e_1_3_3_2_77_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.findings-acl.847"},{"key":"e_1_3_3_2_78_2","doi-asserted-by":"publisher","DOI":"10.1145\/3173574.3173677"},{"key":"e_1_3_3_2_79_2","doi-asserted-by":"publisher","DOI":"10.1109\/PERCOM.2004.1276842"},{"key":"e_1_3_3_2_80_2","doi-asserted-by":"publisher","DOI":"10.1145\/2939672.2939778"},{"key":"e_1_3_3_2_81_2","doi-asserted-by":"crossref","unstructured":"Omar Shaikh Shardul Sapkota Shan Rizvi Eric Horvitz Joon\u00a0Sung Park Diyi Yang and Michael\u00a0S Bernstein. 2025. Creating General User Models from Computer Use. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2505.10831 (2025).","DOI":"10.1145\/3746059.3747722"},{"key":"e_1_3_3_2_82_2","doi-asserted-by":"crossref","unstructured":"Donghee Shin. 2021. The effects of explainability and causability on perception trust and acceptance: Implications for explainable AI. International journal of human-computer studies 146 (2021) 102551.","DOI":"10.1016\/j.ijhcs.2020.102551"},{"key":"e_1_3_3_2_83_2","doi-asserted-by":"publisher","DOI":"10.1109\/ROBOT.1994.351166"},{"key":"e_1_3_3_2_84_2","doi-asserted-by":"publisher","DOI":"10.1145\/3597638.3608402"},{"key":"e_1_3_3_2_85_2","doi-asserted-by":"publisher","DOI":"10.1145\/3313831.3376404"},{"key":"e_1_3_3_2_86_2","doi-asserted-by":"publisher","DOI":"10.1145\/3441852.3471233"},{"key":"e_1_3_3_2_87_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-20074-8_33"},{"key":"e_1_3_3_2_88_2","doi-asserted-by":"crossref","unstructured":"Jianyuan Wang Minghao Chen Nikita Karaev Andrea Vedaldi Christian Rupprecht and David Novotny. 2025. VGGT: Visual Geometry Grounded Transformer. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2503.11651 (2025).","DOI":"10.1109\/CVPR52734.2025.00499"},{"key":"e_1_3_3_2_89_2","doi-asserted-by":"publisher","DOI":"10.1109\/IPIN.2012.6418894"},{"key":"e_1_3_3_2_90_2","doi-asserted-by":"publisher","unstructured":"Jacob\u00a0O. Wobbrock Shaun\u00a0K. Kane Krzysztof\u00a0Z. Gajos Susumu Harada and Jon Froehlich. 2011. Ability-Based Design: Concept Principles and Examples. ACM Trans. Access. Comput. 3 3 Article 9 (April 2011) 27\u00a0pages. 10.1145\/1952383.1952384","DOI":"10.1145\/1952383.1952384"},{"key":"e_1_3_3_2_91_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICICS.2003.1292553"},{"key":"e_1_3_3_2_92_2","unstructured":"Jingyi Xie Rui Yu He Zhang Syed\u00a0Masum Billah Sooyeon Lee and John\u00a0M Carroll. 2025. Beyond Visual Perception: Insights from Smartphone Interaction of Visually Impaired Users with Large Multimodal Models. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2502.16098 (2025)."},{"key":"e_1_3_3_2_93_2","doi-asserted-by":"publisher","unstructured":"Andi Xu Minyu Cai Dier Hou Ruei-Che Chang and Anhong Guo. 2024. ImageExplorer Deployment: Understanding Text-Based and Touch-Based Image Exploration in the Wild(W4A \u201924). Association for Computing Machinery New York NY USA. 10.1145\/3677846.3677861","DOI":"10.1145\/3677846.3677861"},{"key":"e_1_3_3_2_94_2","doi-asserted-by":"publisher","DOI":"10.1145\/3654777.3676336"},{"key":"e_1_3_3_2_95_2","doi-asserted-by":"publisher","DOI":"10.1109\/FMSys62467.2024.00010"},{"key":"e_1_3_3_2_96_2","doi-asserted-by":"crossref","unstructured":"Jianing Yang Alexander Sax Kevin\u00a0J Liang Mikael Henaff Hao Tang Ang Cao Joyce Chai Franziska Meier and Matt Feiszli. 2025. Fast3R: Towards 3D Reconstruction of 1000+ Images in One Forward Pass. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2501.13928 (2025).","DOI":"10.1109\/CVPR52734.2025.02042"},{"key":"e_1_3_3_2_97_2","doi-asserted-by":"crossref","unstructured":"Yuncong Yang Han Yang Jiachen Zhou Peihao Chen Hongxin Zhang Yilun Du and Chuang Gan. 2024. 3D-Mem: 3D Scene Memory for Embodied Exploration and Reasoning. arxiv:https:\/\/arXiv.org\/abs\/2411.17735\u00a0[cs.CV] https:\/\/arxiv.org\/abs\/2411.17735","DOI":"10.1109\/CVPR52734.2025.01612"},{"key":"e_1_3_3_2_98_2","doi-asserted-by":"crossref","unstructured":"Rui Yu Sooyeon Lee Jingyi Xie Syed\u00a0Masum Billah and John\u00a0M Carroll. 2024. Human\u2013AI collaboration for remote sighted assistance: Perspectives from the LLM era. Future internet 16 7 (2024) 254.","DOI":"10.3390\/fi16070254"},{"key":"e_1_3_3_2_99_2","doi-asserted-by":"publisher","DOI":"10.1145\/3688828.3699636"},{"key":"e_1_3_3_2_100_2","unstructured":"Zeyu Zhang Xiaohe Bo Chen Ma Rui Li Xu Chen Quanyu Dai Jieming Zhu Zhenhua Dong and Ji-Rong Wen. 2024. A survey on the memory mechanism of large language model based agents. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2404.13501 (2024)."},{"key":"e_1_3_3_2_101_2","doi-asserted-by":"publisher","DOI":"10.1145\/2702123.2702437"}],"event":{"name":"ASSETS '25: The 27th International ACM SIGACCESS Conference on Computers and Accessibility","location":"Denver Colorado USA","acronym":"ASSETS '25","sponsor":["SIGACCESS ACM Special Interest Group on Accessible Computing"]},"container-title":["Proceedings of the 27th International ACM SIGACCESS Conference on Computers and Accessibility"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3663547.3746319","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,1,9]],"date-time":"2026-01-09T17:59:03Z","timestamp":1767981543000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3663547.3746319"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,22]]},"references-count":100,"alternative-id":["10.1145\/3663547.3746319","10.1145\/3663547"],"URL":"https:\/\/doi.org\/10.1145\/3663547.3746319","relation":{},"subject":[],"published":{"date-parts":[[2025,10,22]]},"assertion":[{"value":"2025-10-22","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}