{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,23]],"date-time":"2026-04-23T07:59:54Z","timestamp":1776931194880,"version":"3.51.2"},"publisher-location":"New York, NY, USA","reference-count":142,"publisher":"ACM","content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2026,4,13]]},"DOI":"10.1145\/3772318.3790696","type":"proceedings-article","created":{"date-parts":[[2026,4,13]],"date-time":"2026-04-13T06:44:21Z","timestamp":1776062661000},"page":"1-19","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Characterizing Unintended Consequences of GUI Agents For Web Browsing"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-4145-117X","authenticated-orcid":false,"given":"Shuning","family":"Zhang","sequence":"first","affiliation":[{"name":"Tsinghua University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0007-1606-5780","authenticated-orcid":false,"given":"Jingruo","family":"Chen","sequence":"additional","affiliation":[{"name":"Information Science, Cornell University, Ithaca, New York, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0008-4898-2521","authenticated-orcid":false,"given":"Zhiqi","family":"Gao","sequence":"additional","affiliation":[{"name":"School of Data Science, The Chinese University of Hong Kong, Shenzhen, Shenzhen, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0008-6135-4714","authenticated-orcid":false,"given":"Jiajing","family":"Gao","sequence":"additional","affiliation":[{"name":"The Hong Kong University of Science and Technology, Hongkong, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8041-7962","authenticated-orcid":false,"given":"Xin","family":"Yi","sequence":"additional","affiliation":[{"name":"Tsinghua University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6331-6542","authenticated-orcid":false,"given":"Hewu","family":"Li","sequence":"additional","affiliation":[{"name":"Tsinghua University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2026,4,13]]},"reference":[{"key":"e_1_3_3_2_2_2","unstructured":"Saaket Agashe Kyle Wong Vincent Tu Jiachen Yang Ang Li and Xin\u00a0Eric Wang. 2025. Agent s2: A compositional generalist-specialist framework for computer use agents. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2504.00906 (2025)."},{"key":"e_1_3_3_2_3_2","doi-asserted-by":"crossref","unstructured":"Damiano Angeletti Enrico Giunchiglia Massimo Narizzano Alessandra Puddu and Salvatore Sabina. 2010. Using bounded model checking for coverage analysis of safety-critical software in an industrial setting. Journal of Automated Reasoning 45 4 (2010) 397\u2013414.","DOI":"10.1007\/s10817-010-9172-3"},{"key":"e_1_3_3_2_4_2","unstructured":"Anthropic. 2025. Computer use (beta). https:\/\/docs.anthropic.com\/en\/docs\/build-with-claude\/computer-use\/ Accessed: 2025-02-19."},{"key":"e_1_3_3_2_5_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642180"},{"key":"e_1_3_3_2_6_2","doi-asserted-by":"publisher","DOI":"10.1145\/3658644.3690350"},{"key":"e_1_3_3_2_7_2","doi-asserted-by":"crossref","unstructured":"Michael Bailey David Dittrich Erin Kenneally and Doug Maughan. 2012. The menlo report. IEEE Security & Privacy 10 2 (2012) 71\u201375.","DOI":"10.1109\/MSP.2012.52"},{"key":"e_1_3_3_2_8_2","doi-asserted-by":"crossref","unstructured":"Tom\u00a0L Beauchamp et\u00a0al. 2008. The belmont report. The Oxford textbook of clinical research ethics (2008) 149\u2013155.","DOI":"10.1093\/oso\/9780195168655.003.0015"},{"key":"e_1_3_3_2_9_2","doi-asserted-by":"crossref","unstructured":"Virginia Braun and Victoria Clarke. 2019. Reflecting on reflexive thematic analysis. Qualitative research in sport exercise and health 11 4 (2019) 589\u2013597.","DOI":"10.1080\/2159676X.2019.1628806"},{"key":"e_1_3_3_2_10_2","first-page":"7187","volume-title":"Encyclopedia of quality of life and well-being research","author":"Braun Virginia","year":"2024","unstructured":"Virginia Braun and Victoria Clarke. 2024. Thematic analysis. In Encyclopedia of quality of life and well-being research. Springer, 7187\u20137193."},{"key":"e_1_3_3_2_11_2","doi-asserted-by":"publisher","DOI":"10.1145\/3678884.3689133"},{"key":"e_1_3_3_2_12_2","doi-asserted-by":"publisher","DOI":"10.7551\/mitpress\/4398.001.0001"},{"key":"e_1_3_3_2_13_2","doi-asserted-by":"publisher","unstructured":"Ada Chen Yongjiang Wu Junyuan Zhang Jingyu Xiao Shu Yang Jen tse Huang Kun Wang Wenxuan Wang and Shuai Wang. 2025. A Survey on the Safety and Security Threats of Computer-Using Agents: JARVIS or Ultron?10.48550\/arXiv.2505.10924 arxiv:https:\/\/arXiv.org\/abs\/2505.10924\u00a0[cs.CL]","DOI":"10.48550\/arXiv.2505.10924"},{"key":"e_1_3_3_2_14_2","doi-asserted-by":"publisher","DOI":"10.1145\/3746059.3747798"},{"key":"e_1_3_3_2_15_2","unstructured":"Chaoran Chen Zhiping Zhang Bingcan Guo Shang Ma Ibrahim Khalilov Simret\u00a0A Gebreegziabher Yanfang Ye Ziang Xiao Yaxing Yao Tianshi Li et\u00a0al. 2025. The Obvious Invisible Threat: LLM-Powered GUI Agents\u2019 Vulnerability to Fine-Print Injections. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2504.11281 (2025)."},{"key":"e_1_3_3_2_16_2","unstructured":"Chaoran Chen Zhiping Zhang Ibrahim Khalilov Bingcan Guo Simret\u00a0A Gebreegziabher Yanfang Ye Ziang Xiao Yaxing Yao Tianshi Li and Toby Jia-Jun Li. 2025. Toward a Human-Centered Evaluation Framework for Trustworthy LLM-powered GUI Agents. HEAL workshop of CHI 25 (2025)."},{"key":"e_1_3_3_2_17_2","volume-title":"The Thirteenth International Conference on Learning Representations","author":"Chen Dongping","year":"2024","unstructured":"Dongping Chen, Yue Huang, Siyuan Wu, Jingyu Tang, Huichi Zhou, Qihui Zhang, Zhigang He, Yilin Bai, Chujie Gao, Liuyi Chen, et\u00a0al. 2024. GUI-World: A Video Benchmark and Dataset for Multimodal GUI-oriented Understanding. In The Thirteenth International Conference on Learning Representations."},{"key":"e_1_3_3_2_18_2","first-page":"5901","volume-title":"Proceedings of the IEEE\/CVF International Conference on Computer Vision","author":"Chen Gongwei","year":"2025","unstructured":"Gongwei Chen, Xurui Zhou, Rui Shao, Yibo Lyu, Kaiwen Zhou, Shuai Wang, Wentao Li, Yinchuan Li, Zhongang Qi, and Liqiang Nie. 2025. Less is more: Empowering gui agent with context-aware simplification. In Proceedings of the IEEE\/CVF International Conference on Computer Vision. 5901\u20135911."},{"key":"e_1_3_3_2_19_2","doi-asserted-by":"publisher","DOI":"10.1145\/3586183.3606720"},{"key":"e_1_3_3_2_20_2","doi-asserted-by":"publisher","DOI":"10.1145\/3706598.3714135"},{"key":"e_1_3_3_2_21_2","doi-asserted-by":"publisher","DOI":"10.1145\/3678884.3681852"},{"key":"e_1_3_3_2_22_2","unstructured":"Zichen Chen Jiaao Chen Jianda Chen and Misha Sra. 2025. Position: Standard Benchmarks Fail\u2013LLM Agents Present Overlooked Risks for Financial Applications. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2502.15865 (2025)."},{"key":"e_1_3_3_2_23_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.acl-long.505"},{"key":"e_1_3_3_2_24_2","doi-asserted-by":"publisher","unstructured":"Anh-Hoang Dang Vu Tran and Le-Minh Nguyen. 2025. Survey and analysis of hallucinations in large language models: attribution to prompting strategies or model behavior. Frontiers in Artificial Intelligence 8 (2025) 1622292. 10.3389\/frai.2025.1622292","DOI":"10.3389\/frai.2025.1622292"},{"key":"e_1_3_3_2_25_2","doi-asserted-by":"publisher","DOI":"10.1145\/1125451.1125753"},{"key":"e_1_3_3_2_26_2","doi-asserted-by":"crossref","unstructured":"Michela Del\u00a0Vicario Alessandro Bessi Fabiana Zollo Fabrizio Petroni Antonio Scala Guido Caldarelli H.\u00a0Eugene Stanley and Walter Quattrociocchi. 2016. The spreading of misinformation online. Proceedings of the National Academy of Sciences 113 3 (2016) 554\u2013559.","DOI":"10.1073\/pnas.1517441113"},{"key":"e_1_3_3_2_27_2","doi-asserted-by":"crossref","unstructured":"Zehang Deng Yongjian Guo Changzhou Han Wanlun Ma Junwu Xiong Sheng Wen and Yang Xiang. 2025. Ai agents under threat: A survey of key security challenges and future pathways. Comput. Surveys 57 7 (2025) 1\u201336.","DOI":"10.1145\/3716628"},{"key":"e_1_3_3_2_28_2","unstructured":"Cedric Faas Sophie Kerstan Richard Uth Markus Langer and Anna\u00a0Maria Feit. 2025. Design Considerations for Human Oversight of AI: Insights from Co-Design Workshops and Work Design Theory. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2510.19512 (2025)."},{"key":"e_1_3_3_2_29_2","doi-asserted-by":"crossref","unstructured":"Don Fallis. 2015. What is disinformation?Library trends 63 3 (2015) 401\u2013426.","DOI":"10.1353\/lib.2015.0014"},{"key":"e_1_3_3_2_30_2","doi-asserted-by":"publisher","DOI":"10.1145\/1473018.1473028"},{"key":"e_1_3_3_2_31_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2025.emnlp-main.12"},{"key":"e_1_3_3_2_32_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2025.emnlp-main.12"},{"key":"e_1_3_3_2_33_2","volume-title":"NeurIPS 2025 Workshop on Regulatable ML","author":"Feng Kevin","year":"2025","unstructured":"Kevin Feng, Tae\u00a0Soo Kim, Rock\u00a0Yuren Pang, Faria Huq, Tal August, and Amy\u00a0X Zhang. 2025. On the Regulatory Potential of User Interfaces for AI Agent Governance. In NeurIPS 2025 Workshop on Regulatable ML."},{"key":"e_1_3_3_2_34_2","doi-asserted-by":"crossref","unstructured":"Casey Fiesler Michael Zimmer Nicholas Proferes Sarah Gilbert and Naiyan Jones. 2024. Remember the human: A systematic review of ethical considerations in reddit research. Proceedings of the ACM on Human-Computer Interaction 8 GROUP (2024) 1\u201333.","DOI":"10.1145\/3633070"},{"key":"e_1_3_3_2_35_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.01262"},{"key":"e_1_3_3_2_36_2","unstructured":"Boyu Gou Zanming Huang Yuting Ning Yu Gu Michael Lin Weijian Qi Andrei Kopanev Botao Yu Bernal\u00a0Jim\u00e9nez Guti\u00e9rrez Yiheng Shu et\u00a0al. 2025. Mind2Web 2: Evaluating Agentic Search with Agent-as-a-Judge. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2506.21506 (2025)."},{"key":"e_1_3_3_2_37_2","volume-title":"The Thirteenth International Conference on Learning Representations","author":"Gou Boyu","year":"2024","unstructured":"Boyu Gou, Ruohan Wang, Boyuan Zheng, Yanan Xie, Cheng Chang, Yiheng Shu, Huan Sun, and Yu Su. 2024. Navigating the Digital World as Humans Do: Universal Visual Grounding for GUI Agents. In The Thirteenth International Conference on Learning Representations."},{"key":"e_1_3_3_2_38_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613905.3650948"},{"key":"e_1_3_3_2_39_2","doi-asserted-by":"publisher","DOI":"10.1145\/3730567.3732922"},{"key":"e_1_3_3_2_40_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.acl-long.371"},{"key":"e_1_3_3_2_41_2","doi-asserted-by":"publisher","DOI":"10.1145\/3272973.3274059"},{"key":"e_1_3_3_2_42_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICSC65596.2025.11140447"},{"key":"e_1_3_3_2_43_2","doi-asserted-by":"crossref","unstructured":"Zhiyuan Hu Chumin Liu Xidong Feng Yilun Zhao See-Kiong Ng Anh\u00a0Tuan Luu Junxian He Pang Wei\u00a0W Koh and Bryan Hooi. 2024. Uncertainty of thoughts: Uncertainty-aware planning enhances information seeking in llms. Advances in Neural Information Processing Systems 37 (2024) 24181\u201324215.","DOI":"10.52202\/079017-0762"},{"key":"e_1_3_3_2_44_2","unstructured":"Tian Huang Chun Yu Weinan Shi Zijian Peng David Yang Weiqi Sun and Yuanchun Shi. [n. d.]. Prompt2Task: Automating UI Tasks on Smartphones from Textual Prompts. ACM Transactions on Computer-Human Interaction ([n. d.])."},{"key":"e_1_3_3_2_45_2","unstructured":"Ziwei Ji Nayeon Lee Rita Frieske Tiezheng Yu Dan Su Yan Xu Etsuko Ishii Yvette Bang Andrea Madotto and Pascale Fung. 2023. Survey of Hallucination in Natural Language Generation. Comput. Surveys (2023). https:\/\/arxiv.org\/abs\/2202.03629 arXiv:https:\/\/arXiv.org\/abs\/2202.03629."},{"key":"e_1_3_3_2_46_2","doi-asserted-by":"crossref","unstructured":"Ziwei Ji Nayeon Lee Rita Frieske Tiezheng Yu Dan Su Yan Xu Etsuko Ishii Ye\u00a0Jin Bang Andrea Madotto and Pascale Fung. 2023. Survey of hallucination in natural language generation. Comput. Surveys 55 12 (2023) 1\u201338.","DOI":"10.1145\/3571730"},{"key":"e_1_3_3_2_47_2","doi-asserted-by":"publisher","unstructured":"Haitao Jia Ming He Zimo Yin Likang Wu Jianping Fan and Jitao Sang. 2025. ReInAgent: A Context-Aware GUI Agent Enabling Human-in-the-Loop Mobile Task Navigation. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2510.07988 (2025). 10.48550\/arXiv.2510.07988","DOI":"10.48550\/arXiv.2510.07988"},{"key":"e_1_3_3_2_48_2","doi-asserted-by":"crossref","unstructured":"Shian Jia Xinbo Wang Mingli Song and Gang Chen. 2024. Agent Centric Operating System\u2013a Comprehensive Review and Outlook for Operating System. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2411.17710 (2024).","DOI":"10.32388\/XPJYHO"},{"key":"e_1_3_3_2_49_2","unstructured":"Wenjia Jiang Yangyang Zhuang Chenxi Song Xu Yang Joey\u00a0Tianyi Zhou and Chi Zhang. 2025. Appagentx: Evolving gui agents as proficient smartphone users. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2503.02268 (2025)."},{"key":"e_1_3_3_2_50_2","doi-asserted-by":"publisher","DOI":"10.1109\/PerComWorkshops65533.2025.00138"},{"key":"e_1_3_3_2_51_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-65630-9_12"},{"key":"e_1_3_3_2_52_2","doi-asserted-by":"publisher","DOI":"10.1145\/3584931.3606960"},{"key":"e_1_3_3_2_53_2","doi-asserted-by":"crossref","unstructured":"Jacek\u00a0A Kopec and John\u00a0M Esdaile. 1990. Bias in case-control studies. A review.Journal of epidemiology and community health 44 3 (1990) 179.","DOI":"10.1136\/jech.44.3.179"},{"key":"e_1_3_3_2_54_2","doi-asserted-by":"publisher","unstructured":"Thomas Kuntz Agatha Duzan Hao Zhao Francesco Croce J.\u00a0Zico Kolter Nicolas Flammarion and Maksym Andriushchenko. 2025. OS-Harm: A Benchmark for Measuring Safety of Computer Use Agents. 10.48550\/arXiv.2506.14866 arxiv:https:\/\/arXiv.org\/abs\/2506.14866\u00a0[cs.SE]","DOI":"10.48550\/arXiv.2506.14866"},{"key":"e_1_3_3_2_55_2","unstructured":"Jungjae Lee Dongjae Lee Chihun Choi Youngmin Im Jaeyoung Wi Kihong Heo Sangeun Oh Sunjae Lee and Insik Shin. 2025. Safeguarding mobile gui agent via logic-based action verification. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2503.18492 (2025)."},{"key":"e_1_3_3_2_56_2","doi-asserted-by":"publisher","DOI":"10.1145\/3746027.3755688"},{"key":"e_1_3_3_2_57_2","doi-asserted-by":"crossref","unstructured":"Wei Li William\u00a0E Bishop Alice Li Christopher Rawles Folawiyo Campbell-Ajala Divya Tyamagundlu and Oriana Riva. 2024. On the effects of data scale on ui control agents. Advances in Neural Information Processing Systems 37 (2024) 92130\u201392154.","DOI":"10.52202\/079017-2925"},{"key":"e_1_3_3_2_58_2","doi-asserted-by":"publisher","DOI":"10.1109\/DTPI61353.2024.10778901"},{"key":"e_1_3_3_2_59_2","unstructured":"Yuanchun Li Hao Wen Weijun Wang Xiangyu Li Yizhen Yuan Guohong Liu Jiacheng Liu Wenxing Xu Xiang Wang Yi Sun et\u00a0al. 2024. Personal llm agents: Insights and survey about the capability efficiency and security. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2401.05459 (2024)."},{"key":"e_1_3_3_2_60_2","unstructured":"Siyuan Liang Tianmeng Fang Zhe Liu Aishan Liu Yan Xiao Jinyuan He Ee-Chien Chang and Xiaochun Cao. 2025. SafeMobile: Chain-level Jailbreak Detection and Automated Evaluation for Multimodal Mobile Agents. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2507.00841 (2025)."},{"key":"e_1_3_3_2_61_2","volume-title":"The Thirteenth International Conference on Learning Representations","author":"Liao Zeyi","year":"2024","unstructured":"Zeyi Liao, Lingbo Mo, Chejian Xu, Mintong Kang, Jiawei Zhang, Chaowei Xiao, Yuan Tian, Bo Li, and Huan Sun. 2024. EIA: Environmental injection attack on generalist web agents for privacy leakage. In The Thirteenth International Conference on Learning Representations."},{"key":"e_1_3_3_2_62_2","unstructured":"Zhixin Lin Jungang Li Shidong Pan Yibo Shi Yue Yao and Dongliang Xu. 2025. Mind the third eye! benchmarking privacy awareness in mllm-powered smartphone agents. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2508.19493 (2025)."},{"key":"e_1_3_3_2_63_2","unstructured":"Guangyi Liu Pengxiang Zhao Liang Liu Zhiming Chen Yuxiang Chai Shuai Ren Hao Wang Shibo He and Wenchao Meng. 2025. Learnact: Few-shot mobile gui agent with a unified demonstration benchmark. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2504.13805 (2025)."},{"key":"e_1_3_3_2_64_2","unstructured":"Zikang Liu Junyi Li Wayne\u00a0Xin Zhao Dawei Gao Yaliang Li and Ji-rong Wen. 2025. PAL-UI: Planning with Active Look-back for Vision-Based GUI Agents. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2510.00413 (2025)."},{"key":"e_1_3_3_2_65_2","unstructured":"Xing\u00a0Han L\u00f9 Gaurav Kamath Marius Mosbach and Siva Reddy. 2025. Build the web for agents not agents for the web. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2506.10953 (2025)."},{"key":"e_1_3_3_2_66_2","doi-asserted-by":"publisher","DOI":"10.1145\/3411764.3445467"},{"key":"e_1_3_3_2_67_2","doi-asserted-by":"publisher","DOI":"10.1145\/3706598.3713540"},{"key":"e_1_3_3_2_68_2","first-page":"159","volume-title":"Twelfth Symposium on Usable Privacy and Security (SOUPS 2016)","author":"Marques Diogo","year":"2016","unstructured":"Diogo Marques, Ildar Muslukhov, Tiago Guerreiro, Lu\u00eds Carri\u00e7o, and Konstantin Beznosov. 2016. Snooping on mobile phones: Prevalence and trends. In Twelfth Symposium on Usable Privacy and Security (SOUPS 2016). 159\u2013174."},{"key":"e_1_3_3_2_69_2","doi-asserted-by":"crossref","unstructured":"Nora McDonald Sarita Schoenebeck and Andrea Forte. 2019. Reliability and inter-rater reliability in qualitative research: Norms and guidelines for CSCW and HCI practice. Proceedings of the ACM on human-computer interaction 3 CSCW (2019) 1\u201323.","DOI":"10.1145\/3359174"},{"key":"e_1_3_3_2_70_2","doi-asserted-by":"crossref","unstructured":"Siddharth Mehrotra Carolina\u00a0Centeio Jorge Catholijn\u00a0M Jonker and Myrthe\u00a0L Tielman. 2024. Integrity-based explanations for fostering appropriate trust in AI agents. ACM Transactions on Interactive Intelligent Systems 14 1 (2024) 1\u201336.","DOI":"10.1145\/3610578"},{"key":"e_1_3_3_2_71_2","doi-asserted-by":"publisher","DOI":"10.1145\/2493190.2493223"},{"key":"e_1_3_3_2_72_2","unstructured":"Dang Nguyen Jian Chen Yu Wang Gang Wu Namyong Park Zhengmian Hu Hanjia Lyu Junda Wu Ryan Aponte Yu Xia et\u00a0al. 2024. Gui agents: A survey. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2412.13501 (2024)."},{"key":"e_1_3_3_2_73_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2025.findings-acl.1158"},{"key":"e_1_3_3_2_74_2","doi-asserted-by":"publisher","DOI":"10.1145\/3711896.3736555"},{"key":"e_1_3_3_2_75_2","doi-asserted-by":"crossref","unstructured":"Michelle O\u00e2\u00c2\u00a0\u00c22Reilly and Nikki Kiyimba. 2015. Advanced qualitative research: A guide to using theory. (2015).","DOI":"10.4135\/9781529622782"},{"key":"e_1_3_3_2_76_2","volume-title":"The mobile phone-A medium in itself","author":"Oksman Virpi","year":"2010","unstructured":"Virpi Oksman. 2010. The mobile phone-A medium in itself. VTT."},{"key":"e_1_3_3_2_77_2","unstructured":"OpenAI. 2024. Introducing ChatGPT Agents. https:\/\/openai.com\/index\/introducing-chatgpt-agent\/. Accessed: 2025-01-29."},{"key":"e_1_3_3_2_78_2","unstructured":"OpenAI. 2025. Introducing Operator. https:\/\/openai.com\/index\/introducing-operator\/ Accessed: 2025-02-19."},{"key":"e_1_3_3_2_79_2","doi-asserted-by":"crossref","unstructured":"Michelle O\u2019Reilly Nikki Kiyimba and Alison Drewett. 2021. Mixing qualitative methods versus methodologies: A critical reflection on communication and power in inpatient care. Counselling and psychotherapy research 21 1 (2021) 66\u201376.","DOI":"10.1002\/capr.12365"},{"key":"e_1_3_3_2_80_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2025.findings-acl.326"},{"key":"e_1_3_3_2_81_2","doi-asserted-by":"publisher","DOI":"10.5555\/3692070.3693659"},{"key":"e_1_3_3_2_82_2","unstructured":"Ayush Pandey Jai Bardhan Ishita Jain Ramya\u00a0S Hebbalaguppe Rohan\u00a0Raju Dhanakshirur and Lovekesh Vig. 2025. Refine and Align: Confidence Calibration through Multi-Agent Interaction in VQA. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2511.11169 (2025)."},{"key":"e_1_3_3_2_83_2","doi-asserted-by":"publisher","DOI":"10.1145\/3706598.3713726"},{"key":"e_1_3_3_2_84_2","volume-title":"The Thirty-ninth Annual Conference on Neural Information Processing Systems","author":"Papoudakis Georgios","year":"2025","unstructured":"Georgios Papoudakis, Thomas Coste, Jun Wang, Kun Shao, et\u00a0al. 2025. Succeed or Learn Slowly: Sample Efficient Off-Policy Reinforcement Learning for Mobile App Control. In The Thirty-ninth Annual Conference on Neural Information Processing Systems."},{"key":"e_1_3_3_2_85_2","doi-asserted-by":"publisher","DOI":"10.1145\/3586183.3606763"},{"key":"e_1_3_3_2_86_2","doi-asserted-by":"crossref","unstructured":"Samir Passi. 2025. Agentic AI has a Human Oversight Problem. Available at SSRN 5529058 (2025).","DOI":"10.2139\/ssrn.5529058"},{"key":"e_1_3_3_2_87_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-89424-4_15"},{"key":"e_1_3_3_2_88_2","doi-asserted-by":"crossref","unstructured":"Nicholas Proferes Naiyan Jones Sarah Gilbert Casey Fiesler and Michael Zimmer. 2021. Studying reddit: A systematic overview of disciplines approaches methods and ethics. Social Media+ Society 7 2 (2021) 20563051211019004.","DOI":"10.1177\/20563051211019004"},{"key":"e_1_3_3_2_89_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.acl-long.810"},{"key":"e_1_3_3_2_90_2","doi-asserted-by":"publisher","unstructured":"Cheng Qian Zuxin Liu Akshara Prabhakar Zhiwei Liu Jianguo Zhang Haolin Chen Heng Ji Weiran Yao Shelby Heinecke Silvio Savarese Caiming Xiong and Huan Wang. 2025. UserBench: An Interactive Gym Environment for User-Centric Agents. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2507.22034 (2025). 10.48550\/arXiv.2507.22034","DOI":"10.48550\/arXiv.2507.22034"},{"key":"e_1_3_3_2_91_2","doi-asserted-by":"publisher","unstructured":"Subhey\u00a0Sadi Rahman Md.\u00a0Adnanul Islam Md.\u00a0Mahbub Alam Musarrat Zeba Md.\u00a0Abdur Rahman Sadia\u00a0Sultana Chowa Mohaimenul Azam\u00a0Khan Raiaan and Sami Azam. 2025. Hallucination to Truth: A Review of Fact-Checking and Factuality Evaluation in Large Language Models. (2025). 10.48550\/arXiv.2508.03860arXiv:https:\/\/arXiv.org\/abs\/2508.03860.","DOI":"10.48550\/arXiv.2508.03860"},{"key":"e_1_3_3_2_92_2","volume-title":"The Thirteenth International Conference on Learning Representations","author":"Rawles Christopher","year":"2024","unstructured":"Christopher Rawles, Sarah Clinckemaillie, Yifan Chang, Jonathan Waltz, Gabrielle Lau, Marybeth Fair, Alice Li, William\u00a0E Bishop, Wei Li, Folawiyo Campbell-Ajala, et\u00a0al. 2024. AndroidWorld: A Dynamic Benchmarking Environment for Autonomous Agents. In The Thirteenth International Conference on Learning Representations."},{"key":"e_1_3_3_2_93_2","volume-title":"The Thirteenth International Conference on Learning Representations","author":"Rawles Christopher","year":"2024","unstructured":"Christopher Rawles, Sarah Clinckemaillie, Yifan Chang, Jonathan Waltz, Gabrielle Lau, Marybeth Fair, Alice Li, William\u00a0E Bishop, Wei Li, Folawiyo Campbell-Ajala, et\u00a0al. 2024. AndroidWorld: A Dynamic Benchmarking Environment for Autonomous Agents. In The Thirteenth International Conference on Learning Representations."},{"key":"e_1_3_3_2_94_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-77772-2_7"},{"key":"e_1_3_3_2_95_2","doi-asserted-by":"publisher","unstructured":"Zeyu Rong Tianxi Ji Jiazhao Zhang Tong Qu Jingling Li and Qiang Ma. 2025. RecAgent: Uncertainty-Aware GUI Agent. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2508.04025 (2025). 10.48550\/arXiv.2508.04025","DOI":"10.48550\/arXiv.2508.04025"},{"key":"e_1_3_3_2_96_2","unstructured":"Yangjun Ruan Honghua Dong Andrew Wang Silviu Pitis Yongchao Zhou Jimmy Ba Yann Dubois Chris\u00a0J Maddison and Tatsunori Hashimoto. 2023. Identifying the risks of lm agents with an lm-emulated sandbox. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2309.15817 (2023)."},{"key":"e_1_3_3_2_97_2","first-page":"2421","volume-title":"34th USENIX Security Symposium (USENIX Security 25)","author":"Russinovich Mark","year":"2025","unstructured":"Mark Russinovich, Ahmed Salem, and Ronen Eldan. 2025. Great, now write an article about that: The crescendo { Multi-Turn}{ LLM} jailbreak attack. In 34th USENIX Security Symposium (USENIX Security 25). 2421\u20132440."},{"key":"e_1_3_3_2_98_2","unstructured":"Huawen Shen Chang Liu Gengluo Li Xinlong Wang Yu Zhou Can Ma and Xiangyang Ji. 2024. Falcon-ui: Understanding gui before following user instructions. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2412.09362 (2024)."},{"key":"e_1_3_3_2_99_2","unstructured":"Yucheng Shi Wenhao Yu Wenlin Yao Wenhu Chen and Ninghao Liu. 2025. Towards trustworthy gui agents: A survey. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2503.23434 (2025)."},{"key":"e_1_3_3_2_100_2","doi-asserted-by":"crossref","unstructured":"Ben Shneiderman. 2002. Promoting universal usability with multi-layer interface design. ACM SIGCAPH computers and the physically handicapped73-74 (2002) 1\u20138.","DOI":"10.1145\/960201.957206"},{"key":"e_1_3_3_2_101_2","unstructured":"Junhao Su Yuanliang Wan Junwei Yang Hengyu Shi Tianyang Han Junfeng Luo and Yurui Qiu. 2025. Failure Makes the Agent Stronger: Enhancing Accuracy through Structured Reflection for Reliable Tool Interactions. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2509.18847 (2025)."},{"key":"e_1_3_3_2_102_2","unstructured":"Qiushi Sun Mukai Li Zhoumianze Liu Zhihui Xie Fangzhi Xu Zhangyue Yin Kanzhi Cheng Zehao Li Zichen Ding Qi Liu et\u00a0al. 2025. OS-Sentinel: Towards Safety-Enhanced Mobile GUI Agents via Hybrid Validation in Realistic Workflows. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2510.24411 (2025)."},{"key":"e_1_3_3_2_103_2","unstructured":"Xiangru Tang Qiao Jin Kunlun Zhu Tongxin Yuan Yichi Zhang Wangchunshu Zhou Meng Qu Yilun Zhao Jian Tang Zhuosheng Zhang et\u00a0al. 2024. Prioritizing safeguarding over autonomy: Risks of llm agents for science. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2402.04247 (2024)."},{"key":"e_1_3_3_2_104_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2025.findings-emnlp.1268"},{"key":"e_1_3_3_2_105_2","doi-asserted-by":"publisher","DOI":"10.1145\/3290605.3300542"},{"key":"e_1_3_3_2_106_2","doi-asserted-by":"publisher","DOI":"10.1145\/3462204.3481724"},{"key":"e_1_3_3_2_107_2","unstructured":"Shuai Wang Weiwen Liu Jingxuan Chen Yuqi Zhou Weinan Gan Xingshan Zeng Yuhan Che Shuai Yu Xinlong Hao Kun Shao et\u00a0al. 2024. Gui agents with foundation models: A comprehensive survey. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2411.04890 (2024)."},{"key":"e_1_3_3_2_108_2","doi-asserted-by":"crossref","unstructured":"Alexander Wei Nika Haghtalab and Jacob Steinhardt. 2023. Jailbroken: How does llm safety training fail?Advances in Neural Information Processing Systems 36 (2023) 80079\u201380110.","DOI":"10.52202\/075280-3508"},{"key":"e_1_3_3_2_109_2","volume-title":"The Thirteenth International Conference on Learning Representations","author":"Williams Marcus","year":"2025","unstructured":"Marcus Williams, Micah Carroll, Adhyyan Narang, Constantin Weisser, Brendan Murphy, and Anca Dragan. 2025. On Targeted Manipulation and Deception when Optimizing LLMs for User Feedback. In The Thirteenth International Conference on Learning Representations."},{"key":"e_1_3_3_2_110_2","doi-asserted-by":"publisher","DOI":"10.14722\/ndss.2025.241131"},{"key":"e_1_3_3_2_111_2","unstructured":"Zhe Wu Hongjin Lu Junliang Xing Changhao Zhang Yin Zhu Yuhao Yang Yuheng Jing Kai Li Kun Shao Jianye Hao et\u00a0al. 2025. Hi-Agent: Hierarchical Vision-Language Agents for Mobile Device Control. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2510.14388 (2025)."},{"key":"e_1_3_3_2_112_2","unstructured":"Jiannan Xiang Yun Zhu Lei Shu Maria Wang Lijun Yu Gabriel Barcik James Lyon Srinivas Sunkara and Jindong Chen. 2025. UISim: An Interactive Image-Based UI Simulator for Dynamic Mobile Environments. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2509.21733 (2025)."},{"key":"e_1_3_3_2_113_2","doi-asserted-by":"publisher","unstructured":"Hongwei Xiao Yongqi Sun Zhenghao Duan Yunxiang Huo Jingze Liu Mingyu Luo Yanhui Li and Yingchao Zhang. 2024. A Study of Model Iterations of Fitts\u2019 Law and Its Application to Human\u2013Computer Interactions. Applied Sciences 14 16 (2024) 7386. 10.3390\/app14167386","DOI":"10.3390\/app14167386"},{"key":"e_1_3_3_2_114_2","unstructured":"Bin Xie Rui Shao Gongwei Chen Kaiwen Zhou Yinchuan Li Jie Liu Min Zhang and Liqiang Nie. 2025. Gui-explorer: Autonomous exploration and mining of transition-aware knowledge for gui agent. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2505.16827 (2025)."},{"key":"e_1_3_3_2_115_2","unstructured":"Tianci Xue Weijian Qi Tianneng Shi Chan\u00a0Hee Song Boyu Gou Dawn Song Huan Sun and Yu Su. 2025. An illusion of progress? assessing the current state of web agents. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2504.01382 (2025)."},{"key":"e_1_3_3_2_116_2","unstructured":"Jingyi Yang Shuai Shao Dongrui Liu and Jing Shao. 2025. RiOSWorld: Benchmarking the Risk of Multimodal Computer-Use Agents. arxiv:https:\/\/arXiv.org\/abs\/2506.00618\u00a0[cs.AI] https:\/\/arxiv.org\/abs\/2506.00618"},{"key":"e_1_3_3_2_117_2","unstructured":"Jingqi Yang Zhilong Song Jiawei Chen Mingli Song Sheng Zhou Xiaogang Ouyang Chun Chen Can Wang et\u00a0al. 2025. GUI-Robust: A Comprehensive Dataset for Testing GUI Agent Robustness in Real-World Anomalies. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2506.14477 (2025)."},{"key":"e_1_3_3_2_118_2","unstructured":"Pei Yang Hai Ci and Mike\u00a0Zheng Shou. 2025. macOSWorld: A Multilingual Interactive Benchmark for GUI Agents. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2506.04135 (2025)."},{"key":"e_1_3_3_2_119_2","doi-asserted-by":"publisher","DOI":"10.1145\/3706598.3713493"},{"key":"e_1_3_3_2_120_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.emnlp-main.505"},{"key":"e_1_3_3_2_121_2","unstructured":"Chaoyun Zhang Shilin He Liqun Li Si Qin Yu Kang Qingwei Lin Saravan Rajmohan and Dongmei Zhang. 2025. Api agents vs. gui agents: Divergence and convergence. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2503.11069 (2025)."},{"key":"e_1_3_3_2_122_2","unstructured":"Chaoyun Zhang Shilin He Jiaxu Qian Bowen Li Liqun Li Si Qin Yu Kang Minghua Ma Guyue Liu Qingwei Lin et\u00a0al. 2024. Large language model-brained gui agents: A survey. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2411.18279 (2024)."},{"key":"e_1_3_3_2_123_2","unstructured":"Chi Zhang Zhao Yang Jiaxuan Liu Yucheng Han Xin Chen Zebiao Huang Bin Fu and Gang Yu. 2023. AppAgent: Multimodal Agents as Smartphone Users. arxiv:https:\/\/arXiv.org\/abs\/2312.13771\u00a0[cs.CV] https:\/\/arxiv.org\/abs\/2312.13771"},{"key":"e_1_3_3_2_124_2","doi-asserted-by":"publisher","DOI":"10.1145\/3706598.3713600"},{"key":"e_1_3_3_2_125_2","unstructured":"Kaiyuan Zhang Zian Su Pin-Yu Chen Elisa Bertino Xiangyu Zhang and Ninghui Li. 2025. LLM Agents Should Employ Security Principles. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2505.24019 (2025)."},{"key":"e_1_3_3_2_126_2","doi-asserted-by":"publisher","DOI":"10.1145\/3584931.3607008"},{"key":"e_1_3_3_2_127_2","unstructured":"Muru Zhang Ofir Press William Merrill Alisa Liu and Noah\u00a0A Smith. 2023. How language model hallucinations can snowball. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2305.13534 (2023)."},{"key":"e_1_3_3_2_128_2","doi-asserted-by":"publisher","DOI":"10.1145\/3733816.3760752"},{"key":"e_1_3_3_2_129_2","doi-asserted-by":"crossref","unstructured":"Shuning Zhang Hui Wang and Xin Yi. 2025. Exploring collaboration patterns and strategies in human-ai co-creation through the lens of agency: A scoping review of the top-tier hci literature. Proceedings of the ACM on Human-Computer Interaction 9 7 (2025) 1\u201343.","DOI":"10.1145\/3757594"},{"key":"e_1_3_3_2_130_2","unstructured":"Shuning Zhang Lyumanshan Ye Xin Yi Jingyu Tang Bo Shui Haobin Xing Pengfei Liu and Hewu Li. 2024. \" Ghost of the past\": identifying and resolving privacy leakage from LLM\u2019s memory through proactive user interaction. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2410.14931 (2024)."},{"key":"e_1_3_3_2_131_2","doi-asserted-by":"publisher","DOI":"10.1145\/3706598.3713928"},{"key":"e_1_3_3_2_132_2","unstructured":"Shuning Zhang Xin Yi Haobin Xing Lyumanshan Ye Yongquan Hu and Hewu Li. 2024. Adanonymizer: Interactively Navigating and Balancing the Duality of Privacy and Output Performance in Human-LLM Interaction. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2410.15044 (2024)."},{"key":"e_1_3_3_2_133_2","doi-asserted-by":"publisher","unstructured":"Wan Zhang and Jing Zhang. 2025. Hallucination Mitigation for Retrieval-Augmented Large Language Models: A Review. Mathematics 13 5 (2025) 856. 10.3390\/math13050856","DOI":"10.3390\/math13050856"},{"key":"e_1_3_3_2_134_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.findings-emnlp.636"},{"key":"e_1_3_3_2_135_2","doi-asserted-by":"publisher","DOI":"10.1145\/3351095.3372852"},{"key":"e_1_3_3_2_136_2","unstructured":"Zeyu Zhang Xiaohe Bo Chen Ma Rui Li Xu Chen Quanyu Dai Jieming Zhu Zhenhua Dong and Ji-Rong Wen. 2024. A survey on the memory mechanism of large language model based agents. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2404.13501 (2024)."},{"key":"e_1_3_3_2_137_2","unstructured":"Zhisong Zhang Tianqing Fang Kaixin Ma Wenhao Yu Hongming Zhang Haitao Mi and Dong Yu. 2025. Enhancing web agents with explicit rollback mechanisms. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2504.11788 (2025)."},{"key":"e_1_3_3_2_138_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642385"},{"key":"e_1_3_3_2_139_2","doi-asserted-by":"publisher","DOI":"10.1145\/3708359.3712153"},{"key":"e_1_3_3_2_140_2","unstructured":"Kangjia Zhao Jiahui Song Leigang Sha Haozhan Shen Zhi Chen Tiancheng Zhao Xiubo Liang and Jianwei Yin. 2024. Gui testing arena: A unified benchmark for advancing autonomous gui testing agent. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2412.18426 (2024)."},{"key":"e_1_3_3_2_141_2","first-page":"61349","volume-title":"International Conference on Machine Learning","author":"Zheng Boyuan","year":"2024","unstructured":"Boyuan Zheng, Boyu Gou, Jihyung Kil, Huan Sun, and Yu Su. 2024. GPT-4V (ision) is a Generalist Web Agent, if Grounded. In International Conference on Machine Learning. PMLR, 61349\u201361385."},{"key":"e_1_3_3_2_142_2","unstructured":"Shuyan Zhou Frank\u00a0F Xu Hao Zhu Xuhui Zhou Robert Lo Abishek Sridhar Xianyi Cheng Tianyue Ou Yonatan Bisk Daniel Fried et\u00a0al. 2023. Webarena: A realistic web environment for building autonomous agents. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2307.13854 (2023)."},{"key":"e_1_3_3_2_143_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2025.findings-naacl.205"}],"event":{"name":"CHI 2026: CHI Conference on Human Factors in Computing Systems","location":"Barcelona Spain","acronym":"CHI '26","sponsor":["SIGCHI ACM Special Interest Group on Computer-Human Interaction"]},"container-title":["Proceedings of the 2026 CHI Conference on Human Factors in Computing Systems"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3772318.3790696","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,4,17]],"date-time":"2026-04-17T09:01:24Z","timestamp":1776416484000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3772318.3790696"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,4,13]]},"references-count":142,"alternative-id":["10.1145\/3772318.3790696","10.1145\/3772318"],"URL":"https:\/\/doi.org\/10.1145\/3772318.3790696","relation":{},"subject":[],"published":{"date-parts":[[2026,4,13]]},"assertion":[{"value":"2026-04-13","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}