{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,30]],"date-time":"2026-03-30T15:07:30Z","timestamp":1774883250030,"version":"3.50.1"},"reference-count":43,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2026,2,13]],"date-time":"2026-02-13T00:00:00Z","timestamp":1770940800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0"},{"start":{"date-parts":[[2026,2,13]],"date-time":"2026-02-13T00:00:00Z","timestamp":1770940800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0"}],"funder":[{"DOI":"10.13039\/501100007052","name":"Universit\u00e0 degli Studi di Verona","doi-asserted-by":"crossref","id":[{"id":"10.13039\/501100007052","id-type":"DOI","asserted-by":"crossref"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Empir Software Eng"],"published-print":{"date-parts":[[2026,5]]},"DOI":"10.1007\/s10664-026-10816-4","type":"journal-article","created":{"date-parts":[[2026,2,13]],"date-time":"2026-02-13T07:52:18Z","timestamp":1770969138000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["VLM-Fuzz: Vision language model assisted recursive depth-first search exploration for effective GUI testing of android apps"],"prefix":"10.1007","volume":"31","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-5369-5235","authenticated-orcid":false,"given":"Biniam Fisseha","family":"Demissie","sequence":"first","affiliation":[]},{"given":"Yan Naing","family":"Tun","sequence":"additional","affiliation":[]},{"given":"Lwin Khin","family":"Shar","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7325-0316","authenticated-orcid":false,"given":"Mariano","family":"Ceccato","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2026,2,13]]},"reference":[{"key":"10816_CR1","doi-asserted-by":"crossref","unstructured":"Amalfitano D, Fasolino AR, Tramontana P, De\u00a0Carmine S, Memon AM (2012) Using gui ripping for automated testing of android applications. In Proceedings of the 27th IEEE\/ACM International Conference on Automated Software Engineering, pages 258\u2013261","DOI":"10.1145\/2351676.2351717"},{"issue":"5","key":"10816_CR2","doi-asserted-by":"publisher","first-page":"53","DOI":"10.1109\/MS.2014.55","volume":"32","author":"D Amalfitano","year":"2014","unstructured":"Amalfitano D, Fasolino AR, Tramontana P, Ta BD, Memon AM (2014) Mobiguitar: Automated model-based testing of mobile apps. IEEE Softw 32(5):53\u201359","journal-title":"IEEE Softw"},{"key":"10816_CR3","doi-asserted-by":"crossref","unstructured":"Anand S, Naik M, Harrold MJ, Yang H (2012) Automated concolic testing of smartphone apps. In Proceedings of the ACM SIGSOFT 20th International Symposium on the Foundations of Software Engineering, pages 1\u201311","DOI":"10.1145\/2393596.2393666"},{"key":"10816_CR4","unstructured":"Android (2024a) Android uiautomator. https:\/\/developer.android.com\/training\/testing\/other-components\/ui-automator##ui-automator"},{"key":"10816_CR5","unstructured":"Android (2024b) Ui\/application exerciser monkey. https:\/\/developer.android.com\/studio\/test\/other-testing-tools\/monkey"},{"key":"10816_CR6","doi-asserted-by":"crossref","unstructured":"Azim T, Neamtiu I (2013) Targeted and depth-first exploration for systematic testing of android apps. In: Proceedings of the 2013 ACM SIGPLAN international conference on Object oriented programming systems languages & applications, pages 641\u2013660","DOI":"10.1145\/2509136.2509549"},{"issue":"9","key":"10816_CR7","first-page":"4248","volume":"12","author":"K Choi","year":"2018","unstructured":"Choi K, Ko M, Chang B-M (2018) A practical intent fuzzing tool for robustness of inter-component communication in android apps. KSII Transactions on Internet & Information Systems 12(9):4248\u20134270","journal-title":"KSII Transactions on Internet & Information Systems"},{"issue":"10","key":"10816_CR8","doi-asserted-by":"publisher","first-page":"623","DOI":"10.1145\/2544173.2509552","volume":"48","author":"W Choi","year":"2013","unstructured":"Choi W, Necula G, Sen K (2013) Guided gui testing of android apps with minimal restart and approximate learning. Acm Sigplan Notices 48(10):623\u2013640","journal-title":"Acm Sigplan Notices"},{"key":"10816_CR9","doi-asserted-by":"crossref","unstructured":"Choudhary SR, Gorla A, Orso A (2015) Automated test input generation for android: Are we there yet?(e). In: 2015 30th IEEE\/ACM International Conference on Automated Software Engineering (ASE), pages 429\u2013440. IEEE","DOI":"10.1109\/ASE.2015.89"},{"issue":"4","key":"10816_CR10","doi-asserted-by":"publisher","first-page":"2438","DOI":"10.1007\/s10664-019-09701-0","volume":"24","author":"L Cruz","year":"2019","unstructured":"Cruz L, Abreu R, Lo D (2019) To the attention of mobile software developers: guess what, test your app! Empir Softw Eng 24(4):2438\u20132468","journal-title":"Empir Softw Eng"},{"issue":"6","key":"10816_CR11","doi-asserted-by":"publisher","first-page":"5084","DOI":"10.1007\/s10664-020-09879-8","volume":"25","author":"BF Demissie","year":"2020","unstructured":"Demissie BF, Ceccato M, Shar LK (2020) Security analysis of permission re-delegation vulnerabilities in android apps. Empir Softw Eng 25(6):5084\u20135136","journal-title":"Empir Softw Eng"},{"key":"10816_CR12","doi-asserted-by":"crossref","unstructured":"Dong Z, B\u00f6hme M, Cojocaru L, Roychoudhury A (2020) Time-travel testing of android apps. In: Proceedings of the ACM\/IEEE 42nd International Conference on Software Engineering, pages 481\u2013492","DOI":"10.1145\/3377811.3380402"},{"key":"10816_CR13","doi-asserted-by":"crossref","unstructured":"Du X, Liu M, Wang K, Wang H, Liu J, Chen Y, Feng J, Sha C, Peng X, Lou Y (2024) Evaluating large language models in class-level code generation. In: Proceedings of the IEEE\/ACM 46th International Conference on Software Engineering, pages 1\u201313","DOI":"10.1145\/3597503.3639219"},{"key":"10816_CR14","doi-asserted-by":"crossref","unstructured":"Feng S, Chen C (2024) Prompting is all you need: Automated android bug replay with large language models. In: Proceedings of the IEEE\/ACM 46th International Conference on Software Engineering, ICSE \u201924, New York, NY, USA. Association for Computing Machinery","DOI":"10.1145\/3597503.3608137"},{"key":"10816_CR15","unstructured":"Google (2025) Espresso. https:\/\/developer.android.com\/training\/testing\/espresso"},{"key":"10816_CR16","doi-asserted-by":"crossref","unstructured":"Gu T, Sun C, Ma X, Cao C, Xu C, Yao Y, Zhang Q, Lu J, Su Z (2019) Practical gui testing of android applications via model abstraction and refinement. In: 2019 IEEE\/ACM 41st International Conference on Software Engineering (ICSE), pages 269\u2013280. IEEE","DOI":"10.1109\/ICSE.2019.00042"},{"key":"10816_CR17","doi-asserted-by":"crossref","unstructured":"Hao S, Liu B, Nath S, Halfond WGJ, Govindan R (2014) Puma: Programmable ui-automation for large-scale dynamic analysis of mobile apps. In: Proceedings of the 12th annual international conference on Mobile systems, applications, and services, pages 204\u2013217","DOI":"10.1145\/2594368.2594390"},{"key":"10816_CR18","unstructured":"Hugging Face (2024) Wildvision arena : Benchmarking multimodal llms in the wild. https:\/\/huggingface.co\/spaces\/WildVision\/vision-arena"},{"key":"10816_CR19","doi-asserted-by":"crossref","unstructured":"Kochhar PS, Thung F, Nagappan N, Zimmermann T, Lo D (2015) Understanding the test automation culture of app developers. In 2015 IEEE 8th International Conference on Software Testing, Verification and Validation (ICST), pages 1\u201310. IEEE","DOI":"10.1109\/ICST.2015.7102609"},{"issue":"1","key":"10816_CR20","doi-asserted-by":"publisher","first-page":"45","DOI":"10.1109\/TR.2018.2865733","volume":"68","author":"P Kong","year":"2018","unstructured":"Kong P, Li L, Gao J, Liu K, Bissyand\u00e9 TF, Klein J (2018) Automated testing of android apps: A systematic literature review. IEEE Trans Reliab 68(1):45\u201366","journal-title":"IEEE Trans Reliab"},{"key":"10816_CR21","doi-asserted-by":"crossref","unstructured":"Lai D, Rubin J (2019) Goal-driven exploration for android applications. In: 2019 34th IEEE\/ACM International Conference on Automated Software Engineering (ASE), pages 115\u2013127. IEEE","DOI":"10.1109\/ASE.2019.00021"},{"key":"10816_CR22","doi-asserted-by":"crossref","unstructured":"Li Y, Yang Z, Guo Y, Chen X (2017) Droidbot: a lightweight ui-guided test input generator for android. In 2017 IEEE\/ACM 39th International Conference on Software Engineering Companion (ICSE-C), pages 23\u201326. IEEE","DOI":"10.1109\/ICSE-C.2017.8"},{"key":"10816_CR23","doi-asserted-by":"crossref","unstructured":"Li Y, Yang Z, Guo Y, Chen X (2019) Humanoid: A deep learning-based approach to automated black-box android app testing. In: 2019 34th IEEE\/ACM International Conference on Automated Software Engineering (ASE), pages 1070\u20131073. IEEE","DOI":"10.1109\/ASE.2019.00104"},{"key":"10816_CR24","doi-asserted-by":"crossref","unstructured":"Liu Z, Chen C, Wang J, Chen M, Wu B, Che X, Wang D, Wang Q (2024) Make llm a testing expert: Bringing human-like interaction to mobile gui testing via functionality-aware decisions. In: Proceedings of the IEEE\/ACM 46th International Conference on Software Engineering, pages 1\u201313","DOI":"10.1145\/3597503.3639180"},{"key":"10816_CR25","unstructured":"Liu Z, Li C, Chen C, Wang J, Wu B, Wang Y, Hu J, Wang Q (2024) Vision-driven automated mobile gui testing via multimodal large language model. arXiv:2407.03037"},{"key":"10816_CR26","doi-asserted-by":"crossref","unstructured":"Machiry A, Tahiliani R, Naik M (2013) Dynodroid: An input generation system for android apps. In: Proceedings of the 2013 9th Joint Meeting on Foundations of Software Engineering, pages 224\u2013234","DOI":"10.1145\/2491411.2491450"},{"key":"10816_CR27","doi-asserted-by":"crossref","unstructured":"Mahmood R, Mirzaei N, Malek S (2014) Evodroid: Segmented evolutionary testing of android apps. In: Proceedings of the 22nd ACM SIGSOFT International Symposium on Foundations of Software Engineering, pages 599\u2013609","DOI":"10.1145\/2635868.2635896"},{"key":"10816_CR28","doi-asserted-by":"crossref","unstructured":"Mao K, Harman M, Jia Y (2016) Sapienz: Multi-objective automated testing for android applications. In: Proceedings of the 25th international symposium on software testing and analysis, pages 94\u2013105","DOI":"10.1145\/2931037.2931054"},{"key":"10816_CR29","doi-asserted-by":"crossref","unstructured":"Moran K, Linares-V\u00e1squez M, Bernal-C\u00e1rdenas C, Vendome C, Poshyvanyk D (2017) Crashscope: A practical tool for automated testing of android applications. In: 2017 IEEE\/ACM 39th International Conference on Software Engineering Companion (ICSE-C), pages 15\u201318. IEEE","DOI":"10.1109\/ICSE-C.2017.16"},{"key":"10816_CR30","unstructured":"OpenAI (2024) Gpt-4-vision. https:\/\/help.openai.com\/en\/articles\/8555496-gpt-4-vision-api"},{"key":"10816_CR31","doi-asserted-by":"crossref","unstructured":"Pan M,\u00a0Huang A, Wang G, Zhang T, Li X (2020) Reinforcement learning based curiosity-driven testing of android applications. In: Proceedings of the 29th ACM SIGSOFT International Symposium on Software Testing and Analysis, pages 153\u2013164","DOI":"10.1145\/3395363.3397354"},{"key":"10816_CR32","doi-asserted-by":"crossref","unstructured":"Peng C, Zhang Z, Lv Z, Yang P (2022) Mubot: Learning to test large-scale commercial android apps like a human. In: 2022 IEEE International Conference on Software Maintenance and Evolution (ICSME), pages 543\u2013552. IEEE","DOI":"10.1109\/ICSME55016.2022.00074"},{"issue":"4","key":"10816_CR33","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3502868","volume":"31","author":"A Romdhana","year":"2022","unstructured":"Romdhana A, Merlo A, Ceccato M, Tonella P (2022) Deep reinforcement learning for black-box testing of android apps. ACM Transactions on Software Engineering and Methodology (TOSEM) 31(4):1\u201329","journal-title":"ACM Transactions on Software Engineering and Methodology (TOSEM)"},{"key":"10816_CR34","unstructured":"Rubtsov V (2006) Emma: Java code coverage tool"},{"key":"10816_CR35","doi-asserted-by":"crossref","unstructured":"Ryan G, Jain S, Shang M, Wang S, Ma X, Ramanathan MK, Ray B (2024) Code-aware prompting: A study of coverage-guided test generation in regression setting using llm. Proceedings of the ACM on Software Engineering, 1(FSE):951\u2013971","DOI":"10.1145\/3643769"},{"key":"10816_CR36","doi-asserted-by":"crossref","unstructured":"Sasnauskas R, Regehr J (2014) Intent fuzzer: crafting intents of death. In Proceedings of the 2014 Joint International Workshop on Dynamic Analysis (WODA) and Software and System Performance Testing, Debugging, and Analytics (PERTEA), pages 1\u20135","DOI":"10.1145\/2632168.2632169"},{"key":"10816_CR37","doi-asserted-by":"crossref","unstructured":"Su T, Meng G, Chen Y,\u00a0Wu K, Yang W, Yao Y, Pu G, Liu Y, Su Z (2017) Guided, stochastic model-based gui testing of android apps. In: Proceedings of the 2017 11th Joint Meeting on Foundations of Software Engineering, pages 245\u2013256","DOI":"10.1145\/3106237.3106298"},{"key":"10816_CR38","doi-asserted-by":"crossref","unstructured":"Su T, Wang J, Su Z (2021) Benchmarking automated gui testing for android against real-world bugs. In: Proceedings of the 29th ACM Joint Meeting on European Software Engineering Conference and Symposium on the Foundations of Software Engineering, ESEC\/FSE 2021, page 119\u2013130, New York, NY, USA. Association for Computing Machinery","DOI":"10.1145\/3468264.3468620"},{"key":"10816_CR39","unstructured":"VLM-Fuzz (2025) Replication package of vlm-fuzz. https:\/\/bit.ly\/VLM-Fuzz"},{"key":"10816_CR40","doi-asserted-by":"crossref","unstructured":"Yang W, Prasad MR, Xie T (2013) A grey-box approach for automated gui-model generation of mobile applications. In: International Conference on Fundamental Approaches to Software Engineering, pages 250\u2013265. Springer","DOI":"10.1007\/978-3-642-37057-1_19"},{"key":"10816_CR41","doi-asserted-by":"crossref","unstructured":"YazdaniBanafsheDaragh F, Malek S (2021) Deep gui: Black-box gui input generation with deep learning. In: 2021 36th IEEE\/ACM International Conference on Automated Software Engineering (ASE), pages 905\u2013916. IEEE","DOI":"10.1109\/ASE51524.2021.9678778"},{"key":"10816_CR42","doi-asserted-by":"crossref","unstructured":"Ye H, Cheng S, Zhang L, Jiang F (2013) Droidfuzzer: Fuzzing the android apps with intent-filter tag. In: Proceedings of International Conference on Advances in Mobile Computing & Multimedia, pages 68\u201374","DOI":"10.1145\/2536853.2536881"},{"key":"10816_CR43","unstructured":"Zhang C, Yang Z, Liu J, Han Y, Chen X, Huang Z, Fu B, Yu G (2023) Appagent: Multimodal agents as smartphone users. arXiv:2312.13771"}],"container-title":["Empirical Software Engineering"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10664-026-10816-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10664-026-10816-4","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10664-026-10816-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,30]],"date-time":"2026-03-30T14:35:19Z","timestamp":1774881319000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10664-026-10816-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,2,13]]},"references-count":43,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2026,5]]}},"alternative-id":["10816"],"URL":"https:\/\/doi.org\/10.1007\/s10664-026-10816-4","relation":{},"ISSN":["1382-3256","1573-7616"],"issn-type":[{"value":"1382-3256","type":"print"},{"value":"1573-7616","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,2,13]]},"assertion":[{"value":"6 March 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"28 January 2026","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 February 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The empirical evaluation presented in this submission is not subject to ethical approval in the organizations where the authors work.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical Approval"}},{"value":"Not applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Informed consent"}},{"value":"The authors of this submission certify that they have NO affiliations with or involvement in any organization or entity with any financial interest (such as honoraria; educational grants; participation in speakers\u2019 bureaus; membership, employment, consultancies, stock ownership, or other equity interest; and expert testimony or patent-licensing arrangements), or non-financial interest (such as personal or professional relationships, affiliations, knowledge or beliefs) in the subject matter or materials discussed in this manuscript.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of Interest"}},{"value":"Clinical trial number: not applicable.","order":5,"name":"Ethics","group":{"name":"EthicsHeading","label":"Clinical Trial Number"}}],"article-number":"76"}}