{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,13]],"date-time":"2026-04-13T14:34:50Z","timestamp":1776090890784,"version":"3.50.1"},"publisher-location":"Cham","reference-count":52,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783032050045","type":"print"},{"value":"9783032050052","type":"electronic"}],"license":[{"start":{"date-parts":[[2025,9,9]],"date-time":"2025-09-09T00:00:00Z","timestamp":1757376000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,9,9]],"date-time":"2025-09-09T00:00:00Z","timestamp":1757376000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2026]]},"DOI":"10.1007\/978-3-032-05005-2_20","type":"book-chapter","created":{"date-parts":[[2025,9,8]],"date-time":"2025-09-08T04:41:02Z","timestamp":1757306462000},"page":"381-402","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["Can GPT-4o Evaluate Usability Like Human Experts? A Comparative Study on\u00a0Issue Identification in\u00a0Heuristic Evaluation"],"prefix":"10.1007","author":[{"given":"Guilherme","family":"Guerino","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Luiz","family":"Rodrigues","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Bruna","family":"Capeleti","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Rafael Ferreira","family":"Mello","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Andr\u00e9","family":"Freire","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Luciana","family":"Zaina","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,9,9]]},"reference":[{"key":"20_CR1","doi-asserted-by":"crossref","unstructured":"Alkaissi, H., McFarlane, S.I.: Artificial hallucinations in ChatGPT: implications in scientific writing. Cureus 15(2) (2023)","DOI":"10.7759\/cureus.35179"},{"key":"20_CR2","doi-asserted-by":"crossref","unstructured":"Barambones, J., Moral, C., de\u00a0Antonio, A., Imbert, R., Mart\u00ednez, L., Villalba-Mora, E.: ChatGPT for learning HCI techniques: a case study on interviews for personas. IEEE Trans. Learn. Technol. (2024)","DOI":"10.1109\/TLT.2024.3386095"},{"key":"20_CR3","doi-asserted-by":"publisher","unstructured":"Brade, S., Wang, B., Sousa, M., Oore, S., Grossman, T.: Promptify: text-to-image generation through interactive prompt exploration with large language models. In: Proceedings of the 36th Annual ACM Symposium on User Interface Software and Technology, UIST \u201923, Association for Computing Machinery, New York, NY, USA (2023). https:\/\/doi.org\/10.1145\/3586183.3606725","DOI":"10.1145\/3586183.3606725"},{"key":"20_CR4","doi-asserted-by":"crossref","unstructured":"Braun, V., Clarke, V.: Thematic analysis. In: Encyclopedia of Quality of Life and Well-Being Research, pp. 7187\u20137193. Springer (2024)","DOI":"10.1007\/978-3-031-17299-1_3470"},{"key":"20_CR5","doi-asserted-by":"crossref","unstructured":"Capeleti, B.S.: Human-data interaction in geoprocessing applications: design recommendations from inspections, user evaluations and expert experiences. Master\u2019s thesis. Federal University of Lavras (2023)","DOI":"10.5753\/sbsi_estendido.2023.229402"},{"key":"20_CR6","doi-asserted-by":"publisher","unstructured":"Chang, Y., et al.: A survey on evaluation of large language models. ACM Trans. Intell. Syst. Technol. 15(3) (2024). https:\/\/doi.org\/10.1145\/3641289","DOI":"10.1145\/3641289"},{"key":"20_CR7","unstructured":"Chen, B., Zhang, Z., Langren\u00e9, N., Zhu, S.: Unleashing the potential of prompt engineering in large language models: a comprehensive review. arXiv preprint arXiv:2310.14735 (2023)"},{"key":"20_CR8","doi-asserted-by":"crossref","unstructured":"De\u00a0Paoli, S.: Can large language models emulate an inductive thematic analysis of semi-structured interviews? An exploration and provocation on the limits of the approach and the model. arXiv preprint arXiv:2305.13014 (2023)","DOI":"10.1177\/08944393231220483"},{"key":"20_CR9","doi-asserted-by":"publisher","unstructured":"Duan, P., Warner, J., Li, Y., Hartmann, B.: Generating automatic feedback on UI mockups with large language models. In: Proceedings of the 2024 CHI Conference on Human Factors in Computing Systems, CHI \u201924. Association for Computing Machinery, New York, NY, USA (2024). https:\/\/doi.org\/10.1145\/3613904.3642782","DOI":"10.1145\/3613904.3642782"},{"key":"20_CR10","first-page":"30","volume":"6","author":"ML Edwards","year":"2014","unstructured":"Edwards, M.L., Smith, B.C.: The effects of the neutral response option on the extremeness of participant responses. J. Undergraduate Sch. 6, 30 (2014)","journal-title":"J. Undergraduate Sch."},{"key":"20_CR11","doi-asserted-by":"publisher","unstructured":"Freitas, J.A.d., et al.: Sensation in gamification: a qualitative investigation of background music in gamified learning. J. Interact. Sys. 15(1), 810\u2013822 (2024). https:\/\/doi.org\/10.5753\/jis.2024.4501. https:\/\/journals-sol.sbc.org.br\/index.php\/jis\/article\/view\/4501","DOI":"10.5753\/jis.2024.4501"},{"key":"20_CR12","doi-asserted-by":"crossref","unstructured":"Giray, L.: Prompt engineering with ChatGPT: a guide for academic writers. Ann. Biomed. Eng., 1\u20135 (2023)","DOI":"10.1007\/s10439-023-03272-4"},{"key":"20_CR13","doi-asserted-by":"crossref","unstructured":"Girotra, K., Meincke, L., Terwiesch, C., Ulrich, K.T.: Ideas are dimes a dozen: large language models for idea generation in innovation. Available at SSRN 4526071 (2023)","DOI":"10.2139\/ssrn.4526071"},{"key":"20_CR14","doi-asserted-by":"publisher","unstructured":"Gorlewicz, J.L., et al.: Design guidelines and recommendations for multimodal, touchscreen-based graphics. ACM Trans. Access. Comput. 13(3) (2020). https:\/\/doi.org\/10.1145\/3403933","DOI":"10.1145\/3403933"},{"key":"20_CR15","doi-asserted-by":"crossref","unstructured":"H\u00e4m\u00e4l\u00e4inen, P., Tavast, M., Kunnari, A.: Evaluating large language models in generating synthetic HCI research data: a case study. In: Proceedings of the 2023 CHI Conference on Human Factors in Computing Systems, pp. 1\u201319 (2023)","DOI":"10.1145\/3544548.3580688"},{"key":"20_CR16","unstructured":"ISO9241-11: Ergonomics of human-system interaction \u2014 part 11: usability: definitions and concepts (2018). https:\/\/www.iso.org\/obp\/ui\/#iso:std:iso:9241:-11:ed-2:v1:en"},{"issue":"12","key":"20_CR17","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3571730","volume":"55","author":"Z Ji","year":"2023","unstructured":"Ji, Z., et al.: Survey of hallucination in natural language generation. ACM Comput. Surv. 55(12), 1\u201338 (2023)","journal-title":"ACM Comput. Surv."},{"key":"20_CR18","doi-asserted-by":"publisher","unstructured":"Karmaker\u00a0Santu, S.K., Feng, D.: TELeR: a general taxonomy of LLM prompts for benchmarking complex tasks. In: Bouamor, H., Pino, J., Bali, K. (eds.) Findings of the Association for Computational Linguistics, EMNLP 2023, pp. 14197\u201314203. Association for Computational Linguistics, Singapore, December 2023. https:\/\/doi.org\/10.18653\/v1\/2023.findings-emnlp.946. https:\/\/aclanthology.org\/2023.findings-emnlp.946","DOI":"10.18653\/v1\/2023.findings-emnlp.946"},{"key":"20_CR19","doi-asserted-by":"publisher","unstructured":"Konopatzki, G.E., Valentim, N.C., Guerino, G.C.: A qualitative study and improvement on UX and usability evaluation questionnaire focused on multi-touch systems. In: Proceedings of the XXIII Brazilian Symposium on Software Quality, SBQS \u201924, pp. 362\u2013372. Association for Computing Machinery, New York, NY, USA (2024). https:\/\/doi.org\/10.1145\/3701625.3701674","DOI":"10.1145\/3701625.3701674"},{"key":"20_CR20","unstructured":"Lazar, J., Feng, J.H., Hochheiser, H.: Research Methods in Human-Computer Interaction. Morgan Kaufmann (2017)"},{"key":"20_CR21","unstructured":"Leiker, D., Finnigan, S., Gyllen, A.R., Cukurova, M.: Prototyping the use of large language models (LLMs) for adult learning content creation at scale. arXiv preprint arXiv:2306.01815 (2023)"},{"key":"20_CR22","unstructured":"Lewis, J., Sauro, J.: Does removing the neutral response option affect rating behavior? (2023). https:\/\/measuringu.com\/removing-the-neutral-response-option\/. Accessed 2 Feb 2025"},{"key":"20_CR23","unstructured":"Liu, Y., Sharma, P., Oswal, M.J., Xia, H., Huang, Y.: PersonaFlow: boosting research ideation with LLM-simulated expert personas. arXiv preprint arXiv:2409.12538 (2024)"},{"key":"20_CR24","doi-asserted-by":"crossref","unstructured":"Lu, Y., Zhang, C., Zhang, I., Li, T.J.J.: Bridging the gap between ux practitioners\u2019 work practices and ai-enabled design support tools. In: CHI Conference on Human Factors in Computing Systems Extended Abstracts, pp.\u00a01\u20137 (2022)","DOI":"10.1145\/3491101.3519809"},{"key":"20_CR25","doi-asserted-by":"crossref","unstructured":"McKnight, P.E., Najab, J.: Mann-Whitney U test. In: The Corsini Encyclopedia of Psychology, p.\u00a01 (2010)","DOI":"10.1002\/9780470479216.corpsy0524"},{"key":"20_CR26","doi-asserted-by":"crossref","unstructured":"Meinecke, A., Heidrich, D., Dworatzyk, K., Theis, S.: A comparative heuristic evaluation of Kadi4Mat through human evaluators and GPT-4. In: International Conference on Human-Computer Interaction, pp. 91\u2013108. Springer (2024)","DOI":"10.1007\/978-3-031-76821-7_8"},{"key":"20_CR27","doi-asserted-by":"publisher","unstructured":"Mello, R., et al.: Prompt engineering for automatic short answer grading in Brazilian Portuguese. In: Anais do XXXV Simp\u00f3sio Brasileiro de Inform\u00e1tica na Educa\u00e7\u00e3o, pp. 1730\u20131743. SBC, Porto Alegre, RS, Brasil (2024). https:\/\/doi.org\/10.5753\/sbie.2024.242424. https:\/\/sol.sbc.org.br\/index.php\/sbie\/article\/view\/31353","DOI":"10.5753\/sbie.2024.242424"},{"key":"20_CR28","doi-asserted-by":"publisher","unstructured":"Mi, N., Cavuoto, L.A., Benson, K., Smith-Jackson, T., Nussbaum, M.A.: A heuristic checklist for an accessible smartphone interface design. Univers. Access Inf. Soc. 13(4), 351\u2013365 (2014). https:\/\/doi.org\/10.1007\/s10209-013-0321-4","DOI":"10.1007\/s10209-013-0321-4"},{"issue":"3","key":"20_CR29","doi-asserted-by":"publisher","first-page":"338","DOI":"10.1145\/77481.77486","volume":"33","author":"R Molich","year":"1990","unstructured":"Molich, R., Nielsen, J.: Improving a human-computer dialogue. Commun. ACM 33(3), 338\u2013348 (1990)","journal-title":"Commun. ACM"},{"key":"20_CR30","unstructured":"Moran, K.: Usability (user) testing 101 (2019). https:\/\/www.nngroup.com\/articles\/usability-testing-101\/"},{"key":"20_CR31","unstructured":"Nielsen, J.: Heuristic evaluation. In: Usability Inspection Methods, pp. 25\u201362. Wiley (1994)"},{"issue":"3","key":"20_CR32","doi-asserted-by":"publisher","first-page":"319","DOI":"10.1086\/344431","volume":"29","author":"SM Nowlis","year":"2002","unstructured":"Nowlis, S.M., Kahn, B.E., Dhar, R.: Coping with ambivalence: the effect of removing a neutral option on consumer attitude and preference judgments. J. Consum. Res. 29(3), 319\u2013334 (2002)","journal-title":"J. Consum. Res."},{"key":"20_CR33","unstructured":"OpenAI: GPT-4 technical report (2023)"},{"key":"20_CR34","unstructured":"Panda, S.: LLMs\u2019 ways of seeing user personas. arXiv preprint arXiv:2409.14858 (2024)"},{"key":"20_CR35","doi-asserted-by":"crossref","unstructured":"Pearson, K.: X. on the criterion that a given system of deviations from the probable in the case of a correlated system of variables is such that it can be reasonably supposed to have arisen from random sampling. London Edinburgh Dublin Philos. Mag. J. Sci. 50(302), 157\u2013175 (1900)","DOI":"10.1080\/14786440009463897"},{"key":"20_CR36","doi-asserted-by":"crossref","unstructured":"Pereira\u00a0J\u00fanior, C., Rodrigues, L., Costa, N., Macario\u00a0Filho, V., Mello, R.: Can VLM understand children\u2019s handwriting? An analysis on handwritten mathematical equation recognition. In: Olney, A.M., Chounta, I.A., Liu, Z., Santos, O.C., Bittencourt, I.I. (eds.) Artificial Intelligence in Education. Posters and Late Breaking Results, Workshops and Tutorials, Industry and Innovation Tracks, Practitioners, Doctoral Consortium and Blue Sky, pp. 321\u2013328. Springer, Cham (2024)","DOI":"10.1007\/978-3-031-64315-6_28"},{"key":"20_CR37","doi-asserted-by":"crossref","unstructured":"Petridis, S., Terry, M., Cai, C.J.: Promptinfuser: bringing user interface mock-ups to life with large language models. In: Extended Abstracts of the 2023 CHI Conference on Human Factors in Computing Systems, pp.\u00a01\u20136 (2023)","DOI":"10.1145\/3544549.3585628"},{"key":"20_CR38","unstructured":"Petrie, H., Buykx, L.: Collaborative heuristic evaluation: improving the effectiveness of heuristic evaluation. In: Proceedings of UPA 2010 International Conference (2010)"},{"key":"20_CR39","doi-asserted-by":"publisher","unstructured":"Rodrigues, L., Dwan Pereira, F., Cabral, L., Ga\u0161evi\u0107, D., Ramalho, G., Ferreira Mello, R.: Assessing the quality of automatic-generated short answers using GPT-4. Comput. Educ. Artif. Intell. 7, 100248 (2024). https:\/\/doi.org\/10.1016\/j.caeai.2024.100248. https:\/\/www.sciencedirect.com\/science\/article\/pii\/S2666920X24000511","DOI":"10.1016\/j.caeai.2024.100248"},{"key":"20_CR40","doi-asserted-by":"crossref","unstructured":"Saavedra, M., Rusu, C., Qui\u00f1ones, D., Roncagliolo, S.: A set of usability and user experience heuristics for social networks. In: Meiselwitz, G. (ed.) Social Computing and Social Media. Design, Human Behavior and Analytics - 11th International Conference, SCSM 2019, Held as Part of the 21st HCI International Conference, HCII 2019, Orlando, FL, USA, July 26-31, 2019, Proceedings, Part I. LNCS, vol. 11578, pp. 128\u2013139. Springer (2019)","DOI":"10.1007\/978-3-030-21902-4_10"},{"key":"20_CR41","unstructured":"Sahoo, P., Singh, A.K., Saha, S., Jain, V., Mondal, S., Chadha, A.: A systematic survey of prompt engineering in large language models: techniques and applications. arXiv preprint arXiv:2402.07927 (2024)"},{"key":"20_CR42","doi-asserted-by":"crossref","unstructured":"Stephanidis, C., Salvendy, G.: User Experience Methods and Tools in Human-Computer Interaction, 1st edn. CRC Press (2024)","DOI":"10.1201\/9781003495161"},{"key":"20_CR43","doi-asserted-by":"crossref","unstructured":"Suh, S., Chen, M., Min, B., Li, T.J.J., Xia, H.: Luminate: structured generation and exploration of design space with large language models for human-AI co-creation. In: Proceedings of the CHI Conference on Human Factors in Computing Systems, pp. 1\u201326 (2024)","DOI":"10.1145\/3613904.3642400"},{"key":"20_CR44","doi-asserted-by":"publisher","unstructured":"Takaffoli, M., Li, S., M\u00e4kel\u00e4, V.: Generative AI in user experience design and research: how do UX practitioners, teams, and companies use Genai in industry? In: Proceedings of the 2024 ACM Designing Interactive Systems Conference, DIS \u201924, pp. 1579\u20131593. Association for Computing Machinery, New York, NY, USA (2024). https:\/\/doi.org\/10.1145\/3643834.3660720","DOI":"10.1145\/3643834.3660720"},{"key":"20_CR45","doi-asserted-by":"crossref","unstructured":"Tavast, M., Kunnari, A., H\u00e4m\u00e4l\u00e4inen, P.: Language models can generate human-like self-reports of emotion. In: Companion Proceedings of the 27th International Conference on Intelligent User Interfaces, pp. 69\u201372 (2022)","DOI":"10.1145\/3490100.3516464"},{"key":"20_CR46","unstructured":"Tullis, T., Albert, W.: Measuring the User Experience: Collecting, Analyzing, and Presenting Usability Metrics, 2nd edn. Morgan Kaufmann Publishers Inc., San Francisco, CA, USA (2013)"},{"key":"20_CR47","doi-asserted-by":"publisher","DOI":"10.1007\/s43681-024-00583-7","author":"Z Wang","year":"2024","unstructured":"Wang, Z., Chu, Z., Viet Doan, T., Ni, S., Yang, M., Zhang, W.: History, development, and principles of large language models-an introductory survey. AI Ethics (2024). https:\/\/doi.org\/10.1007\/s43681-024-00583-7","journal-title":"AI Ethics"},{"key":"20_CR48","first-page":"24824","volume":"35","author":"J Wei","year":"2022","unstructured":"Wei, J., et al.: Chain-of-thought prompting elicits reasoning in large language models. Adv. Neural. Inf. Process. Syst. 35, 24824\u201324837 (2022)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"20_CR49","unstructured":"White, J., et al.: A prompt pattern catalog to enhance prompt engineering with chatgpt. arXiv preprint arXiv:2302.11382 (2023)"},{"key":"20_CR50","doi-asserted-by":"publisher","unstructured":"Yan, L., et al.: Practical and ethical challenges of large language models in education: a systematic scoping review. British J. Educ. Technol. (2023). https:\/\/doi.org\/10.1111\/bjet.13370","DOI":"10.1111\/bjet.13370"},{"key":"20_CR51","unstructured":"Zhong, R., Hsieh, G., McDonald, D.W.: How can LLMs support UX practitioners with image-related tasks? In: GenAICHI: CHI 2024 Workshop on Generative AI and HCI, pp.\u00a01\u20136 (2024)"},{"key":"20_CR52","unstructured":"Ziyu, Z., et al.: Through the lens of core competency: survey on evaluation of large language models. In: Zhang, J. (ed.) Proceedings of the 22nd Chinese National Conference on Computational Linguistics (Volume 2: Frontier Forum), pp. 88\u2013109. Chinese Information Processing Society of China, Harbin, China, August 2023. https:\/\/aclanthology.org\/2023.ccl-2.8"}],"container-title":["Lecture Notes in Computer Science","Human-Computer Interaction \u2013 INTERACT 2025"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-032-05005-2_20","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,8]],"date-time":"2025-09-08T04:41:37Z","timestamp":1757306497000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-032-05005-2_20"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,9,9]]},"ISBN":["9783032050045","9783032050052"],"references-count":52,"URL":"https:\/\/doi.org\/10.1007\/978-3-032-05005-2_20","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,9,9]]},"assertion":[{"value":"9 September 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"INTERACT","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"IFIP Conference on Human-Computer Interaction","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Belo Horizonte","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Brazil","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2025","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"8 September 2025","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"12 September 2025","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"20","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"interact2025","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/ifip-tc13.org\/interact2025\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}