{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,25]],"date-time":"2025-06-25T04:08:05Z","timestamp":1750824485726,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":82,"publisher":"ACM","content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,6,23]]},"DOI":"10.1145\/3715275.3732021","type":"proceedings-article","created":{"date-parts":[[2025,6,23]],"date-time":"2025-06-23T17:01:18Z","timestamp":1750698078000},"page":"296-311","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Understanding the Effects of Explaining Predictive but Unintuitive Features in Human-XAI Interaction"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-4460-5637","authenticated-orcid":false,"given":"Jiaming","family":"Qu","sequence":"first","affiliation":[{"name":"University of North Carolina at Chapel Hill, Chapel Hill, North Carolina, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7645-0556","authenticated-orcid":false,"given":"Jaime","family":"Arguello","sequence":"additional","affiliation":[{"name":"University of North Carolina at Chapel Hill, Chapel Hill, North Carolina, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0278-2347","authenticated-orcid":false,"given":"Yue","family":"Wang","sequence":"additional","affiliation":[{"name":"University of North Carolina at Chapel Hill, Chapel Hill, North Carolina, USA"}]}],"member":"320","published-online":{"date-parts":[[2025,6,23]]},"reference":[{"unstructured":"Josh Achiam Steven Adler Sandhini Agarwal Lama Ahmad Ilge Akkaya Florencia\u00a0Leoni Aleman Diogo Almeida Janko Altenschmidt Sam Altman Shyamal Anadkat et\u00a0al. 2023. Gpt-4 technical report. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2303.08774 (2023).","key":"e_1_3_3_1_2_2"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_3_2","DOI":"10.1145\/3411764.3445717"},{"key":"e_1_3_3_1_4_2","volume-title":"Natural language processing with Python: analyzing text with the natural language toolkit","author":"Bird Steven","year":"2009","unstructured":"Steven Bird, Ewan Klein, and Edward Loper. 2009. Natural language processing with Python: analyzing text with the natural language toolkit. \" O\u2019Reilly Media, Inc.\"."},{"doi-asserted-by":"crossref","unstructured":"Charles\u00a0F Bond\u00a0Jr and Bella\u00a0M DePaulo. 2006. Accuracy of deception judgments. Personality and social psychology Review 10 3 (2006) 214\u2013234.","key":"e_1_3_3_1_5_2","DOI":"10.1207\/s15327957pspr1003_2"},{"unstructured":"Sebastian Bordt Ben Lengerich Harsha Nori and Rich Caruana. 2024. Data Science with LLMs and Interpretable Models. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2402.14474 (2024).","key":"e_1_3_3_1_6_2"},{"unstructured":"Vadim Borisov and Gjergji Kasneci. 2022. Relational Local Explanations. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2212.12374 (2022).","key":"e_1_3_3_1_7_2"},{"unstructured":"John Brooke. 2013. SUS: a retrospective. Journal of usability studies 8 2 (2013) 29\u201340.","key":"e_1_3_3_1_8_2"},{"unstructured":"Tom Brown Benjamin Mann Nick Ryder Melanie Subbiah Jared\u00a0D Kaplan Prafulla Dhariwal Arvind Neelakantan Pranav Shyam Girish Sastry Amanda Askell et\u00a0al. 2020. Language models are few-shot learners. Advances in neural information processing systems 33 (2020) 1877\u20131901.","key":"e_1_3_3_1_9_2"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_10_2","DOI":"10.1145\/3377325.3377498"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_11_2","DOI":"10.1145\/3290605.3300234"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_12_2","DOI":"10.1609\/icwsm.v14i1.7282"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_13_2","DOI":"10.1145\/2783258.2788613"},{"doi-asserted-by":"crossref","unstructured":"Valerie Chen Q\u00a0Vera Liao Jennifer Wortman\u00a0Vaughan and Gagan Bansal. 2023. Understanding the role of human intuition on reliance in human-AI decision-making with explanations. Proceedings of the ACM on Human-computer Interaction 7 CSCW2 (2023) 1\u201332.","key":"e_1_3_3_1_14_2","DOI":"10.1145\/3610219"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_15_2","DOI":"10.1145\/3613904.3641904"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_16_2","DOI":"10.1145\/3290605.3300789"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_17_2","DOI":"10.18653\/v1\/2023.acl-long.870"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_18_2","DOI":"10.1145\/3397481.3450644"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_19_2","DOI":"10.4324\/9780203771587"},{"unstructured":"Ian Covert Scott\u00a0M Lundberg and Su-In Lee. 2020. Understanding global feature contributions with additive importance measures. Advances in Neural Information Processing Systems 33 (2020) 17212\u201317223.","key":"e_1_3_3_1_20_2"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_21_2","DOI":"10.1145\/3377325.3377512"},{"unstructured":"Finale Doshi-Velez and Been Kim. 2017. Towards A Rigorous Science of Interpretable Machine Learning. arXiv (2017). https:\/\/arxiv.org\/abs\/1702.08608","key":"e_1_3_3_1_22_2"},{"doi-asserted-by":"crossref","unstructured":"Charles\u00a0W Dunnett. 1955. A multiple comparison procedure for comparing several treatments with a control. J. Amer. Statist. Assoc. 50 272 (1955) 1096\u20131121.","key":"e_1_3_3_1_23_2","DOI":"10.1080\/01621459.1955.10501294"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_24_2","DOI":"10.1145\/3491101.3503727"},{"doi-asserted-by":"crossref","unstructured":"Donald\u00a0E Farrar and Robert\u00a0R Glauber. 1967. Multicollinearity in regression analysis: the problem revisited. The Review of Economic and Statistics (1967) 92\u2013107.","key":"e_1_3_3_1_25_2","DOI":"10.2307\/1937887"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_26_2","DOI":"10.18653\/v1\/2023.nlrse-1.4"},{"unstructured":"Aaron Fisher Cynthia Rudin and Francesca Dominici. 2019. All models are wrong but many are useful: Learning a variable\u2019s importance by studying an entire class of prediction models simultaneously. Journal of Machine Learning Research 20 177 (2019) 1\u201381.","key":"e_1_3_3_1_27_2"},{"unstructured":"Ronald\u00a0A Fisher. 1949. The design of experiments. (1949).","key":"e_1_3_3_1_28_2"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_29_2","DOI":"10.1145\/3313831.3376316"},{"unstructured":"Tanya Goyal Junyi\u00a0Jessy Li and Greg Durrett. 2022. News summarization and evaluation in the era of gpt-3. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2209.12356 (2022).","key":"e_1_3_3_1_30_2"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_31_2","DOI":"10.1016\/S0166-4115(08)62386-9"},{"unstructured":"Dan Hendrycks Collin Burns Steven Basart Andy Zou Mantas Mazeika Dawn Song and Jacob Steinhardt. 2021. Measuring Massive Multitask Language Understanding. Proceedings of the International Conference on Learning Representations (ICLR) (2021).","key":"e_1_3_3_1_32_2"},{"doi-asserted-by":"crossref","unstructured":"Samuel Himmelfarb. 1975. What do you do when the control group doesn\u2019t fit into the factorial design? Psychological Bulletin 82 3 (1975) 363.","key":"e_1_3_3_1_33_2","DOI":"10.1037\/\/0033-2909.82.3.363"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_34_2","DOI":"10.18653\/v1\/2023.acl-long.230"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_35_2","DOI":"10.18653\/v1\/2023.findings-acl.750"},{"unstructured":"Joseph\u00a0D Janizek Pascal Sturmfels and Su-In Lee. 2021. Explaining explanations: Axiomatic feature interactions for deep networks. Journal of Machine Learning Research 22 104 (2021) 1\u201354.","key":"e_1_3_3_1_36_2"},{"doi-asserted-by":"crossref","unstructured":"Gary\u00a0M Kaufmann and Terry\u00a0A Beehr. 1986. Interactions between job stressors and social support: Some counterintuitive results. Journal of applied psychology 71 3 (1986) 522.","key":"e_1_3_3_1_37_2","DOI":"10.1037\/\/0021-9010.71.3.522"},{"doi-asserted-by":"crossref","unstructured":"Jenia Kim Henry Maathuis and Danielle Sent. 2024. Human-centered evaluation of explainable AI applications: a systematic review. Frontiers in Artificial Intelligence 7 (2024) 1456486.","key":"e_1_3_3_1_38_2","DOI":"10.3389\/frai.2024.1456486"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_39_2","DOI":"10.1145\/3630106.3658941"},{"key":"e_1_3_3_1_40_2","first-page":"193","volume-title":"Proceedings of the 24th Annual Conference of the European Association for Machine Translation","author":"Kocmi Tom","year":"2023","unstructured":"Tom Kocmi and Christian Federmann. 2023. Large Language Models Are State-of-the-Art Evaluators of Translation Quality. In Proceedings of the 24th Annual Conference of the European Association for Machine Translation. 193\u2013203."},{"key":"e_1_3_3_1_41_2","first-page":"1885","volume-title":"International conference on machine learning","author":"Koh Pang\u00a0Wei","year":"2017","unstructured":"Pang\u00a0Wei Koh and Percy Liang. 2017. Understanding black-box predictions via influence functions. In International conference on machine learning. PMLR, 1885\u20131894."},{"unstructured":"Nicholas Kroeger Dan Ley Satyapriya Krishna Chirag Agarwal and Himabindu Lakkaraju. 2023. Are Large Language Models Post Hoc Explainers? arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2310.05797 (2023).","key":"e_1_3_3_1_42_2"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_43_2","DOI":"10.1145\/2678025.2701399"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_44_2","DOI":"10.1145\/3593013.3594087"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_45_2","DOI":"10.1145\/3313831.3376873"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_46_2","DOI":"10.1145\/3287560.3287590"},{"unstructured":"Benjamin\u00a0J Lengerich Sebastian Bordt Harsha Nori Mark\u00a0E Nunnally Yin Aphinyanaphongs Manolis Kellis and Rich Caruana. 2023. LLMs understand glass-box models discover surprises and suggest repairs. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2308.01157 (2023).","key":"e_1_3_3_1_47_2"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_48_2","DOI":"10.18653\/v1\/D13-1199"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_49_2","DOI":"10.3115\/v1\/P14-1147"},{"unstructured":"Q\u00a0Vera Liao and Kush\u00a0R Varshney. 2021. Human-centered explainable ai (xai): From algorithms to user experiences. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2110.10790 (2021).","key":"e_1_3_3_1_50_2"},{"doi-asserted-by":"crossref","unstructured":"Zhuoran Lu Dakuo Wang and Ming Yin. 2024. Does more advice help? the effects of second opinions in AI-assisted decision making. Proceedings of the ACM on Human-Computer Interaction 8 CSCW1 (2024) 1\u201331.","key":"e_1_3_3_1_51_2","DOI":"10.1145\/3653708"},{"unstructured":"Scott\u00a0M Lundberg and Su-In Lee. 2017. A unified approach to interpreting model predictions. Advances in neural information processing systems 30 (2017).","key":"e_1_3_3_1_52_2"},{"unstructured":"David Martens James Hinns Camille Dams Mark Vergouwen and Theodoros Evgeniou. 2023. Tell me a story! narrative-driven xai with large language models. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2309.17057 (2023).","key":"e_1_3_3_1_53_2"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_54_2","DOI":"10.18653\/v1\/2023.findings-emnlp.568"},{"key":"e_1_3_3_1_55_2","first-page":"497","volume-title":"Proceedings of the 2013 conference of the north american chapter of the association for computational linguistics: human language technologies","author":"Ott Myle","year":"2013","unstructured":"Myle Ott, Claire Cardie, and Jeffrey\u00a0T Hancock. 2013. Negative deceptive opinion spam. In Proceedings of the 2013 conference of the north american chapter of the association for computational linguistics: human language technologies. 497\u2013501."},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_56_2","DOI":"10.5555\/2002472.2002512"},{"unstructured":"Bo Pan Zhen Xiong Guanchen Wu Zheng Zhang Yifei Zhang and Liang Zhao. 2024. TAGExplainer: Narrating Graph Explanations for Text-Attributed Graph Learning Models. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2410.15268 (2024).","key":"e_1_3_3_1_57_2"},{"doi-asserted-by":"crossref","unstructured":"Raja Parasuraman and Victor Riley. 1997. Humans and automation: Use misuse disuse abuse. Human factors 39 2 (1997) 230\u2013253.","key":"e_1_3_3_1_58_2","DOI":"10.1518\/001872097778543886"},{"unstructured":"Fabian Pedregosa Ga\u00ebl Varoquaux Alexandre Gramfort Vincent Michel Bertrand Thirion Olivier Grisel Mathieu Blondel Peter Prettenhofer Ron Weiss Vincent Dubourg et\u00a0al. 2011. Scikit-learn: Machine learning in Python. the Journal of machine Learning research 12 (2011) 2825\u20132830.","key":"e_1_3_3_1_59_2"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_60_2","DOI":"10.1145\/3459637.3482409"},{"key":"e_1_3_3_1_61_2","volume-title":"ACM SIGIR Conference On Human Information Interaction And Retrieval","author":"Qu Jiaming","year":"2023","unstructured":"Jiaming Qu, Jaime Arguello, and Yue Wang. 2023. Understanding the Cognitive Influences of Interpretability Features on How Users Scrutinize Machine-Predicted Categories. In ACM SIGIR Conference On Human Information Interaction And Retrieval."},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_62_2","DOI":"10.1145\/3630106.3658547"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_63_2","DOI":"10.1145\/2939672.2939778"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_64_2","DOI":"10.1609\/aaai.v32i1.11491"},{"doi-asserted-by":"crossref","unstructured":"John\u00a0TE Richardson. 2011. Eta squared and partial eta squared as measures of effect size in educational research. Educational research review 6 2 (2011) 135\u2013147.","key":"e_1_3_3_1_65_2","DOI":"10.1016\/j.edurev.2010.12.001"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_66_2","DOI":"10.1145\/3581641.3584066"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_67_2","DOI":"10.1145\/3531146.3533127"},{"unstructured":"Rita Sevastjanova and Mennatallah El-Assady. 2022. Beware the rationalization trap! when language model explainability diverges from our mental models of language. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2207.06897 (2022).","key":"e_1_3_3_1_68_2"},{"unstructured":"Philipp Spitzer Niklas K\u00fchl Marc Goutier Manuel Kaschura and Gerhard Satzger. 2024. Transferring Domain Knowledge with (X) AI-Based Learning Systems. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2406.01329 (2024).","key":"e_1_3_3_1_69_2"},{"key":"e_1_3_3_1_70_2","first-page":"3319","volume-title":"International conference on machine learning","author":"Sundararajan Mukund","year":"2017","unstructured":"Mukund Sundararajan, Ankur Taly, and Qiqi Yan. 2017. Axiomatic attribution for deep networks. In International conference on machine learning. PMLR, 3319\u20133328."},{"key":"e_1_3_3_1_71_2","first-page":"4149","volume-title":"Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long and Short Papers)","author":"Talmor Alon","year":"2019","unstructured":"Alon Talmor, Jonathan Herzig, Nicholas Lourie, and Jonathan Berant. 2019. CommonsenseQA: A Question Answering Challenge Targeting Commonsense Knowledge. In Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long and Short Papers). 4149\u20134158."},{"doi-asserted-by":"crossref","unstructured":"Sule Tekkesinoglu and Lars Kunze. 2024. From Feature Importance to Natural Language Explanations Using LLMs with RAG. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2407.20990 (2024).","key":"e_1_3_3_1_72_2","DOI":"10.2139\/ssrn.4910800"},{"unstructured":"Michael Tsang Sirisha Rambhatla and Yan Liu. 2020. How does this interaction affect me? interpretable attribution for feature interactions. Advances in neural information processing systems 33 (2020) 6147\u20136159.","key":"e_1_3_3_1_73_2"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_74_2","DOI":"10.1145\/3290605.3300831"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_75_2","DOI":"10.18653\/v1\/2023.newsum-1.1"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_76_2","DOI":"10.24963\/ijcai.2023\/343"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_77_2","DOI":"10.1145\/3377325.3377480"},{"unstructured":"Chih-Kuan Yeh Joon Kim Ian En-Hsu Yen and Pradeep\u00a0K Ravikumar. 2018. Representer point selection for explaining deep neural networks. Advances in neural information processing systems 31 (2018).","key":"e_1_3_3_1_78_2"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_79_2","DOI":"10.18653\/v1\/D19-1404"},{"unstructured":"Wayne\u00a0Xin Zhao Kun Zhou Junyi Li Tianyi Tang Xiaolei Wang Yupeng Hou Yingqian Min Beichen Zhang Junjie Zhang Zican Dong et\u00a0al. 2023. A survey of large language models. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2303.18223 (2023).","key":"e_1_3_3_1_80_2"},{"doi-asserted-by":"crossref","unstructured":"Jianlong Zhou Amir\u00a0H Gandomi Fang Chen and Andreas Holzinger. 2021. Evaluating the quality of machine learning explanations: A survey on methods and metrics. Electronics 10 5 (2021) 593.","key":"e_1_3_3_1_81_2","DOI":"10.3390\/electronics10050593"},{"doi-asserted-by":"crossref","unstructured":"Caleb Ziems William Held Omar Shaikh Jiaao Chen Zhehao Zhang and Diyi Yang. 2024. Can Large Language Models Transform Computational Social Science? Computational Linguistics 50 1 (2024) 237\u2013291.","key":"e_1_3_3_1_82_2","DOI":"10.1162\/coli_a_00502"},{"unstructured":"Alexandra Zytek Sara Pid\u00f2 and Kalyan Veeramachaneni. 2024. LLMs for XAI: Future Directions for Explaining Explanations. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2405.06064 (2024).","key":"e_1_3_3_1_83_2"}],"event":{"acronym":"FAccT '25","name":"FAccT '25: The 2025 ACM Conference on Fairness, Accountability, and Transparency","location":"Athens Greece"},"container-title":["Proceedings of the 2025 ACM Conference on Fairness, Accountability, and Transparency"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3715275.3732021","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,24]],"date-time":"2025-06-24T11:14:43Z","timestamp":1750763683000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3715275.3732021"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,6,23]]},"references-count":82,"alternative-id":["10.1145\/3715275.3732021","10.1145\/3715275"],"URL":"https:\/\/doi.org\/10.1145\/3715275.3732021","relation":{},"subject":[],"published":{"date-parts":[[2025,6,23]]},"assertion":[{"value":"2025-06-23","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}