{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,2]],"date-time":"2026-05-02T16:59:00Z","timestamp":1777741140771,"version":"3.51.4"},"reference-count":236,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2024,12,14]],"date-time":"2024-12-14T00:00:00Z","timestamp":1734134400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,12,14]],"date-time":"2024-12-14T00:00:00Z","timestamp":1734134400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/100018693","name":"HORIZON EUROPE Framework Programme","doi-asserted-by":"publisher","award":["860621"],"award-info":[{"award-number":["860621"]}],"id":[{"id":"10.13039\/100018693","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Ethics Inf Technol"],"published-print":{"date-parts":[[2025,3]]},"DOI":"10.1007\/s10676-024-09800-7","type":"journal-article","created":{"date-parts":[[2024,12,14]],"date-time":"2024-12-14T00:27:23Z","timestamp":1734136043000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":5,"title":["Nullius in Explanans: an ethical risk assessment for explainable AI"],"prefix":"10.1007","volume":"27","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-4733-9760","authenticated-orcid":false,"given":"Luca","family":"Nannini","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Diletta","family":"Huyskes","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Enrico","family":"Panai","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Giada","family":"Pistilli","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0382-3083","authenticated-orcid":false,"given":"Alessio","family":"Tartaro","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2024,12,14]]},"reference":[{"key":"9800_CR1","doi-asserted-by":"publisher","first-page":"52138","DOI":"10.1109\/ACCESS.2018.2870052","volume":"6","author":"A Adadi","year":"2018","unstructured":"Adadi, A., & Berrada, M. (2018). Peeking inside the black-box: A survey on explainable artificial intelligence (XAI). IEEE Access, 6, 52138\u201352160. https:\/\/doi.org\/10.1109\/ACCESS.2018.2870052","journal-title":"IEEE Access"},{"key":"9800_CR2","unstructured":"Adebayo, J., Gilmer, J., Muelly, M., Goodfellow, I. J., Hardt, M., & Kim, B. (2018). Sanity checks for saliency maps. In S. Bengio, H. M. Wallach, H. Larochelle, K. Grauman, N. Cesa-Bianchi, & R. Garnett (Eds.), Advances in neural information processing systems 31: Annual conference on neural information processing systems 2018, NeurIPS 2018, December 3-8, 2018, Montr\u00e9al, Canada (pp. 9525\u20139536). https:\/\/proceedings.neurips.cc\/paper\/2018\/hash\/294a8ed24b1ad22ec2e7efea049b8737-Abstract.html"},{"key":"9800_CR3","unstructured":"Adebayo, J., Muelly, M., Abelson, H., & Kim, B. (2022). Post hoc explanations may be ineffective for detecting unknown spurious correlation. In The tenth international conference on learning representations, ICLR 2022, virtual event, April 25-29, 2022. OpenReview.net. https:\/\/openreview.net\/forum?id=xNOVfCCvDpM"},{"key":"9800_CR4","unstructured":"Adebayo, J., Muelly, M., Liccardi, I., & Kim, B. (2020). Debugging tests for model explanations. In H. Larochelle, M. Ranzato, R. Hadsell, M.-F. Balcan, & H.-T. Lin (Eds.), Advances in neural information processing systems 33: Annual conference on neural information processing systems 2020, NeurIPS 2020, December 6-12, 2020, virtual. https:\/\/proceedings.neurips.cc\/paper\/2020\/hash\/075b051ec3d22dac7b33f788da631fd4-Abstract.html"},{"key":"9800_CR5","unstructured":"Agarwal, C., Zitnik, M., & Lakkaraju, H. (2022). Probing GNN explainers: A rigorous theoretical and empirical analysis of GNN explanation methods. In G. Camps-Valls, F. J. R. Ruiz, & I. Valera (Eds.), International conference on artificial intelligence and statistics, AISTATS 2022, 28-30 March 2022, virtual event, proceedings of machine learning research (Vol. 151, pp. 8969\u20138996). PMLR. https:\/\/proceedings.mlr.press\/v151\/agarwal22b.html"},{"key":"9800_CR6","doi-asserted-by":"publisher","unstructured":"Agre, P. E. (2014). Toward a critical technical practice: Lessons learned in trying to reform AI. In Social science, technical systems, and cooperative work (pp. 131\u2013157). Psychology Press. https:\/\/doi.org\/10.4324\/9781315805849","DOI":"10.4324\/9781315805849"},{"key":"9800_CR7","unstructured":"A\u00efvodji, U., Arai, H., Fortineau, O., Gambs, S., Hara, S., & Tapp, A. (2019). Fairwashing: The risk of rationalization. In K. Chaudhuri, & R. Salakhutdinov (Eds.), Proceedings of the 36th international conference on machine learning, ICML 2019, 9-15 June 2019, Long Beach, California, USA, proceedings of machine learning research (Vol.\u00a097, pp. 161\u2013170). PMLR. http:\/\/proceedings.mlr.press\/v97\/aivodji19a.html"},{"key":"9800_CR8","unstructured":"A\u00efvodji, U., Arai, H., Gambs, S., & Hara, S. (2021). Characterizing the risk of fairwashing. In M. Ranzato, A. Beygelzimer, Y. N. Dauphin, P. Liang, & J. W. Vaughan (Eds.), Advances in neural information processing systems 34: Annual conference on neural information processing systems 2021, NeurIPS 2021, December 6-14, 2021, virtual (pp. 14822-14834). https:\/\/proceedings.neurips.cc\/paper\/2021\/hash\/7caf5e22ea3eb8175ab518429c8589a4-Abstract.html"},{"key":"9800_CR9","unstructured":"Alvarez-Melis, D., & Jaakkola, T. S. (2018). Towards robust interpretability with self-explaining neural networks. In S. Bengio, H. M. Wallach, H. Larochelle, K. Grauman, N. Cesa-Bianchi, & R. Garnett (Eds.), Advances in neural information processing systems 31: Annual conference on neural information processing systems 2018, NeurIPS 2018, December 3-8, 2018, Montr\u00e9al, Canada (pp. 7786\u20137795). https:\/\/proceedings.neurips.cc\/paper\/2018\/hash\/3e9f0fc9b2f89e043bc6233994dfcf76-Abstract.html"},{"issue":"6","key":"9800_CR10","doi-asserted-by":"publisher","first-page":"373","DOI":"10.1016\/0950-7051(96)81920-4","volume":"8","author":"R Andrews","year":"1995","unstructured":"Andrews, R., Diederich, J., & Tickle, A. B. (1995). Survey and critique of techniques for extracting rules from trained artificial neural networks. Knowledge-Based Systems, 8(6), 373\u2013389. https:\/\/doi.org\/10.1016\/0950-7051(96)81920-4","journal-title":"Knowledge-Based Systems"},{"key":"9800_CR11","doi-asserted-by":"crossref","unstructured":"Angwin, J., Larson, J., Mattu, S., & Kirchner, L. (2016). Machine bias. In Ethics of data and analytics (pp. 254\u2013264). Auerbach Publications.","DOI":"10.1201\/9781003278290-37"},{"key":"9800_CR12","doi-asserted-by":"publisher","unstructured":"Arnold, M., Bellamy, R. K. E., Hind, M., Houde, S., Mehta, S., Mojsilovic, A., Nair, R., Ramamurthy, K. N., Olteanu, A., Piorkowski, D., Reimer, D., Richards, J. T., Tsay, J., & Varshney, K. R. (2019). Factsheets: Increasing trust in AI services through supplier\u2019s declarations of conformity. IBM Journal of Research and Development, 63(4\/5), 6:1\u20136:13. https:\/\/doi.org\/10.1147\/JRD.2019.2942288","DOI":"10.1147\/JRD.2019.2942288"},{"key":"9800_CR13","doi-asserted-by":"crossref","unstructured":"Arora, S., Pruthi, D., Sadeh, N. M., Cohen, W. W., Lipton, Z. C., & Neubig, G. (2022). Explain, edit, and understand: Rethinking user study design for evaluating model explanations. In Thirty-sixth AAAI conference on artificial intelligence, AAAI 2022, thirty-fourth conference on innovative applications of artificial intelligence, IAAI 2022, the twelveth symposium on educational advances in artificial intelligence, EAAI 2022 virtual event, February 22-March 1, 2022 (pp. 5277\u20135285). AAAI Press. https:\/\/ojs.aaai.org\/index.php\/AAAI\/article\/view\/20464","DOI":"10.1609\/aaai.v36i5.20464"},{"key":"9800_CR14","doi-asserted-by":"publisher","unstructured":"Balagopalan, A., Zhang, H., Hamidieh, K., Hartvigsen, T., Rudzicz, E., & Ghassemi, M. (2022). The road to explainability is paved with bias: Measuring the fairness of explanations. In FAccT \u201922: 2022 ACM conference on fairness, accountability, and transparency, Seoul, Republic of Korea, June 21-24, 2022 (pp. 1194\u20131206). ACM. https:\/\/doi.org\/10.1145\/3531146.3533179","DOI":"10.1145\/3531146.3533179"},{"key":"9800_CR15","doi-asserted-by":"publisher","unstructured":"Baniecki, H., & Biecek, P. (2022). Manipulating SHAP via adversarial data perturbations (student abstract). In Thirty-sixth AAAI conference on artificial intelligence, AAAI 2022, thirty-fourth conference on innovative applications of artificial intelligence, IAAI 2022, the twelveth symposium on educational advances in artificial intelligence, EAAI 2022 virtual event, February 22-March 1, 2022 (pp. 12907\u201312908). AAAI Press. https:\/\/doi.org\/10.1609\/AAAI.V36I11.21590.","DOI":"10.1609\/AAAI.V36I11.21590"},{"key":"9800_CR16","doi-asserted-by":"publisher","DOI":"10.1016\/j.inffus.2024.102303","volume":"107","author":"H Baniecki","year":"2024","unstructured":"Baniecki, H., & Biecek, P. (2024). Adversarial attacks and defenses in explainable artificial intelligence: A survey. Information Fusion, 107, 102303. https:\/\/doi.org\/10.1016\/j.inffus.2024.102303","journal-title":"Information Fusion"},{"key":"9800_CR17","doi-asserted-by":"publisher","unstructured":"Baniecki, H., Kretowicz, W., & Biecek, P. (2022). Fooling partial dependence via data poisoning. In M. Amini, S. Canu, A. Fischer, T. Guns, P. K. Novak, & G. Tsoumakas (Eds.), Machine learning and knowledge discovery in databases\u2014European conference, ECML PKDD 2022, Grenoble, France, September 19-23, 2022, proceedings, part III, lecture notes in computer science (Vol. 13715, pp. 121\u2013136). Springer. https:\/\/doi.org\/10.1007\/978-3-031-26409-2_8","DOI":"10.1007\/978-3-031-26409-2_8"},{"key":"9800_CR18","doi-asserted-by":"publisher","unstructured":"Bekker, S. (2020). Fundamental rights in digital welfare states: The case of SyRI in the Netherlands, T.M.C. Netherlands Yearbook of International Law (pp. 289\u2013307). Asser Press.https:\/\/doi.org\/10.1007\/978-94-6265-403-7_24","DOI":"10.1007\/978-94-6265-403-7_24"},{"key":"9800_CR19","doi-asserted-by":"publisher","unstructured":"Bertrand, A., Belloum, R., Eagan, J. R., & Maxwell, W. (2022). How cognitive biases affect XAI-assisted decision-making: A systematic review. In V. Conitzer, J. Tasioulas, M. Scheutz, R. Calo, M. Mara, & A. Zimmermann (Eds.), AIES \u201922: AAAI\/ACM conference on AI, ethics, and society, Oxford, United Kingdom, May 19-21, 2021 (pp. 78\u201391). ACM.https:\/\/doi.org\/10.1145\/3514094.3534164","DOI":"10.1145\/3514094.3534164"},{"key":"9800_CR20","doi-asserted-by":"publisher","first-page":"317","DOI":"10.1016\/j.patcog.2018.07.023","volume":"84","author":"B Biggio","year":"2018","unstructured":"Biggio, B., & Roli, F. (2018). Wild patterns: Ten years after the rise of adversarial machine learning. Pattern Recognition, 84, 317\u2013331. https:\/\/doi.org\/10.1016\/j.patcog.2018.07.023","journal-title":"Pattern Recognition"},{"key":"9800_CR21","doi-asserted-by":"publisher","first-page":"77","DOI":"10.1191\/1478088706qp063oa","volume":"3","author":"V Braun","year":"2006","unstructured":"Braun, V., & Clarke, V. (2006). Using thematic analysis in psychology. Qualitative Research in Psychology, 3, 77\u2013101. https:\/\/doi.org\/10.1191\/1478088706qp063oa","journal-title":"Qualitative Research in Psychology"},{"key":"9800_CR22","doi-asserted-by":"publisher","unstructured":"Brown, D., & Kvinge, H. (2023). Making corgis important for honeycomb classification: Adversarial attacks on concept-based explainability tools. In IEEE\/CVF conference on computer vision and pattern recognition, CVPR 2023\u2014Workshops, Vancouver, BC, Canada, June 17-24, 2023 (pp. 620\u2013627). IEEE. https:\/\/doi.org\/10.1109\/CVPRW59228.2023.00069,","DOI":"10.1109\/CVPRW59228.2023.00069"},{"issue":"1","key":"9800_CR23","doi-asserted-by":"publisher","first-page":"205395172098386","DOI":"10.1177\/2053951720983865","volume":"8","author":"S Brown","year":"2021","unstructured":"Brown, S., Davidovic, J., & Hasan, A. (2021). The algorithm audit: Scoring the algorithms that score us. Big Data & Society, 8(1), 2053951720983865. https:\/\/doi.org\/10.1177\/2053951720983865","journal-title":"Big Data & Society"},{"key":"9800_CR24","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2022.118888","volume":"213","author":"F Cabitza","year":"2023","unstructured":"Cabitza, F., Campagner, A., Malgieri, G., Natali, C., Schneeberger, D., Stoeger, K., & Holzinger, A. (2023). Quod erat demonstrandum?\u2013Towards a typology of the concept of explanation for the design of explainable AI. Expert Systems with Applications, 213, 118888. https:\/\/doi.org\/10.1016\/j.eswa.2022.118888","journal-title":"Expert Systems with Applications"},{"key":"9800_CR25","doi-asserted-by":"publisher","unstructured":"Carlini, N., & Wagner, D. A. (2017a). Adversarial examples are not easily detected: Bypassing ten detection methods. In B. Thuraisingham, B. Biggio, D. M. Freeman, B. Miller, & A. Sinha (Eds.), Proceedings of the 10th ACM workshop on artificial intelligence and security, AISec@CCS 2017, Dallas, TX, USA, November 3, 2017 (pp. 3\u201314). ACM. https:\/\/doi.org\/10.1145\/3128572.3140444","DOI":"10.1145\/3128572.3140444"},{"key":"9800_CR26","doi-asserted-by":"publisher","unstructured":"Carlini, N., & Wagner, D. A. (2017b). Towards evaluating the robustness of neural networks. In 2017 IEEE symposium on security and privacy, SP 2017, San Jose, CA, USA, May 22-26, 2017 (pp. 39\u201357). IEEE Computer Society. https:\/\/doi.org\/10.1109\/SP.2017.49","DOI":"10.1109\/SP.2017.49"},{"key":"9800_CR27","doi-asserted-by":"publisher","unstructured":"Carmichael, Z., & Scheirer, W. J. (2023). Unfooling perturbation-based post hoc explainers. In B. Williams, Y Chen, & J. Neville (Eds.), Thirty-seventh AAAI conference on artificial intelligence, AAAI 2023, thirty-fifth conference on innovative applications of artificial intelligence, IAAI 2023, thirteenth symposium on educational advances in artificial intelligence, EAAI 2023, Washington, DC, USA, February 7-14, 2023 (pp. 6925\u20136934). AAAI Press. https:\/\/doi.org\/10.1609\/AAAI.V37I6.25847","DOI":"10.1609\/AAAI.V37I6.25847"},{"key":"9800_CR28","unstructured":"Chen, J., Wu, X., Rastogi, V., Liang, Y., & Jha, S. (2019). Robust attribution regularization. In: [214] (pp. 14300\u201314310). https:\/\/proceedings.neurips.cc\/paper\/2019\/hash\/172ef5a94b4dd0aa120c6878fc29f70c-Abstract.html"},{"issue":"CSCW2","key":"9800_CR29","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3610219","volume":"7","author":"V Chen","year":"2023","unstructured":"Chen, V., Liao, Q. V., Vaughan, J. W., & Bansal, G. (2023). Understanding the role of human intuition on reliance in human-AI decision-making with explanations. Proceedings of the ACM on Human-Computer Interaction, 7(CSCW2), 1\u201332. https:\/\/doi.org\/10.1145\/3610219","journal-title":"Proceedings of the ACM on Human-Computer Interaction"},{"key":"9800_CR30","unstructured":"Chen, X., Liu, C., Li, B., Lu, K., & Song, D. (2017). Targeted backdoor attacks on deep learning systems using data poisoning. CoRR abs\/1712.05526. http:\/\/arxiv.org\/abs\/1712.05526"},{"key":"9800_CR31","doi-asserted-by":"publisher","unstructured":"Cheng, H. F., Wang, R., Zhang, Z., O\u2019Connell, F., Gray, T., Harper, F. M., & Zhu, H. (2019). Explaining decision-making algorithms through UI: Strategies to help non-expert stakeholders. In S. A. Brewster, G. Fitzpatrick, A. L. Cox, & V. Kostakos (Eds.), Proceedings of the 2019 CHI conference on human factors in computing systems, CHI 2019, Glasgow, Scotland, UK, May 04-09, 2019 (p. 559). ACM. https:\/\/doi.org\/10.1145\/3290605.3300789","DOI":"10.1145\/3290605.3300789"},{"key":"9800_CR32","doi-asserted-by":"publisher","unstructured":"Clark, H. H., & Brennan, S. E. (1991). Grounding in communication. In L. Resnick, B. L, M. John, & S. D. Teasley (Eds.), Perspectives on socially shared cognition (pp. 13\u20131991). American Psychological Association. https:\/\/doi.org\/10.1037\/10096-006","DOI":"10.1037\/10096-006"},{"key":"9800_CR33","doi-asserted-by":"publisher","unstructured":"Cobbe, J., Veale, M., & Singh, J. (2023). Understanding accountability in algorithmic supply chains. In Proceedings of the 2023 ACM conference on fairness, accountability, and transparency, FAccT 2023, Chicago, IL, USA, June 12-15, 2023 (pp. 1186\u20131197). ACM. https:\/\/doi.org\/10.1145\/3593013.3594073","DOI":"10.1145\/3593013.3594073"},{"key":"9800_CR34","unstructured":"Cohen, J. M., Rosenfeld, E., & Kolter, J. Z. (2019). Certified adversarial robustness via randomized smoothing. In K. Chaudhuri, & R. Salakhutdinov (Eds.), Proceedings of the 36th international conference on machine learning, ICML 2019, 9-15 June 2019, Long Beach, California, USA, proceedings of machine learning research (Vol.\u00a097, pp. 1310\u20131320). PMLR. http:\/\/proceedings.mlr.press\/v97\/cohen19c.html"},{"key":"9800_CR35","doi-asserted-by":"publisher","DOI":"10.1002\/WIDM.1391","author":"R Confalonieri","year":"2021","unstructured":"Confalonieri, R., Coba, L., Wagner, B., & Besold, T. R. (2021). A historical perspective of explainable artificial intelligence. WIREs Data Mining and Knowledge Discovery. https:\/\/doi.org\/10.1002\/WIDM.1391","journal-title":"WIREs Data Mining and Knowledge Discovery"},{"key":"9800_CR36","unstructured":"Craven, M. W., & Shavlik, J. W. (1995). Extracting tree-structured representations of trained networks. In D. S. Touretzky, M. Mozer, & M. E. Hasselmo (Eds.), Advances in neural information processing systems 8, NIPS, Denver, CO, USA, November 27-30, 1995 (pp. 24\u201330). MIT Press. http:\/\/papers.nips.cc\/paper\/1152-extracting-tree-structured-representations-of-trained-networks"},{"key":"9800_CR37","doi-asserted-by":"publisher","unstructured":"Dai, J., Upadhyay, S., A\u00efvodji, U., Bach, S. H., & Lakkaraju, H. (2022). Fairness via explanation quality: Evaluating disparities in the quality of post hoc explanations. In V. Conitzer, J. Tasioulas, M. Scheutz, R. Calo, M. Mara, & A. Zimmermann (Eds.), AIES \u201922: AAAI\/ACM conference on AI, ethics, and society, Oxford, United Kingdom, May 19-21, 2021 (pp. 203\u2013214). ACM. https:\/\/doi.org\/10.1145\/3514094.3534159","DOI":"10.1145\/3514094.3534159"},{"key":"9800_CR38","doi-asserted-by":"publisher","DOI":"10.1016\/J.ARTINT.2021.103525","volume":"299","author":"R Dazeley","year":"2021","unstructured":"Dazeley, R., Vamplew, P., Foale, C., Young, C., Aryal, S., & Cruz, F. (2021). Levels of explainable artificial intelligence for human-aligned conversational explanations. Artificial Intelligence, 299, 103525. https:\/\/doi.org\/10.1016\/J.ARTINT.2021.103525","journal-title":"Artificial Intelligence"},{"issue":"2","key":"9800_CR39","doi-asserted-by":"publisher","DOI":"10.1016\/J.GIQ.2021.101666","volume":"39","author":"H de Bruijn","year":"2022","unstructured":"de Bruijn, H., Warnier, M., & Janssen, M. (2022). The perils and pitfalls of explainable AI: Strategies for explaining algorithmic decision-making. Government Information Quarterly, 39(2), 101666. https:\/\/doi.org\/10.1016\/J.GIQ.2021.101666","journal-title":"Government Information Quarterly"},{"key":"9800_CR40","volume-title":"Dissemination","author":"J Derrida","year":"2016","unstructured":"Derrida, J. (2016). Dissemination. Bloomsbury Publishing."},{"issue":"1","key":"9800_CR41","doi-asserted-by":"publisher","first-page":"5","DOI":"10.1037\/0022-3514.56.1.5","volume":"56","author":"PG Devine","year":"1989","unstructured":"Devine, P. G. (1989). Stereotypes and prejudice: Their automatic and controlled components. Journal of Personality and Social Psychology, 56(1), 5. https:\/\/doi.org\/10.1037\/0022-3514.56.1.5","journal-title":"Journal of Personality and Social Psychology"},{"key":"9800_CR42","doi-asserted-by":"publisher","unstructured":"Devlin, J., Chang, M., Lee, K., & Toutanova, K. (2019). BERT: Pre-training of deep bidirectional transformers for language understanding. In J. Burstein, C. Doran, & T. Solorio (Eds.), Proceedings of the 2019 conference of the North American chapter of the Association for Computational Linguistics: Human Language Technologies, NAACL-HLT 2019, Minneapolis, MN, USA, June 2-7, 2019, volume 1 (long and short papers) (pp. 4171\u20134186). Association for Computational Linguistics. https:\/\/doi.org\/10.18653\/V1\/N19-1423","DOI":"10.18653\/V1\/N19-1423"},{"key":"9800_CR43","doi-asserted-by":"crossref","unstructured":"Dimanov, B., Bhatt, U., Jamnik, M., & Weller, A. (2020). You shouldn\u2019t trust me: Learning models which conceal unfairness from multiple explanation methods. In H. Espinoza, J. Hern\u00e1ndez-Orallo, X. C. Chen, S. S. \u00d3h\u00c9igeartaigh, X. Huang, M. Castillo-Effen, R. Mallah, & J. A. McDermid (Eds.), Proceedings of the workshop on artificial intelligence safety, co-located with 34th AAAI conference on artificial intelligence, SafeAI@AAAI 2020, New York City, NY, USA, February 7, 2020, CEUR workshop proceedings (Vol. 2560, pp. 63\u201373). CEUR-WS.org. https:\/\/ceur-ws.org\/Vol-2560\/paper8.pdf","DOI":"10.3233\/FAIA200380"},{"key":"9800_CR44","unstructured":"Dombrowski, A., Alber, M., Anders, C. J., Ackermann, M., M\u00fcller, K., & Kessel, P. (2019). Explanations can be manipulated and geometry is to blame. In: [214] (pp. 13567-13578). https:\/\/proceedings.neurips.cc\/paper\/2019\/hash\/bb836c01cdc9120a9c984c525e4b1a4a-Abstract.html"},{"key":"9800_CR45","doi-asserted-by":"publisher","DOI":"10.1016\/J.PATCOG.2021.108194","volume":"121","author":"A Dombrowski","year":"2022","unstructured":"Dombrowski, A., Anders, C. J., M\u00fcller, K., & Kessel, P. (2022). Towards robust explanations for deep neural networks. Pattern Recognition, 121, 108194. https:\/\/doi.org\/10.1016\/J.PATCOG.2021.108194","journal-title":"Pattern Recognition"},{"key":"9800_CR46","doi-asserted-by":"publisher","unstructured":"Dong, Y., Yang, X., Deng, Z., Pang, T., Xiao, Z., Su, H., & Zhu, J. (2021). Black-box detection of backdoor attacks with limited information and data. In 2021 IEEE\/CVF international conference on computer vision, ICCV 2021, Montreal, QC, Canada, October 10-17, 2021 (pp. 16462\u201316471). IEEE. https:\/\/doi.org\/10.1109\/ICCV48922.2021.01617","DOI":"10.1109\/ICCV48922.2021.01617"},{"key":"9800_CR47","doi-asserted-by":"publisher","unstructured":"Duddu, V., & Boutet, A. (2022). Inferring sensitive attributes from model explanations. In M. A. Hasan, & L. Xiong (Eds.), Proceedings of the 31st ACM international conference on information & knowledge management, Atlanta, GA, USA, October 17-21, 2022 (pp. 416\u2013425). ACM. https:\/\/doi.org\/10.1145\/3511808.3557362","DOI":"10.1145\/3511808.3557362"},{"key":"9800_CR48","doi-asserted-by":"publisher","unstructured":"Dwork, C. (2006). Differential privacy. In M. Bugliesi, B. Preneel, V. Sassone, I., & Wegener (Eds.), Automata, languages and programming (pp. 1\u201312). Springer Berlin Heidelberg. https:\/\/doi.org\/10.1007\/11787006_1","DOI":"10.1007\/11787006_1"},{"key":"9800_CR49","doi-asserted-by":"publisher","unstructured":"Ehsan, U., Wintersberger, P., Liao, Q. V., Watkins, E. A., Manger, C., Daum\u00e9 III, H., Riener, A., & Riedl, M. O. (2022). Human-centered explainable AI (HCXAI): Beyond opening the black-box of AI. In Extended abstracts of the 2022 CHI conference on human factors in computing systems. Association for Computing Machinery, New York, NY, USA, CHI EA \u201922.https:\/\/doi.org\/10.1145\/3491101.3503727,","DOI":"10.1145\/3491101.3503727"},{"key":"9800_CR50","volume-title":"Automating inequality: How high-tech tools profile, police, and punish the poor","author":"V Eubanks","year":"2018","unstructured":"Eubanks, V. (2018). Automating inequality: How high-tech tools profile, police, and punish the poor. St: Martin\u2019s Press."},{"key":"#cr-split#-9800_CR51.1","unstructured":"European Commission. (2016). Regulation"},{"key":"#cr-split#-9800_CR51.2","unstructured":"(EU) 2016\/679 of the European Parliament and of the Council of 27 April 2016 on the protection of natural persons with regard to the processing of personal data and on the free movement of such data, and repealing Directive 95\/46\/EC (General Data Protection Regulation) (Text with EEA relevance). https:\/\/eur-lex.europa.eu\/eli\/reg\/2016\/679\/oj"},{"key":"9800_CR52","doi-asserted-by":"publisher","unstructured":"Ferry, J., A\u00efvodji, U., Gambs, S., Huguet, M., & Siala, M. (2022). Exploiting fairness to enhance sensitive attributes reconstruction. CoRR abs\/2209.01215. https:\/\/doi.org\/10.48550\/ARXIV.2209.01215","DOI":"10.48550\/ARXIV.2209.01215"},{"key":"9800_CR53","unstructured":"Fisher, A., Rudin, C., & Dominici, F. (2019). All models are wrong, but many are useful: Learning a variable\u2019s importance by studying an entire class of prediction models simultaneously. Journal of Machine Learning Research, 20, 177:1\u2013177:81."},{"key":"9800_CR54","doi-asserted-by":"publisher","first-page":"727","DOI":"10.1007\/s11948-012-9413-4","volume":"19","author":"L Floridi","year":"2013","unstructured":"Floridi, L. (2013). Distributed morality in an information society. Science and Engineering Ethics, 19, 727\u2013743. https:\/\/doi.org\/10.1007\/s11948-012-9413-4","journal-title":"Science and Engineering Ethics"},{"key":"9800_CR55","doi-asserted-by":"publisher","unstructured":"Floridi, L. (2016a). Faultless responsibility: On the nature and allocation of moral responsibility for distributed moral actions. Philosophical Transactions of the Royal Society A: Mathematical, Physical and Engineering Sciences, 374(2083), 20160112. https:\/\/doi.org\/10.1098\/rsta.2016.0112","DOI":"10.1098\/rsta.2016.0112"},{"key":"9800_CR56","doi-asserted-by":"crossref","unstructured":"Floridi, L. (2016b). Tolerant paternalism: Pro-ethical design as a resolution of the dilemma of toleration. Science and Engineering Ethics, 22(6), 1669\u20131688.","DOI":"10.1007\/s11948-015-9733-2"},{"key":"9800_CR57","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s13347-018-0303-9","volume":"31","author":"L Floridi","year":"2018","unstructured":"Floridi, L. (2018). Soft ethics and the governance of the digital. Philosophy & Technology, 31, 1\u20138. https:\/\/doi.org\/10.1007\/s13347-018-0303-9","journal-title":"Philosophy & Technology"},{"issue":"1","key":"9800_CR58","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/2594473.2594475","volume":"15","author":"AA Freitas","year":"2013","unstructured":"Freitas, A. A. (2013). Comprehensible classification models: A position paper. SIGKDD Explorations, 15(1), 1\u201310. https:\/\/doi.org\/10.1145\/2594473.2594475","journal-title":"SIGKDD Explorations"},{"key":"9800_CR59","unstructured":"Friedman, B., & Kahn, P. H. (2002). Human values, ethics, and design. In The human-computer interaction handbook: Fundamentals, evolving technologies and emerging applications (pp. 1177\u20131201). L. Erlbaum Associates Inc."},{"issue":"5","key":"9800_CR60","doi-asserted-by":"publisher","first-page":"1189","DOI":"10.1214\/aos\/1013203451","volume":"29","author":"JH Friedman","year":"2001","unstructured":"Friedman, J. H. (2001). Greedy function approximation: A gradient boosting machine. The Annals of Statistics, 29(5), 1189\u20131232. https:\/\/doi.org\/10.1214\/aos\/1013203451","journal-title":"The Annals of Statistics"},{"key":"9800_CR61","doi-asserted-by":"crossref","unstructured":"Fukuchi, K., Hara, S., & Maehara, T. (2020). Faking fairness via stealthily biased sampling. In The thirty-fourth AAAI conference on artificial intelligence, AAAI 2020, the thirty-second innovative applications of artificial intelligence conference, IAAI 2020, the tenth AAAI symposium on educational advances in artificial intelligence, EAAI 2020, New York, NY, USA, February 7-12, 2020 (pp. 412\u2013419). AAAI Press. https:\/\/ojs.aaai.org\/index.php\/AAAI\/article\/view\/5377","DOI":"10.1609\/aaai.v34i01.5377"},{"key":"9800_CR62","volume-title":"Dialogue concerning the two chief world systems","author":"G Galilei","year":"1953","unstructured":"Galilei, G. (1953). Dialogue concerning the two chief world systems. Ptolemaic and Copernican: University of California Press."},{"key":"9800_CR63","doi-asserted-by":"publisher","unstructured":"Gan, Y., Mao, Y., Zhang, X., Ji, S., Pu, Y., Han, M., Yin, J., & Wang, T. (2022). \u201cis your explanation stable?\u201d: A robustness evaluation framework for feature attribution. In H. Yin, A. Stavrou, C. Cremers, & E. Shi (Eds.), Proceedings of the 2022 ACM SIGSAC conference on computer and communications security, CCS 2022, Los Angeles, CA, USA, November 7-11, 2022 (pp. 1157\u20131171). ACM. https:\/\/doi.org\/10.1145\/3548606.3559392","DOI":"10.1145\/3548606.3559392"},{"key":"9800_CR64","doi-asserted-by":"publisher","unstructured":"Gao, Y., Xu, C., Wang, D., Chen, S., Ranasinghe, D.C., & Nepal, S. (2019). STRIP: A defence against Trojan attacks on deep neural networks. In D. Balenson (Eds.), Proceedings of the 35th annual computer security applications conference, ACSAC 2019, San Juan, PR, USA, December 09-13, 2019 (pp. 113\u2013125). ACM. https:\/\/doi.org\/10.1145\/3359789.3359790","DOI":"10.1145\/3359789.3359790"},{"key":"9800_CR65","doi-asserted-by":"publisher","unstructured":"Gebru, T., Morgenstern, J., Vecchione, B., Vaughan, J. W., Wallach, H. M., Daum\u00e9, H., III., & Crawford, K. (2021). Datasheets for datasets. Communications of the ACM, 64(12), 86\u201392. https:\/\/doi.org\/10.1145\/3458723","DOI":"10.1145\/3458723"},{"key":"9800_CR66","unstructured":"Ghalebikesabi, S., Ter-Minassian, L., DiazOrdaz, K., & Holmes, C.C (2021) On locality of local explanation models. In M. Ranzato, A. Beygelzimer, Y. N. Dauphin, P. Liang, & J. W. Vaughan (Eds.), Advances in neural information processing systems 34: Annual conference on neural information processing systems 2021, NeurIPS 2021, December 6-14, 2021, virtual (pp. 18395-18407). https:\/\/proceedings.neurips.cc\/paper\/2021\/hash\/995665640dc319973d3173a74a03860c-Abstract.html"},{"key":"9800_CR67","doi-asserted-by":"publisher","unstructured":"Ghorbani, A., Abid, A, & Zou, J. Y. (2019). Interpretation of neural networks is fragile. In The thirty-third AAAI conference on artificial intelligence, AAAI 2019, the thirty-first innovative applications of artificial intelligence conference, IAAI 2019, the ninth AAAI symposium on educational advances in artificial intelligence, EAAI 2019, Honolulu, Hawaii, USA, January 27-February 1, 2019 (pp. 3681\u20133688). AAAI Press. https:\/\/doi.org\/10.1609\/aaai.v33i01.33013681","DOI":"10.1609\/aaai.v33i01.33013681"},{"issue":"1","key":"9800_CR68","doi-asserted-by":"publisher","first-page":"44","DOI":"10.1080\/10618600.2014.907095","volume":"24","author":"A Goldstein","year":"2015","unstructured":"Goldstein, A., Kapelner, A., Bleich, J., & Pitkin, E. (2015). Peeking inside the black box: Visualizing statistical learning with plots of individual conditional expectation. Journal of Computational and Graphical Statistics, 24(1), 44\u201365. https:\/\/doi.org\/10.1080\/10618600.2014.907095","journal-title":"Journal of Computational and Graphical Statistics"},{"key":"9800_CR69","unstructured":"Goodfellow, I. J., Shlens, J., & Szegedy, C. (2015). Explaining and harnessing adversarial examples. In Y. Bengio, & Y. LeCun (Eds.), 3rd international conference on learning representations, ICLR 2015, San Diego, CA, USA, May 7-9, 2015, conference track proceedings. http:\/\/arxiv.org\/abs\/1412.6572"},{"issue":"1","key":"9800_CR70","doi-asserted-by":"publisher","first-page":"101","DOI":"10.1023\/A:1008290415597","volume":"8","author":"A Gopnik","year":"1998","unstructured":"Gopnik, A. (1998). Explanation as orgasm. Minds and Machines, 8(1), 101\u2013118. https:\/\/doi.org\/10.1023\/A:1008290415597","journal-title":"Minds and Machines"},{"issue":"5","key":"9800_CR71","doi-asserted-by":"crossref","first-page":"620","DOI":"10.1037\/0012-1649.37.5.620","volume":"37","author":"A Gopnik","year":"2001","unstructured":"Gopnik, A., Sobel, D. M., Schulz, L. E., & Glymour, C. (2001). Causal learning mechanisms in very young children: Two-, three-, and four-year-olds infer causal relations from patterns of variation and covariation. Developmental Psychology, 37(5), 620.","journal-title":"Developmental Psychology"},{"key":"9800_CR72","doi-asserted-by":"publisher","first-page":"47230","DOI":"10.1109\/ACCESS.2019.2909068","volume":"7","author":"T Gu","year":"2019","unstructured":"Gu, T., Liu, K., Dolan-Gavitt, B., & Garg, S. (2019). BadNets: Evaluating backdooring attacks on deep neural networks. IEEE Access, 7, 47230\u201347244. https:\/\/doi.org\/10.1109\/ACCESS.2019.2909068","journal-title":"IEEE Access"},{"key":"9800_CR73","doi-asserted-by":"publisher","unstructured":"Guidotti, R., Monreale, A., Ruggieri, S., Turini, F., Giannotti, F., & Pedreschi, D. (2019). A survey of methods for explaining black box models. ACM Computing Surveys, 51(5), 93:1\u201393:42. https:\/\/doi.org\/10.1145\/3236009","DOI":"10.1145\/3236009"},{"issue":"2","key":"9800_CR74","doi-asserted-by":"publisher","first-page":"44","DOI":"10.1609\/AIMAG.V40I2.2850","volume":"40","author":"D Gunning","year":"2019","unstructured":"Gunning, D., & Aha, D. W. (2019). Darpa\u2019s explainable artificial intelligence (XAI) program. AI Magazine, 40(2), 44\u201358. https:\/\/doi.org\/10.1609\/AIMAG.V40I2.2850","journal-title":"AI Magazine"},{"key":"9800_CR75","doi-asserted-by":"publisher","unstructured":"Hacker, P., & Passoth, J. H. (2022). Varieties of\u00a0AI explanations under the\u00a0law. From\u00a0the\u00a0GDPR to\u00a0the\u00a0AIA, and\u00a0beyond. In A. Holzinger, R. Goebel, R. Fong, T. Moon, K. M\u00fcller, & W. Samek (Eds.), xxAI\u2014Beyond explainable AI: International workshop, held in conjunction with ICML 2020, July 18, 2020, Vienna, Austria, revised and extended papers. Lecture notes in computer science (pp. 343\u2013373). Springer International Publishing. https:\/\/doi.org\/10.1007\/978-3-031-04083-2_17","DOI":"10.1007\/978-3-031-04083-2_17"},{"issue":"4","key":"9800_CR76","first-page":"609","volume":"13","author":"D Hadwick","year":"2021","unstructured":"Hadwick, D., & Lan, S. (2021). Lessons to be learned from the Dutch childcare allowance scandal: A comparative review of algorithmic governance by tax administrations in the Netherlands. France and Germany. World Tax Journal-Amsterdam, 13(4), 609\u2013645.","journal-title":"France and Germany. World Tax Journal-Amsterdam"},{"key":"9800_CR77","unstructured":"Hagendorff, T. (2019). The ethics of AI ethics\u2014An evaluation of guidelines. CoRR abs\/1903.03425. http:\/\/arxiv.org\/abs\/1903.03425"},{"issue":"2","key":"9800_CR78","doi-asserted-by":"publisher","first-page":"172","DOI":"10.1177\/1745691611400240","volume":"6","author":"U Hahn","year":"2011","unstructured":"Hahn, U. (2011). The problem of circularity in evidence, argument, and explanation. Perspectives on Psychological Science, 6(2), 172\u2013182. https:\/\/doi.org\/10.1177\/1745691611400240","journal-title":"Perspectives on Psychological Science"},{"key":"9800_CR79","doi-asserted-by":"publisher","DOI":"10.4324\/9781410605290","author":"DF Halpern","year":"2000","unstructured":"Halpern, D. F. (2000). Sex differences in cognitive abilities. Psychology Press. https:\/\/doi.org\/10.4324\/9781410605290","journal-title":"Psychology Press"},{"key":"9800_CR80","volume-title":"Whose science? Whose knowledge?: Thinking from women\u2019s lives","author":"S Harding","year":"1991","unstructured":"Harding, S. (1991). Whose science? Whose knowledge?: Thinking from women\u2019s lives. Cornell University Press."},{"issue":"1","key":"9800_CR81","doi-asserted-by":"crossref","first-page":"88","DOI":"10.2307\/2183532","volume":"74","author":"GH Harman","year":"1965","unstructured":"Harman, G. H. (1965). The inference to the best explanation. The Philosophical Review, 74(1), 88\u201395.","journal-title":"The Philosophical Review"},{"issue":"2","key":"9800_CR82","doi-asserted-by":"publisher","first-page":"14","DOI":"10.1007\/s44206-022-00017-z","volume":"1","author":"A Hasan","year":"2022","unstructured":"Hasan, A., Brown, S., Davidovic, J., Lange, B., & Regan, M. (2022). Algorithmic bias and risk assessments: Lessons from practice. Digital Society, 1(2), 14. https:\/\/doi.org\/10.1007\/s44206-022-00017-z","journal-title":"Digital Society"},{"issue":"1","key":"9800_CR83","doi-asserted-by":"publisher","first-page":"113","DOI":"10.1348\/014466600164363","volume":"39","author":"N Haslam","year":"2000","unstructured":"Haslam, N., Rothschild, L., & Ernst, D. (2000). Essentialist beliefs about social categories. British Journal of social psychology, 39(1), 113\u2013127. https:\/\/doi.org\/10.1348\/014466600164363","journal-title":"British Journal of social psychology"},{"issue":"2","key":"9800_CR84","doi-asserted-by":"publisher","first-page":"149","DOI":"10.1207\/S15326969ECO1502_4","volume":"15","author":"H Heft","year":"2003","unstructured":"Heft, H. (2003). Affordances, dynamic experience, and the challenge of reification. Ecological Psychology, 15(2), 149\u2013180. https:\/\/doi.org\/10.1207\/S15326969ECO1502_4","journal-title":"Ecological Psychology"},{"issue":"2","key":"9800_CR85","doi-asserted-by":"publisher","first-page":"135","DOI":"10.1086\/286983","volume":"15","author":"CG Hempel","year":"1948","unstructured":"Hempel, C. G., & Oppenheim, P. (1948). Studies in the logic of explanation. Philosophy of Science, 15(2), 135\u2013175. https:\/\/doi.org\/10.1086\/286983","journal-title":"Philosophy of Science"},{"key":"9800_CR86","unstructured":"Heo, J., Joo, S., & Moon, T. (2019). Fooling neural network interpretations via adversarial model manipulation. In H. M. Wallach, H. Larochelle, A. Beygelzimer, F. d\u2019Alch\u00e9-Buc, E. B. Fox, & R. Garnett (Eds.), Advances in neural information processing systems 32: Annual conference on neural information processing systems 2019, NeurIPS 2019, December 8-14, 2019, Vancouver, BC, Canada (pp. 2921\u20132932). https:\/\/proceedings.neurips.cc\/paper\/2019\/hash\/7fea637fd6d02b8f0adf6f7dc36aed93-Abstract.html"},{"issue":"1","key":"9800_CR87","doi-asserted-by":"publisher","first-page":"41","DOI":"10.1007\/s43681-020-00008-1","volume":"1","author":"M Hickok","year":"2021","unstructured":"Hickok, M. (2021). Lessons learned from AI ethics principles for future actions. AI Ethics, 1(1), 41\u201347. https:\/\/doi.org\/10.1007\/s43681-020-00008-1","journal-title":"AI Ethics"},{"key":"9800_CR88","unstructured":"Hooker, S., Erhan, D., Kindermans, P., & Kim B. (2019). A benchmark for interpretability methods in deep neural networks. In H. M. Wallach, H. Larochelle, A. Beygelzimer, F. d\u2019Alch\u00e9-Buc, E. B. Fox, & R. Garnett (Eds.), Advances in neural information processing systems 32: Annual conference on neural information processing systems 2019, NeurIPS 2019, December 8-14, 2019, Vancouver, BC, Canada (pp. 9734\u20139745). https:\/\/proceedings.neurips.cc\/paper\/2019\/hash\/fe4b8556000d0f0cae99daa5c5c5a410-Abstract.html"},{"issue":"1","key":"9800_CR89","doi-asserted-by":"publisher","first-page":"91","DOI":"10.1016\/0010-0277(96)81418-1","volume":"59","author":"WS Horton","year":"1996","unstructured":"Horton, W. S., & Keysar, B. (1996). When do speakers take into account common ground? Cognition, 59(1), 91\u2013117. https:\/\/doi.org\/10.1016\/0010-0277(96)81418-1","journal-title":"Cognition"},{"key":"9800_CR90","doi-asserted-by":"publisher","DOI":"10.3389\/frai.2022.903875","author":"T Huber","year":"2022","unstructured":"Huber, T., Limmer, B., & Andr\u00e9, E. (2022). Benchmarking perturbation-based saliency maps for explaining atari agents. Frontiers in Artificial Intelligence. https:\/\/doi.org\/10.3389\/frai.2022.903875","journal-title":"Frontiers in Artificial Intelligence"},{"key":"9800_CR91","unstructured":"Human\u00a0Rights Watch. (2023). Automated neglect\u2014hrw.org. Retrieved June 27, 2023, from https:\/\/www.hrw.org\/report\/2023\/06\/13\/automated-neglect\/how-world-banks-push-allocate-cash-assistance-using-algorithms"},{"key":"9800_CR92","doi-asserted-by":"publisher","unstructured":"Hyman, S. E. (2010). The diagnosis of mental disorders: The problem of reification. Annual Review of Clinical Psychology, 6(Volume 6, 2010):155\u2013179. https:\/\/doi.org\/10.1146\/annurev.clinpsy.3.022806.091532","DOI":"10.1146\/annurev.clinpsy.3.022806.091532"},{"key":"9800_CR93","unstructured":"Ilyas, A., Engstrom, L., Athalye, A., & Lin, J. (2018). Black-box adversarial attacks with limited queries and information. In J. G. Dy, & A. Krause (Eds.), Proceedings of the 35th international conference on machine learning, ICML 2018, Stockholmsm\u00e4ssan, Stockholm, Sweden, July 10-15, 2018, proceedings of machine learning research (Vol.\u00a080, pp. 2142-2151). PMLR. http:\/\/proceedings.mlr.press\/v80\/ilyas18a.html"},{"issue":"5","key":"9800_CR94","doi-asserted-by":"publisher","first-page":"496","DOI":"10.1177\/1745691612448792","volume":"7","author":"Y Inbar","year":"2012","unstructured":"Inbar, Y., & Lammers, J. (2012). Political diversity in social and personality psychology. Perspectives on Psychological Science, 7(5), 496\u2013503. https:\/\/doi.org\/10.1177\/1745691612448792","journal-title":"Perspectives on Psychological Science"},{"key":"9800_CR95","doi-asserted-by":"publisher","unstructured":"Jagielski, M., Oprea, A., Biggio, B., Liu, C., Nita-Rotaru, C., & Li, B. (2018). Manipulating machine learning: Poisoning attacks and countermeasures for regression learning. In 2018 IEEE symposium on security and privacy, SP 2018, proceedings, 21-23 May 2018, San Francisco, California, USA (pp. 19\u201335). IEEE Computer Society. https:\/\/doi.org\/10.1109\/SP.2018.00057","DOI":"10.1109\/SP.2018.00057"},{"issue":"2","key":"9800_CR96","doi-asserted-by":"publisher","first-page":"478","DOI":"10.1177\/0894439320980118","volume":"40","author":"M Janssen","year":"2022","unstructured":"Janssen, M., Hartog, M., Matheus, R., Ding, A. I., & Kuk, G. (2022). Will algorithms blind people? The effect of explainable AI and decision-makers\u2019 experience on AI-supported decision-making in government. Social Science Computer Review, 40(2), 478\u2013493. https:\/\/doi.org\/10.1177\/0894439320980118","journal-title":"Social Science Computer Review"},{"key":"9800_CR97","doi-asserted-by":"publisher","unstructured":"Jia, J., Liu, Y., & Gong, N. Z. (2022). Badencoder: Backdoor attacks to pre-trained encoders in self-supervised learning. In 43rd IEEE symposium on security and privacy, SP 2022, San Francisco, CA, USA, May 22-26, 2022 (pp. 2043\u20132059). IEEE. https:\/\/doi.org\/10.1109\/SP46214.2022.9833644","DOI":"10.1109\/SP46214.2022.9833644"},{"issue":"1","key":"9800_CR98","doi-asserted-by":"publisher","first-page":"123","DOI":"10.1080\/1369118X.2021.1934069","volume":"26","author":"RF J\u00f8rgensen","year":"2023","unstructured":"J\u00f8rgensen, R. F. (2023). Data and rights in the digital welfare state: The case of Denmark. Information, Communication & Society, 26(1), 123\u2013138. https:\/\/doi.org\/10.1080\/1369118X.2021.1934069","journal-title":"Information, Communication & Society"},{"issue":"3","key":"9800_CR99","doi-asserted-by":"publisher","first-page":"430","DOI":"10.1016\/0010-0285(72)90016-3","volume":"3","author":"D Kahneman","year":"1972","unstructured":"Kahneman, D., & Tversky, A. (1972). Subjective probability: A judgment of representativeness. Cognitive Psychology, 3(3), 430\u2013454. https:\/\/doi.org\/10.1016\/0010-0285(72)90016-3","journal-title":"Cognitive Psychology"},{"issue":"4","key":"9800_CR100","doi-asserted-by":"publisher","first-page":"341","DOI":"10.1037\/0003-066X.39.4.341","volume":"39","author":"D Kahneman","year":"1984","unstructured":"Kahneman, D., & Tversky, A. (1984). Choices, values, and frames. American Psychologist, 39(4), 341. https:\/\/doi.org\/10.1037\/0003-066X.39.4.341","journal-title":"American Psychologist"},{"key":"9800_CR101","doi-asserted-by":"publisher","unstructured":"Kaur, H., Nori, H., Jenkins, S., Caruana, R., Wallach, H., & Jennifer, W. V. (2020). Interpreting interpretability: Understanding data scientists\u2019 use of interpretability tools for machine learning. In Proceedings of the 2020 CHI conference on human factors in computing systems. Association for Computing Machinery, New York, NY, USA, CHI \u201920 (pp. 1\u201314). https:\/\/doi.org\/10.1145\/3313831.3376219","DOI":"10.1145\/3313831.3376219"},{"key":"9800_CR102","doi-asserted-by":"publisher","unstructured":"Keane, M. T., Kenny, E. M., Delaney, E., & Smyth, B. (2021). If only we had better counterfactual explanations: Five key deficits to rectify in the evaluation of counterfactual XAI techniques. In Z. Zhou (Ed.), Proceedings of the thirtieth international joint conference on artificial intelligence, IJCAI 2021, Virtual Event \/ Montreal, Canada, 19-27 August 2021 (pp. 4466\u20134474). ijcai.org.https:\/\/doi.org\/10.24963\/ijcai.2021\/609","DOI":"10.24963\/ijcai.2021\/609"},{"key":"9800_CR103","doi-asserted-by":"publisher","unstructured":"Keane, M. T., & Smyth, B. (2020). Good counterfactuals and where to find them: A case-based technique for generating counterfactuals for explainable AI (XAI). In I. Watson, R. O. Weber (Eds.), Case-based reasoning research and development\u201428th International conference, ICCBR 2020, Salamanca, Spain, June 8-12, 2020, proceedings, lecture notes in computer science (Vol. 12311, pp. 163\u2013178). Springer. https:\/\/doi.org\/10.1007\/978-3-030-58342-2_11","DOI":"10.1007\/978-3-030-58342-2_11"},{"key":"9800_CR104","doi-asserted-by":"publisher","first-page":"227","DOI":"10.1146\/annurev.psych.57.102904.190100","volume":"57","author":"FC Keil","year":"2006","unstructured":"Keil, F. C. (2006). Explanation and understanding. Annual Review of Psychology, 57, 227\u2013254. https:\/\/doi.org\/10.1146\/annurev.psych.57.102904.190100","journal-title":"Annual Review of Psychology"},{"key":"9800_CR105","doi-asserted-by":"crossref","DOI":"10.7551\/mitpress\/2930.001.0001","volume-title":"Explanation and cognition","author":"FC Keil","year":"2000","unstructured":"Keil, F. C., Wilson, R. A., & Wilson, R. A. (2000). Explanation and cognition. MIT Press."},{"key":"9800_CR106","doi-asserted-by":"crossref","unstructured":"Kenny, E. M., & Keane, M. T. (2021). On generating plausible counterfactual and semi-factual explanations for deep learning. In Thirty-fifth AAAI conference on artificial intelligence, AAAI 2021, thirty-third conference on innovative applications of artificial intelligence, IAAI 2021, the eleventh symposium on educational advances in artificial intelligence, EAAI 2021, virtual event, February 2-9, 2021 (pp. 11575\u201311585). AAAI Press. https:\/\/ojs.aaai.org\/index.php\/AAAI\/article\/view\/17377","DOI":"10.1609\/aaai.v35i13.17377"},{"issue":"1","key":"9800_CR107","doi-asserted-by":"publisher","first-page":"89","DOI":"10.1006\/jmla.1995.1005","volume":"34","author":"B Keysar","year":"1995","unstructured":"Keysar, B., & Bly, B. (1995). Intuitions of the transparency of idioms: Can one keep a secret by spilling the beans? Journal of Memory and Language, 34(1), 89\u2013109. https:\/\/doi.org\/10.1006\/jmla.1995.1005","journal-title":"Journal of Memory and Language"},{"key":"9800_CR108","unstructured":"Kim, B., Wattenberg, M., Gilmer, J., Cai, C. J., Wexler, J., Vi\u00e9gas, F. B., & Sayres, R. (2018). Interpretability beyond feature attribution: Quantitative testing with concept activation vectors (TCAV). In J. G. Dy, A. Krause (Eds.), Proceedings of the 35th international conference on machine learning, ICML 2018, Stockholmsm\u00e4ssan, Stockholm, Sweden, July 10-15, 2018, proceedings of machine learning research (Vol.\u00a080, pp. 2673\u20132682). PMLR. http:\/\/proceedings.mlr.press\/v80\/kim18d.html"},{"key":"9800_CR109","unstructured":"Kim, J. S., Plumb, G., & Talwalkar, A. (2022). Sanity simulations for saliency methods. In K. Chaudhuri, S. Jegelka, L. Song, C. Szepesv\u00e1ri, G. Niu, & S. Sabato (Eds.), International conference on machine learning, ICML 2022, 17-23 July 2022, Baltimore, Maryland, USA, proceedings of machine learning research (Vol. 162, pp. 11173\u201311200). PMLR. https:\/\/proceedings.mlr.press\/v162\/kim22h.html"},{"key":"9800_CR110","doi-asserted-by":"publisher","first-page":"1121","DOI":"10.1037\/0022-3514.77.6.1121","volume":"77","author":"J Kruger","year":"2000","unstructured":"Kruger, J., & Dunning, D. (2000). Unskilled and unaware of it: How difficulties in recognizing one\u2019s own incompetence lead to inflated self-assessments. Journal of Personality and Social Psychology, 77, 1121\u201334. https:\/\/doi.org\/10.1037\/0022-3514.77.6.1121","journal-title":"Journal of Personality and Social Psychology"},{"key":"9800_CR111","doi-asserted-by":"publisher","first-page":"395","DOI":"10.1037\/0033-2909.106.3.395","volume":"106","author":"A Kruglanski","year":"1989","unstructured":"Kruglanski, A. (1989). The psychology of being right: The problem of accuracy in social perception and cognition. Psychological Bulletin, 106, 395\u2013409. https:\/\/doi.org\/10.1037\/0033-2909.106.3.395","journal-title":"Psychological Bulletin"},{"key":"9800_CR112","doi-asserted-by":"publisher","first-page":"345","DOI":"10.1016\/S0065-2601(05)37006-7","volume":"37","author":"A Kruglanski","year":"2005","unstructured":"Kruglanski, A., Raviv, A., Bar-Tal, D., Raviv, A., Sharvit, K., Ellis, S., Bar, R., Pierro, A., & Mannetti, L. (2005). Says who?: Epistemic authority effects in social judgment. Advances in Experimental Social Psychology, 37, 345\u2013392. https:\/\/doi.org\/10.1016\/S0065-2601(05)37006-7","journal-title":"Advances in Experimental Social Psychology"},{"key":"9800_CR113","doi-asserted-by":"publisher","unstructured":"Kuhl, U., Artelt, A., & Hammer, B. (2022). Keep your friends close and your counterfactuals closer: Improved learning from closest rather than plausible counterfactual explanations in an abstract setting. In FAccT \u201922: 2022 ACM conference on fairness, accountability, and transparency, Seoul, Republic of Korea, June 21-24, 2022 (pp. 2125\u20132137). ACM. https:\/\/doi.org\/10.1145\/3531146.3534630","DOI":"10.1145\/3531146.3534630"},{"key":"9800_CR114","unstructured":"Kuhn, T. S. (1981). textitObjectivity, value judgment, and theory choice (pp. 320\u2013339). Duke University Press."},{"key":"9800_CR115","doi-asserted-by":"publisher","unstructured":"Kuppa, A., & Le-Khac, N. (2020). Black box attacks on explainable artificial intelligence (XAI) methods in cyber security. In 2020 international joint conference on neural networks, IJCNN 2020, Glasgow, United Kingdom, July 19-24, 2020 (pp. 1\u20138). IEEE. https:\/\/doi.org\/10.1109\/IJCNN48605.2020.9206780","DOI":"10.1109\/IJCNN48605.2020.9206780"},{"key":"9800_CR116","doi-asserted-by":"publisher","unstructured":"Laberge, G., A\u00efvodji, U., & Hara, S. (2022). Fooling SHAP with stealthily biased sampling. CoRR abs\/2205.15419. https:\/\/doi.org\/10.48550\/arXiv.2205.15419","DOI":"10.48550\/arXiv.2205.15419"},{"key":"9800_CR117","unstructured":"Lakkaraju, H., Arsov, N., & Bastani, O. (2020). Robust and stable black box explanations. In Proceedings of the 37th international conference on machine learning, ICML 2020, 13-18 July 2020, virtual event, proceedings of machine learning research (Vol. 119, pp. 5628\u20135638). PMLR. http:\/\/proceedings.mlr.press\/v119\/lakkaraju20a.html"},{"key":"9800_CR118","unstructured":"Lakoff, G. (2008). Women, fire, and dangerous things: What categories reveal about the mind. University of Chicago Press."},{"issue":"4","key":"9800_CR119","first-page":"631","volume":"25","author":"G Lakoff","year":"1999","unstructured":"Lakoff, G., Johnson, M., & Sowa, J. F. (1999). Review of philosophy in the flesh: The embodied mind and its challenge to western thought. Computational Linguistics, 25(4), 631\u2013634.","journal-title":"Computational Linguistics"},{"key":"9800_CR120","doi-asserted-by":"publisher","DOI":"10.1016\/J.ARTINT.2021.103473","volume":"296","author":"M Langer","year":"2021","unstructured":"Langer, M., Oster, D., Speith, T., Hermanns, H., K\u00e4stner, L., Schmidt, E., Sesing, A., & Baum, K. (2021). What do we want from explainable artificial intelligence (XAI)?\u2013A stakeholder perspective on XAI and a conceptual model guiding interdisciplinary XAI research. Artificial Intelligence, 296, 103473. https:\/\/doi.org\/10.1016\/J.ARTINT.2021.103473","journal-title":"Artificial Intelligence"},{"key":"9800_CR121","first-page":"155","volume":"10","author":"B Latour","year":"1988","unstructured":"Latour, B. (1988). The politics of explanation: An alternative. Knowledge and Reflexivity: New Frontiers in the Sociology of Knowledge, 10, 155\u2013176.","journal-title":"Knowledge and Reflexivity: New Frontiers in the Sociology of Knowledge"},{"key":"9800_CR122","doi-asserted-by":"publisher","unstructured":"Leventi-Peetz, A., & Weber, K. (2022). Rashomon effect and consistency in explainable artificial intelligence (XAI). In K. Arai (Ed.), Proceedings of the future technologies conference, FTC 2022, virtual event, 20-21 October 2022, Volume 1, lecture notes in networks and systems (Vol. 559, pp. 796\u2013808). Springer. https:\/\/doi.org\/10.1007\/978-3-031-18461-1_52","DOI":"10.1007\/978-3-031-18461-1_52"},{"key":"9800_CR123","doi-asserted-by":"publisher","DOI":"10.7551\/mitpress\/5526.001.0001","author":"SC Levinson","year":"2000","unstructured":"Levinson, S. C. (2000). Presumptive meanings: The theory of generalized conversational implicature. MIT Press. https:\/\/doi.org\/10.7551\/mitpress\/5526.001.0001","journal-title":"MIT Press"},{"key":"9800_CR124","unstructured":"Liao, Q. V., & Varshney, K. R. (2021). Human-centered explainable AI (XAI): From algorithms to user experiences. CoRR abs\/2110.10790. http:\/\/arxiv.org\/abs\/2110.10790"},{"key":"9800_CR125","doi-asserted-by":"publisher","unstructured":"Lipton, P. (2017). Inference to the best explanation. In: W. H. Newton-Smith (Ed.), A companion to the philosophy of science (pp. 184\u2013193). Blackwell. https:\/\/doi.org\/10.1002\/9781405164481.ch29","DOI":"10.1002\/9781405164481.ch29"},{"issue":"3","key":"9800_CR126","doi-asserted-by":"publisher","first-page":"31","DOI":"10.1145\/3236386.3241340","volume":"16","author":"ZC Lipton","year":"2018","unstructured":"Lipton, Z. C. (2018). The mythos of model interpretability: In machine learning, the concept of interpretability is both important and slippery. Queue, 16(3), 31\u201357. https:\/\/doi.org\/10.1145\/3236386.3241340","journal-title":"Queue"},{"key":"9800_CR127","doi-asserted-by":"publisher","DOI":"10.1016\/j.artint.2022.103787","volume":"313","author":"A Liu","year":"2022","unstructured":"Liu, A., Chen, X., Liu, S., Xia, L., & Gan, C. (2022). Certifiably robust interpretation via R\u00e9nyi differential privacy. Artificial Intelligence, 313, 103787. https:\/\/doi.org\/10.1016\/j.artint.2022.103787","journal-title":"Artificial Intelligence"},{"key":"9800_CR128","doi-asserted-by":"crossref","unstructured":"Liu, Y., Ma, S., Aafer, Y., Lee, W., Zhai, J., Wang, W., & Zhang, X. (2018). Trojaning attack on neural networks. In 25th annual network and distributed system security symposium, NDSS 2018, San Diego, California, USA, February 18-21, 2018. The Internet Society. http:\/\/wp.internetsociety.org\/ndss\/wp-content\/uploads\/sites\/25\/2018\/02\/ndss2018_03A-5_Liu_paper.pdf","DOI":"10.14722\/ndss.2018.23291"},{"key":"9800_CR129","doi-asserted-by":"publisher","unstructured":"L\u00f6fstr\u00f6m, H., Hammar, K., & Johansson U. (2022). A meta survey of quality evaluation criteria in explanation methods. In: J. D. Weerdt, & A. Polyvyanyy (Eds.), Intelligent information systems\u2014CAiSE forum 2022, Leuven, Belgium, June 6-10, 2022, proceedings, lecture notes in business information processing (Vol. 452, pp. 55\u201363). Springer. https:\/\/doi.org\/10.1007\/978-3-031-07481-3_7","DOI":"10.1007\/978-3-031-07481-3_7"},{"issue":"8","key":"9800_CR130","doi-asserted-by":"publisher","first-page":"539","DOI":"10.1111\/j.1747-9991.2011.00413.x","volume":"6","author":"T Lombrozo","year":"2011","unstructured":"Lombrozo, T. (2011). The instrumental value of explanations. Philosophy Compass, 6(8), 539\u2013551. https:\/\/doi.org\/10.1111\/j.1747-9991.2011.00413.x","journal-title":"Philosophy Compass"},{"key":"9800_CR131","doi-asserted-by":"publisher","DOI":"10.1093\/oxfordhb\/9780199734689.013.0014","author":"T Lombrozo","year":"2012","unstructured":"Lombrozo, T. (2012). Explanation and abductive inference. The Oxford Handbook of Thinking and Reasoning. https:\/\/doi.org\/10.1093\/oxfordhb\/9780199734689.013.0014","journal-title":"The Oxford Handbook of Thinking and Reasoning"},{"key":"9800_CR132","unstructured":"Lundberg, S. M., & Lee, S. (2017). A unified approach to interpreting model predictions. In I. Guyon, U. von Luxburg, S. Bengio, H. M. Wallach, R. Fergus, S. V. N. Vishwanathan, & R. Garnett (Eds.), Advances in neural information processing systems 30: Annual conference on neural information processing systems 2017, December 4-9, 2017, Long Beach, CA, USA (pp. 4765\u20134774). https:\/\/proceedings.neurips.cc\/paper\/2017\/hash\/8a20a8621978632d76c43dfd28b67767-Abstract.html"},{"key":"9800_CR133","unstructured":"Madry, A., Makelov, A., Schmidt, L., Tsipras, D., & Vladu, A. (2018). Towards deep learning models resistant to adversarial attacks. In 6th international conference on learning representations, ICLR 2018, Vancouver, BC, Canada, April 30-May 3, 2018, conference track proceedings. OpenReview.net. https:\/\/openreview.net\/forum?id=rJzIBfZAb"},{"key":"9800_CR134","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9780511489877","author":"CE McGarty","year":"2002","unstructured":"McGarty, C. E., Yzerbyt, V. Y., & Spears, R. E. (2002). Stereotypes as explanations: The formation of meaningful beliefs about social groups. Cambridge University Press. https:\/\/doi.org\/10.1017\/CBO9780511489877","journal-title":"Cambridge University Press"},{"issue":"1","key":"9800_CR135","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1098\/rsnr.1960.0001","volume":"15","author":"D McKie","year":"1960","unstructured":"McKie, D. (1960). The origins and foundation of the Royal Society of London. Notes and Records of the Royal Society of London, 15(1), 1\u201337. https:\/\/doi.org\/10.1098\/rsnr.1960.0001","journal-title":"Notes and Records of the Royal Society of London"},{"issue":"12","key":"9800_CR136","doi-asserted-by":"publisher","first-page":"1469","DOI":"10.1037\/0003-066X.44.12.1469","volume":"44","author":"DL Medin","year":"1989","unstructured":"Medin, D. L. (1989). Concepts and conceptual structure. American Psychologist, 44(12), 1469. https:\/\/doi.org\/10.1037\/0003-066X.44.12.1469","journal-title":"American Psychologist"},{"key":"9800_CR137","doi-asserted-by":"publisher","unstructured":"Medin, D., & Ortony, A. (1989). Comments on part I: Psychological essentialism (pp. 179\u2013196). Cambridge University Press. https:\/\/doi.org\/10.1017\/CBO9780511529863.009","DOI":"10.1017\/CBO9780511529863.009"},{"key":"9800_CR138","doi-asserted-by":"publisher","unstructured":"Mehrabi, N., Morstatter, F., Saxena, N., Lerman, K., & Galstyan, A. (2022). A survey on bias and fairness in machine learning. ACM Computing Surveys, 54(6), 115:1\u2013115:35. https:\/\/doi.org\/10.1145\/3457607","DOI":"10.1145\/3457607"},{"issue":"10","key":"9800_CR139","doi-asserted-by":"publisher","first-page":"8930","DOI":"10.1609\/aaai.v35i10.17080","volume":"35","author":"N Mehrabi","year":"2021","unstructured":"Mehrabi, N., Naveed, M., Morstatter, F., & Galstyan, A. (2021). Exacerbating algorithmic bias through fairness attacks. Proceedings of the AAAI Conference on Artificial Intelligence, 35(10), 8930\u20138938. https:\/\/doi.org\/10.1609\/aaai.v35i10.17080","journal-title":"Proceedings of the AAAI Conference on Artificial Intelligence"},{"issue":"3","key":"9800_CR140","doi-asserted-by":"crossref","first-page":"439","DOI":"10.1075\/pc.16.3.02mei","volume":"16","author":"J Meibauer","year":"2008","unstructured":"Meibauer, J. (2008). Tautology as presumptive meaning. Pragmatics & Cognition, 16(3), 439\u2013470.","journal-title":"Pragmatics & Cognition"},{"issue":"9","key":"9800_CR141","doi-asserted-by":"publisher","first-page":"529","DOI":"10.1038\/s42256-020-0216-z","volume":"2","author":"EL Merrer","year":"2020","unstructured":"Merrer, E. L., & Tr\u00e9dan, G. (2020). Remote explainability faces the bouncer problem. Nature Machine Intelligence, 2(9), 529\u2013539. https:\/\/doi.org\/10.1038\/s42256-020-0216-z","journal-title":"Nature Machine Intelligence"},{"issue":"1","key":"9800_CR142","doi-asserted-by":"publisher","first-page":"205395171665021","DOI":"10.1177\/2053951716650211","volume":"3","author":"J Metcalf","year":"2016","unstructured":"Metcalf, J., & Crawford, K. (2016). Where are human subjects in big data research? The emerging ethics divide. Big Data & Society, 3(1), 205395171665021. https:\/\/doi.org\/10.1177\/2053951716650211","journal-title":"Big Data & Society"},{"key":"9800_CR143","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.artint.2018.07.007","volume":"267","author":"T Miller","year":"2019","unstructured":"Miller, T. (2019). Explanation in artificial intelligence: Insights from the social sciences. Artificial Intelligence, 267, 1\u201338. https:\/\/doi.org\/10.1016\/j.artint.2018.07.007","journal-title":"Artificial Intelligence"},{"key":"9800_CR144","unstructured":"Miller, T., Howe, P., & Sonenberg, L. (2017). Explainable AI: Beware of inmates running the asylum or: How I learnt to stop worrying and love the social and behavioural sciences. CoRR abs\/1712.00547. http:\/\/arxiv.org\/abs\/1712.00547"},{"key":"9800_CR145","unstructured":"Mishra, S., Dutta, S., Long, J., & Magazzeni, D. (2021). A survey on the robustness of feature importance and counterfactual explanations. CoRR abs\/2111.00358. http:\/\/arxiv.org\/abs\/2111.00358"},{"key":"9800_CR146","doi-asserted-by":"crossref","unstructured":"Mitchell, M., Wu, S., Zaldivar, A., Barnes, P., Vasserman, L., Hutchinson, B., Spitzer, E., Raji, I. D., & Gebru, T. (2018). Model cards for model reporting. In Proceedings of the conference on fairness, accountability, and transparency.","DOI":"10.1145\/3287560.3287596"},{"key":"9800_CR147","unstructured":"Mohseni, S., Zarei, N., & Ragan, E. D. (2018). A survey of evaluation methods and measures for interpretable machine learning. CoRR abs\/1811.11839. http:\/\/arxiv.org\/abs\/1811.11839"},{"key":"9800_CR148","doi-asserted-by":"publisher","DOI":"10.1145\/3387166","author":"S Mohseni","year":"2021","unstructured":"Mohseni, S., Zarei, N., & Ragan, E. D. (2021). A multidisciplinary survey and framework for design and evaluation of explainable AI systems. ACM Transactions on Interactive Intelligent Systems. https:\/\/doi.org\/10.1145\/3387166","journal-title":"ACM Transactions on Interactive Intelligent Systems"},{"key":"9800_CR149","doi-asserted-by":"publisher","DOI":"10.1007\/s43681-022-00191-3","author":"J M\u00f6kander","year":"2022","unstructured":"M\u00f6kander, J., & Floridi, L. (2022). Operationalising AI governance through ethics-based auditing: An industry case study. AI and Ethics. https:\/\/doi.org\/10.1007\/s43681-022-00191-3","journal-title":"AI and Ethics"},{"issue":"1","key":"9800_CR150","doi-asserted-by":"publisher","first-page":"411","DOI":"10.1007\/S00146-021-01308-8","volume":"38","author":"J Morley","year":"2023","unstructured":"Morley, J., Kinsey, L., Elhalal, A., Garcia, F., Ziosi, M., & Floridi, L. (2023). Operationalising AI ethics: Barriers, enablers and next steps. AI & Society, 38(1), 411\u2013423. https:\/\/doi.org\/10.1007\/S00146-021-01308-8","journal-title":"AI & Society"},{"key":"9800_CR151","doi-asserted-by":"publisher","DOI":"10.2139\/ssrn.3877437","author":"E Moss","year":"2021","unstructured":"Moss, E., Watkins, E. A., Singh, R., Elish, M. C., & Metcalf, J. (2021). Assembling accountability: Algorithmic impact assessment for the public interest. SSRN. https:\/\/doi.org\/10.2139\/ssrn.3877437","journal-title":"SSRN"},{"key":"9800_CR152","doi-asserted-by":"publisher","unstructured":"Nanda, V., Dooley, S., Singla, S., Feizi, S., & Dickerson, J. P. (2021). Fairness through robustness: Investigating robustness disparity in deep learning. In Proceedings of the 2021 ACM conference on fairness, accountability, and transparency. Association for Computing Machinery, New York, NY, USA, FAccT \u201921 (pp. 466-477). https:\/\/doi.org\/10.1145\/3442188.3445910","DOI":"10.1145\/3442188.3445910"},{"key":"9800_CR153","doi-asserted-by":"crossref","unstructured":"Nannini, L. (2024). Habemus a right to an explanation: So what?\u2014A framework on transparency-explainability functionality and tensions in the EU AI act. In Proceedings of the AAAI\/ACM conference on AI, ethics, and society (pp. 1023-1035). https:\/\/ojs.aaai.org\/index.php\/AIES\/article\/download\/31700\/33867\/35764","DOI":"10.1609\/aies.v7i1.31700"},{"key":"9800_CR154","doi-asserted-by":"publisher","unstructured":"Nannini, L., Balayn, A., & Smith, A. L. (2023). Explainability in AI policies: A critical review of communications, reports, regulations, and standards in the EU, US, and UK. In Proceedings of the 2023 ACM conference on fairness, accountability, and transparency, FAccT 2023, Chicago, IL, USA, June 12-15, 2023 (pp. 1198\u20131212). ACM. https:\/\/doi.org\/10.1145\/3593013.3594074","DOI":"10.1145\/3593013.3594074"},{"key":"9800_CR155","unstructured":"Nast, C. (2023). Inside the suspicion machine. wired.com. Retrieved June 27, 2023, from, https:\/\/www.wired.com\/story\/welfare-state-algorithms\/"},{"issue":"2","key":"9800_CR156","doi-asserted-by":"publisher","first-page":"175","DOI":"10.1037\/1089-2680.2.2.175","volume":"2","author":"RS Nickerson","year":"1998","unstructured":"Nickerson, R. S. (1998). Confirmation bias: A ubiquitous phenomenon in many guises. Review of General Psychology, 2(2), 175\u2013220. https:\/\/doi.org\/10.1037\/1089-2680.2.2.175","journal-title":"Review of General Psychology"},{"issue":"1","key":"9800_CR157","doi-asserted-by":"publisher","first-page":"32","DOI":"10.1007\/s42979-020-00390-x","volume":"2","author":"A Noack","year":"2021","unstructured":"Noack, A., Ahern, I., Dou, D., & Li, B. (2021). An empirical study on the relation between network interpretability and adversarial robustness. SN Computer Science, 2(1), 32. https:\/\/doi.org\/10.1007\/s42979-020-00390-x","journal-title":"SN Computer Science"},{"key":"9800_CR158","doi-asserted-by":"publisher","unstructured":"Noppel, M., Peter, L., & Wressnegger, C. (2023). Disguising attacks with explanation-aware backdoors. In 2023 2023 IEEE symposium on security and privacy (SP) (SP) (pp. 664\u2013681). Los Alamitos, CA, USA: IEEE Computer Society. https:\/\/doi.org\/10.1109\/SP46215.2023.00057","DOI":"10.1109\/SP46215.2023.00057"},{"key":"9800_CR159","doi-asserted-by":"publisher","unstructured":"Oh, S. J., Schiele, B., & Fritz, M. (2019). Towards reverse-engineering black-box neural networks. In W. Samek, G. Montavon, A. Vedaldi, L. K. Hansen & K. M\u00fcller (Eds.), Explainable AI: Interpreting, explaining and visualizing deep learning, lecture notes in computer science (Vol. 11700, pp. 121-144). Springer. https:\/\/doi.org\/10.1007\/978-3-030-28954-6_7","DOI":"10.1007\/978-3-030-28954-6_7"},{"key":"9800_CR160","doi-asserted-by":"publisher","unstructured":"Papernot, N., McDaniel, P. D., Goodfellow, I. J., Jha, S., Celik, Z. B., & Swami, A. (2017). Practical black-box attacks against machine learning. In R. Karri, O. Sinanoglu, A. Sadeghi, & X. Yi (Eds.), Proceedings of the 2017 ACM on Asia conference on computer and communications security, AsiaCCS 2017, Abu Dhabi, United Arab Emirates, April 2-6, 2017 (pp. 506\u2013519). ACM. https:\/\/doi.org\/10.1145\/3052973.3053009","DOI":"10.1145\/3052973.3053009"},{"key":"9800_CR161","doi-asserted-by":"publisher","unstructured":"Papernot, N., McDaniel, P. D., Wu, X., Jha, S., & Swami, A. (2016). Distillation as a defense to adversarial perturbations against deep neural networks. In IEEE symposium on security and privacy, SP 2016, San Jose, CA, USA, May 22-26, 2016 (pp. 582\u2013597). IEEE Computer Society.https:\/\/doi.org\/10.1109\/SP.2016.41","DOI":"10.1109\/SP.2016.41"},{"key":"9800_CR162","doi-asserted-by":"publisher","unstructured":"Patel, N., Shokri, R., & Zick, Y. (2022). Model explanations with differential privacy. In FAccT \u201922: 2022 ACM conference on fairness, accountability, and transparency, Seoul, Republic of Korea, June 21-24, 2022 (pp. 1895\u20131904). ACM. https:\/\/doi.org\/10.1145\/3531146.3533235","DOI":"10.1145\/3531146.3533235"},{"key":"9800_CR163","unstructured":"Pawelczyk, M., Datta, T., van\u00a0den Heuvel, J., Kasneci, G., & Lakkaraju, H. (2023). Probabilistically robust recourse: Navigating the trade-offs between costs and robustness in algorithmic recourse. In The eleventh international conference on learning representations, ICLR 2023, Kigali, Rwanda, May 1-5, 2023. OpenReview.net. https:\/\/openreview.net\/pdf?id=sC-PmTsiTB"},{"key":"9800_CR164","doi-asserted-by":"crossref","unstructured":"Popper, K. (2014). Conjectures and refutations: The growth of scientific knowledge. Routledge.","DOI":"10.4324\/9780203538074"},{"key":"9800_CR165","doi-asserted-by":"publisher","unstructured":"Quan, P., Chakraborty, S., Jeyakumar, J. V., & Srivastava, M. B. (2022). On the amplification of security and privacy risks by post-hoc explanations in machine learning models. CoRR abs\/2206.14004. https:\/\/doi.org\/10.48550\/arXiv.2206.14004","DOI":"10.48550\/arXiv.2206.14004"},{"key":"9800_CR166","doi-asserted-by":"publisher","DOI":"10.1177\/1461444819876115","author":"A Rahman","year":"2020","unstructured":"Rahman, A. (2020). Algorithms of oppression: How search engines reinforce racism. New Media & Society. https:\/\/doi.org\/10.1177\/1461444819876115","journal-title":"New Media & Society"},{"key":"9800_CR167","doi-asserted-by":"publisher","unstructured":"Raji, I. D., Smart, A., White, R. N., Mitchell, M., Gebru, T., Hutchinson, B., Smith-Loud, J., Theron, D., & Barnes, P. (2020). Closing the AI accountability gap: Defining an end-to-end framework for internal algorithmic auditing. In M. Hildebrandt, C. Castillo, L. E. Celis, S. Ruggieri, L. Taylor, & G. Zanfir-Fortuna (Eds.), FAT* \u201920: Conference on fairness, accountability, and transparency, Barcelona, Spain, January 27-30, 2020 (pp. 33\u201344). ACM. https:\/\/doi.org\/10.1145\/3351095.3372873","DOI":"10.1145\/3351095.3372873"},{"key":"9800_CR168","doi-asserted-by":"publisher","DOI":"10.1016\/j.jlp.2022.104734","volume":"76","author":"A Raveendran","year":"2022","unstructured":"Raveendran, A., Renjith, V., & Madhu, G. (2022). A comprehensive review on dynamic risk analysis methodologies. Journal of Loss Prevention in the Process Industries, 76, 104734. https:\/\/doi.org\/10.1016\/j.jlp.2022.104734","journal-title":"Journal of Loss Prevention in the Process Industries"},{"key":"9800_CR169","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/bs.acdb.2020.05.001","volume":"59","author":"M Rhodes","year":"2020","unstructured":"Rhodes, M., & Moty, K. (2020). What is social essentialism and how does it develop? Advances in Child Development and Behavior, 59, 1\u201330. https:\/\/doi.org\/10.1016\/bs.acdb.2020.05.001","journal-title":"Advances in Child Development and Behavior"},{"key":"9800_CR170","doi-asserted-by":"publisher","unstructured":"Ribeiro, M. T., Singh, S., & Guestrin, C. (2016). \u201cwhy should I trust you?\u201d: Explaining the predictions of any classifier. In B. Krishnapuram, M. Shah, A. J. Smola, C. C. Aggarwal, D. Shen, & R. Rastogi (Eds.), Proceedings of the 22nd ACM SIGKDD international conference on knowledge discovery and data mining, San Francisco, CA, USA, August 13-17, 2016 (pp. 1135\u20131144). ACM. https:\/\/doi.org\/10.1145\/2939672.2939778","DOI":"10.1145\/2939672.2939778"},{"key":"9800_CR171","unstructured":"Rieger, L., & Hansen, L. K. (2020). A simple defense against adversarial attacks on heatmap explanations. CoRR abs\/2007.06381. http:\/\/arxiv.org\/abs\/2007.06381"},{"issue":"4","key":"9800_CR172","doi-asserted-by":"publisher","first-page":"495","DOI":"10.1007\/S11023-019-09509-3","volume":"29","author":"S Robbins","year":"2019","unstructured":"Robbins, S. (2019). A misdirected principle with a catch: Explicability for AI. Minds and Machines, 29(4), 495\u2013514. https:\/\/doi.org\/10.1007\/S11023-019-09509-3","journal-title":"Minds and Machines"},{"key":"9800_CR173","doi-asserted-by":"publisher","unstructured":"Ronnow-Rasmussen, T. (2015). Intrinsic and extrinsic value. In The Oxford handbook of value theory (pp. 29\u201343). Oxford University Press. https:\/\/doi.org\/10.1093\/oxfordhb\/9780199959303.013.0003","DOI":"10.1093\/oxfordhb\/9780199959303.013.0003"},{"issue":"1","key":"9800_CR174","first-page":"1","volume":"1","author":"S Rossnan","year":"2006","unstructured":"Rossnan, S. (2006). Overcoming math anxiety. Mathitudes, 1(1), 1\u20134.","journal-title":"Overcoming math anxiety. Mathitudes"},{"issue":"5","key":"9800_CR175","doi-asserted-by":"publisher","first-page":"521","DOI":"10.1207\/s15516709cog2605_1","volume":"26","author":"L Rozenblit","year":"2002","unstructured":"Rozenblit, L., & Keil, F. (2002). The misunderstood limits of folk science: An illusion of explanatory depth. Cognitive Science, 26(5), 521\u2013562. https:\/\/doi.org\/10.1207\/s15516709cog2605_1","journal-title":"Cognitive Science"},{"issue":"5","key":"9800_CR176","doi-asserted-by":"publisher","first-page":"206","DOI":"10.1038\/s42256-019-0048-x","volume":"1","author":"C Rudin","year":"2019","unstructured":"Rudin, C. (2019). Stop explaining black box machine learning models for high stakes decisions and use interpretable models instead. Nature Machine Intelligence, 1(5), 206\u2013215. https:\/\/doi.org\/10.1038\/s42256-019-0048-x","journal-title":"Nature Machine Intelligence"},{"key":"9800_CR177","volume-title":"Scientific explanation and the causal structure of the world","author":"WC Salmon","year":"1984","unstructured":"Salmon, W. C. (1984). Scientific explanation and the causal structure of the world. Princeton University Press."},{"key":"9800_CR178","first-page":"3","volume":"13","author":"WC Salmon","year":"1989","unstructured":"Salmon, W. C. (1989). Four decades of scientific explanation. Minnesota Studies in the Philosophy of Science, 13, 3\u2013219.","journal-title":"Minnesota Studies in the Philosophy of Science"},{"key":"9800_CR179","doi-asserted-by":"publisher","unstructured":"Sambasivan, N., Kapania, S., Highfill, H., Akrong, D., Paritosh, P., & Aroyo, L. M. (2021). \u201ceveryone wants to do the model work, not the data work\u201d: Data cascades in high-stakes ai. In Proceedings of the 2021 CHI conference on human factors in computing systems. Association for Computing Machinery, New York, NY, USA, CHI \u201921. https:\/\/doi.org\/10.1145\/3411764.3445518","DOI":"10.1145\/3411764.3445518"},{"key":"9800_CR180","doi-asserted-by":"crossref","DOI":"10.4324\/9781410610386","volume-title":"Making minds less well educated than our own","author":"RC Schank","year":"2004","unstructured":"Schank, R. C. (2004). Making minds less well educated than our own. Routledge."},{"key":"9800_CR181","doi-asserted-by":"publisher","unstructured":"Schemmer, M., Hemmer, P., Nitsche, M., K\u00fchl, N., & V\u00f6ssing, M. (2022). A meta-analysis of the utility of explainable artificial intelligence in human-AI decision-making. In Proceedings of the 2022 AAAI\/ACM conference on AI, ethics, and society. Association for Computing Machinery, New York, NY, USA, AIES \u201922 (pp. 617\u2013626). https:\/\/doi.org\/10.1145\/3514094.3534128","DOI":"10.1145\/3514094.3534128"},{"key":"9800_CR182","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9780511609213","author":"JR Searle","year":"1979","unstructured":"Searle, J. R. (1979). Expression and meaning: Studies in the theory of speech acts. Cambridge University Press. https:\/\/doi.org\/10.1017\/CBO9780511609213","journal-title":"Cambridge University Press"},{"key":"9800_CR183","unstructured":"Selbst. A. D. (2021). An institutional view of algorithmic impact assessments. Harvard Journal of Law & Technology, 35(1). https:\/\/ssrn.com\/abstract=3867634"},{"key":"9800_CR184","unstructured":"Severi, G., Meyer, J., Coull, S. E., & Oprea, A. (2021). Explanation-guided backdoor poisoning attacks against malware classifiers. In M. Bailey, & R. Greenstadt (Eds.), 30th USENIX security symposium, USENIX security 2021, August 11-13, 2021 (pp. 1487\u20131504). USENIX Association. https:\/\/www.usenix.org\/conference\/usenixsecurity21\/presentation\/severi"},{"key":"9800_CR185","unstructured":"Shafahi, A., Huang, W. R., Najibi, M., Suciu, O., Studer, C., Dumitras, T., & Goldstein, T. (2018) Poison frogs! Targeted clean-label poisoning attacks on neural networks. In S. Bengio, H. M. Wallach, H. Larochelle, K. Grauman, N. Cesa-Bianchi, & R. Garnett (Eds.), Advances in neural information processing systems 31: Annual conference on neural information processing systems 2018, NeurIPS 2018, December 3-8, 2018, Montr\u00e9al, Canada (pp. 6106\u20136116). https:\/\/proceedings.neurips.cc\/paper\/2018\/hash\/22722a343513ed45f14905eb07621686-Abstract.html"},{"key":"9800_CR186","unstructured":"Shafahi, A., Najibi, M., Ghiasi, A., Xu, Z., Dickerson, J. P., Studer, C., Davis, L. S., Taylor, G., & Goldstein, T. (2019). Adversarial training for free! In H. M. Wallach, H. Larochelle, A. Beygelzimer, F. d\u2019Alch\u00e9-Buc, E. B. Fox, & R. Garnett (Eds.), Advances in neural information processing systems 32: Annual conference on neural information processing systems 2019, NeurIPS 2019, December 8-14, 2019, Vancouver, BC, Canada (pp. 3353\u20133364). https:\/\/proceedings.neurips.cc\/paper\/2019\/hash\/7503cfacd12053d309b6bed5c89de212-Abstract.html"},{"key":"9800_CR187","doi-asserted-by":"publisher","unstructured":"Shokri, R., Strobel, M., & Zick, Y. (2021). On the privacy risks of model explanations. In M. Fourcade, B. Kuipers, S. Lazar, & D. K. Mulligan (Eds.), AIES \u201921: AAAI\/ACM conference on AI, ethics, and society, virtual event, USA, May 19-21, 2021. ACM, pp. 231\u2013241. https:\/\/doi.org\/10.1145\/3461702.3462533.","DOI":"10.1145\/3461702.3462533"},{"key":"9800_CR188","doi-asserted-by":"publisher","unstructured":"Sinha, S., Chen, H., Sekhon, A., Ji, Y., & Qi, Y. (2021). Perturbing inputs for fragile interpretations in deep natural language processing. In J. Bastings, Y. Belinkov, E. Dupoux, M. Giulianelli, D. Hupkes, Y. Pinter, & H. Sajjad (Eds.), Proceedings of the fourth BlackboxNLP workshop on analyzing and interpreting neural networks for NLP, BlackboxNLP@EMNLP 2021, Punta Cana, Dominican Republic, November 11, 2021 (pp. 420\u2013434). Association for Computational Linguistics. https:\/\/doi.org\/10.18653\/v1\/2021.blackboxnlp-1.33","DOI":"10.18653\/v1\/2021.blackboxnlp-1.33"},{"key":"9800_CR189","doi-asserted-by":"publisher","unstructured":"Sinha, S., Huai, M., Sun, J., & Zhang A. (2022). Understanding and enhancing robustness of concept-based models. CoRR abs\/2211.16080. https:\/\/doi.org\/10.48550\/arXiv.2211.16080","DOI":"10.48550\/arXiv.2211.16080"},{"key":"9800_CR190","doi-asserted-by":"publisher","unstructured":"Slack, D., Hilgard, S., Jia, E., Singh, S., & Lakkaraju, H. (2020) Fooling lime and shap: Adversarial attacks on post hoc explanation methods. In Proceedings of the AAAI\/ACM conference on AI, ethics, and society. Association for Computing Machinery, New York, NY, USA, AIES \u201920 (pp. 180\u2013186). https:\/\/doi.org\/10.1145\/3375627.3375830","DOI":"10.1145\/3375627.3375830"},{"key":"9800_CR191","unstructured":"Slack, D., Hilgard, A., Lakkaraju, H., & Singh S. (2021a). Counterfactual explanations can be manipulated. In M. Ranzato, A. Beygelzimer, Y. N. Dauphin, P. Liang & J. W. Vaughan (Eds.), Advances in neural information processing systems 34: Annual conference on neural information processing systems 2021, NeurIPS 2021, December 6-14, 2021, virtual (pp. 62-75). https:\/\/proceedings.neurips.cc\/paper\/2021\/hash\/009c434cab57de48a31f6b669e7ba266-Abstract.html"},{"key":"9800_CR192","unstructured":"Slack, D., Hilgard, A., Singh, S., & Lakkaraju, H. (2021b) Reliable post hoc explanations: Modeling uncertainty in explainability. In M. Ranzato, A. Beygelzimer, Y. N. Dauphin, P. Liang & J. W. Vaughan (Eds.), Advances in neural information processing systems 34: Annual conference on neural information processing systems 2021, NeurIPS 2021, December 6-14, 2021, virtual (pp. 9391-9404). https:\/\/proceedings.neurips.cc\/paper\/2021\/hash\/4e246a381baf2ce038b3b0f82c7d6fb4-Abstract.html"},{"key":"9800_CR193","doi-asserted-by":"publisher","unstructured":"Sokol, K., & Flach, P. (2020). Explainability fact sheets: A framework for systematic assessment of explainable approaches. In Proceedings of the 2020 conference on fairness, accountability, and transparency. Association for Computing Machinery, New York, NY, USA, FAT* \u201920 (pp. 56-67). https:\/\/doi.org\/10.1145\/3351095.3372870","DOI":"10.1145\/3351095.3372870"},{"key":"9800_CR194","doi-asserted-by":"publisher","unstructured":"Solans, D., Biggio, B., & Castillo, C. (2020). Poisoning attacks on algorithmic fairness. In F. Hutter, K. Kersting, J. Lijffijt, & I. Valera (Eds.), Machine learning and knowledge discovery in databases\u2014European conference, ECML PKDD 2020, Ghent, Belgium, September 14-18, 2020, proceedings, part I, lecture notes in computer science (Vol. 12457, pp. 162\u2013177). Springer. https:\/\/doi.org\/10.1007\/978-3-030-67658-2_10","DOI":"10.1007\/978-3-030-67658-2_10"},{"key":"9800_CR195","doi-asserted-by":"publisher","unstructured":"Sorokina, D., Caruana, R., Riedewald, M., & Fink, D. (2008). Detecting statistical interactions with additive groves of trees. In W. W. Cohen, McCallum, A., & S. T. Roweis (Eds.), Machine learning, proceedings of the twenty-fifth international conference (ICML 2008), Helsinki, Finland, June 5-9, 2008, ACM international conference proceeding series (Vol. 307, pp. 1000-1007). ACM.https:\/\/doi.org\/10.1145\/1390156.1390282","DOI":"10.1145\/1390156.1390282"},{"key":"9800_CR196","doi-asserted-by":"publisher","DOI":"10.1093\/0195174089.001.0001","author":"PK Stanford","year":"2006","unstructured":"Stanford, P. K. (2006). Exceeding our grasp: Science, history, and the problem of unconceived alternatives. Oxford University Press. https:\/\/doi.org\/10.1093\/0195174089.001.0001","journal-title":"Oxford University Press"},{"key":"9800_CR197","doi-asserted-by":"publisher","first-page":"11974","DOI":"10.1109\/ACCESS.2021.3051315","volume":"9","author":"I Stepin","year":"2021","unstructured":"Stepin, I., Alonso, J. M., Catal\u00e1, A., & Pereira-Fari\u00f1a, M. (2021). A survey of contrastive and counterfactual explanation generation methods for explainable artificial intelligence. IEEE Access, 9, 11974\u201312001. https:\/\/doi.org\/10.1109\/ACCESS.2021.3051315","journal-title":"IEEE Access"},{"key":"9800_CR198","unstructured":"Szegedy, C., Zaremba, W., Sutskever, I., Bruna, J., Erhan, D., Goodfellow, I. J., & Fergus, R. (2014). Intriguing properties of neural networks. In: Y. Bengio & Y. LeCun (Eds.), 2nd international conference on learning representations, ICLR 2014, Banff, AB, Canada, April 14-16, 2014, conference track proceedings. http:\/\/arxiv.org\/abs\/1312.6199"},{"key":"9800_CR199","doi-asserted-by":"publisher","DOI":"10.3389\/fdata.2022.704203","volume":"5","author":"R Tang","year":"2022","unstructured":"Tang, R., Liu, N., Yang, F., Zou, N., & Hu, X. (2022). Defense against explanation manipulation. Frontiers Big Data, 5, 704203. https:\/\/doi.org\/10.3389\/fdata.2022.704203","journal-title":"Frontiers Big Data"},{"key":"9800_CR200","doi-asserted-by":"publisher","DOI":"10.1007\/s43681-023-00401-6","author":"A Tartaro","year":"2024","unstructured":"Tartaro, A., Panai, E., & Cocchiaro, M. Z. (2024). Ai risk assessment using ethical dimensions. AI and Ethics. https:\/\/doi.org\/10.1007\/s43681-023-00401-6","journal-title":"AI and Ethics"},{"key":"9800_CR201","unstructured":"The Royal Society. (1662). First charter. History of the Royal Society. https:\/\/royalsociety.org\/about-us\/who-we-are\/history\/"},{"key":"9800_CR202","doi-asserted-by":"crossref","unstructured":"Tomsett, R., Harborne, D., Chakraborty, S., Gurram, P., & Preece, A. D. (2020). Sanity checks for saliency metrics. In The thirty-fourth AAAI conference on artificial intelligence, AAAI 2020, the thirty-second innovative applications of artificial intelligence conference, IAAI 2020, the tenth AAAI symposium on educational advances in artificial intelligence, EAAI 2020, New York, NY, USA, February 7-12, 2020 (pp. 6021\u20136029). AAAI Press. https:\/\/ojs.aaai.org\/index.php\/AAAI\/article\/view\/6064","DOI":"10.1609\/aaai.v34i04.6064"},{"key":"9800_CR203","unstructured":"Tram\u00e8r, F., Carlini, N., Brendel, W., & Madry A. (2020). On adaptive attacks to adversarial example defenses. In: H. Larochelle, M. Ranzato, R. Hadsell, M. Balcan & H. Lin (Eds.), Advances in neural information processing systems 33: Annual conference on neural information processing systems 2020, NeurIPS 2020, December 6-12, 2020, virtual. https:\/\/proceedings.neurips.cc\/paper\/2020\/hash\/11f38f8ecd71867b42433548d1078e38-Abstract.html"},{"issue":"2","key":"9800_CR204","doi-asserted-by":"publisher","first-page":"212","DOI":"10.1086\/341050","volume":"69","author":"JD Trout","year":"2002","unstructured":"Trout, J. D. (2002). Scientific explanation and the sense of understanding. Philosophy of Science, 69(2), 212\u2013233. https:\/\/doi.org\/10.1086\/341050","journal-title":"Philosophy of Science"},{"issue":"2","key":"9800_CR205","first-page":"452","volume":"65","author":"RM Tubbs","year":"1990","unstructured":"Tubbs, R. M., Messier, W. F., & Knechel, W. R. (1990). Recency effects in the auditor\u2019s belief-revision process. The Accounting Review, 65(2), 452\u2013460.","journal-title":"The Accounting Review"},{"issue":"2","key":"9800_CR206","doi-asserted-by":"publisher","first-page":"207","DOI":"10.1016\/0010-0285(73)90033-9","volume":"5","author":"A Tversky","year":"1973","unstructured":"Tversky, A., & Kahneman, D. (1973). Availability: A heuristic for judging frequency and probability. Cognitive Psychology, 5(2), 207\u2013232. https:\/\/doi.org\/10.1016\/0010-0285(73)90033-9","journal-title":"Cognitive Psychology"},{"key":"9800_CR207","doi-asserted-by":"publisher","unstructured":"Vandenberghe, F. (2015). Reification: History of the concept (pp. 203\u2013206). https:\/\/doi.org\/10.1016\/B978-0-08-097086-8.03109-3","DOI":"10.1016\/B978-0-08-097086-8.03109-3"},{"issue":"CSCW1","key":"9800_CR208","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3579605","volume":"7","author":"H Vasconcelos","year":"2023","unstructured":"Vasconcelos, H., J\u00f6rke, M., Grunde-McLaughlin, M., Gerstenberg, T., Bernstein, M. S., & Krishna, R. (2023). Explanations can reduce overreliance on AI systems during decision-making. Proceedings of the ACM on Human-Computer Interaction, 7(CSCW1), 1\u201338. https:\/\/doi.org\/10.1145\/3579605","journal-title":"Proceedings of the ACM on Human-Computer Interaction"},{"key":"9800_CR209","doi-asserted-by":"publisher","unstructured":"Veldanda, A. K., Liu, K., Tan, B., Krishnamurthy, P., Khorrami, F., Karri, R., Dolan-Gavitt, B., & Garg, S. (2021). Nnoculation: Catching badnets in the wild. In N. Carlini, A. Demontis, & Y. Chen, (Eds.), AISec@CCS 2021: Proceedings of the 14th ACM workshop on artificial intelligence and security, virtual event, Republic of Korea, 15 November 2021 (pp. 49\u201360). ACM. https:\/\/doi.org\/10.1145\/3474369.3486874","DOI":"10.1145\/3474369.3486874"},{"key":"9800_CR210","doi-asserted-by":"publisher","DOI":"10.1016\/j.artint.2022.103840","volume":"316","author":"M Virgolin","year":"2023","unstructured":"Virgolin, M., & Fracaros, S. (2023). On the robustness of sparse counterfactual explanations to adverse perturbations. Artificial Intelligence, 316, 103840. https:\/\/doi.org\/10.1016\/j.artint.2022.103840","journal-title":"Artificial Intelligence"},{"key":"9800_CR211","doi-asserted-by":"publisher","DOI":"10.1007\/s10618-022-00900-w","author":"D Vre\u0161","year":"2022","unstructured":"Vre\u0161, D., & Robnik-\u0160ikonja, M. (2022). Preventing deception with explanation methods using focused sampling. Data Mining and Knowledge Discovery. https:\/\/doi.org\/10.1007\/s10618-022-00900-w","journal-title":"Data Mining and Knowledge Discovery"},{"key":"9800_CR212","doi-asserted-by":"crossref","unstructured":"Wachter, S., Mittelstadt, B. D., & Russell, C. (2017). Counterfactual explanations without opening the black box: Automated decisions and the GDPR. CoRR abs\/1711.00399. http:\/\/arxiv.org\/abs\/1711.00399","DOI":"10.2139\/ssrn.3063289"},{"key":"9800_CR213","doi-asserted-by":"publisher","first-page":"53","DOI":"10.1037\/0278-7393.26.1.53","volume":"26","author":"M Waldmann","year":"2000","unstructured":"Waldmann, M. (2000). Competition among causes but not effects in predictive and diagnostic learning. Journal of Experimental Psychology Learning Memory and Cognition, 26, 53\u201376. https:\/\/doi.org\/10.1037\/0278-7393.26.1.53","journal-title":"Journal of Experimental Psychology Learning Memory and Cognition"},{"key":"9800_CR214","unstructured":"Wallach, H. M., Larochelle, H., Beygelzimer, A., d\u2019Alch\u00e9-Buc, F., Fox, E. B., & Garnett, R (Eds.). (2019). Advances in neural information processing systems 32: Annual conference on neural information processing systems 2019, NeurIPS 2019, December 8-14, 2019, Vancouver, BC, Canada. https:\/\/proceedings.neurips.cc\/paper\/2019"},{"issue":"1","key":"9800_CR215","doi-asserted-by":"publisher","first-page":"95","DOI":"10.1007\/bf01063922","volume":"100","author":"DN Walton","year":"1994","unstructured":"Walton, D. N. (1994). Begging the question as a pragmatic fallacy. Synthese, 100(1), 95\u2013131. https:\/\/doi.org\/10.1007\/bf01063922","journal-title":"Synthese"},{"key":"9800_CR216","unstructured":"Walton, D. (2008). Informal logic: A pragmatic approach. Cambridge University Press."},{"key":"9800_CR217","unstructured":"Walton, D. (2010). The place of emotion in argument. Penn State Press."},{"key":"9800_CR218","doi-asserted-by":"publisher","unstructured":"Warnecke, A., Arp, D., Wressnegger, C., & Rieck, K. (2020). Evaluating explanation methods for deep learning in security. In IEEE European symposium on security and privacy, EuroS &P 2020, Genoa, Italy, September 7-11, 2020 (pp. 158\u2013174). IEEE. https:\/\/doi.org\/10.1109\/EuroSP48549.2020.00018","DOI":"10.1109\/EuroSP48549.2020.00018"},{"issue":"3","key":"9800_CR219","doi-asserted-by":"publisher","first-page":"417","DOI":"10.1007\/s11023-019-09506-6","volume":"29","author":"DS Watson","year":"2019","unstructured":"Watson, D. S. (2019). The rhetoric and reality of anthropomorphism in artificial intelligence. Minds and Machines, 29(3), 417\u2013440. https:\/\/doi.org\/10.1007\/s11023-019-09506-6","journal-title":"Minds and Machines"},{"key":"9800_CR220","unstructured":"Weerts, H. J. P., Dud\u00edk, M., Edgar, R., Jalali, A., Lutz, R., & Madaio, M. (2023) Fairlearn: Assessing and improving fairness of AI systems. Journal of Machine Learning Research, 24, 257:1\u2013257:8"},{"key":"9800_CR221","doi-asserted-by":"publisher","unstructured":"Weidinger, L., Uesato, J, Rauh, M., Griffin, C., Huang, P.-S., Mellor, J., Glaese, A., Cheng, M., Balle, B., Kasirzadeh, A., Biles, C., Brown, S., Kenton, Z., Hawkins, W., Stepleton, T., Birhane, A., Hendricks, L. A., Rimell, L., Isaac, W., \u2026 Gabriel, I. (2022) Taxonomy of risks posed by language models. In 2022 ACM conference on fairness, accountability, and transparency. Association for Computing Machinery, New York, NY, USA, FAccT \u201922 (pp. 214\u2013229). https:\/\/doi.org\/10.1145\/3531146.3533088","DOI":"10.1145\/3531146.3533088"},{"key":"9800_CR222","doi-asserted-by":"publisher","first-page":"470","DOI":"10.1162\/jocn.2008.20040","volume":"20","author":"D Weisberg","year":"2008","unstructured":"Weisberg, D., Keil, F., Goodstein, J., Rawson, E., & Gray, J. (2008). The seductive allure of neuroscience explanations. Journal of Cognitive Neuroscience, 20, 470\u2013477. https:\/\/doi.org\/10.1162\/jocn.2008.20040","journal-title":"Journal of Cognitive Neuroscience"},{"issue":"6","key":"9800_CR223","doi-asserted-by":"publisher","first-page":"82","DOI":"10.1145\/1349026.1349043","volume":"51","author":"DJ Weitzner","year":"2008","unstructured":"Weitzner, D. J., Abelson, H., Berners-Lee, T., Feigenbaum, J., Hendler, J. A., & Sussman, G. J. (2008). Information accountability. Communications of the ACM, 51(6), 82\u201387. https:\/\/doi.org\/10.1145\/1349026.1349043","journal-title":"Communications of the ACM"},{"key":"9800_CR224","doi-asserted-by":"publisher","unstructured":"Wicker, M., Heo, J., Costabello, L., & Weller, A. (2022). Robust explanation constraints for neural networks. CoRR abs\/2212.08507. https:\/\/doi.org\/10.48550\/arXiv.2212.08507","DOI":"10.48550\/arXiv.2212.08507"},{"key":"9800_CR225","doi-asserted-by":"publisher","DOI":"10.1017\/dap.2022.39","author":"M Wieringa","year":"2023","unstructured":"Wieringa, M. (2023). \u201chey syri, tell me about algorithmic accountability\u2019\u2019: Lessons from a landmark case. Data & Policy. https:\/\/doi.org\/10.1017\/dap.2022.39","journal-title":"Data & Policy"},{"key":"9800_CR226","unstructured":"Wikipedia. (2023). Ignotum per ignotius. https:\/\/en.wikipedia.org\/wiki\/Ignotum_per_ignotius"},{"key":"9800_CR227","doi-asserted-by":"publisher","DOI":"10.1007\/s11191-015-9784-4","author":"D Wilkenfeld","year":"2015","unstructured":"Wilkenfeld, D., & Lombrozo, T. (2015). Inference to the best explanation (IBE) versus explaining for the best inference (EBI). Science & Education. https:\/\/doi.org\/10.1007\/s11191-015-9784-4","journal-title":"Science & Education"},{"issue":"1","key":"9800_CR228","doi-asserted-by":"publisher","first-page":"137","DOI":"10.1023\/A:1008259020140","volume":"8","author":"RA Wilson","year":"1998","unstructured":"Wilson, R. A., & Keil, F. (1998). The shadows and shallows of explanation. Minds and Machines, 8(1), 137\u2013159. https:\/\/doi.org\/10.1023\/A:1008259020140","journal-title":"Minds and Machines"},{"issue":"11","key":"9800_CR229","doi-asserted-by":"publisher","first-page":"508","DOI":"10.1038\/s42256-019-0104-6","volume":"1","author":"W Woods","year":"2019","unstructured":"Woods, W., Chen, J., & Teuscher, C. (2019). Adversarial explanations for understanding image classification decisions and improved neural network robustness. Nature Machine Intelligence, 1(11), 508\u2013516. https:\/\/doi.org\/10.1038\/s42256-019-0104-6","journal-title":"Nature Machine Intelligence"},{"issue":"2","key":"9800_CR230","doi-asserted-by":"publisher","first-page":"87","DOI":"10.1006\/obhd.1997.2696","volume":"70","author":"J Yates","year":"1997","unstructured":"Yates, J., Lee, J. W., & Bush, J. G. (1997). General knowledge overconfidence: Cross-national variations, response style, and \u201creality\u2019\u2019. Organizational Behavior and Human Decision Processes, 70(2), 87\u201394. https:\/\/doi.org\/10.1006\/obhd.1997.2696","journal-title":"Organizational Behavior and Human Decision Processes"},{"key":"9800_CR231","doi-asserted-by":"crossref","DOI":"10.1093\/acprof:oso\/9780199936472.001.0001","volume-title":"Epistemic authority: A theory of trust, authority, and autonomy in belief","author":"LT Zagzebski","year":"2012","unstructured":"Zagzebski, L. T. (2012). Epistemic authority: A theory of trust, authority, and autonomy in belief. Oxford University Press."},{"key":"9800_CR232","doi-asserted-by":"crossref","unstructured":"Zhang, C., Yang, Z., & Ye, Z. (2018). Detecting adversarial perturbations with saliency. CoRR abs\/1803.08773. http:\/\/arxiv.org\/abs\/1803.08773","DOI":"10.1109\/SIPROCESS.2018.8600516"},{"key":"9800_CR233","doi-asserted-by":"publisher","unstructured":"Zhang, H., Gao, J., & Su, L. (2021). Data poisoning attacks against outcome interpretations of predictive models. In F. Zhu, B. C. Ooi & C. Miao (Eds.), KDD \u201921: The 27th ACM SIGKDD conference on knowledge discovery and data mining, virtual event, Singapore, August 14-18, 2021 (pp. 2165\u20132173). ACM. https:\/\/doi.org\/10.1145\/3447548.3467405","DOI":"10.1145\/3447548.3467405"},{"key":"9800_CR234","unstructured":"Zhang, H., Yu, Y., Jiao, J, Xing, E. P., El Ghaoui, L., & Jordan, M. I. (2019) Theoretically principled trade-off between robustness and accuracy. In K. Chaudhuri & R. Salakhutdinov (Eds.), Proceedings of the 36th international conference on machine learning, ICML 2019, 9-15 June 2019, Long Beach, California, USA, proceedings of machine learning research (Vol.\u00a097, pp. 7472\u20137482). PMLR. http:\/\/proceedings.mlr.press\/v97\/zhang19p.html"},{"key":"9800_CR235","unstructured":"Zhang, X., Wang, N., Shen, H., Ji, S., Luo, X., & Wang, T. (2020) Interpretable deep learning under fire. In S. Capkun & F. Roesner (Eds.), 29th USENIX security symposium, USENIX security 2020, August 12-14, 2020 (pp. 1659\u20131676). USENIX Association. https:\/\/www.usenix.org\/conference\/usenixsecurity20\/presentation\/zhang-xinyang"}],"container-title":["Ethics and Information Technology"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10676-024-09800-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10676-024-09800-7\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10676-024-09800-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,4,5]],"date-time":"2025-04-05T18:50:27Z","timestamp":1743879027000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10676-024-09800-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,12,14]]},"references-count":236,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2025,3]]}},"alternative-id":["9800"],"URL":"https:\/\/doi.org\/10.1007\/s10676-024-09800-7","relation":{},"ISSN":["1388-1957","1572-8439"],"issn-type":[{"value":"1388-1957","type":"print"},{"value":"1572-8439","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,12,14]]},"assertion":[{"value":"14 December 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors have no conflict of interest to declare that are relevant to the content of the submitted draft.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"We have also obtained the necessary ethical consent from the responsible authorities (i.e., the University of Santiago de Compostela) where the research has been conducted.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical approval"}},{"value":"No experiment was conducted with human participants or animals for this study.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Research involving human participants and\/or animals"}}],"article-number":"5"}}