{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,25]],"date-time":"2025-03-25T19:04:06Z","timestamp":1742929446243,"version":"3.40.3"},"publisher-location":"Cham","reference-count":41,"publisher":"Springer Nature Switzerland","isbn-type":[{"type":"print","value":"9783031342035"},{"type":"electronic","value":"9783031342042"}],"license":[{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023]]},"DOI":"10.1007\/978-3-031-34204-2_45","type":"book-chapter","created":{"date-parts":[[2023,6,6]],"date-time":"2023-06-06T23:04:18Z","timestamp":1686092658000},"page":"558-569","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Towards Explaining Shortcut Learning Through Attention Visualization and\u00a0Adversarial Attacks"],"prefix":"10.1007","author":[{"given":"Pedro Gon\u00e7alo","family":"Correia","sequence":"first","affiliation":[]},{"given":"Henrique","family":"Lopes Cardoso","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2023,6,7]]},"reference":[{"key":"45_CR1","unstructured":"Chowdhery, A. et al.: PaLM: Scaling Language Modeling with Pathways. arXiv:2204.02311 (2022)"},{"key":"45_CR2","unstructured":"Bahdanau, D., Cho, K., Bengio, Y.: Neural Machine Translation by Jointly Learning to Align and Translate. In: Bengio, Y., LeCun, Y. (eds.) 3rd Int. Conf. on Learning Representations, ICLR 2015, San Diego, CA, USA, May 7\u20139, 2015, Conf. Track Proceedings (2015)"},{"key":"45_CR3","doi-asserted-by":"publisher","unstructured":"Bekoulis, G., Papagiannopoulou, C., Deligiannis, N.: A Review on Fact Extraction and Verification. ACM Comput. Surv. 55(1) (nov 2021). https:\/\/doi.org\/10.1145\/3485127","DOI":"10.1145\/3485127"},{"key":"45_CR4","doi-asserted-by":"publisher","unstructured":"Bowman, S.R., Angeli, G., Potts, C., Manning, C.D.: A large annotated corpus for learning natural language inference. In: Proceedings of 2015 Conference on Empirical Methods in Natural Language Processing, pp. 632\u2013642. ACL, Lisbon, Portugal (Sep 2015). https:\/\/doi.org\/10.18653\/v1\/D15-1075","DOI":"10.18653\/v1\/D15-1075"},{"key":"45_CR5","doi-asserted-by":"publisher","unstructured":"Branco, R., Branco, A., Ant\u00f3nio Rodrigues, J., Silva, J.R.: Shortcutted Commonsense: Data Spuriousness in Deep Learning of Commonsense Reasoning. In: Proceedings of 2021 Conference on Empirical Methods in Natural Language Processing, pp. 1504\u20131521. ACL (Nov 2021). https:\/\/doi.org\/10.18653\/v1\/2021.emnlp-main.113","DOI":"10.18653\/v1\/2021.emnlp-main.113"},{"issue":"4","key":"45_CR6","doi-asserted-by":"publisher","first-page":"966","DOI":"10.3390\/make3040048","volume":"3","author":"V Buhrmester","year":"2021","unstructured":"Buhrmester, V., M\u00fcnch, D., Arens, M.: Analysis of Explainers of Black Box Deep Neural Networks for Computer Vision: a survey. Mach. Learn. Knowl. Extract. 3(4), 966\u2013989 (2021). https:\/\/doi.org\/10.3390\/make3040048","journal-title":"Mach. Learn. Knowl. Extract."},{"key":"45_CR7","doi-asserted-by":"publisher","unstructured":"Devlin, J., Chang, M.W., Lee, K., Toutanova, K.: BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding. In: Proc. 2019 Conf. of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long and Short Papers), pp. 4171\u20134186. ACL, Minneapolis, Minnesota (Jun 2019). https:\/\/doi.org\/10.18653\/v1\/N19-1423","DOI":"10.18653\/v1\/N19-1423"},{"key":"45_CR8","doi-asserted-by":"publisher","unstructured":"Du, M., et al.: owards Interpreting and Mitigating Shortcut Learning Behavior of NLU models. In: Proc. 2021 Conf. of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, pp. 915\u2013929. ACL (Jun 2021). https:\/\/doi.org\/10.18653\/v1\/2021.naacl-main.71","DOI":"10.18653\/v1\/2021.naacl-main.71"},{"key":"45_CR9","doi-asserted-by":"publisher","unstructured":"Feng, S., Wallace, E., Grissom II, A., Iyyer, M., Rodriguez, P., Boyd-Graber, J.: Pathologies of Neural Models Make Interpretations Difficult. In: Proc. 2018 Conf. on Empirical Methods in Natural Language Processing, pp. 3719\u20133728. ACL, Brussels, Belgium (Oct-Nov 2018). https:\/\/doi.org\/10.18653\/v1\/D18-1407","DOI":"10.18653\/v1\/D18-1407"},{"key":"45_CR10","doi-asserted-by":"publisher","unstructured":"Galassi, A., Lippi, M., Torroni, P.: Attention in Natural Language Processing. IEEE Trans. Neural Netw. Learn. Syst. 32(10), 4291\u20134308 (10 2021). https:\/\/doi.org\/10.1109\/tnnls.2020.3019893","DOI":"10.1109\/tnnls.2020.3019893"},{"key":"45_CR11","doi-asserted-by":"publisher","unstructured":"Garg, S., Ramakrishnan, G.: BAE: BERT-based Adversarial Examples for Text Classification. In: Proc. 2020 Conf. on Empirical Methods in Natural Language Processing (EMNLP), pp. 6174\u20136181. ACL (Nov 2020). https:\/\/doi.org\/10.18653\/v1\/2020.emnlp-main.498","DOI":"10.18653\/v1\/2020.emnlp-main.498"},{"key":"45_CR12","doi-asserted-by":"publisher","unstructured":"Geirhos, R., et al.: Shortcut learning in deep neural networks. Nature Mach. Intell. 2(11), 665\u2013673 (11 2020). https:\/\/doi.org\/10.1038\/s42256-020-00257-z","DOI":"10.1038\/s42256-020-00257-z"},{"key":"45_CR13","unstructured":"Goodfellow, I.J., Shlens, J., Szegedy, C.: Explaining and Harnessing Adversarial Examples. In: Bengio, Y., LeCun, Y. (eds.) 3rd Int. Conf. on Learning Representations, ICLR 2015, San Diego, CA, USA, May 7\u20139, 2015, Conference Track Proceedings (2015)"},{"key":"45_CR14","doi-asserted-by":"publisher","unstructured":"Gururangan, S., Swayamdipta, S., Levy, O., Schwartz, R., Bowman, S., Smith, N.A.: Annotation Artifacts in Natural Language Inference Data. In: Proc. 2018 Conf. of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 2 (Short Papers), pp. 107\u2013112. ACL, New Orleans, Louisiana (Jun 2018). https:\/\/doi.org\/10.18653\/v1\/N18-2017","DOI":"10.18653\/v1\/N18-2017"},{"key":"45_CR15","doi-asserted-by":"crossref","unstructured":"Han, X., Wallace, B.C., Tsvetkov, Y.: Explaining Black Box Predictions and Unveiling Data Artifacts through Influence Functions. In: Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, pp. 5553\u20135563. ACL (Jul 2020). 10.18653\/v1\/2020.acl-main.492","DOI":"10.18653\/v1\/2020.acl-main.492"},{"key":"45_CR16","doi-asserted-by":"publisher","unstructured":"Jain, S., Wallace, B.C.: Attention is not Explanation. In: Proceedings 2019 Conf. of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long and Short Papers), pp. 3543\u20133556. ACL, Minneapolis, Minnesota (Jun 2019). https:\/\/doi.org\/10.18653\/v1\/N19-1357","DOI":"10.18653\/v1\/N19-1357"},{"key":"45_CR17","doi-asserted-by":"publisher","unstructured":"Jin, D., Jin, Z., Zhou, J.T., Szolovits, P.: Is BERT Really Robust? A Strong Baseline for Natural Language Attack on Text Classification and Entailment. In: Proceedings of the AAAI Conference on Artificial Intelligence. vol. 34, pp. 8018\u20138025 (Apr 2020). https:\/\/doi.org\/10.1609\/aaai.v34i05.6311","DOI":"10.1609\/aaai.v34i05.6311"},{"key":"45_CR18","unstructured":"Koh, P.W., Liang, P.: Understanding Black-Box Predictions via Influence Functions. In: Proceedings of the 34th International Conference on Machine Learning - Volume 70, pp. 1885\u20131894. JMLR.org (2017)"},{"key":"45_CR19","doi-asserted-by":"publisher","unstructured":"Kovaleva, O., Romanov, A., Rogers, A., Rumshisky, A.: Revealing the Dark Secrets of BERT. In: Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th Int. J. Conf. on Natural Language Processing (EMNLP-IJCNLP), pp. 4365\u20134374. ACL, Hong Kong, China (Nov 2019). https:\/\/doi.org\/10.18653\/v1\/D19-1445","DOI":"10.18653\/v1\/D19-1445"},{"key":"45_CR20","unstructured":"Kuleshov, V., Thakoor, S., Lau, T., Ermon, S.: Adversarial Examples for Natural Language Classification Problems (2018). https:\/\/openreview.net\/forum?id=r1QZ3zbAZ"},{"key":"45_CR21","doi-asserted-by":"publisher","unstructured":"Lee, J., Shin, J.H., Kim, J.S.: Interactive Visualization and Manipulation of Attention-based Neural Machine Translation. In: Proceedings of the 2017 Conference on Empirical Methods in Natural Language Processing: System Demonstrations, pp. 121\u2013126. ACL, Copenhagen, Denmark (Sep 2017). https:\/\/doi.org\/10.18653\/v1\/D17-2021","DOI":"10.18653\/v1\/D17-2021"},{"key":"45_CR22","unstructured":"Lei, D., Chen, X., Zhao, J.: Opening the black box of deep learning. arXiv:1805.08355 (2018)"},{"key":"45_CR23","doi-asserted-by":"publisher","unstructured":"Li, L., Ma, R., Guo, Q., Xue, X., Qiu, X.: BERT-ATTACK: Adversarial Attack Against BERT Using BERT. In: Proceedings 2020 Conference on Empirical Methods in Natural Language Processing (EMNLP), pp. 6193\u20136202. ACL (Nov 2020). https:\/\/doi.org\/10.18653\/v1\/2020.emnlp-main.500","DOI":"10.18653\/v1\/2020.emnlp-main.500"},{"key":"45_CR24","doi-asserted-by":"crossref","unstructured":"MacCartney, B., Manning, C.D.: Modeling Semantic Containment and Exclusion in Natural Language Inference. In: Proceedings of the 22nd International Conference on Computational Linguistics (Coling 2008), pp. 521\u2013528. Coling 2008 Organizing Committee, Manchester, UK (Aug 2008)","DOI":"10.3115\/1599081.1599147"},{"key":"45_CR25","unstructured":"Mnih, V., Heess, N., Graves, A., Kavukcuoglu, K.: Recurrent Models of Visual Attention. In: Proceedings of the 27th International Conference on Neural Information Processing Systems - vol. 2, pp.. 2204\u20132212. NIPS\u201914, MIT Press, Cambridge, MA, USA (2014)"},{"key":"45_CR26","doi-asserted-by":"publisher","unstructured":"Morris, J., Lifland, E., Yoo, J.Y., Grigsby, J., Jin, D., Qi, Y.: TextAttack: A framework for adversarial attacks, data augmentation, and adversarial training in NLP. In: Proceedings 2020 Conference on Empirical Methods in Natural Language Processing: System Demonstrations, pp. 119\u2013126. ACL (Oct 2020). https:\/\/doi.org\/10.18653\/v1\/2020.emnlp-demos.16","DOI":"10.18653\/v1\/2020.emnlp-demos.16"},{"key":"45_CR27","doi-asserted-by":"publisher","unstructured":"Niven, T., Kao, H.Y.: Probing Neural Network Comprehension of Natural Language Arguments. In: Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics, pp. 4658\u20134664. ACL, Florence, Italy (Jul 2019). https:\/\/doi.org\/10.18653\/v1\/P19-1459","DOI":"10.18653\/v1\/P19-1459"},{"key":"45_CR28","doi-asserted-by":"publisher","unstructured":"Peldszus, A., Stede, M.: Joint prediction in MST-style discourse parsing for argumentation mining. In: Proceedings of the 2015 Conference. on Empirical Methods in Natural Language Processing, pp. 938\u2013948. ACL, Lisbon, Portugal (Sep 2015). https:\/\/doi.org\/10.18653\/v1\/D15-1110","DOI":"10.18653\/v1\/D15-1110"},{"key":"45_CR29","doi-asserted-by":"publisher","unstructured":"Ren, S., Deng, Y., He, K., Che, W.: Generating Natural Language Adversarial Examples through Probability Weighted Word Saliency. In: Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics, pp. 1085\u20131097. ACL, Florence, Italy (Jul 2019). https:\/\/doi.org\/10.18653\/v1\/P19-1103","DOI":"10.18653\/v1\/P19-1103"},{"key":"45_CR30","doi-asserted-by":"publisher","unstructured":"Ribeiro, M.T., Wu, T., Guestrin, C., Singh, S.: Beyond accuracy: Behavioral testing of NLP models with CheckList. In: Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, pp. 4902\u20134912. ACL (Jul 2020). https:\/\/doi.org\/10.18653\/v1\/2020.acl-main.442","DOI":"10.18653\/v1\/2020.acl-main.442"},{"key":"45_CR31","doi-asserted-by":"publisher","unstructured":"Rocha, G., Stab, C., Lopes Cardoso, H., Gurevych, I.: Cross-lingual argumentative relation identification: from English to Portuguese. In: Proceedings of the 5th Workshop on Argument Mining, pp. 144\u2013154. ACL, Brussels, Belgium (Nov 2018). https:\/\/doi.org\/10.18653\/v1\/W18-5217","DOI":"10.18653\/v1\/W18-5217"},{"key":"45_CR32","unstructured":"Sanh, V., Debut, L., Chaumond, J., Wolf, T.: Distilbert, a distilled version of bert: smaller, faster, cheaper and lighter. ArXiv abs\/1910.01108 (2019)"},{"key":"45_CR33","doi-asserted-by":"publisher","unstructured":"Serrano, S., Smith, N.A.: Is Attention Interpretable? In: Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics, pp. 2931\u20132951. ACL, Florence, Italy (Jul 2019). https:\/\/doi.org\/10.18653\/v1\/P19-1282","DOI":"10.18653\/v1\/P19-1282"},{"issue":"1","key":"45_CR34","doi-asserted-by":"publisher","first-page":"353","DOI":"10.1109\/TVCG.2018.2865044","volume":"25","author":"H Strobelt","year":"2019","unstructured":"Strobelt, H., Gehrmann, S., Behrisch, M., Perer, A., Pfister, H., Rush, A.M.: Seq2seq-Vis: a visual debugging tool for sequence-to-sequence models. IEEE Trans. Visual Comput. Graph. 25(1), 353\u2013363 (2019). https:\/\/doi.org\/10.1109\/TVCG.2018.2865044","journal-title":"IEEE Trans. Visual Comput. Graph."},{"key":"45_CR35","unstructured":"Brown, T., et al.: Language Models are Few-Shot Learners. In: Larochelle, H., Ranzato, M., Hadsell, R., Balcan, M.F., Lin, H. (eds.) In: Advances in Neural Information Processing Systems. vol. 33, pp. 1877\u20131901. Curran Associates, Inc. (2020)"},{"key":"45_CR36","doi-asserted-by":"publisher","unstructured":"Thorne, J., Vlachos, A., Christodoulopoulos, C., Mittal, A.: FEVER: a Large-scale Dataset for Fact Extraction and VERification. In: Proceedings of the 2018 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long Papers), pp. 809\u2013819. ACL, New Orleans, Louisiana (Jun 2018). https:\/\/doi.org\/10.18653\/v1\/N18-1074","DOI":"10.18653\/v1\/N18-1074"},{"key":"45_CR37","unstructured":"Vaswani, A., et al.: Attention is All You Need. In: Proc. Int. Conf. on Neural Information Processing Systems, pp. 6000\u20136010. NIPS\u201917, Curran Associates Inc., Red Hook, NY, USA (2017)"},{"key":"45_CR38","doi-asserted-by":"publisher","unstructured":"Vig, J.: A Multiscale Visualization of Attention in the Transformer Model. In: Proceedings 57th Annual Meeting of the Association for Computational Linguistics: System Demonstrations, pp. 37\u201342. ACL, Florence, Italy (Jul 2019). https:\/\/doi.org\/10.18653\/v1\/P19-3007","DOI":"10.18653\/v1\/P19-3007"},{"key":"45_CR39","doi-asserted-by":"publisher","unstructured":"Wagner, R.A., Fischer, M.J.: The String-to-String Correction Problem. J. ACM 21(1), 168\u2013173 (1 1974). https:\/\/doi.org\/10.1145\/321796.321811","DOI":"10.1145\/321796.321811"},{"key":"45_CR40","doi-asserted-by":"publisher","unstructured":"Wiegreffe, S., Pinter, Y.: Attention is not not Explanation. In: Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Journal Conference on Natural Language Processing (EMNLP-IJCNLP), pp. 11\u201320. ACL, Hong Kong, China (Nov 2019). https:\/\/doi.org\/10.18653\/v1\/D19-1002","DOI":"10.18653\/v1\/D19-1002"},{"key":"45_CR41","doi-asserted-by":"publisher","unstructured":"Wolf, T., et al.: Transformers: State-of-the-Art Natural Language Processing. In: Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing: System Demonstrations, pp. 38\u201345. ACL (Oct 2020). https:\/\/doi.org\/10.18653\/v1\/2020.emnlp-demos.6","DOI":"10.18653\/v1\/2020.emnlp-demos.6"}],"container-title":["Communications in Computer and Information Science","Engineering Applications of Neural Networks"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-34204-2_45","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,6,6]],"date-time":"2023-06-06T23:16:24Z","timestamp":1686093384000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-34204-2_45"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023]]},"ISBN":["9783031342035","9783031342042"],"references-count":41,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-34204-2_45","relation":{},"ISSN":["1865-0929","1865-0937"],"issn-type":[{"type":"print","value":"1865-0929"},{"type":"electronic","value":"1865-0937"}],"subject":[],"published":{"date-parts":[[2023]]},"assertion":[{"value":"7 June 2023","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"EANN","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Engineering Applications of Neural Networks","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Le\u00f3n","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Spain","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2023","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"14 June 2023","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"17 June 2023","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"24","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eann2023","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eannconf.org\/2023\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Single-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Easyacademia","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"125","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"41","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"8","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"33% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"2.4","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3.2","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"No","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}