{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,12]],"date-time":"2026-03-12T15:38:09Z","timestamp":1773329889348,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":38,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,4,14]],"date-time":"2024-04-14T00:00:00Z","timestamp":1713052800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,4,14]]},"DOI":"10.1145\/3650105.3652291","type":"proceedings-article","created":{"date-parts":[[2024,6,12]],"date-time":"2024-06-12T16:01:35Z","timestamp":1718208095000},"page":"52-56","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":8,"title":["Assessing the Impact of GPT-4 Turbo in Generating Defeaters for Assurance Cases"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0005-4066-8966","authenticated-orcid":false,"given":"Kimya","family":"Khakzad Shahandashti","sequence":"first","affiliation":[{"name":"York University, Toronto, Canada"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0000-6463-449X","authenticated-orcid":false,"given":"Mithila","family":"Sivakumar","sequence":"additional","affiliation":[{"name":"York University, Toronto, Canada"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0000-8192-0164","authenticated-orcid":false,"given":"Mohammad Mahdi","family":"Mohajer","sequence":"additional","affiliation":[{"name":"York University, Toronto, Canada"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7533-7212","authenticated-orcid":false,"given":"Alvine","family":"Boaye Belle","sequence":"additional","affiliation":[{"name":"York University, Toronto, Canada"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0617-2877","authenticated-orcid":false,"given":"Song","family":"Wang","sequence":"additional","affiliation":[{"name":"York University, Toronto, Canada"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9410-2056","authenticated-orcid":false,"given":"Timothy","family":"Lethbridge","sequence":"additional","affiliation":[{"name":"University of Ottawa, Ottawa, Canada"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2024,6,12]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"crossref","first-page":"119569","DOI":"10.1016\/j.eswa.2023.119569","article-title":"Evidence-based decision-making: On the use of systematicity cases to check the compliance of reviews with reporting guidelines such as PRISMA 2020","volume":"217","author":"Belle A. B.","year":"2023","unstructured":"A. B. Belle and Y. Zhao. 2023. Evidence-based decision-making: On the use of systematicity cases to check the compliance of reviews with reporting guidelines such as PRISMA 2020. Expert Systems with Applications 217 (2023), 119569.","journal-title":"Expert Systems with Applications"},{"key":"e_1_3_2_1_2_1","volume-title":"Safety and Reliability","volume":"20","author":"Bishop P.","unstructured":"P. Bishop and R. Bloomfield. 2000. A methodology for safety case development. In Safety and Reliability, Vol. 20. Taylor & Francis, 34--42."},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"crossref","unstructured":"M. Chaaben L. Burgue\u00f1o and H. Sahraoui. 2023. Towards using few-shot prompt learning for automating model completion. In ICSE-NIER. IEEE 7--12.","DOI":"10.1109\/ICSE-NIER58687.2023.00008"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.ress.2022.108933"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"crossref","unstructured":"B. Chen K. Chen S. Hassani Y. Yang D. Amyot L. Lessard G. Mussbacher M. Sabetzadeh and D. Varr\u00f3. 2023. On the use of GPT-4 for creating goal models: an exploratory study. In REW. IEEE 262--271.","DOI":"10.1109\/REW57809.2023.00052"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"crossref","unstructured":"E. Cioroaica B. Buhnova D. Schneider I. Sorokos T. Kuhn and E. Tomur. 2022. Towards the Concept of Trust Assurance Case. In TrustCom. IEEE 1581--1586.","DOI":"10.1109\/TrustCom56396.2022.00227"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1109\/TSE.2016.2553032"},{"key":"e_1_3_2_1_8_1","volume-title":"ICSE","volume":"2","author":"Denney E.","unstructured":"E. Denney, G. Pai, and I. Habli. 2015. Dynamic safety cases for through-life safety assurance. In ICSE, Vol. 2. IEEE, 587--590."},{"key":"e_1_3_2_1_9_1","volume-title":"Bert: Pre-training of deep bidirectional transformers for language understanding. arXiv preprint arXiv:1810.04805","author":"Devlin J.","year":"2018","unstructured":"J. Devlin, M. Chang, K. Lee, and Kristina Toutanova. 2018. Bert: Pre-training of deep bidirectional transformers for language understanding. arXiv preprint arXiv:1810.04805 (2018)."},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"crossref","unstructured":"S. Diemert and J. Joyce. 2020. Eliminative Argumentation for Arguing System Safety-A Practitioner's Experience. In SysCon. IEEE 1--7.","DOI":"10.1109\/SysCon47679.2020.9275852"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1007\/s00165-021-00537-4"},{"key":"e_1_3_2_1_12_1","volume-title":"Evidence: Using Safety Cases in Industry and Healthcare.","author":"Foundation Health","year":"2012","unstructured":"Health Foundation. 2012. Evidence: Using Safety Cases in Industry and Healthcare."},{"key":"e_1_3_2_1_13_1","volume-title":"Tech. Rep. CMU\/SEI-2015-TR-005","author":"Goodenough J. B.","year":"2015","unstructured":"J. B. Goodenough, C. B. Weinstock, and A. Z. Klein. 2015. Eliminative argumentation: A basis for arguing confidence in system properties. SEI, Carnegie Mellon University, Pittsburgh, PA, Tech. Rep. CMU\/SEI-2015-TR-005 (2015)."},{"key":"e_1_3_2_1_14_1","unstructured":"The Assurance Case Working Group. 2021. Goal Structuring Notation Standard Version 3. https:\/\/scsc.uk\/r141C:1?t=1"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"crossref","unstructured":"A. Groza I. A. Letia A. Goron and S. Zaporojan. 2015. A formal approach for identifying assurance deficits in unmanned aerial vehicle software. In ICSEng. Springer 233--239.","DOI":"10.1007\/978-3-319-08422-0_35"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"crossref","unstructured":"R. Hawkins I. Habli D. Kolovos R. Paige and T. Kelly. 2015. Weaving an assurance case from design: a model-based approach. In HASE. IEEE 110--117.","DOI":"10.1109\/HASE.2015.25"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"crossref","unstructured":"R. Hawkins T. Kelly J. Knight and P. Graydon. 2011. A new approach to creating clear safety arguments. In SSS. Springer 3--23.","DOI":"10.1007\/978-0-85729-133-2_1"},{"key":"e_1_3_2_1_18_1","first-page":"11","article-title":"DO-178B: Software considerations in airborne systems and equipment certification","volume":"199","author":"Johnson L. A.","year":"1998","unstructured":"L. A. Johnson et al. 1998. DO-178B: Software considerations in airborne systems and equipment certification. Crosstalk, October 199 (1998), 11--20.","journal-title":"Crosstalk"},{"key":"e_1_3_2_1_19_1","unstructured":"K. Khakzad S. Alvine B. Belle T. C. Lethbridge O. Odu and M. Sivakumar. 2023. A PRISMA-driven systematic mapping study on system assurance weakeners. arXiv preprint arXiv:2311.08328 (2023)."},{"key":"e_1_3_2_1_20_1","first-page":"22199","article-title":"Large language models are zero-shot reasoners","volume":"35","author":"Kojima T.","year":"2022","unstructured":"T. Kojima, S. S. Gu, M. Reid, Y. Matsuo, and Y. Iwasawa. 2022. Large language models are zero-shot reasoners. NeuRIPS 35 (2022), 22199--22213.","journal-title":"NeuRIPS"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"crossref","unstructured":"Z. Langari and T. Maibaum. 2013. Safety cases: a review of challenges. In ASSURE. IEEE 1--6.","DOI":"10.1109\/ASSURE.2013.6614263"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"crossref","first-page":"1297","DOI":"10.1587\/transinf.2019KBP0014","article-title":"Facilitating use of assurance cases in industries by workshops with an agent-based method","volume":"103","author":"Matsuno Yutaka","year":"2020","unstructured":"Yutaka Matsuno, Toshinori Takai, and Shuichiro Yamamoto. 2020. Facilitating use of assurance cases in industries by workshops with an agent-based method. IEICE TRANSACTIONS on Information and Systems 103, 6 (2020), 1297--1308.","journal-title":"IEICE TRANSACTIONS on Information and Systems"},{"key":"e_1_3_2_1_23_1","first-page":"1","article-title":"A culturally sensitive test to evaluate nuanced gpt hallucination","volume":"1","author":"McIntosh T. R.","year":"2023","unstructured":"T. R. McIntosh, T. Liu, T. Susnjak, P. Watters, A. Ng, and M. N. Halgamuge. 2023. A culturally sensitive test to evaluate nuanced gpt hallucination. TAI 1, 01 (2023), 1--13.","journal-title":"TAI"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"crossref","unstructured":"C. Menghi T. Viger A. Di Sandro C. Rees J. Joyce and M. Chechik. 2023. Assurance case development as data: A manifesto. In ICSE-NIER. IEEE 135--139.","DOI":"10.1109\/ICSE-NIER58687.2023.00030"},{"key":"e_1_3_2_1_25_1","unstructured":"M. M. Mohajer R. Aleithan N. S. Harzevili M. Wei A. B. Belle H. V. Pham and S. Wang. 2023. SkipAnalyzer: An Embodied Agent for Code Analysis with Large Language Models. arXiv preprint arXiv:2310.18532 (2023)."},{"key":"e_1_3_2_1_26_1","volume-title":"2018 11th International Conference on the Quality of Information and Communications Technology (QUATIC). IEEE, 65--73","author":"Muram Faiz UL","year":"2018","unstructured":"Faiz UL Muram, Barbara Gallina, and Laura G\u00f3mez Rodr\u00edguez. 2018. Preventing omission of key evidence fallacy in process-based argumentations. In 2018 11th International Conference on the Quality of Information and Communications Technology (QUATIC). IEEE, 65--73."},{"key":"e_1_3_2_1_27_1","volume-title":"GDE Workshop in ICLP.","author":"Murugesan A.","unstructured":"A. Murugesan, I. Hong Wong, R. Stroud, J. Arias, E. Salazar, G. Gupta, R. Bloomfield, S. Varadarajan, and J. Rushby. 2023. Semantic Analysis of Assurance Cases using s (CASP). In GDE Workshop in ICLP."},{"key":"e_1_3_2_1_28_1","first-page":"689","article-title":"An extended systematic literature review on provision of evidence for safety certification","volume":"56","author":"Nair S.","year":"2014","unstructured":"S. Nair, J. L. De La Vara, M. Sabetzadeh, and L. Briand. 2014. An extended systematic literature review on provision of evidence for safety certification. IST 56, 7 (2014), 689--717.","journal-title":"IST"},{"key":"e_1_3_2_1_29_1","unstructured":"OpenAI. 2023. GPT 4. https:\/\/openai.com\/research\/gpt-4"},{"key":"e_1_3_2_1_30_1","unstructured":"OpenAI. 2023. New Models and Developer Products Announced at Dev-Day. https:\/\/openai.com\/blog\/new-models-and-developer-products-announced-at-devday. Accessed: 2024-01-14."},{"key":"e_1_3_2_1_31_1","volume-title":"SafeComp","author":"Rushby J.","unstructured":"J. Rushby. 2013. Logic and epistemology in safety cases. In SafeComp. Springer, 1--7."},{"key":"e_1_3_2_1_32_1","volume-title":"New Frontiers in Artificial Intelligence: JSAI-isAI 2013 Workshops. Springer, 304--318","author":"Rushby J.","year":"2014","unstructured":"J. Rushby. 2014. Mechanized support for assurance case argumentation. In New Frontiers in Artificial Intelligence: JSAI-isAI 2013 Workshops. Springer, 304--318."},{"key":"e_1_3_2_1_33_1","unstructured":"SACM 2021. Structured Assurance Case Metamodel. SACM."},{"key":"e_1_3_2_1_34_1","volume-title":"GPT-4 and Safety Case Generation: An Exploratory Analysis. arXiv preprint arXiv:2312.05696","author":"Sivakumar M.","year":"2023","unstructured":"M. Sivakumar, A. B. Belle, J. Shan, and K. Khakzad S. 2023. GPT-4 and Safety Case Generation: An Exploratory Analysis. arXiv preprint arXiv:2312.05696 (2023)."},{"key":"e_1_3_2_1_35_1","volume-title":"Supporting Assurance Case Development Using Generative AI. In SAFECOMP","author":"Viger T.","year":"2023","unstructured":"T. Viger, L. Murphy, S. Diemert, C. Menghi, A. Di, and M. Chechik. 2023. Supporting Assurance Case Development Using Generative AI. In SAFECOMP 2023."},{"key":"e_1_3_2_1_36_1","first-page":"24824","article-title":"Chain-of-thought prompting elicits reasoning in large language models","volume":"35","author":"Wei J.","year":"2022","unstructured":"J. Wei, X. Wang, D. Schuurmans, M. Bosma, F. Xia, E. Chi, Quoc V Le, D. Zhou, et al. 2022. Chain-of-thought prompting elicits reasoning in large language models. NeuRIPS 35 (2022), 24824--24837.","journal-title":"NeuRIPS"},{"key":"e_1_3_2_1_37_1","volume-title":"PRIMA Workshops. Springer, 47--59","author":"Yuan T.","unstructured":"T. Yuan, S. Manandhar, T. Kelly, and S. Wells. 2016. Automatically detecting fallacies in system safety arguments. In PRIMA Workshops. Springer, 47--59."},{"key":"e_1_3_2_1_38_1","unstructured":"Z. Zhu Y. Xue X. Chen D. Zhou J. Tang D. Schuurmans and H. Dai. 2023. Large Language Models can Learn Rules. arXiv preprint arXiv:2310.07064 (2023)."}],"event":{"name":"FORGE '24: 2024 IEEE\/ACM First International Conference on AI Foundation Models and Software Engineering","location":"Lisbon Portugal","acronym":"FORGE '24","sponsor":["SIGSOFT ACM Special Interest Group on Software Engineering"]},"container-title":["Proceedings of the 2024 IEEE\/ACM First International Conference on AI Foundation Models and Software Engineering"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3650105.3652291","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3650105.3652291","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T00:03:43Z","timestamp":1750291423000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3650105.3652291"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,4,14]]},"references-count":38,"alternative-id":["10.1145\/3650105.3652291","10.1145\/3650105"],"URL":"https:\/\/doi.org\/10.1145\/3650105.3652291","relation":{},"subject":[],"published":{"date-parts":[[2024,4,14]]},"assertion":[{"value":"2024-06-12","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}