{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,19]],"date-time":"2026-02-19T17:38:38Z","timestamp":1771522718008,"version":"3.50.1"},"publisher-location":"Singapore","reference-count":19,"publisher":"Springer Nature Singapore","isbn-type":[{"value":"9789819568871","type":"print"},{"value":"9789819568888","type":"electronic"}],"license":[{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2026]]},"DOI":"10.1007\/978-981-95-6888-8_13","type":"book-chapter","created":{"date-parts":[[2026,2,19]],"date-time":"2026-02-19T16:58:05Z","timestamp":1771520285000},"page":"183-196","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["SecEval: A Security Evaluation Dataset for\u00a0Large Language Models"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0009-0004-7408-8719","authenticated-orcid":false,"given":"Huining","family":"Cui","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3003-1313","authenticated-orcid":false,"given":"Wei","family":"Liu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2026,2,20]]},"reference":[{"key":"13_CR1","unstructured":"Bhatt, M., et\u00a0al.: Cyberseceval 2: a wide-ranging cybersecurity evaluation suite for large language models. arXiv preprint arXiv:2404.13161 (2024)"},{"key":"13_CR2","unstructured":"Bhatt, M., et\u00a0al.: Purple llama cyberseceval: a secure coding benchmark for language models. arXiv preprint arXiv:2312.04724 (2023)"},{"key":"13_CR3","unstructured":"Ferrag, M.A., Battah, A., Tihanyi, N., Debbah, M., Lestable, T., Cordeiro, L.C.: Securefalcon: the next cyber reasoning system for cyber security. arXiv preprint arXiv:2307.06616 (2023)"},{"key":"13_CR4","unstructured":"Ferrag, M.A., Ndhlovu, M., Tihanyi, N., Cordeiro, L.C., Debbah, M., Lestable, T.: Revolutionizing cyber threat detection with large language models. arXiv preprint arXiv:2306.14263 (2023)"},{"key":"13_CR5","unstructured":"Hou, X., et al.: Large language models for software engineering: A systematic literature review. arXiv preprint arXiv:2308.10620 (2023)"},{"key":"13_CR6","doi-asserted-by":"crossref","unstructured":"Kavian, A., Kallehbasti, M.M.P., Kazemi, S., Firouzi, E., Ghafari, M.: LLM security guard for code. arXiv preprint arXiv:2405.01103 (2024)","DOI":"10.1145\/3661167.3661263"},{"key":"13_CR7","doi-asserted-by":"crossref","unstructured":"Li, H., et al.: Multi-step jailbreaking privacy attacks on chatgpt. arXiv preprint arXiv:2304.05197 (2023)","DOI":"10.18653\/v1\/2023.findings-emnlp.272"},{"key":"13_CR8","unstructured":"Liu, C., et al.: Goal-oriented prompt attack and safety evaluation for LLMs. arXiv e-prints, pp. arXiv\u20132309 (2023)"},{"key":"13_CR9","unstructured":"Liu, Z., Shi, J., Buford, J.F.: Cyberbench: a multi-task benchmark for evaluating large language models in cybersecurity"},{"key":"13_CR10","unstructured":"Perez, F., Ribeiro, I.: Ignore previous prompt: attack techniques for language models. arXiv preprint arXiv:2211.09527 (2022)"},{"key":"13_CR11","doi-asserted-by":"crossref","unstructured":"Pravasi, A., Das, S.: Assessing chatgpt\u2019s efficacy in interpreting privacy policies. In: ACM CHI 24\u2019Workshop: Generative AI in User-Generated Content (2024)","DOI":"10.2139\/ssrn.4825426"},{"key":"13_CR12","unstructured":"Siddiq, M.L., Santos, J.: Generate and pray: using sallms to evaluate the security of LLM generated code. arXiv preprint arXiv:2311.00889 (2023)"},{"issue":"7972","key":"13_CR13","doi-asserted-by":"publisher","first-page":"172","DOI":"10.1038\/s41586-023-06291-2","volume":"620","author":"K Singhal","year":"2023","unstructured":"Singhal, K., et al.: Large language models encode clinical knowledge. Nature 620(7972), 172\u2013180 (2023)","journal-title":"Nature"},{"key":"13_CR14","unstructured":"Tihanyi, N., Ferrag, M.A., Jain, R., Debbah, M.: Cybermetric: a benchmark dataset for evaluating large language models knowledge in cybersecurity. arXiv preprint arXiv:2402.07688 (2024)"},{"key":"13_CR15","doi-asserted-by":"crossref","unstructured":"Ullah, S., Han, M., Pujar, S., Pearce, H., Coskun, A., Stringhini, G.: LLMs cannot reliably identify and reason about security vulnerabilities (yet?): a comprehensive evaluation, framework, and benchmarks. In: IEEE Symposium on Security and Privacy (2024)","DOI":"10.1109\/SP54263.2024.00210"},{"key":"13_CR16","unstructured":"Wu, S., et al.: Bloomberggpt: a large language model for finance. arXiv preprint arXiv:2303.17564 (2023)"},{"key":"13_CR17","unstructured":"Zellers, R., et al.: Defending against neural fake news. In: Advances in Neural Information Processing Systems, vol. 32 (2019)"},{"key":"13_CR18","doi-asserted-by":"crossref","unstructured":"Zhang, J., Bu, H., Wen, H., Chen, Y., Li, L., Zhu, H.: When LLMs meet cybersecurity: a systematic literature review. arXiv preprint arXiv:2405.03644 (2024)","DOI":"10.1186\/s42400-025-00361-w"},{"key":"13_CR19","unstructured":"Zhang, M., Pan, X., Yang, M.: Jade: a linguistics-based safety evaluation platform for LLM. arXiv preprint arXiv:2311.00286 (2023)"}],"container-title":["Communications in Computer and Information Science","Data Science and Machine Learning"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-981-95-6888-8_13","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,2,19]],"date-time":"2026-02-19T16:58:09Z","timestamp":1771520289000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-981-95-6888-8_13"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026]]},"ISBN":["9789819568871","9789819568888"],"references-count":19,"URL":"https:\/\/doi.org\/10.1007\/978-981-95-6888-8_13","relation":{},"ISSN":["1865-0929","1865-0937"],"issn-type":[{"value":"1865-0929","type":"print"},{"value":"1865-0937","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026]]},"assertion":[{"value":"20 February 2026","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"AusDM","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Australasian Conference on Data Science and Machine Learning","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Melbourne, VIC","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Australia","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"24 November 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"26 November 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"22","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"ausdm2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/ausdm24.ausdm.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}