{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,11]],"date-time":"2025-09-11T19:37:56Z","timestamp":1757619476803,"version":"3.44.0"},"publisher-location":"Singapore","reference-count":39,"publisher":"Springer Nature Singapore","isbn-type":[{"type":"print","value":"9789819500192"},{"type":"electronic","value":"9789819500208"}],"license":[{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-981-95-0020-8_12","type":"book-chapter","created":{"date-parts":[[2025,7,23]],"date-time":"2025-07-23T09:20:57Z","timestamp":1753262457000},"page":"138-150","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Towards a Concise Benchmark for Security Risk Evaluation in Large Language Models"],"prefix":"10.1007","author":[{"given":"Yu","family":"Zhang","sequence":"first","affiliation":[]},{"given":"Yongbing","family":"Gao","sequence":"additional","affiliation":[]},{"given":"Weihao","family":"Li","sequence":"additional","affiliation":[]},{"given":"Xinguang","family":"Wang","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,7,24]]},"reference":[{"issue":"1","key":"12_CR1","first-page":"1","volume":"38","author":"W Luo","year":"2024","unstructured":"Luo, W., Wang, H.F.: A review of the evaluation of large language model. J. Chin. Inf. Technol. 38(1), 1\u201323 (2024)","journal-title":"J. Chin. Inf. Technol."},{"issue":"9","key":"12_CR2","first-page":"1645","volume":"53","author":"WX Che","year":"2023","unstructured":"Che, W.X., Dou, Z.C., et al.: Challenges, opportunities, and developments in natural language processing in the era of large models. Inf. Sci. China 53(9), 1645\u20131687 (2023)","journal-title":"Inf. Sci. China"},{"key":"12_CR3","unstructured":"Dong, X., Lin, D., Wang, S.: A framework for real-time safeguarding the text generation of large language model. arXiv preprint arXiv:2404.19048 (2024)"},{"key":"12_CR4","doi-asserted-by":"crossref","unstructured":"Kumar, D., Abu Hashem, Y., Durometric, Z.: Watch your language: investigating content moderation with large language models. In: Proceedings of the International AAAI Conference on Web and Social Media, vol. 18, pp. 865\u2013878 (2024)","DOI":"10.1609\/icwsm.v18i1.31358"},{"key":"12_CR5","unstructured":"Zhao, W., Goyal, T., Chiu, Y.Y.: Wild hallucinations: evaluating long-form factuality in LLMs with real-world entity queries. arXiv preprint arXiv:2407.17468 (2024)"},{"issue":"6","key":"12_CR6","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3653304","volume":"18","author":"J Yang","year":"2024","unstructured":"Yang, J., Jin, H., Tang, R.: Harnessing the power of LLMs in practice: a survey on ChatGPT and beyond. ACM Trans. Knowl. Discov. Data 18(6), 1\u201332 (2024)","journal-title":"ACM Trans. Knowl. Discov. Data"},{"key":"12_CR7","unstructured":"Chong, C.J., Hou, C., Yao, Z.: Casper: prompt sanitization for protecting user privacy in web-based large language models. arXiv preprint arXiv:2408.07004 (2024)"},{"issue":"3","key":"12_CR8","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3641289","volume":"15","author":"Y Chang","year":"2024","unstructured":"Chang, Y., Wang, X., Wang, J.: A survey on evaluation of LLMs. ACM Trans. Intell. Syst. Technol. 15(3), 1\u201345 (2024)","journal-title":"ACM Trans. Intell. Syst. Technol."},{"key":"12_CR9","doi-asserted-by":"crossref","unstructured":"Zhang, Z., Lei, L., Wu, L.: SafetyBench: evaluating the safety of LLMs. In: Proceedings of the 62nd Annual Meeting of the Association for Computational Linguistics, pp. 15537\u201315553 (2024)","DOI":"10.18653\/v1\/2024.acl-long.830"},{"key":"12_CR10","unstructured":"Sun, H., Zhang, Z., Deng, J.: Safety assessment of Chinese LLMs. arXiv preprint arXiv:2304.10436 (2023)"},{"key":"12_CR11","unstructured":"Yuan, X., Li, J., Wang, D.: S-Eval: automatic and adaptive test generation for BenchMarking safety evaluation of LLMs. arXiv preprint arXiv:2405.14191 (2024)"},{"key":"12_CR12","doi-asserted-by":"crossref","unstructured":"Liu, Y., Zheng, Y., Xia, S.: SAFETY-J: evaluating safety with critique. arXiv preprint arXiv:2407.17075 (2024)","DOI":"10.18653\/v1\/2024.findings-emnlp.64"},{"key":"12_CR13","unstructured":"Gupta, P., Yau, L.Q., Low, H.H.: WalledEval: a comprehensive safety evaluation toolkit for LLMs. arXiv preprint arXiv:2408.03837 (2024)"},{"key":"12_CR14","unstructured":"Qiu, H., Zhang, S., Li, A.: Latent jailbreak: a benchmark for evaluating text safety and output robustness of LLMs. arXiv preprint arXiv:2307.08487 (2023)"},{"key":"12_CR15","unstructured":"Xu, G., Liu, J., Yan, M.: CVALUES: measuring the values of Chinese LLMs from safety to responsibility. arXiv preprint arXiv:2307.09705 (2023)"},{"key":"12_CR16","unstructured":"Ji, J., Chen, Y., Jin, M.: MoralBench: moral evaluation of LLMs. arXiv preprint arXiv:2406.04428 (2024)"},{"key":"12_CR17","unstructured":"Morales, S., Clarisa, C.R., Cabot, J.: LangBite: a platform for testing bias in LLMs. arXiv preprint arXiv:2404.18558 (2024)"},{"key":"12_CR18","doi-asserted-by":"crossref","unstructured":"Li, L., Dong, B., Wang, R., et al.: SALAD-bench: a hierarchical and comprehensive safety benchmark for large language models. In: Findings of the Association for Computational Linguistics (ACL), pp. 3923\u20133954 (2024)","DOI":"10.18653\/v1\/2024.findings-acl.235"},{"key":"12_CR19","doi-asserted-by":"crossref","unstructured":"Liu, Y., Cai, C., Zhang, X.: Arondight: red teaming large vision language models with auto-generated multi-modal jailbreak prompts. arXiv preprint arXiv:2407.15050 (2024)","DOI":"10.1145\/3664647.3681379"},{"key":"12_CR20","doi-asserted-by":"crossref","unstructured":"Li, M., Chen, M.B., Tang, B.: NewsBench: a systematic evaluation framework for assessing editorial capabilities of LLMs in Chinese journalism. In: Proceedings of the 62nd Annual Meeting of the Association for Computational Linguistics, pp. 9993\u201310014 (2024)","DOI":"10.18653\/v1\/2024.acl-long.538"},{"key":"12_CR21","doi-asserted-by":"crossref","unstructured":"Zhang, Y., Gao, Y., Li, W., et al.: Chinese generation and security index evaluation based on large language model. In: 2024 International Conference on Asian Language Processing (IALP), pp. 151\u2013161. IEEE (2024)","DOI":"10.1109\/IALP63756.2024.10661189"},{"key":"12_CR22","doi-asserted-by":"publisher","DOI":"10.1016\/j.jesp.2022.104327","volume":"101","author":"Z Zhang","year":"2022","unstructured":"Zhang, Z., Chen, Z., Xu, L.: Artificial intelligence and moral dilemmas: perception of ethical decision-making in AI. J. Exp. Soc. Psychol. 101, 104327 (2022)","journal-title":"J. Exp. Soc. Psychol."},{"key":"12_CR23","unstructured":"Zhang, Y., Li, Y., Cui, L.: Siren\u2019s song in the AI ocean: a survey on hallucination in large language models. arXiv preprint arXiv:2309.01219 (2023)"},{"key":"12_CR24","doi-asserted-by":"crossref","unstructured":"Garry, M., Chan, W.M., Foster, J., et al.: Large Language Models (LLMs) and the Institutionalization of Misinformation. Trends Cogn. Sci. (2024)","DOI":"10.1016\/j.tics.2024.08.007"},{"key":"12_CR25","unstructured":"Kojima, T., Gu, S.S., Reid, M.: LLMs are zero-shot reasoners. In: Advances in Neural Information Processing Systems, vol. 35, pp. 22199\u201322213 (2022)"},{"key":"12_CR26","doi-asserted-by":"crossref","unstructured":"Warr, M., Oster, N.J., Isaac, R.: Implicit bias in LLMs: experimental proof and implications for education. J. Res. Technol. Educ, 1\u201324 (2024)","DOI":"10.1080\/15391523.2024.2395295"},{"key":"12_CR27","unstructured":"OpenCompass: A Universal Evaluation Platform for Foundation Models. https:\/\/github.com\/open-compass\/open-compass. Accessed 30 Sept 2024"},{"key":"12_CR28","unstructured":"FlagEval: A Fast, Easy-to-use and Extensible Toolkit for Large-scale Model. https:\/\/github.com\/FlagAI-Open\/FlagAI. Accessed 30 Sept 2024"},{"key":"12_CR29","unstructured":"Hurst, A., Lerer, A., Goucher, A.P., et al.: GPT-4o System Card. arXiv preprint arXiv:2410.21276 (2024)"},{"key":"12_CR30","unstructured":"Meta AI: Introducing Meta LLaMA 3: The Most Capable Openly Available LLM to Date. Meta AI (2024)"},{"key":"12_CR31","unstructured":"Anthropic: Claude 3 Opus: Our Fastest Model yet. https:\/\/www.anthropic.com\/news\/claude-3-family. Accessed 8 Nov 2024"},{"key":"12_CR32","unstructured":"Wang, S.H., Sun, Y., Xiang, Y.: ERNIE 3.0 Titan: Exploring Larger-scale Knowledge Enhanced Pre-training for Language Understanding and Generation. arXiv preprint arXiv:2112.12731 (2021)"},{"key":"12_CR33","unstructured":"Minimax Company: Minimax-ABAB6.5 Models. https:\/\/www.minimaxi.com. Accessed 8 Nov 2024"},{"key":"12_CR34","unstructured":"Bai, J.Z., Bai, S.A., Chu, Y.F.: Qwen Technical Report. arXiv preprint arXiv:2309.16609 (2023)"},{"key":"12_CR35","unstructured":"Machel, R., Savinov, N., Teplyashin, D.: Gemini 1.5: Unlocking Multi-modal Understanding Across Millions of Tokens of Context. arXiv preprint arXiv:2403.05530 (2024)"},{"key":"12_CR36","unstructured":"Doubao Team: Doubao Pro Models. https:\/\/team.doubao.com. Accessed 8 Nov 2024"},{"key":"12_CR37","unstructured":"SenseTime Company: SenseChat. https:\/\/platform.sensenova.cn. Accessed 8 Nov 2024"},{"key":"12_CR38","unstructured":"Zeng, T., Xu, A., Xu, B.: ChatGLM: A Family of LLMs from GLM-130B to GLM-4 All Tools. arXiv preprint arXiv:2406.12793 (2024)"},{"key":"12_CR39","unstructured":"Liu, A., Feng, B., Xue, B.: DeepSeek-V3 Technical Report. arXiv preprint arXiv:2412.19437 (2024)"}],"container-title":["Lecture Notes in Computer Science","Advanced Intelligent Computing Technology and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-981-95-0020-8_12","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,7]],"date-time":"2025-09-07T19:45:52Z","timestamp":1757274352000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-981-95-0020-8_12"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"ISBN":["9789819500192","9789819500208"],"references-count":39,"URL":"https:\/\/doi.org\/10.1007\/978-981-95-0020-8_12","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2025]]},"assertion":[{"value":"24 July 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"The authors have no competing interests to declare that are relevant to the content of this article.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Disclosure of Interests"}},{"value":"ICIC","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Intelligent Computing","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Ningbo","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"China","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2025","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"26 July 2025","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 July 2025","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"21","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"icic2025","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/www.ic-icc.cn\/icg\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}