{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,3]],"date-time":"2026-06-03T11:24:57Z","timestamp":1780485897802,"version":"3.54.1"},"reference-count":142,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,4,29]],"date-time":"2024-04-29T00:00:00Z","timestamp":1714348800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,4,29]],"date-time":"2024-04-29T00:00:00Z","timestamp":1714348800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,4,29]]},"DOI":"10.1109\/isdfs60797.2024.10527236","type":"proceedings-article","created":{"date-parts":[[2024,5,15]],"date-time":"2024-05-15T17:33:23Z","timestamp":1715794403000},"page":"1-10","source":"Crossref","is-referenced-by-count":26,"title":["A Review of Advancements and Applications of Pre-Trained Language Models in Cybersecurity"],"prefix":"10.1109","author":[{"given":"Zefang","family":"Liu","sequence":"first","affiliation":[{"name":"School of Computational Science and Engineering, Georgia Institute of Technology,Atlanta,USA"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref1","article-title":"Bert: Pre-training of deep bidirectional transformers for language understanding","author":"Devlin","year":"2018","journal-title":"ar Xiv preprint"},{"key":"ref2","author":"Radford","year":"2018","journal-title":"Improving language understanding by generative pre-training"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1907.11692"},{"key":"ref4","article-title":"Distilbert, a distilled version of bert: smaller, faster, cheaper and lighter","author":"Sanh","year":"2019","journal-title":"ar Xiv preprint"},{"key":"ref5","article-title":"Albert: A lite bert for self-supervised learning of language represen-tations","author":"Lan","year":"2019","journal-title":"arXiv preprint"},{"key":"ref6","article-title":"Deberta: Decoding-enhanced bert with disentangled attention","author":"He","year":"2020","journal-title":"arXiv preprint"},{"issue":"8","key":"ref7","first-page":"9","article-title":"Language models are unsupervised multitask learners","volume":"1","author":"Radford","year":"2019","journal-title":"OpenAI blog"},{"key":"ref8","first-page":"1877","article-title":"Language mod-els are few-shot learners","volume":"33","author":"Brown","year":"2020","journal-title":"Advances in neural information processing systems"},{"key":"ref9","first-page":"27730","article-title":"Training language models to follow instructions with human feedback","volume":"35","author":"Ouyang","year":"2022","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref10","article-title":"Gpt-4 technical report","author":"Achiam","year":"2023","journal-title":"arXiv preprint"},{"key":"ref11","article-title":"Bart: Denoising sequence-to-sequence pre-training for natural language generation, translation, and comprehension","author":"Lewis","year":"2019","journal-title":"arXiv preprint"},{"issue":"1","key":"ref12","first-page":"5485","article-title":"Exploring the limits of transfer learning with a unified text-to-text transformer","volume":"21","author":"Raffel","year":"2020","journal-title":"The Journal of Machine Learning Research"},{"key":"ref13","article-title":"Scaling instruction-finetuned language models","author":"Chung","year":"2022","journal-title":"arXiv preprint"},{"key":"ref14","article-title":"Llama: Open and efficient foundation language models","author":"Touvron","year":"2023","journal-title":"ar Xiv preprint"},{"key":"ref15","article-title":"Llama 2: Open foundation and fine-tuned chat models","author":"Touvron","year":"2023","journal-title":"arXiv p rep rint"},{"key":"ref16","article-title":"The falcon series of open language models","author":"Almazrouei","year":"2023","journal-title":"ar Xiv preprint"},{"key":"ref17","article-title":"Judging llm-as-a-judge with mt-bench and chatbot arena","volume":"36","author":"Zheng","year":"2024","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref18","article-title":"Mistral 7b","author":"Jiang","year":"2023","journal-title":"arXiv preprint"},{"key":"ref19","article-title":"Mixtral of experts","author":"Jiang","year":"2024","journal-title":"arXiv preprint"},{"key":"ref20","article-title":"Zephyr: Direct distillation of lm alignment","author":"Tunstall","year":"2023","journal-title":"arXiv preprint"},{"key":"ref21","article-title":"Textbooks are all you need","author":"Gunasekar","year":"2023","journal-title":"arXiv preprint"},{"key":"ref22","article-title":"Textbooks are all you need ii: phi-1.5 technical report","author":"Li","year":"2023","journal-title":"arXiv preprint"},{"key":"ref23","article-title":"Domain specialization as the key to make large language models disruptive: A comprehensive survey","author":"Zhao","year":"2023","journal-title":"arXiv preprint"},{"key":"ref24","volume-title":"Secbert: A pretrained bert model for cyber security text, learned cybersecurity knowledge"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.3390\/jcp1040031"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/BigData52589.2021.9671824"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-25538-0_3"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1145\/3652594"},{"key":"ref29","article-title":"Huggingfaces trans-formers: State-of-the-art natural language processing","author":"Wolf","year":"2019","journal-title":"arXiv preprint"},{"key":"ref30","author":"Liu","year":"2024","journal-title":"Cyberbench: A multi-task benchmark for evaluating large language models in cybersecurity"},{"key":"ref31","article-title":"Purple llama cyberseceval: A secure coding benchmark for language models","author":"Bhatt","year":"2023","journal-title":"arXiv preprint"},{"key":"ref32","article-title":"Secqa: A concise question-answering dataset for evalu-ating large language models in computer security","author":"Liu","year":"2023","journal-title":"ar Xiv preprint"},{"key":"ref33","article-title":"Cybermetric: A benchmark dataset for evaluating large language models knowledge in cybersecurity","author":"Tihanyi","year":"2024","journal-title":"arXiv preprint"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.acl-short.31"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.3390\/app13063701"},{"key":"ref36","article-title":"Maldict: Benchmark datasets on mal ware behaviors, platforms, exploitation, and packers","author":"Joyce","year":"2023","journal-title":"arXiv nrenrint"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-41579-2_13"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1145\/3607199.3607242"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2019.2963724"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1145\/3338501.3357374"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/ISDFS52919.2021.9486377"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/SMC52423.2021.9659287"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.3390\/bdcc7020060"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1016\/j.cose.2021.102458"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-97087-1_7"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1007\/s11416-022-00424-3"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2022.3179384"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-16815-4_31"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1145\/3600160.3605057"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1016\/j.jisa.2023.103690"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/TSE.2021.3087402"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/INFOCOMWKSHPS51825.2021.9484500"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1109\/DSAA53316.2021.9564227"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/ICMLA52953.2021.00256"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN55064.2022.9892280"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19208-1_23"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1109\/ISSREW55968.2022.00042"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1016\/j.jisa.2023.103423"},{"key":"ref59","article-title":"Finetuning large language models for vulnerability detection","author":"Shestov","year":"2024","journal-title":"arXiv preprint"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1145\/3472753"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2021.3110524"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1109\/SIU55565.2022.9864721"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.1145\/3565477.3569152"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.1109\/AICCSA56895.2022.10017800"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1109\/ICMLA55696.2022.00048"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1016\/j.dcan.2023.03.008"},{"key":"ref67","doi-asserted-by":"publisher","DOI":"10.1088\/1742-6596\/2504\/1\/012061"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2023.122564"},{"key":"ref69","article-title":"Catbert: Context-aware tiny bert for detecting social engineering emails","author":"Lee","year":"2020","journal-title":"arXiv preprint"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1145\/3465481.3469205"},{"key":"ref71","doi-asserted-by":"publisher","DOI":"10.1016\/j.procs.2021.07.040"},{"key":"ref72","doi-asserted-by":"publisher","DOI":"10.1109\/MILCOM52596.2021.9653028"},{"key":"ref73","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-91885-9_40"},{"key":"ref74","doi-asserted-by":"publisher","DOI":"10.3390\/electronics11223647"},{"key":"ref75","doi-asserted-by":"publisher","DOI":"10.1109\/WI-IAT55865.2022.00028"},{"key":"ref76","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2023.3292171"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.3390\/make6010018"},{"key":"ref78","doi-asserted-by":"publisher","DOI":"10.1109\/CCWC60891.2024.10427626"},{"key":"ref79","doi-asserted-by":"publisher","DOI":"10.1109\/UBMK52708.2021.9558993"},{"key":"ref80","article-title":"Leveraging gpt-2 for classifying spam reviews with limited labeled data via adversarial training","author":"Irissappane","year":"2020","journal-title":"arXiv preprint"},{"key":"ref81","doi-asserted-by":"publisher","DOI":"10.1109\/GLOBECOM42002.2020.9347970"},{"key":"ref82","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2021.3081479"},{"key":"ref83","doi-asserted-by":"publisher","DOI":"10.1016\/j.procs.2021.03.107"},{"key":"ref84","doi-asserted-by":"publisher","DOI":"10.1109\/eIT53891.2022.9813922"},{"key":"ref85","doi-asserted-by":"publisher","DOI":"10.24251\/HICSS.2022.921"},{"key":"ref86","article-title":"Spam detection using bert","author":"Sahmoud","year":"2022","journal-title":"arXiv preprint"},{"key":"ref87","doi-asserted-by":"publisher","DOI":"10.1109\/COM-IT-CON54601.2022.9850588"},{"key":"ref88","doi-asserted-by":"publisher","DOI":"10.1145\/3538491"},{"key":"ref89","doi-asserted-by":"publisher","DOI":"10.1016\/j.mlwa.2023.100470"},{"key":"ref90","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN52387.2021.9534113"},{"key":"ref91","doi-asserted-by":"publisher","DOI":"10.1109\/CloudIntelligence52565.2021.00013"},{"key":"ref92","doi-asserted-by":"publisher","DOI":"10.3390\/e24010069"},{"key":"ref93","doi-asserted-by":"publisher","DOI":"10.1109\/ICSIP55141.2022.9886069"},{"key":"ref94","doi-asserted-by":"publisher","DOI":"10.1109\/ASE51524.2021.9678773"},{"key":"ref95","doi-asserted-by":"publisher","DOI":"10.1080\/08839514.2022.2145642"},{"key":"ref96","doi-asserted-by":"publisher","DOI":"10.3390\/electronics12173580"},{"key":"ref97","doi-asserted-by":"publisher","DOI":"10.1016\/j.asoc.2023.110689"},{"key":"ref98","article-title":"Logprompt: Prompt engineering towards zero-shot and interpretable log analysis","author":"Liu","year":"2023","journal-title":"arXiv preprint"},{"key":"ref99","doi-asserted-by":"publisher","DOI":"10.1109\/HPCC-DSS-SmartCity-DependSys60770.2023.00045"},{"key":"ref100","doi-asserted-by":"publisher","DOI":"10.1109\/BigData59044.2023.10386543"},{"key":"ref101","doi-asserted-by":"publisher","DOI":"10.1145\/3597503.3623304"},{"key":"ref102","doi-asserted-by":"publisher","DOI":"10.1145\/3485447.3512217"},{"key":"ref103","doi-asserted-by":"publisher","DOI":"10.3390\/electronics12030516"},{"key":"ref104","doi-asserted-by":"publisher","DOI":"10.3390\/e25050821"},{"key":"ref105","article-title":"Netgpt: Gener-ative pretrained transformer for network traffic","author":"Meng","year":"2023","journal-title":"ar Xiv preprint"},{"key":"ref106","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2023.3325727"},{"key":"ref107","doi-asserted-by":"publisher","DOI":"10.23919\/JCIN.2023.10272352"},{"key":"ref108","doi-asserted-by":"publisher","DOI":"10.1145\/3487351.3492723"},{"key":"ref109","doi-asserted-by":"publisher","DOI":"10.1109\/ICELTICs56128.2022.9932097"},{"key":"ref110","article-title":"Anomaly detection of command shell sessions based on distilbert: Unsupervised and supervised approaches","author":"Liu","year":"2023","journal-title":"arXiv preprint"},{"key":"ref111","doi-asserted-by":"publisher","DOI":"10.1109\/ISSRE59848.2023.00082"},{"key":"ref112","doi-asserted-by":"publisher","DOI":"10.3390\/app11083383"},{"key":"ref113","doi-asserted-by":"publisher","DOI":"10.1109\/ICCCN52240.2021.9522325"},{"key":"ref114","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2021.3123950"},{"key":"ref115","doi-asserted-by":"publisher","DOI":"10.1007\/978-981-19-9228-5_54"},{"key":"ref116","doi-asserted-by":"publisher","DOI":"10.1016\/j.cose.2023.103424"},{"key":"ref117","doi-asserted-by":"publisher","DOI":"10.1631\/FITEE.2000286"},{"key":"ref118","doi-asserted-by":"publisher","DOI":"10.1145\/3451471.3451508"},{"key":"ref119","doi-asserted-by":"publisher","DOI":"10.1109\/ICBDA51983.2021.9403180"},{"key":"ref120","doi-asserted-by":"publisher","DOI":"10.1109\/ICCT52962.2021.9657857"},{"key":"ref121","doi-asserted-by":"publisher","DOI":"10.1109\/CSR51186.2021.9527981"},{"key":"ref122","article-title":"Cyner: A python library for cybersecurity named entity recognition","author":"Alam","year":"2022","journal-title":"ar Xiv preprint"},{"key":"ref123","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2022.110114"},{"key":"ref124","doi-asserted-by":"publisher","DOI":"10.1016\/j.procs.2023.01.027"},{"key":"ref125","doi-asserted-by":"publisher","DOI":"10.1109\/CSCWD49262.2021.9437858"},{"key":"ref126","doi-asserted-by":"publisher","DOI":"10.1155\/2022\/9875199"},{"key":"ref127","doi-asserted-by":"publisher","DOI":"10.1155\/2022\/7729456"},{"key":"ref128","doi-asserted-by":"publisher","DOI":"10.1186\/s42400-022-00110-3"},{"key":"ref129","doi-asserted-by":"publisher","DOI":"10.3390\/a15090314"},{"key":"ref130","article-title":"Threatcrawl: A bert-based focused crawler for the cybersecurity domain","author":"Kuehn","year":"2023","journal-title":"arXiv preprint"},{"key":"ref131","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN52387.2021.9534192"},{"key":"ref132","doi-asserted-by":"publisher","DOI":"10.1109\/ICSP58490.2023.10248596"},{"key":"ref133","doi-asserted-by":"publisher","DOI":"10.3390\/info14080462"},{"key":"ref134","doi-asserted-by":"publisher","DOI":"10.1109\/eIT57321.2023.10187355"},{"key":"ref135","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2023.3300381"},{"key":"ref136","doi-asserted-by":"publisher","DOI":"10.1007\/s10586-023-04124-5"},{"key":"ref137","article-title":"Cyber sentinel: Exploring conversational agents in streamlining security tasks with gpt-4","author":"Kaheh","year":"2023","journal-title":"arXiv preprint"},{"issue":"10","key":"ref138","article-title":"Advantages, disadvantages and risks as-sociated with chatgpt and ai on cybersecurity","volume":"10","author":"Kalla","year":"2023","journal-title":"Journal of Emerging Technologies and Innovative Research"},{"key":"ref139","doi-asserted-by":"publisher","DOI":"10.3390\/info15010027"},{"key":"ref140","doi-asserted-by":"publisher","DOI":"10.1016\/j.cose.2023.103476"},{"key":"ref141","doi-asserted-by":"publisher","DOI":"10.1016\/j.hcc.2024.100211"},{"key":"ref142","article-title":"Large language models in cybersecurity: State-of-the-art","author":"Motlagh","year":"2024","journal-title":"arXiv preprint"}],"event":{"name":"2024 12th International Symposium on Digital Forensics and Security (ISDFS)","location":"San Antonio, TX, USA","start":{"date-parts":[[2024,4,29]]},"end":{"date-parts":[[2024,4,30]]}},"container-title":["2024 12th International Symposium on Digital Forensics and Security (ISDFS)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10526462\/10526466\/10527236.pdf?arnumber=10527236","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,5,16]],"date-time":"2024-05-16T04:53:57Z","timestamp":1715835237000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10527236\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,4,29]]},"references-count":142,"URL":"https:\/\/doi.org\/10.1109\/isdfs60797.2024.10527236","relation":{},"subject":[],"published":{"date-parts":[[2024,4,29]]}}}