{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,3]],"date-time":"2026-03-03T16:27:30Z","timestamp":1772555250631,"version":"3.50.1"},"reference-count":29,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"7","license":[{"start":{"date-parts":[[2024,7,1]],"date-time":"2024-07-01T00:00:00Z","timestamp":1719792000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2024,7,1]],"date-time":"2024-07-01T00:00:00Z","timestamp":1719792000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,7,1]],"date-time":"2024-07-01T00:00:00Z","timestamp":1719792000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"name":"National Key Research and Development Program of China","award":["2021YFB3100500"],"award-info":[{"award-number":["2021YFB3100500"]}]},{"DOI":"10.13039\/501100004543","name":"China Scholarship Council","doi-asserted-by":"publisher","award":["202306110031"],"award-info":[{"award-number":["202306110031"]}],"id":[{"id":"10.13039\/501100004543","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Ind. Inf."],"published-print":{"date-parts":[[2024,7]]},"DOI":"10.1109\/tii.2024.3379633","type":"journal-article","created":{"date-parts":[[2024,4,9]],"date-time":"2024-04-09T19:00:47Z","timestamp":1712689247000},"page":"9109-9119","source":"Crossref","is-referenced-by-count":6,"title":["An Intelligent Penetration Testing Method Using Human Feedback"],"prefix":"10.1109","volume":"20","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-7137-999X","authenticated-orcid":false,"given":"Qianyu","family":"Li","sequence":"first","affiliation":[{"name":"College of Electronic Engineering, National University of Defense Technology, Hefei, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2370-592X","authenticated-orcid":false,"given":"Ruipeng","family":"Wang","sequence":"additional","affiliation":[{"name":"College of Electronic Engineering, National University of Defense Technology, Hefei, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6654-7610","authenticated-orcid":false,"given":"Min","family":"Zhang","sequence":"additional","affiliation":[{"name":"College of Electronic Engineering, National University of Defense Technology, Hefei, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4533-2706","authenticated-orcid":false,"given":"Fan","family":"Shi","sequence":"additional","affiliation":[{"name":"College of Electronic Engineering, National University of Defense Technology, Hefei, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yi","family":"Shen","sequence":"additional","affiliation":[{"name":"College of Electronic Engineering, National University of Defense Technology, Hefei, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0005-9691-4011","authenticated-orcid":false,"given":"Miao","family":"Hu","sequence":"additional","affiliation":[{"name":"College of Electronic Engineering, National University of Defense Technology, Hefei, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1166-2830","authenticated-orcid":false,"given":"Bingyang","family":"Guo","sequence":"additional","affiliation":[{"name":"College of Electronic Engineering, National University of Defense Technology, Hefei, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7405-7710","authenticated-orcid":false,"given":"Chengxi","family":"Xu","sequence":"additional","affiliation":[{"name":"College of Electronic Engineering, National University of Defense Technology, Hefei, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","first-page":"114","article-title":"Collaborative paradigm of teaching penetration testing using real-world university applications","volume-title":"Proc. Australas. Comput. Educ. Conf.","author":"Vykopal","year":"2022"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/LISAT.2018.8378035"},{"issue":"4","key":"ref3","first-page":"9","article-title":"Ethical hacking and penetrate testing using Kali and metasploit framework","volume":"2","author":"Tabassum","year":"2021","journal-title":"Int. J. Innov. Comput. Sci. Eng."},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TIV.2022.3185159"},{"key":"ref5","first-page":"27730","article-title":"Training language models to follow instructions with human feedback","volume-title":"Proc. Int. Conf. Adv. Neural Inf. Process. Syst.","volume":"35","author":"Ouyang","year":"2022"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1016\/j.cose.2022.102681"},{"key":"ref7","article-title":"Proximal policy optimization algorithms","author":"Schulman","year":"2017"},{"key":"ref8","article-title":"Autonomous penetration testing using reinforcement learning","author":"Schwartz","year":"2019"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/WorldS4.2018.8611595"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1631\/FITEE.1800532"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/EuroSPW51379.2020.00010"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1049\/ise2.12107"},{"key":"ref13","article-title":"Incorporating deception into cyberbattlesim for autonomous defense","author":"Walter","year":"2021"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1007\/s10844-022-00738-0"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/STC55697.2022.00015"},{"key":"ref16","first-page":"41","article-title":"Leveraging deep reinforcement learning for automating penetration testing in reconnaissance and exploitation phase","volume-title":"Proc. RIVF Int. Conf. Comput. Commun. Technol.","author":"Nhu","year":"2022"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1049\/ise2.12107"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1016\/j.cose.2022.103055"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1016\/j.inffus.2022.03.003"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1016\/j.apenergy.2021.117775"},{"key":"ref21","first-page":"1259","article-title":"Skill preferences: Learning to extract and execute robotic skills from human feedback","volume-title":"Proc. Conf. Robot Learn.","author":"Wang","year":"2022"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1613\/jair.1.12360"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1177\/02783649211041652"},{"key":"ref24","first-page":"38176","article-title":"Fine-tuning language models to find agreement among humans with diverse preferences","volume-title":"Proc. Int. Conf. Adv. Neural Inf. Process. Syst.","volume":"35","author":"Bakker","year":"2022"},{"key":"ref25","article-title":"Illustrating reinforcement learning from human feedback (RLHF)","author":"Lambert","year":"2022"},{"key":"ref26","article-title":"Perspectives on the social impacts of reinforcement learning with human feedback","author":"Liu","year":"2023"},{"key":"ref27","article-title":"Cyberbattlesim","author":"Team","year":"2021","journal-title":"Created by Christian Michael Seifert William Betser James Blum Bono, Kate Farris, Emily Goren, Justin Grana, Kristian Holsheimer, Brandon Marken, Joshua Neil, Nicole Nichols, Jugal Parikh, Haoran Wei"},{"key":"ref28","first-page":"3008","article-title":"Learning to summarize with human feedback","volume-title":"Proc. Int. Conf. Adv. Neural Inf. Process. Syst.","volume":"33","author":"Stiennon","year":"2020"},{"key":"ref29","article-title":"Adam: A method for stochastic optimization","author":"Kingma","year":"2014","journal-title":"Comput. Sci."}],"container-title":["IEEE Transactions on Industrial Informatics"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9424\/10582275\/10495724.pdf?arnumber=10495724","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,7]],"date-time":"2024-09-07T04:45:35Z","timestamp":1725684335000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10495724\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,7]]},"references-count":29,"journal-issue":{"issue":"7"},"URL":"https:\/\/doi.org\/10.1109\/tii.2024.3379633","relation":{},"ISSN":["1551-3203","1941-0050"],"issn-type":[{"value":"1551-3203","type":"print"},{"value":"1941-0050","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,7]]}}}