{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,24]],"date-time":"2026-01-24T19:40:49Z","timestamp":1769283649942,"version":"3.49.0"},"reference-count":21,"publisher":"Elsevier BV","issue":"2","license":[{"start":{"date-parts":[[2024,6,1]],"date-time":"2024-06-01T00:00:00Z","timestamp":1717200000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[2024,6,1]],"date-time":"2024-06-01T00:00:00Z","timestamp":1717200000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/legal\/tdmrep-license"},{"start":{"date-parts":[[2023,6,27]],"date-time":"2023-06-27T00:00:00Z","timestamp":1687824000000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0\/"}],"content-domain":{"domain":["elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["High-Confidence Computing"],"published-print":{"date-parts":[[2024,6]]},"DOI":"10.1016\/j.hcc.2023.100145","type":"journal-article","created":{"date-parts":[[2023,8,11]],"date-time":"2023-08-11T20:40:19Z","timestamp":1691786419000},"page":"100145","update-policy":"https:\/\/doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":5,"title":["Research on active defense decision-making method for cloud boundary networks based on reinforcement learning of intelligent agent"],"prefix":"10.1016","volume":"4","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-9688-6242","authenticated-orcid":false,"given":"Huan","family":"Wang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yunlong","family":"Tang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5575-1210","authenticated-orcid":false,"given":"Yan","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ning","family":"Wei","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Junyi","family":"Deng","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zhiyan","family":"Bin","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Weilong","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"78","reference":[{"key":"10.1016\/j.hcc.2023.100145_b1","doi-asserted-by":"crossref","DOI":"10.1016\/j.hcc.2021.100004","article-title":"A model checking-based security analysis framework for IoT systems","volume":"1","author":"Fang","year":"2021","journal-title":"High-Confid. Comput."},{"key":"10.1016\/j.hcc.2023.100145_b2","doi-asserted-by":"crossref","unstructured":"H. Zhang, J. Wang, D. Yu, J. Han, T. Li, Active defense strategy selection based on static Bayesian game, in: Third International Conference on Cyberspace Technology (CCT 2015), 2015, pp. 1\u20137.","DOI":"10.1049\/cp.2015.0806"},{"key":"10.1016\/j.hcc.2023.100145_b3","doi-asserted-by":"crossref","first-page":"50618","DOI":"10.1109\/ACCESS.2018.2880214","article-title":"Attack-defense differential game model for network defense strategy selection","volume":"7","author":"Zhang","year":"2019","journal-title":"IEEE Access"},{"key":"10.1016\/j.hcc.2023.100145_b4","doi-asserted-by":"crossref","first-page":"39621","DOI":"10.1109\/ACCESS.2018.2848242","article-title":"Markov differential game for network defense decision-making method","volume":"6","author":"Huang","year":"2018","journal-title":"IEEE Access"},{"key":"10.1016\/j.hcc.2023.100145_b5","first-page":"2029","article-title":"Shielding collaborative learning: Mitigating poisoning attacks through client-side detection","volume":"18","author":"Zhao","year":"2021","journal-title":"IEEE Trans. Dependable Secur. Comput."},{"key":"10.1016\/j.hcc.2023.100145_b6","first-page":"1","article-title":"Deep reinforcement learning for cyber security","author":"Nguyen","year":"2021","journal-title":"IEEE Trans. Neural Netw. Learn. Syst."},{"key":"10.1016\/j.hcc.2023.100145_b7","series-title":"2021 17th International Conference on Network and Service Management","first-page":"509","article-title":"Learning intrusion prevention policies through optimal stopping","author":"Hammar","year":"2021"},{"key":"10.1016\/j.hcc.2023.100145_b8","doi-asserted-by":"crossref","first-page":"4060","DOI":"10.3390\/s21124060","article-title":"Deep reinforcement learning for attacking wireless sensor networks","volume":"21","author":"Parras","year":"2021","journal-title":"Sensors"},{"key":"10.1016\/j.hcc.2023.100145_b9","doi-asserted-by":"crossref","DOI":"10.1016\/j.ijepes.2022.108798","article-title":"Multi-layer defense algorithm against deep reinforcement learning-based intruders in smart grids","volume":"146","author":"Rouzbahani","year":"2023","journal-title":"Int. J. Electr. Power Energy Syst."},{"key":"10.1016\/j.hcc.2023.100145_b10","doi-asserted-by":"crossref","DOI":"10.1016\/j.rser.2020.110618","article-title":"Applications of reinforcement learning in energy systems","volume":"137","author":"Perera","year":"2021","journal-title":"Renew. Sustain. Energy Rev."},{"key":"10.1016\/j.hcc.2023.100145_b11","doi-asserted-by":"crossref","first-page":"373","DOI":"10.1016\/j.dcan.2022.01.003","article-title":"Moving target defense of routing randomization with deep reinforcement learning against eavesdropping attack","volume":"8","author":"Xu","year":"2022","journal-title":"Digit. Commun. Netw."},{"key":"10.1016\/j.hcc.2023.100145_b12","doi-asserted-by":"crossref","first-page":"5364","DOI":"10.1109\/JIOT.2022.3222210","article-title":"Deep-reinforcement-learning-based resource allocation for cloud gaming via edge computing","volume":"10","author":"Deng","year":"2023","journal-title":"IEEE Internet Things J."},{"key":"10.1016\/j.hcc.2023.100145_b13","doi-asserted-by":"crossref","DOI":"10.1016\/j.eswa.2021.114896","article-title":"A deep reinforcement learning-based method applied for solving multi-agent defense and attack problems","volume":"176","author":"Huang","year":"2021","journal-title":"Expert Syst. Appl."},{"key":"10.1016\/j.hcc.2023.100145_b14","doi-asserted-by":"crossref","DOI":"10.1016\/j.cose.2022.102869","article-title":"Reinforcement learning based adversarial malware example generation against black-box detectors","volume":"121","author":"Zhong","year":"2022","journal-title":"Comput. Secur."},{"key":"10.1016\/j.hcc.2023.100145_b15","series-title":"A hidden attack sequences detection method based on dynamic reward deep deterministic policy gradient, (n.d.)","year":"2023"},{"key":"10.1016\/j.hcc.2023.100145_b16","doi-asserted-by":"crossref","first-page":"115","DOI":"10.1108\/DTS-05-2022-0016","article-title":"Enabling intrusion detection systems with dueling double deep Q-learning","volume":"1","author":"Badr","year":"2022","journal-title":"Digit. Transform. Soc."},{"key":"10.1016\/j.hcc.2023.100145_b17","series-title":"Developing optimal causal cyber-defence agents via cyber security simulation","author":"Andrew","year":"2022"},{"key":"10.1016\/j.hcc.2023.100145_b18","article-title":"A survey on cyber situation awareness systems: Framework, techniques, and insights","author":"Alavizadeh","year":"2022","journal-title":"ACM Comput. Surv."},{"key":"10.1016\/j.hcc.2023.100145_b19","doi-asserted-by":"crossref","first-page":"467","DOI":"10.1109\/COMST.2022.3225137","article-title":"A survey of adversarial attack and defense methods for malware classification in cyber security","volume":"25","author":"Yan","year":"2023","journal-title":"IEEE Commun. Surv. Tutor."},{"key":"10.1016\/j.hcc.2023.100145_b20","series-title":"Proximal policy optimization algorithms","author":"Schulman","year":"2017"},{"key":"10.1016\/j.hcc.2023.100145_b21","series-title":"Playing atari with deep reinforcement learning. - aminer, (n.d.)","year":"2023"}],"container-title":["High-Confidence Computing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S2667295223000430?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S2667295223000430?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2024,10,26]],"date-time":"2024-10-26T02:31:39Z","timestamp":1729909899000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S2667295223000430"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,6]]},"references-count":21,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2024,6]]}},"alternative-id":["S2667295223000430"],"URL":"https:\/\/doi.org\/10.1016\/j.hcc.2023.100145","relation":{},"ISSN":["2667-2952"],"issn-type":[{"value":"2667-2952","type":"print"}],"subject":[],"published":{"date-parts":[[2024,6]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"Research on active defense decision-making method for cloud boundary networks based on reinforcement learning of intelligent agent","name":"articletitle","label":"Article Title"},{"value":"High-Confidence Computing","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.hcc.2023.100145","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2023 The Author(s). Published by Elsevier B.V. on behalf of Shandong University.","name":"copyright","label":"Copyright"}],"article-number":"100145"}}