{“状态”:“确定”,“消息类型”:“工作”,“信息版本”:“1.0.0”,“邮件”:{“索引”:{-“日期-部件”:[[2024,2,11]],“日期-时间”:“2024-02-11T16:41:22Z”,“时间戳”:1707669682309},“引用-计数”:13,“发布者”:“爱思唯尔BV”,“许可证”:[{“开始”:{-date-parts”:[2022,12,1]],《日期-时间》:“2022-12-01T00:00Z“,”timestamp“:1669852800000},”content-version“:“tdm”,“delay-in-days”:0,“URL”:“https:\/\/www.elsevier.com/tdm\/userlicense\/1.0\/”},{“start”:{“date-parts”:[2022,11,18]],“date-time”:“2022-11-18T00:00:00Z”,“timestamp”:1668729600000},“content-version”:“vor”,“delay-in-ddays”:0-nd \/4.0\/“}],“出资人”:[{“DOI”:“10.13039\/501100001809”,“名称”:“中国国家自然科学基金会”,“doi-asserted-by”:“publisher”,“award”:[“62076251”,“62106281”]}],“content-domain”:{“domain”:[“elsevier.com”,“sciencedirect.com”],“crossmark-restriction”:true},“short-container-title”:[”Array“],“published-print”:{“date-parts”:[2022,12]},”doi“10.1016\/j.Array.2022.00262“,”type“:”日志文章“,“created”:{“date-parts”:[[2022,11,24]],“date-time”:“2022-11-24T16:59:01Z”,“timestamp”:1669309141000},“page”:“100262”,“update-policy”:”http://\/dx.doi.org\/10.1016\/elsevier_cm_policy“,”source“:”Crossref“,“is-referenced-by-count”:2,“title”:[“基于奖励随机强化学习的网络空间攻防游戏”],“prefix”:“10.1016”“,”,“卷”:“16”,“作者”:[{“给定”:“雷”,“家庭”:“张”,“序列”:“第一个”,“从属关系”:[]},{“给出”:“红梅”,“家族”:“李”,“顺序”:“附加”,“附属关系”:[]}:[]},{“ORCID”:“http://\/orcid.org\/00000-0003-1733-7956”,“authenticated-orcid”:false,“given”:“Wei”,“family”:“Li”,“sequence”:“additional”,“affiliation”:[]},{“orcid”:[{“问题”:“3”,“密钥”:“10.1016\/j.array.2022.100262_bib1”,“doi-asserted-by”:“crossref”,“first page”:“397”,“doi”:“10.1093\/logcom\/2.3.397”、“article-title”:“非单调逻辑的复杂性结果”,“volume”:”2“,“author”:“Gottlob”,“year”:“1992”,“journal-title“:”j Logic Compute“}”,{“issue”:“3”,“key”:.2022.100262_bb2“,”首页“:”1“,”文章标题“:“利用博弈论和智能学习进行网络安全防御的最优决策方法”,“作者”:“张”,“年份”:“2019年”,“新闻标题”:“安全通信网络”},{“问题”:“4”,“关键”:“10.1016\/j.array.2022.100262_bib3”,“doi-asserted-by”:“crossref”,“首页”:“399”,“doi”:“101007\/s10776-018-0403-6”,“文章标题”:“基于博弈论的无线传感器网络多层入侵检测框架”,“卷”:“25”,“作者”:“Subba”,“年份”:“2018”,“日志标题”:“Int J wireless Inf Network”},{“密钥”:“10.1016\/J.array.2022.00262_bib4”,“doi-asserted-by”:“crossref”,“doi”:“101016\/J.automatica.2020.10883”,“article-title”:“nash和stackelberg均衡下具有二次标准的动态信号博弈”,“数量”:“115”,“作者”:“Sar\u0131tas”,“年份”:“2020”,“期刊标题”:“Autom”},{“密钥”:“10.1016\/j.array.2022.00262_bib5”,“series-title”:“国际计算、网络和通信会议(ICNC)”,“首页”:“577”,“文章标题”:“使用马尔可夫博弈模型的自适应mtd安全性”,“author”:“Chowdhary”,“year”:“2019”},{“key”:“10.1016\/j.array.2022.100262_bib6”,“doi-asserted-by”:“crossref”,《doi》:“10.106\/j.cosrev.2019.100219”,“article-title”:“网络安全中攻击图和攻击树可视化语法综述”,“volume”::“Compute.Sci.Rev.”},{“key”:“10.1016\/j.array.2022.100262_bb7”,“first page”:”5381 495“,“article-title”:“基于进化网络游戏的最优网络防御策略选择方法”,“author”:“Liu”,“year”:“2020”,“journal-title“:”Secur Commun network“},}“key:”10.1016\/j.aray.2022.00262_bb9“,”series-title“:“现有非线性模型的发展及其对两人非零和博弈中纳什均衡的影响”,“author”:“Punniyamoorthy”,“year”:“2021”},{“key”:“10.1016\/j.array.2022.00262_bib8”,“series-title”:“网络安全软件多样性的博弈理论框架”:“10.1016\/j.array.2022.100262_bb10”,“series-title”:“深度强化学习的连续控制”,“author”:“Lillicrap”,“year”:“2015”},{“key”:“10.106\/j-array.2022.100262_bb11”,“series-title”:”确定性策略梯度算法“,”author“:”Silver“,”年“:”2015:“电化学系统”,“作者”:“Newman”,“年份”:“1991”},{“key”:“10.1016\/j.array.2022.100262_bib13”,“doi-asserted-by”:“crossref”,“首页”:“91”,“doi”:“101016\/0368-1874(84)87091-4”,“article-title”:“Proc.6th Australian electrochem.Conf.,geelong,vic”,“volume”:”168“,”作者:“Miller”,“year”:“1984”,“journ”al-title“:“肛门电化学杂志”}],“container-title”:[“Array”],“original-title“:[],“language”:“en”,“link”:[{“URL”:“https:\/\/api.elsevier.com/content\/article\/PII:S2590005622000959?httpAccept=text\/xml”,“content-type”:“text\/.xml”,“content-version”:“vor”,“intended-application”:“text-mining”},{“URL”:“http://api.elsevier.com/content\/aarticle\/PII:S2590005622000959?httpAccept=text\/plain“,”content-type“:”text\/prain“,“content-version”:“vor”,“intended-application”:“text-mining”}],“deposed”:{“date-parts”:[[2024,2,11]],“date-time”:“2024-02-11T16:25:34Z”,“timestamp”:1707668734000},“score”:1,“resource”:{“primary”:“URL”:“https:\\/linkinghub.elsevier.com/retrieve\/pii\/S259000 5622000959“}},”副标题“:[],”short title“:[],”issued“:{”date-parts“:[2022,12]]},”references-count“:13,”alternative-id“:[”S2590005622000959“],”URL“:”http://\/dx.doi.org\/10.1016\/j.array.2022.100262“,”relation“:{},“ISSN”:[“2590-0056”],“ISSN-type”:[{“value”:“2590-10056”,”type“:”print“}],”subject“:[],“published”:{“date-parts”:[2022,12]]},“assertion”:[{“value”:“Elsevier”,“name”:“publisher”,“label”:“本文由”},{“value”:“基于奖励随机强化学习的网络空间攻防游戏”,“name”:“articletitle”,“标签”:“文章标题”}label“:”CrossRef DOI link to publisher maintained version“},{“value”:“article”,“name”:“content_type”,“label”:“content-type”},}“values”:“\u00a9 2022 The Authors.Published by Elsevier Inc.”,“名称”:“版权”,“标签”:“copyright”}],“文章编号”:“100262”}