{“状态”：“确定”，“消息类型”：“工作”，“信息版本”：“1.0.0”，“邮件”：{“索引”：{-“日期-部件”：[[2024,9,6]]，“日期-时间”：“2024-09-06T22:47:25Z”，“时间戳”：1725662845681}，“引用-计数”：26，“发布者”：“IEEE”，“许可证”：[{“开始”：{“日期-零件”：[[2020,11,1]]，”日期-时间“：“2020-11-01T00:00Z”，“timestamp”：1604188800000}，“content-version”：“vor”，“delay-in-days”：0，“URL”：“https:\/\/ieeexplore.iee.org\/Xplorehelp\/downloads\/license-information\/ieee.html”}，{“start”：{“date-parts”：[[2020,11,1]]，“date-time”：“2020-11-01T00:00:00Z”，“timestamp”：16041888000000}，“content-version”：“stm-asf”，“delay-in-days“：0，”URL“https:\\/doi.org\/10.15223\/policy-029“}，{“start”：{“date-parts”：[[2020,11,1]]，“date-time”：“2020-11-01T00:00:00Z”，“timestamp”：1604188800000}，“content-version”：“stm-asf”，“delay-in-days”：0，“URL”：“https:\/\/doi.org\/10.15223\/policy-037”}]，“funder”：[{“doi”：“10.13039\/1000005637”，“name”：“MDC”，“doi-asserted-by”：“publisher”，“id”：[}“id”:“10.13029\/100005637”，“id-type”：“doi”，“asserted-by”：“publisher”}]}]，“content-domain”：{“domain”：[]，“crossmark-restriction”：false}，“short-container-title”：[]“：”Crossref“，”is-referenced-by-count“：2，”title“：[“基于SARSA的深度强化学习的自主觅食”]，“前缀”：“10.1109”，“卷”：“e101 d”，“作者”：[{“给定”：“Anderson”，“家族”：“Mesquita”，“序列”：“第一”，“从属关系”：[]}，{“已知”：“尤里”，“家庭”：“诺盖拉”}、，{“given”：“Joaquim”，“family”：“Cavalcante-Neto”，“sequence”：“additional”，“affiliation”：[]}，{“fivent”：“Paulo”，”family“：”Serafim“，”sequence“：”additional“，”affiliation:[]}]，“member”：“263”，“reference”：[{“year”：“2018”，“author”：“sutton”，“journal-title”：“Reinforcement Learning An Introduction”，“key”：”ref10“}”，{”doi-asserted-by“publisher”，“key”：“ref11”，“doi”：“10.1109\/MSP.2017.2743240”}，{“doi-asserted-by”：“publisher”，“key”：“ref12”，“doi”：“10.109\/5.726791”}、{“doi-asserted-by”:“publishers”，“key”：”ref13“，“doi:”10.1177\/10597123093419“}，}“doi-asserted-by”：”publisher“，”key“：”ref14“，”doi“：”10.1007\/BF00992698“}”，{年“：“1993”，“作者”：“林”，“新闻标题”：“使用神经网络的机器人强化学习”，“key”：“ref15”}，{“doi-asserted-by”：“publisher”，“key”：”ref16“，”doi“：”10.1109“/SSCI.2016.7849837“}，}“key“：”ref17“，”doi-assert-by“：”crossref“，”first page“：“2315”，“doi”：“10.1587”transinf.2017EDP7278“，”article-title“：”使用sarsa和q-learning的深度强化学习：一种混合方法”，“卷”：“e101 d”，“作者”：“熊旭”，“年份”：“2018”，“期刊标题”：“IEICE信息与系统交易”}，{“密钥”：“参考文献18”，“第一页”：“477”，“文章标题”：“关于使用深度强化学习开发三维第一人称射击游戏的自主代理”，“作者”：“serafim”，“年份”：“2017”，“期刊标题”：“Anais do XII Simpósio Brasileiro de Jogos e Entretenimento Digital”}，{“year”：“1989”，“author”：“watkins”，“journal-title”：“Learning from delayed rewards”，”key“：”ref19“}，}“key”：“ref4”，“first-page:”67“article-title“：”进化机器人：生物学“，”author“：”nolfi“，”“year“：”2000“，”journal-title“：“自组织机器的智能与技术”}，{“doi-asserted-by”：“publisher”，“key”：“ref3”，“doi”：“10.1007\/978-3-540-74913-4_46”}、{“year”：“2016”，“author”：“goodfellow”，“journal-title”：“Deep Learning”，“key”：“ref6”}key“：”ref8“，”首页“：”1097“，“article-title”：“基于深度卷积神经网络的Imagenet分类”，“volume”：“1”，“author”：“krizhevsky”，“year”：“2012”，“journal-title“：“Proceedings of the 25th International Conference on neural Information Processing Systems”}，{“doi-asserted-by”：“publisher”，“key”：《ref7》，“doi”：“10.1145\/3234150”}：“ref2”，“DOI”：“10.1016\/j.neunet.2007.09.016”}，{“year”：“2013”，“author”：“mnih”，“journal-title”：“Playing atari with deep reinforcement learning”，“key”：“ref9”}、{“DOI-asserted-by”：“publisher”，“key”：“ref1”，“DOI”：”10.1016\/j.nucom.2015.09.061“}”，{”key：“ref20”，“首页”：“315”，“文章标题”：“深度稀疏整流器神经网络”，“作者”：“glorot”，“年份”：“2011年”，“新闻标题”：“第十四届国际人工智能与统计会议论文集”}，{“年份”:“2015年”，”作者“：”xu“，”article-title“：”卷积网络中校正激活的实证评估“，”key“：”ref22“}，”{“key”：“ref21”，“首页”：“3”，“article-title”：“矫正非线性改善神经网络声学模型”，“卷”：“30”，“作者”：“maas”，“年份”：“2013”，“期刊标题”：“Proc ICML”}，{“key”：“ref24”，“首页”：“249”，“文章标题”：“理解深度前馈神经网络训练的难度”，“作者”：“glorot”，“年份”：“2010”，“期刊标题”：“第十三届国际人工智能与统计会议论文集”}，{“年份”：“2012年”，“作者”：“hinton”，“期刊标题”：“arXiv预印本arXiv 1207 0580”，“文章标题”：《通过防止特征检测器的共适配来改进神经网络》，“key”：“ref23”}：“无探索的非政策深度强化学习”，“作者”：“藤本”，“年份”：“2019年”，“新闻标题”：“机器学习国际会议”}，{“年份”:“2017年”，”作者“：”高“，”新闻标题“：”arXiv预印本arXiv 1704 00805“，”文章标题“：“关于softmax函数的性质及其在博弈论和强化学习中的应用”，“key”：“ref25”}]，“event”：{“name”：“2020年第22届虚拟和增强现实（SVR）研讨会”，“start”：{-“date-parts”：[[2020,11,7]]}，“location”：“Porto de Galinhas，Brazil”，“end”：{--“date-parts”：[2020,11,10]}}，”container-title“：[“2020年第22届虚拟与增强现实研讨会（SVR）”]，“original-title”：[]，“link”：[{“URL”：“http://\/xplorestaging.ieee.org\/ielx7\/9262455\/9262697.pdf？arnumber=9262697”，“content-type”：“unspecified”，“content-version”：“vor”，“intended-application”：“similarity-checking”}]，“deposed”：{“date-parts”：[2022,6,30]]，“日期-时间”：“2022-06-30T15:18:57Z”，“timestamp”：1656602337000}，“score”：1，“resource”：{“primary”：{“URL”：“https:\/\/ieeexplore.iee.org\/document\/9262697\/”}}，”subtitle“：[]，”shorttitle“：[]，”issued“：{”date-parts“：[2020,11]}，‘references-count’：26，”URL“：”http://\/dx.doi.org\/10.109\/svr51698.2020.00070“，”关系“：{}，”主题“：[]，”发布“：{”日期部分“:[[2020,11]]}}}