{“状态”:“确定”,“消息类型”:“工作”,“信息版本”:“1.0.0”,“邮件”:{“索引”:{“日期-部件”:[[2022,7,17]],“日期-时间”:“2022-07-17T22:16:07Z”,“时间戳”:1658096167970},“引用-计数”:23,“发布者”:“IEEE”,“许可证”:[{“开始”:{'日期-部件“:[2019,8,1]],”日期-时间“:”2019-08-01T00:00:00 Z“,”timestamp“:1564617600000},”content-version“:”vor“,“delay-in-days”:0,“URL”:“https:\/\/ieeexplore.iee.org\/Xplorehelp\/downloads\/license-information\/ieee.html”},{“start”:{“date-parts”:[[2019,8,1]],“date-time”:“2019-08-01T00:00:00Z”,“timestamp”:1564617600000},“content-version”:“stm-asf”,“delay-in-days“:0,”URL“https:\\/doi.org\/10.1 5223\/policy-029“},{“开始”:{“日期部分”:[[2019,8,1]],“日期-时间”:“2019-08-01T00:00:00Z”,“时间戳”:1564617600000},“内容版本”:“stm-asf”,“延迟天数”:0,“URL”:“https:\/\/doi.org/10.15223\/policy-037”}],“内容域”:{“域”:[],“交叉标记限制”:false},“短容器标题”:[],“已发布的印刷品”:{“日期部分”:[[2019,8]]},“doi”:“10.1109\/devlr.2019.8850685”,“类型”:“procesdings-article”,“created”:{“date-parts”:[[2019,10,1]],“date-time”:“2019-10-01T03:40:48Z”,“timestamp”:1569901248000},“source”:“Crossref”,“is-referenced-by-count”:0,“title”:[“促进不同方法组合的强化学习探索技术的分类”],“prefix”:“10.1109”,”author“:[{”given“given”:”Bjorn Ivar“,“family”:“Teigen”,“sequence”:“first”,“affiliation”:[]},{“given”:“Kai Olav”,“faily”:”Ellefsen“,”sequence“:”additional“,”affiliance“:[]neneneep,{”given“:”Jim“,”family“:”Torresen“,“se序列”:“additional”,“从属关系”:[]},“member”:“263”,“reference”:[{“key”:”ref10“,”doi-asserted-by“:“publisher”,“doi”:“”10.1145\/1143844.1143949“},{“键”:“参考11”,“article-title”:“软参与者-关键:非政策性最大熵深度强化学习与随机参与者”,“author”:“haarnoja”,“year”:“0”,“journal-title“:”国际机器学习会议(ICML)“},{“key”:“ref12”,“first page”:”1889“,“artice-title:“2015”,“journal-title”:“ICML'15第三十二届国际机器学习会议论文集”},{“key”:“ref13”,“first page”:”4026“,”article-title“:”Deep Exploration via Bootstrapped DQN“,”volume“:”29“,”author“:”osband“,”year“:”2016“,”journal-stitle“:“Advances in neural information processing systems”}“,{”key“:“ref14”,“首页”:“1928”,“article-title”:“深度强化学习的异步方法”,“author”:“mnih”,“year”:“0”,“journal-title“:“第三十三届国际机器学习会议论文集”},{“key”:“ref15”,“doi-asserted-by”:“publisher”,“doi”:“10.2307\/2332286”}:“Boltzmann Exploration Done Right”,“volume”:“30”,“author”:“cesa-bianchi”,“year”:“2017”,“journal-title”:“Advances in neural information processing systems”},{“key”:”ref17“,“volution”::“12”,“author”:”mnih“,”year“:”2013“,”journal-title“Playing atari with deep reinforcement learning”}“,{”key“:”ref18”,“first page”::“Double Q-learning”,“volume”:“23”,“author”:“hasselt”,“year”:“2010”,“journal-title”:“Advances in neural information processing systems”},{“key”:”ref19“,”doi-asserted-by“:”publisher“,”doi“:”10.1007\/978-3642-32375-1“},”{“密钥”:“ref4”,“doi-assert-by”:“publisher”,“doi”:“10.1109\/CVPRW.2017.70”}“,{”key“:”ref3“,”author:“plappert”,“year”:“0”,“journal-title”:“探索的参数空间噪音”},{“key”:“ref6”,“首页”:“3215”,“文章标题”:“彩虹:结合深度强化学习的改进”,“author”:“hessel”,“year”:“0”,“jornal-title:“第三十二届AAAI人工智能会议论文集”}:“10.1080\/09540090600768658”},{“key”:“ref8”,“author”:“sutton”,“year”:“2017”,“journal-title”:“Recentration Learning An Introduction”}、{“key”:”ref7“,“doi-asserted-by”:“publisher”,“doi”:“10.1023\/A:1007541107674”}自举汤普森采样和深度探索“},{”key“:“ref1”,“first page”:“1109”,“article-title”:“VIME:变分信息最大化探索”,“volume”:”5“,“author”:“houthooft”,“year”:“2016”,“journal-title“:”Advances in Neural Information Processing Systems I(NIPS)“},{“key”::“用深度预测模型激励强化学习中的探索”},{“key”:“ref20”,“volume”:”6“,“author”:“brockman”,“year”:“2016”,“journal-title”:“OpenAI Gym”}、{“key”:,“volume”:“114”,“author”:“kirkpatrick”,“year”:“2016”,“journal-title”:“Proceedings of the National Academy of Sciences”},{“key”:”ref21“,”author“:”moore“,”year“:”1990“,”journal-title“:”Efficient memory-based learning for robot control“},”{“密钥”:“ref23”,“doi-asserted-by”:“publisher”,”doi“:”10.1561\/220000070“}],“event”:{“name”:“2019年IEEE第九届发展、学习和表观遗传机器人联合国际会议(ICDL-EpiRob)”,“地点”:“挪威奥斯陆”,“开始”:{“日期部分”:[[2019,8,19]]},“结束”:{“日期部分“:[2019,8,22]]}},”集装箱标签“:[”2019年第九届IEEE发展、学习与表观遗传Rob联合国际会议“],“original-title”:[],“link”:[{“URL”:“http://\/xplorestaging.ieee.org\/ielx7\/8843356\/8850685.pdf?arnumber=8850685”,“content-type”:“unspecified”,“content-version”:“vor”,“intended-application”:“similarity-checking”},“deposed”:{“date-parts”:[2022,7,17]],“date-time”:”2022-07-17T21:49:40Z“,”时间戳“:1658094580000},”分数“:1,”资源“用法:{“primary”:{“URL”:“https:\/\/ieeexplore.iee.org\/document\/885068\/”}},“subtitle”:[],“shorttitle”:[],“issued”:{日期部分:[[2019,8]]},”references-count“:23,”URL“:”http://\/dx.doi.org\/10.109\/devlrn.2019.8850685“,”关系“:{},rts“:[[2019,8]]}}}