{“状态”:“确定”,“消息类型”:“工作”,“信息版本”:“1.0.0”,“邮件”:{“索引”:{“日期部分”:[[2024,3,2],“日期时间”:“2024-03-02T14:49:30Z”,“时间戳”:1709390970850},“引用-计数”:27,“发布者”:“IEEE”,“内容域”:{“域”:[],“交叉标记-限制”:false},”短容器-时间“:[]”,“发布-打印”:{“日期部分”:[[2018,11]]},“DOI”:“10.1109\/humanoids.2018.8624972”,“type”:“proceedings-article”,“created”:{“date-parts”:[[2019,1,25]],“date-time”:“2019-01-25T02:51:38Z”,“timestamp”:1548384698000},“source”:”Crossref“,”is-referenced-by-count“:6,”title“:[”潜在空间机器人技能学习中的用户反馈“],”前缀“10.1109”,“author”:[{“给定”:“Rok”,“家庭”:“巴希克”,“sequence”:“first”,“affiliation”:[]},{“given”:“Zvezdan”,“family”:“Loncarevic”,“segment”:“additional”,“filiation“:[]{”给定“:“Ales”,“家族”:“Ude”,“序列”:“附加”,“从属”:[]},}“giving”:“Bojan”,”family“:”Nemec“,”sequence“:”additional“,”affiliance“:[]{给定“:”Andrej“,“faily”:”游戏“,”序列“:”附加“,”从属“:[]}],“member”:“263”,“reference”:[{“key”:“ref10”,“article-title”:“带序数奖励和不可靠导师的交互式q学习”,“author”:“weng”,“year”:“2013”,“journal title”:《欧洲机器学习与数据库知识发现原理与实践会议(ECML\/PKDD)》},{“密钥”:“ref11”,“doi-asserted-by”:“publisher”,“doi”:“10.2478\/pjbr-2013-0003”},{“key”:“ref12”,“doi-asserted-by”:“publisher”,“doi”:“10.1162\/NECO_a_00393”},{“key”:“ref15”,“doi-asserted-by”:“publisher”,“doi”:“10.1109\/HUMANOIDS.2015.7363570”},{“key”:“ref16”,“doi-asserted-by”:“publisher”,“doi”:“10.1109\/HUMANOIDS.2016.7803340”},{”key“:”ref17“,”first page“:“663”,“article-title”:“逆强化学习算法”,“author”:“ng”,“year”:“2000”,“journal-title“:”Proc Seventh Int Conf Machine learning“},”key:“ref18”,“article-tiple”:“通过对抗性反向强化学习学习稳健奖励”,“author”:“justin”,“year”:“0”,“journal-title”:“arXiv 1710 11248 2017”},{“key”:“ref19”,“author”,“laud”,“year”:《2004》,“johnal-tittle”:《强化学习中奖励形成的理论与应用》},}“keys”:“ref4”,“doi-asserted-by”:“publisher”,《doi》:“10.1080\/01691864.2013.814211”},{“key”:“ref3”,“doi-asserted-by”:“publisher”,“doi”:“10.1109\/TRO.2008.2006703”}1“},{”key“:”ref5“,”article-title“:“使用alice模仿机制解决不同机器人手臂之间的对应问题”,“作者”:“alissandrakis”,“年份”:“2003年”,“新闻标题”:“第二届动物和人工制品模仿国际研讨会”},{“关键”:“参考8”,“首页”:“388”,《文章标题》:“机器人政策搜索调查”,“作家”:“deisenroth”,“year”:“2013”,“journal-title”:“Robotics的基础和趋势”},{“key”:“ref7”,“doi-asserted-by”:“publisher”,“doi”:“10.1007 \/s10994-010-5223-6”}、{“key”:”ref2“,”doi-assert-by“:”publisher“,”doi“:”10.1016 \/S1364-6613(99)01327-3“},”{“key”:“ref1”,“article-title“Towards robot skill”学习:从简单技能到乒乓球”,“作者”:“peters”,“年份”:“2013”,“期刊标题”:“欧洲机器学习会议(ECML)”},{“key”:“ref9”,“doi断言”:“publisher”,“doi”:“10.3389\/frobt.2018.000077”},{“key”:“ref20”,“doi断言”:“publisher”,“doi”:“10.1016\/j.robot.2015.09.011”},{“key”:“ref22”,“doi断言”:“publisher”,“doi”:“10.1560 7\/RSS.2017.XIII.053“},{”键“:“ref21”,“文章标题”:“从人类偏好中进行深度强化学习”,“作者”:“christiano”,“年份”:“2017”,“期刊标题”:“arXiv预印本arXiv 1706 03741”},{“key”:“ref24”,“首页”:“1”,“文章标题”:“在连续状态和动作空间中与人类反馈相结合的强化学习”,“作者”:“vien”,“年份”:“2012”,“期刊标题”:“IEEE Int Conf on Develop and Learn and Epigen Rob(ICDL)”},{“key”:“ref23”,“doi-asserted-by”:“publisher”,“doi”:“10.1145\/1597735.1597738”}“:”akrour“,”year“:”2014“,“journal-title”:“国际机器学习会议”}],“event”:{“name”:“2018 IEEE-RAS第18届国际仿人机器人会议”,“location”:“Beijing,China”,“start”:{“date-parts”:[[2018,11,6]]},“end”:{-“date-parts”:[[2018,11,9]}},”container-title“:[“2018 IEEE-RAS第18届国际仿人机器人会议(Humanoids)”],“original-title”:[],“link”:[{“URL”:“http://\/xplorestaging.IEEE.org\/ielx7\/8596719\/8624972.pdf?arnumber=8624972”,“content-type”:“unspecified”,“content-version”:“vor”,“intended-application”:“similarity-checking”}],“deposed”:{“date-parts”:[2022,1,26]],“date-time”:“2022-01-26T23:10:20Z”,“timestamp”:164323862000},“score”:1,“resource”:{“primary”:{“URL”:“https:\/\/ieeexplore.iee.org\/document\/8624972\/”}},”subtitle“:[],”shorttitle“:[],”issued“:{”date-parts“:[[2018,11]]},‘references-count’:27,”URL“http://\/dx.doi.org\/10.109 \/类人机器人.2018.8624972“,”关系“:{},”主题“:[],”已发布“:{“日期部分”:[[2018,11]]}}