{“状态”:“确定”,“消息类型”:“工作”,“信息版本”:“1.0.0”,“讯息”:{“索引”:{“日期-部件”:[[2024,5,10]],“日期-时间”:“2024-05-10T00:06:22Z”,“时间戳”:1715299582589},“参考-计数”:101,“出版商”:“电气与电子工程师学会(IEEE)”,“发行”:“2”,“许可证”:[{“开始”:{-“日期-零件”:[2019,6,1]],时间”:“2019-06-01T00:00:00Z”,“timestamp”:1559347200000},“content-version”:“vor”,“delay-in-days”:0,“URL”:“https:\/\/ieeexplore.iee.org\/Xplorehelp\/downloads\/license-information\/OAPA.html”}],“funder”:[{“DOI”:“10.13039\/5010000780”,“name”:“European Commission”,“DOI-asserted-by”:“publisher”,“award”:[“FP7\/2007\u20132013“]},{”名称“:“ICT挑战2\u201cCognitive Systems and Robotics\u201d through the Project \u201cIM-CLeVeR\u2014 Intrinsically Motivated Cumulative Learning Versatile Robots\u201d',“奖项”:[“ICT-IP-231722”]}],“内容域”:{“域”:[],“交叉标记限制”:false},“短容器-时间”:[”IEEE Trans.Cogn.Dev.Syst.“],“published-print”:{“date-parts”:[[2019,6]]},“DOI”:“10.1109\/tcds.2016.2607018”,“type”:“journal-article”,“created”:{“date-parts”:[[2016,10,17]],“date-time”:“2016-10-17T20:38:41Z”,“timestamp”:1476736721000},”page“:”292-317“,”source“:“Crossref”,“is-referenced-by-count”:13,“title”:[“在解决多个任务时在技能之间传递知识的强化学习体系结构”],“前缀”:“10.1109”,“卷”:“11”,“作者”:[{“给定”:“保罗”,“家庭”:“托马西诺”,“序列”:“第一”,“隶属关系”:[[{”名称“:新加坡南洋理工大学机器人研究中心”}]},“sequence”:“additional”,“affiliation”:[{“name”:“计算体现神经科学实验室,意大利罗马国家科学技术研究所”}]},{“given”:“Marco”,“family”:“Mirolli”,“se序列”:“附加”,“从属”:“计算实体神经科学实验室,意大利罗马国家科学研究院,意大利罗马”}]},{“given”:“Gianluca”,“family”:“Baldassarre”,“sequence”:“additional”,“affiliation”:[{“name”:“计算实体神经科学实验室,意大利罗马国家科学委员会,Cognizione科学技术研究所”}]}],“成员”:“263”,“参考”:[{“key”:“ref39”,“doi-asserted-by”:“publisher”,“doi”:“10.1080\/09540091003682553”},{“密钥”:“ref38”,“作者”:“麦克法兰”,“年份”:“1993”,“日记标题”:“动物”行为“},{“key”:“ref33”,“doi-asserted-by”:“publisher”,“doi”:“10.1177\/105971230501300205”},{”key“:”ref32“,”doi-assert-by“:”publisher“,”doi“:”10.1016\/S0893-6080(02)00047-3“},}”key“:30“,“首页”:“215”,“文章标题”:“适应性批评与基底神经节”,“author”:“barto”,“year”:“1995”,“journal-title”:“基底节信息处理模型”},{“key”:“ref37”,“doi-asserted-by”:“publisher”,“doi”:“10.1207\/s15516709cog1502_2”}“,”doi“:”10.1016\/S0896-6273(02)00967-4“},{“key”:“ref34”,“doi-asserted-by”:“publisher”,“doi”:“10.1126\/science.275.5306.1593”}标题“:“Proc Adv Neural Inf Process Syst”},{“key”:“ref29”,“doi asserted by”:“publisher”,“doi”:“10.1109\/TSMC.1983.6313077”},{“key”:“ref20”,“首页”:“27”,“文章标题”:“一种生物启发的分层强化学习架构,用于建模具有连续状态和动作的多种技能的学习”,“volume”:“149”,“author”:“caligiore”,“year”:“2010”,“journal-title”:“Proc 10th Int Conf Epigenetic Robot”},{“key”:“ref22”,“doi-asserted-by”:“publisher”,“doi”:“10.1177\/1059712314539710”}TNN.1998.712192“},{”键“:”参考23“,”首页“:”1038“,“article-title”:“强化学习中的泛化:使用稀疏粗编码的成功示例”,“author”:“sutton”,“year”:“1996”,“journal-title“:“Proc-Adv Neural Inf Process Syst”},{“key”:“ref101”,“doi-asserted-by”:“publisher”,“doi”:“10.1016\/j.neunet.2012.09.015”}:“10.1007\/978-3642-27645-3_7”},{“key”:“ref100”,“doi-asserted-by”:“publisher”,“doi”:“10.1016\/S0301-0082(96)00042-1”}S0896-6273(02)01003-6“},{“key”:“ref51”,“doi-asserted-by”:“publisher”,“doi”:“10.1016\/j.neubiorev.2013.01.012”},{“key”:“ref59”,“doi-asserted-by”:“publisher”,“doi”:“10.1109\/DEVLRN.2010.5578840”}、{“密钥”:“ref58”,“doi-asserte-by”:“publisher”,“DII”:”10.1007\/978-1-449-0“},}“keys”:“res57”,“doci-assertd-by”:”publisher“,“doi:”10.1007 \/BF002049-0 593“},{”key“:”ref56“,”doi-asserted-by“:”publisher“,”doi“:“10.1007\/978-3-642-27645-3_1”},{“key”:“ref55”,“doi-asserted-by”:“publisher”,“doi”:“10.1162\/089976600300015961”},{“key”:“ref52”,“doi-asserted-by”:“publisher”,“doi”:“10.1146\/annurev.neuro.24.167”},{“key”:“ref40”,“doi-asserted-by”:“publisher”,“doi”:“10.1093\/acprof:osobl\/9780199552917.001.0001”}、{“key”:”ref4“,“doo-asserted-by”:”publisher“,”doi“:”10.1016\/0003-3472(79)90006-X“},}“key:”ref3“,”doi-assert-by“:”publiser“,“DO”I“:”10.1007\/BF00229422“},{“key”:“ref6”,“first-page”:“1633”,“article-title”:“强化学习领域的迁移学习:调查”,“卷”:“10”,“作者”:“泰勒”,“年份”:“2009”,“期刊标题”:“J Mach Learn Res”},{“key”:“ref5”,“doi断言者”:“publisher”,“doi”:“10.1016\/J.earlhumdev.2003.09.006”},{“key”:“ref8”,“doi断言者”:“publisher”,“doi”:“10.1016\/S1364-6613(99)01294-2”},{“key”:“ref49”、“doi-asserted-by”:“publisher”,“doi”:“10.1016\/S0896-6273(01)00423-8”},{“key”:“ref7”,“doi-sserted-by“:”publisher“,”doi“:”10.1016\/S0079-7421(08)60536-8“},“key“:”ref9“,”doi-assert-by“y“:”publisher“,”doi“:”10.1152\/jn.00795.2010“},{”key“:”ref45“,”doi-asserted-by“:“publisher”,“DOI”:“10.1093\/acprof:oso\/9780195326703.0001”},{“key”:“ref48”,“DOI-asserted-by”:“publicher”,“DI:”10.1006\/nlme.1998.3843“10.1109\/DEVLRN.2011.6037326”},{“key”:“ref41”,“DOI-asserted-by”:“publisher”,“DOI”:“10.3389\/fnins.2010.00020”},{“key”:“ref44”,“DOI-asserted-by”:“publisher”,“DOI:”10.1371\/journal.pone.0003775“},“key“:”ref43“,”DOI-assert-by“:”publisher“,”DOI“:”10.1109\/DevLrn.2012.6400883“}4600568320“},{“key”:“ref72”,“first-page”:“1452”,“article-title”:“Q-error作为模块化强化学习系统中的选择机制”,“volume”:“22”,“author”:“ring”,“year”:“2011”,“journal-title”:“Proc-Int Joint Conf Artif Intell(IJCAI)”},{“key”:”ref71“,“doi-asserted-by”:“publisher”,“doi”:“10.1162\/NECO_a_00246”}753712972“},{”键“:“ref76”,“doi-asserted-by”:“publisher”,“doi”:“10.1007\/s10994-008-5061-y”},{“key”:“ref77”,“first-page”:“1679”,“article-title”:“Learning parameterized skills”,“author”:“da silva”,“year”:“2012”,“journal-title“:”Proc 29 Int Conf Mach Learn(ICML \/978-3-642-39802-5_7“},{“键”:“参考75”,“doi-asserted-by”:“publisher”,“doi”:“10.1007\/978-3642-39802-5_8”},{“key”:“ref78”,“doi-asserted-by”:”publisher“,”doi“:”10.1109\/ICRA.2014.6907629“},}“key:”ref79“,”doi-assert-by doi“:”10.1037\/a0037016“},{“key”:“ref62”,“doi-asserted-by”:“publisher”,“DOI”:“10.1023\/A:1025696116075”},{“key”:“ref61”,“DOI-asserted-by”:“publisher”,“DOI:”10.1007\/978-3-540-77296-5_32“},“key“:”ref63“,”DOI-assert-by“:”publisher“,”DOI“:”10.1016\/S0004-3702(99)00052-1“}便携式选项:强化学习中的技能转移”,“卷”:“7”,“作者”:“konidaris”,“year”:“2007”,“journal-title”:“Proc 20th Int Joint Conf Artif Intell”},{“key”:“ref65”,“doi-asserted-by”:“publisher”,”doi“:”10.1007\/BF00992698“},”{“密钥”:“ref66”,“首页”:“761”,“文章-标题”:“Horde:一种可扩展的实时架构,用于从无监督的传感器-运动交互中学习知识”,“author”:“sutton”,“year”:”2011“,“journal-title”:“Proc 10th Int Conf Auton Agents Multiagent Syst(AAMAS)”},{“key”:“ref67”,“first page”:”720“,”article-title“:”在强化学习代理中的概率策略重用“,”author“:”fern\u00e1ndez“,”year“:”2006“,”journal-title“,”Proc Int Joint Conf Autonomous Agents and Multiagents Systems“},”{“密钥”:“ref68”,“doi-asserted-by”:“publisher”,“DOI”:“10.1145 \/1390156.1390225”},{“key”:“ref2”,“DOI-asserted-by”:“publicher”,“DOI”:”10.1007 \/s00221-005-0169-9“},}“key:”ref69“,”DOI-assert-by“:”publisher“,”DOI“:”10.1016 \/S0893-6080(98)00066-5“}、{“key”:“ref1”,“author”:“piaget”,“year”:“1953”,“journ”al-title“:“儿童智力的起源”},{“key”:“ref95”,“DOI-asserted-by”:“publisher”,“DOI”:“10.3389\/fpsyg.2014.00124”},{“key”:“ref94”,“DOI-asserted-by”:“publicher”,“DOI”:”10.1016\/j.neunet.2012.012“}”,{”key“:”ref93“,”DOI-assert-by“:”publisher“,”DOI“:”10.1007\/978-3642-39875-9“}007\/978-3642-39875-9_8“},{“key”:“ref91”,“DOI-asserted-by”:“publisher”,“DOI”:“10.7551\/mitpress\/9780262016964.001.0001”},{“key”:“ref90”,“author”:“shadmehr”,“year”:“2005”,“journal-title”:“The Computational Neurobiology of Reaching and Pointing”}、{“密钥”:“ref98”,“doi-asserted-by”:“publisher”,“doi”:“10.1016\/j.cognition.2008.011”}10.1007\/11840541_33“},{“键”:“参考96”,“doi-asserted-by”:“publisher”,“doi”:“10.1146\/annurev.ne.09.030186.002041”},{“key”:“ref97”,“doi-asserted-by”:”publisher“,”doi“:”10.1038\/nrn1919“},”{“key”:“ref10”,“首页”:“112”,“article-title”:“层次技能集合的内在动机学习”,“author”:“barto”,“year”:“2004”,“journal-title“:“Proc Int Conf Development Learn(ICDL’06)”},{“key”:“ref11”,“doi断言者”:“publisher”,“doi”:“10.21236\/ADA440079”},{“key”:“ref12”,“doi断言者”:“publisher”,“doi”:“10.1109\/TEVC.2006.890271”},{“key”:“ref13”,“doi断言者”:“publisher”,“doi”:“10.1016/0921-8890(95)00004-Y”},{“key”:“ref14“,”首页“:”11“,”文章标题“:“理解技能自主累积学习的主要开放挑战是什么?”,“卷”:“7”,“作者”:“baldassarre”,“年份”:“2010年”,“新闻标题”:“Newslett Autonom心理发展技术委员会”},{“key”:“ref15”,“doi-asserted-by”:“publisher”,“doi”:“10.1007\/978-3642-27645-3_5”},“journal-title”:“动物行为-进化方法”},{“key”:“ref82”,“doi-asserted-by”:“publisher”,“doi”:“10.1109\/TCDS.2016.2538961”}},{“key”:“ref18”,“doi-asserted-by”:“publisher”,“doi”:“10.1016\/S1389-0417(01)00039-0”},{“key”:“ref84”,“article-title”:“使用不同密度自动发现强化学习中的子目标”,“author”:“mcgovern”,“year”:“2001”}、{“key”:”ref19“,“article-title”:“神经网络和强化学习的规划”,“author”:“baldassarre”,“年份”:“2002”}:“publisher”,“DOI”:“10.1007\/978-3642-32375-1”},{“key”:“ref80”,“article-title”:“Mixture models”,“author”:“jacobs”,“year”:“2008”}:“使用技能链在持续强化学习领域中发现技能”,“作者”:“konidaris”,“年份”:“2009年”,“日志标题”:“Proc Adv Neural Inf Process Syst(NIPS)”},{“key”:“ref86”,“doi-asserted-by”:“publisher”,”doi“:”10.1109\/DevLrn.2012.6400835“},”{“key”:”ref87“,”doi-assert-by“:”publisher“,”doi:“10.3389”//fnbot.2013.0022“}”,{“键”:“ref88”,“doi-asserted-by”:“publisher”,“doi”:“10.1037\/0278-7393.5.179”}],“container-title”:[“IEEE认知与发展系统事务”],“原始标题”:[],“链接”:[{“URL”:“http://\/xplorestaging.IEEE.org\/ielx7\/727498947\/07592409.pdf?arnumber=7592409”,“内容类型”:“未指定”,“content-version”:“vor”,“intended-application”:“similarity-checking”}],“deposed”:{“date-parts”:[[2024,5,9]],“date-time”:“2024-05-09T17:41:09Z”,“timestamp”:1715276469000},“score”:1,“resource”:{“primary”:}“URL”:“https:\/\/ieeexplore.iee.org\/document\/7592409\/”}},”subtitle“:[],”shortitle“:[],“issued”:{-“date-ports”“:[[2019,6]]},”引用计数“:101,”日志发布“:{“问题”:“2”},“URL”:“http://\/dx.doi.org\/10.109\/tcds.2016.2607018”,“关系”:{},”ISSN“:[”2379-8920“,”2379-9939“],“问题类型”:[{“值”:“2379-8930”,“类型”:“打印”}、{“数值”:“2.379-8939”,“类别”:“电子”}],“主题”:[],“发布”:{”日期部分:[2019]6]]}}