{“id”:“https://openalex.org/W2401683402“,”doi“:”https://doi.org/10.1007/978-3-319-29339-4_2“,”title“:“从人类交流的纠正建议中交互式学习持续行动”,”display_name“:“通过人类交流的更正建议交互式学习持续动作”,”publication_year“:2015,”publiation_date“:”2015-01-01“,”ids“:{”openalex“:”https://openalex.org/W2401683402“,”doi“:”https://doi.org/10.1007/978-3-319-29339-4_2“,”mag“:”2401683402“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://doi.org/10.1007/978-3-319-29339-4_2,“pdf_url”:https://link.springer.com/content/pdf/10.1007/978-3-319-29339-4_2.pdf,“源”:{“id”:https://openalex.org/S106296714“,”display_name“:”计算机科学讲义“,”issn_l“:”0302-9743“,”isn“:[”0302-7743“、”1611-3349“],”is_oa“:false、”is_in_doaj“:false、”is_core“:true、”host_organization“:”https://openalex.org/P4310318900“,”“host_organization_name”:“Springer Science+Business Media”,“host_organization_lineage”:[“https://openalex.org/P431031965","https://openalex.org/P4310318900“],”host_organization_lineage_names“:[”Springer Nature“,”Springr Science+Business Media“],“type”:“book series”},“license”:“cc-by-nc”,“licence_id”:“https://openalex.org/licenses/cc-by-nc“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},”type“:”book-chapter“,”type_crossref“:“book-chapper”,”indexed_in“:[”crossref“],”open_access“:{”is_oa“:true,”oa_status“:”hybrid“,”oa_url“:”https://link.springer.com/content/pdf/10.1007/978-3-319-29339-4_2.pdf“,”any_repository_has_fulltext“:false},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5028010633“,”display_name“:”Carlos Celemin“,”orcid“:”https://orcid.org/0000-0001-8880-0966},“机构”:[{“id”:https://openalex.org/I69737025“,”display_name“:”智利大学“,”ror“:”https://ror.org/047gc3g35“,”country_code“:”CL“,”type“:“教育”,”世系“:[”https://openalex.org/I69737025“]}],”国家“:[”CL“],”is_corresponding“:false,”raw_author_name“:”Carlos Celemin“,”raw_affiation_string“:[”智利圣地亚哥大学电气工程与先进采矿技术中心系“],”附属机构“:[{”raw_affiation_string“:”智利圣地亚哥智利大学电气工程与先进采矿技术中心系”,“institution_ids”:[“https://openalex.org/I69737025“]}]},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A50484484415“,”display_name“:”Javier Ruiz\u2010del\u2010Solar“,”orcid“:”https://orcid.org/0000-0003-2965-633X},“机构”:[{“id”:https://openalex.org/I69737025“,”display_name“:”智利大学“,”ror“:”https://ror.org/047gc3g35“,”country_code“:”CL“,”type“:“教育”,”世系“:[”https://openalex.org/I69737025“]}],”国家“:[”CL“],”is_corresponding“:false,”raw_author_name“:”Javier Ruiz-Del-Solar“,”raw _ afiliation_strings“:[“智利圣地亚哥智利大学电气工程与先进采矿技术中心系”],”affiliations“:”智利圣地亚哥智利大学电气工程与先进采矿技术中心系”,“institution_ids”:[“https://openalex.org/I69737025“]}]}],”countries_distinct_count“:1,”institutions_disting_count”:1,“corresponding_author_ids”:[],”correspounding_institution_ids“:[]、”apc_list“:{“value”:5000,”currency“:”EUR“,”value_usd“:5392,”provenance“:”doaj“},”apc_payed“:{”value“:5000,“currencurrency”:“EUR”,”value_ usd“:5392,“provenance”:“doaj”},“fwci”:1.585,“has_fulltext”:true,“fulltext_origin”:“pdf“,”cited_by_count“:7,”cited_by_percentile_year“:{”min“:85,”max“:86},”biblio“:{”volume“:null,”issue“:nul,”first_page“:”16“,”last_page“:”27“},“is_retracted”:false,“is_paratext”:false,“primary_topic”:{“id”:“https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9985,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9985,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10653“,”“display_name”:“机器人抓取和示范学习”,“score”:0.9972,“subfield”:{“id”:“https://openalex.org/subfields/2207“,”display_name“:”控制与系统工程“},”field“:{”id“:”https://openalex.org/fields/22“,”display_name“:”Engineering“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/human机器人协作“,”display_name“:”Human-Robot Collaboration“,”score“:0.551281},{”id“:”https://openalex.org/keywords/robot-learning“,”display_name“:”机器人学习“,”score“:0.539228},{”id“:”https://openalex.org/keywords/reinforcement-learning网站“,”display_name“:”强化学习“,”score“:0.53666},{”id“:”https://openalex.org/keywords/safe-human-robot-interaction网站“,”display_name“:”安全人机交互“,”score“:0.522711}],”concepts“:[{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.82256985},{”id“:”https://openalex.org/C2779305910,“wikidata”:https://www.wikidata.org/wiki/Q5172809“,”display_name“:”纠正性反馈“,”level“:2,”score“:0.77394783},{”id“:”https://openalex.org/C97541855,“wikidata”:https://www.wikidata.org/wiki/Q830687“,”display_name“:”强化学习“,”level“:2,”score“:0.7609892},{”id“:”https://openalex.org/C2779955035,“wikidata”:https://www.wikidata.org/wiki/Q4686785“,”display_name“:”Advice(programming)“,”level“:2,”score“:0.72995216},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.5751784},{”id“:”https://openalex.org/C2780791683,“wikidata”:https://www.wikidata.org/wiki/Q846785“,”display_name“:”Action(physical)“,”level“:2,”score“:0.5308441},{”id“:”https://openalex.org/C36503486,“wikidata”:https://www.wikidata.org/wiki/Q11235244“,”display_name“:”领域(数学分析)“,”级别“:2,”分数“:0.5004599},{”id“:”https://openalex.org/C90509273,“wikidata”:https://www.wikidata.org/wiki/Q11012“,”display_name“:”Robot“,”level“:2,”score“:0.4860125},{”id“:”https://openalex.org/C107457646,“wikidata”:https://www.wikidata.org/wiki/Q207434“,”display_name“:”Human\u2013计算机交互“,”level“:1,”score“:0.44836354},{”id“:”https://openalex.org/C145420912,“wikidata”:https://www.wikidata.org/wiki/Q853077“,”display_name“:”数学教育“,”level“:1,”score“:0.077489585},{”id“:”https://openalex.org/C134306372,“wikidata”:https://www.wikidata.org/wiki/Q7754“,”display_name“:”数学分析“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C121332964,“wikidata”:https://www.wikidata.org/wiki/Q413“,”display_name“:”物理“,”级别“:0,”分数“:0.0},{”id“:”https://openalex.org/C33923547,“wikidata”:https://www.wikidata.org/wiki/Q395“,”display_name“:”数学“,”等级“:0,”分数“:0.0},{”id“:”https://openalex.org/C62520636,“wikidata”:https://www.wikidata.org/wiki/Q944网址“,”display_name“:”量子力学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C199360897,“wikidata”:https://www.wikidata.org/wiki/Q9143“,”display_name“:”Programming language“,”level“:1,”score“:0.0}],”mesh“:[],”locations_count“:1,”locations“:[{”is_oa“:true,”landing_page_url“:”https://doi.org/10.1007/978-3-319-29339-4_2,“pdf_url”:https://link.springer.com/content/pdf/10.1007/978-3-319-29339-4_2.pdf,“源”:{“id”:https://openalex.org/S106296714“,”display_name“:”计算机科学讲义“,”issn_l“:”0302-9743“,”isn“:[”0302-7743“、”1611-3349“],”is_oa“:false、”is_in_doaj“:false、”is_core“:true、”host_organization“:”https://openalex.org/P4310318900“,”“host_organization_name”:“Springer Science+Business Media”,“host_organization_lineage”:[“https://openalex.org/P431031965","https://openalex.org/P4310318900“],”host_organization_lineage_names“:[”Springer Nature“,”Springr Science+Business Media“],“type”:“book series”},“license”:“cc-by-nc”,“licence_id”:“https://openalex.org/licenses/cc-by-nc“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true}],”best_oa_location“:{”is_oa“:true,”landing_page_url“:”https://doi.org/10.1007/978-3-319-29339-4_2,“pdf_url”:https://link.springer.com/content/pdf/10.1007/978-3-319-29339-4_2.pdf,“源”:{“id”:https://openalex.org/S106296714“,”display_name“:”计算机科学讲义“,”issn_l“:”0302-9743“,”isn“:[”0302-7743“、”1611-3349“],”is_oa“:false、”is_in_doaj“:false、”is_core“:true、”host_organization“:”https://openalex.org/P4310318900“,”“host_organization_name”:“Springer Science+Business Media”,“host_organization_lineage”:[“https://openalex.org/P431031965","https://openalex.org/P4310318900“],”host_organization_lineage_names“:[”Springer Nature“,”Springr Science+Business Media“],“type”:“book series”},“license”:“cc-by-nc”,“licence_id”:“https://openalex.org/licenses/cc-by-nc“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},”sustainable_development_goals“:[],”grants“:[],”datasets“:],”versions“:[https://openalex.org/W1536323281","https://openalex.org/W1626155273","https://openalex.org/W1966259872","https://openalex.org/W1979308911","https://openalex.org/W1986014385","https://openalex.org/W1999874108","https://openalex.org/W2062821321","https://openalex.org/W2098584016","https://openalex.org/W2104308387","https://openalex.org/W2120982521","https://openalex.org/W2126861176","https://openalex.org/W2128103053","https://openalex.org/W2129659607","https://openalex.org/W2150818585","https://openalex.org/W2156869222","https://openalex.org/W2162932021","https://openalex.org/W2406235655","https://openalex.org/W4214717370“],”related_works“:[”https://openalex.org/W4390193239","https://openalex.org/W4386265809","https://openalex.org/W4213266652网址","https://openalex.org/W4206735805","https://openalex.org/W3164368351网址","https://openalex.org/W3133706844","https://openalex.org/W2998735842","https://openalex.org/W2899872056","https://openalex.org/W2791575529","https://openalex.org/W1984742304“],”ngrams_url“:”https://api.openalex.org/works/W2401683402/ngrams网站“,”abstract_inverted_index“:{”An“:[0],”interactive“:[1],”learning“:[2,96107],”framework“:[3],”that“:[4,55117],”allows“:[5],”nonpert“:[6],”humans“:[7],”to“:[8121126135],”shape“:[9],”a“:[10,16,45,56132],”policy“:[11],”through“:[12],”corrective“:[13],”advice“:[14],”using“:[15,91],”二进制“:[17],”信号“:[18],”输入“:[19,93109142],”提议的“:[20,24,30,41,50,72105110],“动作”:[21,58144],“域”:[22],“的”:[23,29,34,52,67,74],“机器人/代理”:[25],“是”:[26,44,69119138]。“:[27],”一“:[28],”大多数“:[31],”创新“:[32],”特征“:[33],”教练“:[35,68103118],”(纠正“:[36],”建议“:[37],”沟通“:[38],”通过“:[39],”人类),“:[40],”提议“:[42],”框架“:[43],”机制“:[46],”用于“:[47140],”自适应“:[48],”调整“:[49],“数量”:[51],“人类”:[53124],“反馈”:[54],“给定”:[57],“接收”,“:[59],”将“:[60]”、“into”:[61]、“consideration”:[62]、“past”:[63]、“feedback”。“:[64],”The“:[65],”performance“:[66],”compared“:[70],”with“:[71128],”one“:/73],”TAMER“:[75],”(Teaching“:[76],”an“:[77,87],”Agent“:[78],”Manually“:[79],”via“:[80],”Evaluative“:[81],”Reinforcement“,”:[82],“ACTAMER”:[83],“(Actor-Critic“:[84],”TAMER),”:[85],“and”:[86100],“autonomous”:[88],“Agent”:[89],“trained”:[90],“SARSA(\u03bb)”:[92],“two”:[94],“补强“:[95],”问题:“:[97],”球“:[98],”运球“:【99】,”大车杆“:【101】,”平衡。“:[102],”优于“:[104],”其他“:[106],”框架“:[108],”报告“:[111],”实验。“:[112],“In”:[113],“addition”,“address”:[114],“results”:[115],“show”:[116],“able”:[120],“transfer”:[122],“successfully”:[123],“knowledge”:[125],“agent”:[127],“continuous”:%129],“actions”:[130],“being”:[131],“complementary”:[133],“approach”:%134],“TAMER,”:[136],“which”:[137],“适当”:[139],“teaching”“:[141],”离散“:[143],”域。“:[145]},”cited_by_api_url“:”https://api.openalex.org/works?filter=cites:W2401683402“,”counts_by_year“:[{“年份”:2024,”cited_by_count“:1},{“年”:2022,”ciped_by_cunt“:1},”{“年度”:2020,“cited_by_count”:1}.,{”year“:2018,”cited_by_count?:3},“年份”:2016,”citted_by_count“:1}],”updated_date“:”2024-06-29T03:53.767597“,”created_date:“2016-06-24”}