{“id”:“https://openalex.org/W2962244319“,”doi“:”https://doi.org/10.109/devlrn.2018.8761044“,”title“:“通过使用MaxPain架构并行奖惩进行深度强化学习”,”display_name“:”通过使用MaxPain架构并行奖罚进行深度强化教学“,”publication_year“:2018,”publiation_date“:”2018-09-01“,”ids“:{”openalex“:”https://openalex.org/W2962244319“,”doi“:”https://doi.org/10.109/devlrn.2018.8761044“,”mag“:”2962244319“},”language“:”en“,”primary_location“:{”is_oa“:false,”landing_page_url“:”https://doi.org/10.109/devlrn.2018.8761044“,”pdf_url“:null,”source“:null,”license“:null',”licence_id“:null,”version“:nuller,”is_accepted“:false,”is_published“:false},”type“:”article“,”type_crossref“:“procesdings-article”,”indexed_in“:[”crossref“],”open_access“:{”is_oa“:false,”oa_status“:”closed“,”oa_url”:null“,”any_repository_has_fulltext“:false}”,”authorships“:[{”author_position“:”first“,”作者“:{”id“:”https://openalex.org/A5033611778“,”display_name“:”Jie\u2010Xin Wang“,”orcid“:”https://orcid.org/0000-0002-1854-4095},“机构”:[{“id”:https://openalex.org/I4210104143“,”display_name“:”国际高级电信研究所“,”ror“:”https://ror.org/01pe1d703“,”country_code“:”JP“,”type“:”设施“,”沿袭“:[”https://openalex.org/I4210104143“]}],”国家“:[”JP“],”is_corresponding“:false,”raw_author_name“:”Jiexin Wang“,”raw _affiliation_strings“:[“日本京都ATR计算神经科学实验室脑机器人接口部,619-0288”],”affiliations“:”脑-机器人接口部,ATR计算神经科学实验室,日本京都,619-0288”,“institution_ids”:[“https://openalex.org/I4210104143“]}]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5068305732“,”display_name“:”Stefan Elfwing“,”orcid“:”https://orcid.org/0000-0001-6689-1000},“机构”:[{“id”:https://openalex.org/I4210104143“,”display_name“:”国际高级电信研究所“,”ror“:”https://ror.org/01pe1d703“,”country_code“:”JP“,”type“:”设施“,”沿袭“:[”https://openalex.org/I4210104143“]}],”国家“:[”JP“],”is_corresponding“:false,”raw_author_name“:”Stefan Elfwing“,”raw _ afiliation_strings“:[“日本京都ATR计算神经科学实验室脑机器人接口部,619-0288”],”affiliations“:”脑-机器人接口部,ATR计算神经科学实验室,日本京都,619-0288”,“institution_ids”:[“https://openalex.org/I4210104143“]}]},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A5031054137“,”display_name“:”Eiji Uchibe“,”orcid“:”https://orcid.org/0000-0001-7908-0258},“机构”:[{“id”:https://openalex.org/I4210104143“,”display_name“:”国际高级电信研究所“,”ror“:”https://ror.org/01pe1d703“,”country_code“:”JP“,”type“:”设施“,”沿袭“:[”https://openalex.org/I4210104143“]}],”国家“:[”JP“],”is_corresponding“:false,”raw_author_name“:”Eiji Uchibe“,”raw _affiliation_strings“:[“日本京都ATR计算神经科学实验室脑机器人接口部,619-0288”],”affiliations“:”ATR计算神经科学实验室脑-机器人接口系,京都,619-0288,日本”,“institute_ids”:[“https://openalex.org/I4210104143“]}]}],”countries_distinct_count“:1,”institutions_disting_count”:1,“corresponding_author_ids”:[],”correspounding_institution_ids“:[]、”apc_list“:null,”apc_payd“:null,”has_fulltext“:true,”fulltext_origin“:”ngrams“,”cited_by_count,“issue”:null,“first_page”:null,“last_page”:null},“is_retracted”:false,“is_paratext”:false,“primary_topic”:{“id”:“https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9996,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9996,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10581“,”“display_name”:“皮层网络中的神经元振荡”,“score”:0.9911,“subfield”:{“id”:“https://openalex.org/subfields/2805“,”display_name“:”认知神经科学“},”字段“:{”id“:”https://openalex.org/fields/28“,”display_name“:”Neuroscience“},”domain“:{”id“:”https://openalex.org/domains/1“,”display_name“:”生命科学“}},{”id“:”https://openalex.org/T10042“,”“display_name”:“认知控制和决策的神经机制”,“score”:0.9874,“subfield”:{“id”:“https://openalex.org/subfields/2805“,”display_name“:”认知神经科学“},”字段“:{”id“:”https://openalex.org/fields/28“,”display_name“:”Neuroscience“},”domain“:{”id“:”https://openalex.org/domains/1“,”display_name“:”生命科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/reward-processing“,”display_name“:”奖励处理“,”score“:0.620861},{”id“:”https://openalex.org/keywords/reinforcement-learning网站“,”display_name“:”强化学习“,”score“:0.619451},{”id“:”https://openalex.org/keywords/dep-learning网站“,”display_name“:”深度学习“,”score“:0.541164},{”id“:”https://openalex.org/keywords/working-memory网站“,”display_name“:”工作记忆“,”score“:0.511933}],”concepts“:[{”id“:”https://openalex.org/C97541855,“wikidata”:https://www.wikidata.org/wiki/Q830687“,”display_name“:”强化学习“,”level“:2,”score“:0.89769495},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.74996984},{”id“:”https://openalex.org/C123657996,“wikidata”:https://www.wikidata.org/wiki/Q12271“,”display_name“:”Architecture“,”level“:2,”score“:0.7019723},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.64790833},{”id“:”https://openalex.org/C2776654903,“wikidata”:https://www.wikidata.org/wiki/Q2601463“,”display_name“:”SAFER“,”level“:2,”score“:0.56262386},{”id“:”https://openalex.org/C2779295839,“wikidata”:https://www.wikidata.org/wiki/Q3544090“,”display_name“:”惩罚(心理)“,”level“:2,”score“:0.55841756},{”id“:”https://openalex.org/C2780791683,“wikidata”:https://www.wikidata.org/wiki/Q846785“,”display_name“:”Action(physical)“,”level“:2,”score“:0.5494709},{”id“:”https://openalex.org/C188116033,“wikidata”:https://www.wikidata.org/wiki/Q2664563“,”display_name“:”Q-learning“,”level“:3,”score“:0.49434853},{”id“:”https://openalex.org/C14646407,“wikidata”:https://www.wikidata.org/wiki/Q1430750“,”display_name“:”Bellman equation“,”level“:2,”score“:0.4918735},{”id“:”https://openalex.org/C2776291640,“wikidata”:https://www.wikidata.org/wiki/Q2912517“,”display_name“:”Value(mathematics)“,”level“:2,”score“:0.4498696},{”id“:”https://openalex.org/C67203356,“wikidata”:https://www.wikidata.org/wiki/Q1321905“,”display_name“:”钢筋“,”level“:2,”score“:0.41137204},{”id“:”https://openalex.org/C119857082,“wikidata”:https://www.wikidata.org/wiki/Q2539“,”display_name“:”机器学习“,”level“:1,”score“:0.39032832},{”id“:”https://openalex.org/C38652104,“wikidata”:https://www.wikidata.org/wiki/Q3510521“,”display_name“:”计算机安全“,”level“:1,”score“:0.16677237},{”id“:”https://openalex.org/C126255220,“wikidata”:https://www.wikidata.org/wiki/Q141495“,”display_name“:”数学优化“,”level“:1,”score“:0.12134275},{”id“:”https://openalex.org/C15744967,“wikidata”:https://www.wikidata.org/wiki/Q9418(网址:https://www.wikidata.org/wiki/Q9418)“,”display_name“:”心理学“,”等级“:0,”分数“:0.12008324},{”id“:”https://openalex.org/C121332964,“wikidata”:https://www.wikidata.org/wiki/Q413“,”display_name“:”物理“,”级别“:0,”分数“:0.0},{”id“:”https://openalex.org/C33923547,“wikidata”:https://www.wikidata.org/wiki/Q395“,”display_name“:”数学“,”等级“:0,”分数“:0.0},{”id“:”https://openalex.org/C62520636,“wikidata”:https://www.wikidata.org/wiki/Q944“,”display_name“:”量子力学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C153349607,“wikidata”:https://www.wikidata.org/wiki/Q36649“,”display_name“:”视觉艺术“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C142362112,“wikidata”:https://www.wikidata.org/wiki/Q735“,”display_name“:”Art“,”level“:0,”score“:0.0},{”id“:”https://openalex.org/C77805123,“wikidata”:https://www.wikidata.org/wiki/Q161272“,”display_name“:”社会心理学“,”level“:1,”score“:0.0}],”mesh“:[],”locations_count“:1.”locations“:[{”is_oa“:false,”landing_page_url“:”https://doi.org/10.109/devlrn.2018.8761044“,”pdf_url“:null,”source“:null,”license“:null:”license_id“:nuld,”version“:null,”is_accepted“:false,”is_published“:false}],”best_oa_location“:nul,”sustainable_development_goals“:[{”id“:”https://metadata.un.org/sdg/16“,”score“:0.78,”display_name“:”Peace,justice,and strong institutions“}],”grants“:[],”datasets“:【】,”versions“:【],”referenced_works_count“:12,”referrenced_works“:[”https://openalex.org/W1612579644","https://openalex.org/W1828803485","https://openalex.org/W2015051472","https://openalex.org/W2083058253","https://openalex.org/W2145339207","https://openalex.org/W2338986187","https://openalex.org/W2419612459","https://openalex.org/W2795921402","https://openalex.org/W2949475445","https://openalex.org/W2950892788","https://openalex.org/W2963305465","https://openalex.org/W4298342547“],”related_works“:[”https://openalex.org/W4376605461","https://openalex.org/W3099153698","https://openalex.org/W3096874164","https://openalex.org/W3087814763网址","https://openalex.org/W3038962357","https://openalex.org/W2892507673","https://openalex.org/W2386410636","https://openalex.org/W2357975469","https://openalex.org/W2136202932","https://openalex.org/W2025663273“],”ngrams_url“:”https://api.openalex.org/works/W296244319/ngrams“,”“abstract_inverted_index”:{“传统上,”:[0],“强化”:[1,66],“学习”:[2,49,53,67],“治疗”:[3],“惩罚”:[4,34],“作为”:[5173],“否定”:[6],“奖励”:[7],“然而,”:[8],“in”:[9116122126174],“生物学”:[10],“决定”:[11],“系统,”:[12],“一些”:[13],“证据”:[14],“显示”:[15],“that”:[16],“animals”:[17],“have”:[18],“分开“:[19],“系统”:[20],“用于”:[21],“奖励”:[22,32],“和”:[23,33,35,41,51107119],“惩罚。“:[24157179],”The“:[25132],”MaxPain“:[26,61102140148161],”architecture“:[27,62103],”parallelizes“:[28],”The“:[29,48,52,60,80,85,89,93101127136143160167175],”predictions“:[30],”of“:[31,54,88138177],”scales“:[36],”them“:[37],”into“:[38,63],”dual-attributes“:[39],”policies“:[40],“has”:[42],“been”:[43],“show”:[44],“to”:[45,73],“both”:[46],“improve”:[47],“speed”:[50],“safe”:[55],“behaviors.”:[56],“This”:[57],“paper”:[58],“extends”:[59]:[76,95],“函数”:[77,96],“To”:[78],“派生”:[79],“行为”:[81],“策略”:[82],“我们”:[83,99],“考虑”:[84],“混合”:[86],“分布”:[87],“策略”:[90],“计算”:[91],“来自”:[92],“对于”:[97],“评估”:[98],“比较”:[100],“与”:[104],“基于计数”:[105144],“探索”:[106],“回报分解”:[109],“结构”:[110],“调用”:[111],“杂交”:[112],“奖励”:[113],“架构”:[114],“(HRA)”:[115],“网格世界”:[117],“导航”:[11812],“基于视觉”:[120],“U形”:[124],“迷宫”:[125],“Gazebo”:[128],“机器人”:[129],“模拟”:[130133],“环境”:[131],“结果”:[134],“显示”:[135],“优势”:[137],“途径”:[141],“超越”:[142],“方法”:[145],“原因”:[146],“代理”:[149162169],“高效”:[150],“避免”:[151],“死机”:[152],“states”:[153],“by”:[154],“predicating”:[155],“future”:[156],“In”:[158],“addition,”:[159],“learn”:[163170],“safe”:[164],“behaviors”,“:[165172],”while“:[166],“HRA”:[168],“similar”:[171],“case”:176],“no”:[178]},“cited_by_api_url”:“状态”https://api.openalex.org/works?filter=cites:W2962244319“,”counts_by_year“:[{”年份“:2024,”cited_by_count“:2},{”年“:2023,”cited_by_count”:2},{“年份”:2020,”citecd_by_count“:1}],”updated_date“:”2024-06-19T17:17:19.861318“,”created_date:“2019-07-23”}