{“id”:“https://openalex.org/W2508424122“,”doi“:”https://doi.org/10.1016/j.neunet.2016.07.013“,”title“:“从自由能到期望能:改进强化学习中基于能量的价值函数逼近”,“display_name”:“从免费能到期望能量:改进强化教学中基于能量值函数逼近”、“publication_year”:2016,“publication_date”:“2016-12-01”,“ids”:{“openalex”:“https://openalex.org/W2508424122“,”doi“:”https://doi.org/10.1016/j.neunet.2016.07.013“,”mag“:”2508424122“,”pmid“:”https://pubmed.ncbi.nlm.nih.gov/27639720“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://doi.org/10.1016/j.neunet.2016.07.013“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S123019304“,”display_name“:”Neural networks“,”issn_l“:”0893-6080“,”isn“:[”0893-6080“,”1879-2782“],”is_oa“:false,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/P4310320990“,”“host_organization_name”:“Elsevier BV”,“host_organization_lineage”:[“https://openalex.org/P4310320990“],”host_organization_lineage_names“:[”Elsevier BV“],”type“:”journal“},”license“:”cc by nc nd“,”license_id“:”https://openalex.org/licenses/cc-by-nc-nd“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},”type“:”article“,”type_crossref“:“journal-article”,”indexed_in“:[”crossref“,”publimed“],”open_access“:{”is_oa“:true,”oa_status“:”hybrid“,”oa_url“:”https://doi.org/10.1016/j.neunet.2016.07.013“,”any_repository_has_fulltext“:false},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5068305732“,”display_name“:”Stefan Elfwing“,”orcid“:”https://orcid.org/0000-0001-6689-1000},“机构”:[{“id”:https://openalex.org/I142637625“,”display_name“:”冲绳理工大学研究生院“,”ror“:”https://ror.org/02qg15b79“,”country_code“:”JP“,”type“:“教育”,”世系“:[”https://openalex.org/I142637625“]}],”国家“:[”JP“],”is_corresponding“:true,”raw_author_name“:”Stefan Elfwing“,”raw_affiation_strings“:[”ATR计算神经科学实验室脑机器人接口系,2-2-2 Hikaridai,Seikacho,Soraku gun,Kyoto 619-0288,日本“,”冲绳科学技术研究所研究生大学,1919-1 Tancha,Onna-son,Okinawa 904-0495,Japan“],“affiliations”:[{“raw_affiliation_string”:“冲绳科学与技术研究所大学,1919-1 Tanchahttps://openalex.org/I142637625“]},{”raw_affiliation_string“:”ATR计算神经科学实验室脑机器人接口部,2-2-2 Hikaridai,Seikacho,Soraku-gun,京都619-0288,日本“,”institution_ids“:[]}]}“,{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5031054137“,”display_name“:”Eiji Uchibe“,”orcid“:”https://orcid.org/0000-0001-7908-0258},“机构”:[{“id”:https://openalex.org/I142637625“,”display_name“:”冲绳理工大学研究生院“,”ror“:”https://ror.org/02qg15b79“,”country_code“:”JP“,”type“:“教育”,”世系“:[”https://openalex.org/I142637625“]}],”国家“:[”JP“],”is_corresponding“:false,”raw_author_name“:”Eiji Uchibe“,”raw _affiliation_strings“:[“ATR计算神经科学实验室脑机器人接口部,2-2-2 Hikaridai,Seikacho,Soraku-gun,Kyoto 619-0288,日本”,“冲绳科学技术研究生院,1919-1 Tancha,Onna son,Okinawa 904-0495,日本“],“附属机构”:[{“raw_affiation_string”:“冲绳科学技术研究生院,1919-1 Tancha,Onna son,Okinawa 904-0495,日本”,“Institute_ids”:[”https://openalex.org/I142637625“]},{”raw_affiliation_string“:”ATR计算神经科学实验室脑-机器人接口部,2-2-2 Hikaridai,Seikacho,Soraku-gun,Kyoto 619-0288,日本“,”institution_ids“:[]}]}“,{“author_position”:“last”,“author”:{“id”:“https://openalex.org/A5004840638“,”display_name“:”Kenji Doya“,”orcid“:”https://orcid.org/0000-0002-2446-6820},“机构”:[{“id”:https://openalex.org/I142637625“,”display_name“:”冲绳理工大学研究生院“,”ror“:”https://ror.org/02qg15b79“,”country_code“:”JP“,”type“:“教育”,”世系“:[”https://openalex.org/I142637625“]}],”国家“:[”JP“],”is_corresponding“:false,”raw_author_name“:”Kenji Doya“,”raw _ afiliation_strings“:[“冲绳科学技术研究生院,1919-1 Tancha,Onna-son,Okinawa 904-0495,Japan”],“afiliations”:[{“raw _ ffiliation_string”:“冲绳科学技术研究生院,1919-1 Tancha,Onna-son,Okinawa 904-0495,Japan“,”institution_ids“:[”https://openalex.org/I142637625“]}]}],”countries_disticont_count“:1,”institutions_disticent_count”:1,“corresponding_author_ids”:[“https://openalex.org/A5068305732“],”对应的机构ID“:[”https://openalex.org/I142637625“],”apc_list“:{”value“:3350,”currency“:”USD“,”value_USD“:33500,”provenance“:”doaj“},”apc _payed“:”value”:3350“,”curency“:”美元“,”value_USD”:3380,“provenance”:“doaj”},“has_fulltext”:true,“fulltext_origin”:“ngrams”,“cited_by_count”:16,“citted_by_percentile_year”:{“min”:91,“max”:92},“biblio”:{“volume”:“84”,“issue”:null,“first_page”:“17”,“last_page”:”27“},“is_retracted”:false,“is_paratext”:false,“primary_topic”:{“id”:“https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9981,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9981,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T11689“,”display_name“:”深度学习模型中的对抗性稳健性“,”score“:0.9977,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10775“,”“display_name”:“图像处理中的生成对手网络”,“score”:0.9952,“subfield”:{“id”:“https://openalex.org/subfields/1707“,”display_name“:”计算机视觉和模式识别“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”Physical Sciences“}}],”keywords“:[{”id“:”https://openalex.org/keywords/reinforcement-learning网站“,”display_name“:”强化学习“,”score“:0.613133},{”id“:”https://openalex.org/keywords/representation-learning网站“,”display_name“:”表征学习“,”score“:0.552377}],”concepts“:[{”id“:”https://openalex.org/C97541855,“wikidata”:https://www.wikidata.org/wiki/Q830687“,”display_name“:”强化学习“,”level“:2,”score“:0.7376416},{”id“:”https://openalex.org/C192576344,“wikidata”:https://www.wikidata.org/wiki/Q194706“,”display_name“:”Boltzmann machine“,”level“:3,”score“:0.69524795},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.65835124},{”id“:”https://openalex.org/C199354608,“wikidata”:https://www.wikidata.org/wiki/Q7316287“,”display_name“:”受限Boltzmann机器“,”level“:3,”score“:0.63618714},{”id“:”https://openalex.org/C91873725,“wikidata”:https://www.wikidata.org/wiki/Q3445816“,”display_name“:”函数近似“,”level“:3,”score“:0.63581824},{”id“:”https://openalex.org/C63479239,“wikidata”:https://www.wikidata.org/wiki/Q7353546“,”display_name“:”健壮性(进化)“,”level“:3,”score“:0.57690144},{”id“:”https://openalex.org/C50644808,“wikidata”:https://www.wikidata.org/wiki/Q192776“,”display_name“:”人工神经网络“,”level“:2,”score“:0.5398551},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.502558},{”id“:”https://openalex.org/C186370098,“wikidata”:https://www.wikidata.org/wiki/Q442787“,”display_name“:”能量(信号处理)“,”level“:2,”score“:0.4435571},{”id“:”https://openalex.org/C14036430网址,“wikidata”:https://www.wikidata.org/wiki/Q3736076“,”display_name“:”功能(生物学)“,”级别“:2,”分数“:0.42847884},{”id“:”https://openalex.org/C48372109,“wikidata”:https://www.wikidata.org/wiki/Q3913“,”display_name“:”二进制数“,”level“:2,”score“:0.4142156},{”id“:”https://openalex.org/C11413529,“wikidata”:https://www.wikidata.org/wiki/Q8366“,”display_name“:”Algorithm“,”level“:1,”score“:0.3221104},{”id“:”https://openalex.org/C33923547,“wikidata”:https://www.wikidata.org/wiki/Q395“,”display_name“:”数学“,”等级“:0,”分数“:0.24620333},{”id“:”https://openalex.org/C105795698,“wikidata”:https://www.wikidata.org/wiki/Q12483“,”display_name“:”Statistics“,”level“:1,”score“:0.09227902},{”id“:”https://openalex.org/C55493867,“wikidata”:https://www.wikidata.org/wiki/Q7094“,”display_name“:”生物化学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C185592680,“wikidata”:https://www.wikidata.org/wiki/Q2329“,”display_name“:”Chemistry“,”level“:0,”score“:0.0},{”id“:”https://openalex.org/C94375191,“wikidata”:https://www.wikidata.org/wiki/Q11205“,”display_name“:”算术“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C78458016,“wikidata”:https://www.wikidata.org/wiki/Q840400“,”display_name“:”进化生物学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C86803240,“wikidata”:https://www.wikidata.org/wiki/Q420“,”display_name“:”生物学“,”等级“:0,”分数“:0.0},{”id“:”https://openalex.org/C104317684,“wikidata”:https://www.wikidata.org/wiki/Q7187“,”display_name“:”Gene“,”level“:2,”score“:0.0}],”mesh“:[{”descriptor_ui“:”D000069550“,”描述符名称“:”机器学习“,”qualifier_ui”:“”,“qualifier _name”:null,”is_major_topic“:true},{”描述符名称{“描述符用户界面”:“D012054“,”描述符名称“:”强化,心理学“,”限定符_ui“:”“,”qualifier_name“:null,”is_major_topic“:true},{”描述符_ ui“:”D006801“,”说明符_name“:”人类“,”qualifier_uiis_major_topic“:false},{“描述符_ui”:“D000069550”,“描述符名称”:“机器学习”,“限定符_ui“:”Q000639“,”限定符名称“:”趋势“,”is_mayor_topical“:false},”描述符名称“:“D008962”,“descriptor_name”:“模型,理论”,“qualifier_ui(限定符_ui):“”,“qualifier_name”(限定符名称):null,“is_major_topic”:false},“描述符_ ui”(描述符名称):“D016571”,“描述符名称”:“”神经网络,计算机“,”限定符_ui“:”,“限定符_名称”:null,“is_major_topic”:false},{“描述符_用户界面”:“D010775”,“描述符名称”:“光刺激”,“qualifier _ui”:“”,“qualifier名称”:null,“is _major _topic],“locations_count”:2,“location”:[{“is_oa”:true,“landing_page_url”:“https://doi.org/10.1016/j.neunet.2016.07.013“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S123019304“,”display_name“:”Neural networks“,”issn_l“:”0893-6080“,”isn“:[”0893-6080“,”1879-2782“],”is_oa“:false,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/P4310320990“,”host_organization_name“:”爱思唯尔BV“,”host_organization_lineage“:[”https://openalex.org/P4310320990“],”host_organization_lineage_names“:[”Elsevier BV“],”type“:”journal“},”license“:”cc by nc nd“,”license_id“:”https://openalex.org/licenses/cc-by-nc-nd“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},{”is_oa“:false,”landing_page_url“:”https://pubmed.ncbi.nlm.nih.gov/27639720“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306525036“,”display_name“:”PubMed“,”issn_l“:null,”issn“:null,”is_oa“:false,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I1299303238“,”“host_organization_name”:“美国国立卫生研究院”,“host_ordanization_lineage”:[“https://openalex.org/I1299303238“],”host_organization_lineage_names“:[”National Institutes of Health“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:null,“is_accepted”:false,“is_published”:false}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“https://doi.org/10.1016/j.neunet.2016.07.013“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S123019304“,”display_name“:”Neural networks“,”issn_l“:”0893-6080“,”isn“:[”0893-6080“,”1879-2782“],”is_oa“:false,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/P4310320990“,”“host_organization_name”:“Elsevier BV”,“host_organization_lineage”:[“https://openalex.org/P4310320990“],”host_organization_lineage_names“:[”Elsevier BV“],”type“:”journal“},”license“:”cc by nc nd“,”license_id“:”https://openalex.org/licenses/cc-by-nc-nd“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},”sustainable_development_goals“:[{”score“:0.91,”display_name“:”负担得起的清洁能源“,”id“:”https://metadata.un.org/sdg/7“}],”拨款“:[{”资助者“:”https://openalex.org/F4320320912“,”“funder_display_name”:“教育、文化、体育、科学技术部”,“award_id”:null},{“funder”:“https://openalex.org/F4320321034“,”“funder_display_name”:“新能源和工业技术发展组织”,“award_id”:“23120007”},{“funder”:“https://openalex.org/F4320322443“,”funder_display_name“:”冲绳科学技术研究生院“,”award_id“:null}],”数据集“:[],”版本“:[],”referenced_works_count“:12,”referenced_works“:[”https://openalex.org/W2048865854","https://openalex.org/W2064556564","https://openalex.org/W2075323224","https://openalex.org/W2112796928","https://openalex.org/W2116064496","https://openalex.org/W2118933070","https://openalex.org/W2145805610","https://openalex.org/W2150318520","https://openalex.org/W2339916026","https://openalex.org/W3041202696","https://openalex.org/W3207021134","https://openalex.org/W4214717370“],”related_works“:[”https://openalex.org/W4302433642","https://openalex.org/W4283272532","https://openalex.org/W2952018105","https://openalex.org/W2916681395","https://openalex.org/W2556473569","https://openalex.org/W2551541394","https://openalex.org/W2529583158","https://openalex.org/W2193475944","https://openalex.org/W2119341610","https://openalex.org/W2108438604“],”ngrams_url“:”https://api.openalex.org/works/W2508424122/ngrams网站“,”“abstract_inverted_index”:{“Free-energy”:[0],“based”:[1],“reinforction”:[2],“learning”:[3,8188],“(FERL)”:[4],“was”:[5],“proposed”:[6144],“for”:[7163201],“in”:[9180183],“high-dimensional”:[10171],“state”:[11,30139173213],“and”:[12,75159186190195208215],”“action”:[13],”空格。14],“然而,”:[15],““:[16,33,41,47,50,56,73,76,79,87,97116120127],“FERL”:[17,48,80194],“method”:[18,81145],“does”:[19],“only”:[20],“real”:[21],“work”:[22],“well”:[23132154],“with”:[24170206],“binary”,“:[25,29],”or“:[26],“close”:[27],“to”:[28,96136],“input”:[31],“where”:[32],“number”:[34,42218],“of”:[35,43,60,78,99126166219],“active”:[36],“状态“:[37],”是“:[38,53,94],”较少“:[39],”小于“:[40],”非活动“:[44],”状态。“:[45],“In”:[46,66101],“method”,“:[49],“value”:+5117],“function”:[52108118161199],“approximated”:[54],“by”:[55,85,90114119146],“negative”:[57121128],“free”:[58,88129],“energy”:[59,89123],“a”:[61,91167202216],“restrictived”:[62],“Boltzmann”:[63],“machine”:[64],“(RBM)。“:[65],”our“:[67143],”earlier“:[68],”study“:[69103],”we“:[00104],”demoved“:[71],”that“:[72,93106148],”performance“:[74],”robustive“:[77],”can“:[82110],”be“:[83111],”improved“:[84113],”scaling“:[86],”constant“:[92],”related“:95],”size“:[98],”network.“:[100],”this“”:[102],“提议”:[105],“RBM”:[107],“近似值”:[109200],“进一步“:[112],”近似“:[115],”预期“:[122],”(EERL),“:[124],”代替“:[125],”能量“:[130],”作为“:[131133153155212],”存在“:[134],”可“:[135],”句柄“:[137],”连续“:[138],”输入。“:[140],“我们”:[141],“验证”:[142],“演示”:[147],“EERL:”:[149],“(1)”:[150],“优于”:[151193],“FERL,”:[152],“标准”:[156196],“神经”:[157197],“网络”:[158198],“线性”:[160],“近似”:[162],“三”:[164],“版本”:[165],“网格世界”:[168],“任务”:[169]205],“图像”:[172],“输入;“:[174],“(2)”:[175],“实现”:[176],“新”:[177],“最先进”:[178],“结果”:[179],“随机”:[181],“SZ-Tettris”:[182],“两者”:[184],“无模型”:[185],“基于模型”:[1],“设置;“:[189],“(3)”:[191],“显著”:[192],“机器人”:[203],“导航”:[204],“原始”:[207],“噪音”:[209],“RGB”:[210],“图像”:[211],“输入”:[214],“大”:[217],“动作”。“:[220]},”cited_by_api_url“:”https://api.openalex.org/works?filter=cites:W2508424122“,”counts_by_year“:[{“年份”:2022,”cited_by_count“:1},{“年”:2021,”ciped_by_cunt“:2},”{“年度”:2020,“cited_by_count”:2}.,{”年“:2019,”cited_by_count“创建日期”:“2016-09-16”}