{“id”:“https://openalex.org/W32035761999“,”doi“:”https://doi.org/10.1007/978-3-031-19907-3_18“,”title“:“信息论驱动下的强化学习”,”display_name“:”信息论驱动的强化学习“,”publication_year“:2023,”publitation_date“:”2023-01-01“,”ids“:{”openalex“:”https://openalex.org/W32035761999“,”doi“:”https://doi.org/10.1007/978-3-031-19907-3_18“,”mag“:”3203576199“},”language“:”en“,”primary_location“:{”is_oa“:false,”landing_page_url“:”https://doi.org/10.1007/978-3-031-19907-3_18“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S106296714“,”display_name“:”计算机科学讲义“,”issn_l“:”0302-9743“,”isn“:[”0302-7743“、”1611-3349“],”is_oa“:false、”is_in_doaj“:false、”is_core“:true、”host_organization“:”https://openalex.org/P4310318900“,”“host_organization_name”:“Springer Science+Business Media”,“host_organization_lineage”:[“https://openalex.org/P431031965","https://openalex.org/P4310318900“],”host_organization_lineage_names“:[”Springer Nature“,”Springer-Science+Business Media“],“type”:“book-series”},“license”:null,“licence_id”:nul,“version”:null,“is_accepted”:false,“is_published”:false},”type“:”book-chapter“,”type_crossref“:“book-chapter”,”indexed_in“:[“crossref”],“open_access”:{“is_oa”:true,“oa_status”:“green”,“oa_url”:https://arxiv.org/pdf/2109.15147“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5020795308“,”display_name“:”Elliot Catt“,”orcid“:”https://orcid.org/0000-0001-9411-927X},“机构”:[{“id”:https://openalex.org/I4210090411“,”display_name“:”DeepMind(英国)“,”ror“:”https://ror.org/00971b260“,”“country_code”“:”GB“,”type“:”company“,”seriance“:[”https://openalex.org/I4210090411","https://openalex.org/I4210128969“]}],”国家“:[”GB“],”is_corresponding“:true,”raw_author_name“:”Elliot Catt“,”raw _affiliation_strings“:[“Deepmind,London,UK”],“affiliations”:[{“raw _afiliation_string”:“Deepmind,Longon,UG”,“institution_ids”:[”https://openalex.org/I4210090411“]}]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5073944062“,”display_name“:”马库斯·赫特“,”兽人“:”https://orcid.org/0000-0002-3263-4097},“机构”:[{“id”:https://openalex.org/I4210090411“,”display_name“:”DeepMind(英国)“,”ror“:”https://ror.org/00971b260“,”“country_code”“:”GB“,”type“:”company“,”seriance“:[”https://openalex.org/I4210090411","https://openalex.org/I4210128969“]}],”国家“:[”GB“],”is_corresponding“:false,”raw_author_name“:”Marcus Hutter“,”raw_affiation_strings“:[”Deepmind,London,UK“],”附属机构“:[{”raw_affiation_string“:”Deepmind,London,UK“,”机构ID“:[”https://openalex.org/I4210090411“]}]},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A506070909021“,”display_name“:”Joel Veness“,”orcid“:null},”institutions“:[{”id“:”https://openalex.org/I4210090411“,”display_name“:”DeepMind(英国)“,”ror“:”https://ror.org/00971b260“,”“country_code”“:”GB“,”type“:”company“,”seriance“:[”https://openalex.org/I4210090411","https://openalex.org/I4210128969“]}],”国家“:[”GB“],”is_corresponding“:false,”raw_author_name“:”Joel Veness“,”raw _affiliation_strings“:[“Deepmind,London,UK”],“affiliations”:[{“raw _afiliation_string”:“Deepmind,Longon,UG”,“institution_ids”:[”https://openalex.org/I4210090411“]}]}],”institution_assertions“:[],”countries_distiction_count“:1,”institutions_disticent_count”:1,“corresponding_author_ids”:[“https://openalex.org/A5020795308“],”对应的机构ID“:[”https://openalex.org/I4210090411“],”apc_list“:{”value“:5000,”currency“:”EUR“,”value_usd“:5392,”出处“:”doaj“},”apc_payed“:null,”fwci“:0.0,”has_fulltext“:false,”cited_by_count“:0,”citation_normalized_perminent“:{”value“:0.0,”is_in_top_1_perminent“:false,”is_in_top_1_perminent“:false},”cited_by_percentle_year“:{”min“:0,”max“:71},”biblio“:”{“卷”:null,“问题”:nullfirst_page“:”188“,”last_page“:”198“},”is_retracted“:false,”is_paratext“:fase,”primary_topic“:{”id“:”https://openalex.org/T2002“,”display_name“:”计算复杂性与算法信息理论“,”score“:0.9974,”subfield“:{”id“:”https://openalex.org/subfields/1703“,”display_name“:”计算理论与数学“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T2002“,”display_name“:”计算复杂性与算法信息理论“,”score“:0.9974,”subfield“:{”id“:”https://openalex.org/subfields/1703“,”display_name“:”计算理论与数学“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9956,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T1975“,”“display_name”:“遗传编程在机器学习中的应用”,“score”:0.9951,“subfield”:{“id”:“https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/reinforcement-learning网站“,”display_name“:”强化学习“,”score“:0.642733},{”id“:”https://openalex.org/keywords/formalism网站“,”display_name“:”形式主义(音乐)“,”score“:0.52062154},{”id“:”https://openalex.org/keywords/sequence网站“,”display_name“:”Sequence(biology)“,”score“:0.48861963}],”concepts“:[{”id“:”https://openalex.org/C97541855,“wikidata”:https://www.wikidata.org/wiki/Q830687“,”display_name“:”强化学习“,”level“:2,”score“:0.86148417},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.8015405},{”id“:”https://openalex.org/C100609095,“wikidata”:https://www.wikidata.org/wiki/Q1335050“,”display_name“:”具体认知“,”level“:2,”score“:0.6132784},{”id“:”https://openalex.org/C73301696,“wikidata”:https://www.wikidata.org/wiki/Q5469984“,”display_name“:”形式主义(音乐)“,”level“:3,”score“:0.52062154},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.5143903},{”id“:”https://openalex.org/C2780791683,“wikidata”:https://www.wikidata.org/wiki/Q846785“,”display_name“:”Action(physics)“,”level“:2,”score“:0.50031066},{”id“:”https://openalex.org/C2778112365,“wikidata”:https://www.wikidata.org/wiki/Q3511065“,”display_name“:”Sequence(biology)“,”level“:2,”score“:0.48861963},{”id“:”https://openalex.org/C107457646,“wikidata”:https://www.wikidata.org/wiki/Q207434“,”display_name“:”Human\u2013计算机交互“,”level“:1,”score“:0.44116017},{”id“:”https://openalex.org/C67203356,“wikidata”:https://www.wikidata.org/wiki/Q1321905“,”display_name“:”钢筋“,”level“:2,”score“:0.4137642},{”id“:”https://openalex.org/C188147891,“wikidata”:https://www.wikidata.org/wiki/Q147638“,”display_name“:”认知科学“,”level“:1,”score“:0.34562343},{”id“:”https://openalex.org/C15744967,“wikidata”:https://www.wikidata.org/wiki/Q9418(网址:https://www.wikidata.org/wiki/Q9418)“,”display_name“:”心理学“,”等级“:0,”分数“:0.0},{”id“:”https://openalex.org/C121332964,“wikidata”:https://www.wikidata.org/wiki/Q413“,”display_name“:”物理“,”级别“:0,”分数“:0.0},{”id“:”https://openalex.org/C62520636,“wikidata”:https://www.wikidata.org/wiki/Q944“,”display_name“:”量子力学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C86803240,“wikidata”:https://www.wikidata.org/wiki/Q420“,”display_name“:”生物学“,”等级“:0,”分数“:0.0},{”id“:”https://openalex.org/C153349607,“wikidata”:https://www.wikidata.org/wiki/Q36649“,”display_name“:”视觉艺术“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C54355233,“wikidata”:https://www.wikidata.org/wiki/Q7162“,”display_name“:”Genetics“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C77805123,“wikidata”:https://www.wikidata.org/wiki/Q161272“,”display_name“:”社会心理学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C142362112,“wikidata”:https://www.wikidata.org/wiki/Q735“,”display_name“:”Art“,”level“:0,”score“:0.0},{”id“:”https://openalex.org/C558565934,“wikidata”:https://www.wikidata.org/wiki/Q2743“,”display_name“:”Musical“,”level“:2,”score“:0.0}],”mesh“:[],”locations_count“:2.”locations“:[{”is_oa“:false,”landing_page_url“:”https://doi.org/10.1007/978-3-031-19907-3_18“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S106296714“,”display_name“:”计算机科学讲义“,”issn_l“:”0302-9743“,”isn“:[”0302-7743“、”1611-3349“],”is_oa“:false、”is_in_doaj“:false、”is_core“:true、”host_organization“:”https://openalex.org/P4310318900“,”“host_organization_name”:“Springer Science+Business Media”,“host_organization_lineage”:[“https://openalex.org/P431031965","https://openalex.org/P4310318900“],”host_organization_lineage_names“:[”Springer Nature“,”Springer-Science+Business Media“],“type”:“book-series”},“license”:null,“licence_id”:nul,“version”:null,“is_accepted”:false,“is_published”:false},{“is_oa”:true,“landing_page_url”:“https://arxiv.org/abs/2109.15147,“pdf_url”:https://arxiv.org/pdf/2109.15147,“源”:{“id”:https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”is_core“:fase,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“https://arxiv.org/abs/2109.15147,“pdf_url”:https://arxiv.org/pdf/2109.15147,“源”:{“id”:https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”is_core“:fase,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false},”sustainable_development_goals“:[],“grants”:[]、“datasets”:【】,“versions”:【],“referenced_works_count”:35,“referrenced_works”:[”https://openalex.org/W1212832299","https://openalex.org/W1528086278","https://openalex.org/W1576452626","https://openalex.org/W2057978375","https://openalex.org/W2073384958","https://openalex.org/W2097881906","https://openalex.org/W2099111195","https://openalex.org/W2121863487","https://openalex.org/W2123447947","https://openalex.org/W2129652681","https://openalex.org/W2145339207","https://openalex.org/W2171886309","https://openalex.org/W2553665199","https://openalex.org/W2609374097","https://openalex.org/W2626778328","https://openalex.org/W2772709170","https://openalex.org/W2911940095","https://openalex.org/W2914261249","https://openalex.org/W2944299231","https://openalex.org/W2948380112","https://openalex.org/W2962893049","https://openalex.org/W2963080043","https://openalex.org/W3030163527","https://openalex.org/W3035435378","https://openalex.org/W3037871539网址","https://openalex.org/W3047988254","https://openalex.org/W3085190015","https://openalex.org/W3093621883","https://openalex.org/W3116006999","https://openalex.org/W3140968660","https://openalex.org/W3165994454","https://openalex.org/W3174224867","https://openalex.org/W3176407006","https://openalex.org/W4214717370","https://openalex.org/W4307347247“],”related_works“:[”https://openalex.org/W4283365723","https://openalex.org/W4250820896","https://openalex.org/W2963001125","https://openalex.org/W2380179524","https://openalex.org/W2352366064","https://openalex.org/W2333383158","https://openalex.org/W2124102101","https://openalex.org/W2091233881","https://openalex.org/W1570928019","https://openalex.org/W1484550171“],”abstract_inverted_index“:{”强化“:[0],”学习“:[1],”形式化“:[2],”an“:[3,46,77],”具体化“:[4],”agent \u2019s“:[5],”交互“:[6],”with“:[7,74118],”the“:[8,18,32,66,87114],”environment“:[9],”through“:[10],”observations“:[11],”rewards“:[12],”and“:[13,53128138],“操作”:[14],“但是”:[15],“其中”:[16],“执行”:[17],“动作”:[19,60],“来”:[20],“来自?“:[21],”动作“:[22],”是“:[23,61],”经常“:[24],”考虑“:[25],”to“:[26,76109112132],”代表“:[27],”某物“:[28],”外部,“:[29],”这样的“:[30],”如“:[31,65,94],”运动“:[33],”of“:[34,45,64,68,71122135],”a“:[35,57,69119],”肢体,“:[36],”象棋“:[38],“工件”:[39],“或”:[40],“更多”:[41],“一般”:[42],“输出”:[44,67],“执行器。“:[47],”在“:[48],”这个“:[49106130],”工作“:[50107],”我们“:[51],”探索“:[52],”形式化“:[54],”对比“:[56],”视图“:[57],”即“:[58],”那“:[59129],”最佳“:[62],”思想“:[63],”序列“:[70,92],”内部“:[72123137],”选择“:[73],”尊重“:[75],”行动“:[78124140],“型号。“:[79],”此“:[80],”视图“:[81],”是“:[82108],”特别“:[83],”非常适合“:[84],”用于“:[85,97],”杠杆“:[86],”最近“:[88],”预付款“:[89],”in“:[90105],”大型“:[91],”模型“:[93],”先前“:[95],”知识“:[96],”多任务“:[98],”强化“:[99],”学习“:[100],”问题。“:[101],“我们的”:[102],“主要”:[103],“贡献”:[104],“显示”:[110],“如何”:[111],“增加”:[113],“标准”:[115],“MDP”:[116],“形式主义”:[117],“顺序”:[120],“概念”:[121],“使用”:[125],“信息理论”:[126],“技术”,“:[127],“线索”:[131],“自我维持”:[133],“定义”:[134],“两者”:[136],“外部”:[139],“值”:[141],“功能。“:[142]},”cited_by_api_url“:”https://api.openalex.org/works?filter=cites:W3203576199“,”counts_by_year“:[],”updated_date“:”2024-09-17T08:43:33.272495“,”created_date:“2021-10-11”}“