{“id”:“https://openalex.org/W2966368748“,”doi“:”https://doi.org/10.24963/ijcai.2019/302“,”title“:”一般环境中的强渐近最优Agent“,”display_name“:”通用环境中的弱渐近最优Agent”,“publication_year”:2019,“publitation_date”:“2019-07-28”,“ids”:{“openalex”:“https://openalex.org/W2966368748“,”doi“:”https://doi.org/10.24963/ijcai.2019/302“,”mag“:”2966368748“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://doi.org/10.24963/ijcai.2019/302,“pdf_url”:https://www.ijcai.org/proceedings/2019/0302.pdf“,”source“:null,”license“:null,”licence_id“:nul,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},”type“:”article“,”type_crossref“:“proceedings-article”,”indexed_in“:[”crossref“],”open_access“:{”is_oa“:true,”oa_status“:”青铜色“,”oa_url“:”https://www.ijcai.org/proceedings/2019/0302.pdf“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5027690597“,”display_name“:”Michael K.Cohen“,”orcid“:”https://orcid.org/0000-0003-1749-875X},“机构”:[{“id”:https://openalex.org/I118347636“,”display_name“:”澳大利亚国立大学“,”ror“:”https://ror.org/019wvm592“,”country_code“:”AU“,”type“:“教育”,”世系“:[”https://openalex.org/I118347636“]}],”国家“:[”AU“],”is_corresponding“:false,”raw_author_name“:”Michael K.Cohen“,”raw_affiliation_strings“:[“澳大利亚国立大学”],”affiliations“:[{”raw_affiliation_string“:”澳大利亚国立大学“,”institution_ids“:[https://openalex.org/I118347636“]}]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5020795308“,”display_name“:”Elliot Catt“,”orcid“:”https://orcid.org/0000-0001-9411-927X},“机构”:[{“id”:https://openalex.org/I118347636“,”display_name“:”澳大利亚国立大学“,”ror“:”https://ror.org/019wvm592“,”country_code“:”AU“,”type“:“教育”,”世系“:[”https://openalex.org/I118347636“]}],”国家“:[”AU“],”is_corresponding“:false,”raw_author_name“:”Elliot Catt“,”raw _affiliation_strings“:[“澳大利亚国立大学”],”affiliations“:[{”raw _affiliation_string“:”澳大利亚国立大学“,”institution_ids“:]”https://openalex.org/I118347636“]}]},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A5073944062“,”display_name“:”马库斯·赫特“,”兽人“:”https://orcid.org/0000-0002-3263-4097},“机构”:[{“id”:https://openalex.org/I118347636“,”display_name“:”澳大利亚国立大学“,”ror“:”https://ror.org/019wvm592“,”country_code“:”AU“,”type“:“教育”,”世系“:[”https://openalex.org/I118347636“]}],”国家“:[”AU“],”is_corresponding“:false,”raw_author_name“:”Marcus Hutter“,”raw _affiliation_strings“:[“澳大利亚国立大学”],”affiliations“:[{”raw _affiliation_string“:”澳大利亚国立大学“,”institution_ids“:]”https://openalex.org/I118347636“]}]}],”institution_assertions“:[],”countries_distiction_count“:1,”institutions_disticent_count”:1,“corresponding_author_ids”:[]、“corresconding_institution_ids“:[].”apc_list“:null,”apc_payed“:null,”fwci“:1.184,”has_fulltext“:true,”fulltext_origin“:”pdf“,”cited_by_count:5,“citation_normalized_percentile”:{“value”:0.5224 72,“is_in_top_1_percent”:假,“is_in_top_10_percent“:false},”cited_by_percentile_year“:{”min“:80,”max“:81},“biblio”:{“volume”:null,“issue”:nul,“first_page”:null,“last_page”:null},,“is_retracted”:false,“is_paratext”:false,“primary_topic”:{“id”:“https://openalex.org/T2002“,”display_name“:”计算复杂性与算法信息理论“,”score“:0.9959,”subfield“:{”id“:”https://openalex.org/subfields/1703“,”display_name“:”计算理论与数学“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T2002“,”display_name“:”计算复杂性与算法信息理论“,”score“:0.9959,”subfield“:{”id“:”https://openalex.org/subfields/1703“,”display_name“:”计算理论与数学“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T12101“,”display_name“:”多臂盗贼问题优化“,”score“:0.9234,”subfield“:{”id“:”https://openalex.org/subfields/1803“,”display_name“:”管理科学与运筹学“},”字段“:{”id“:”https://openalex.org/fields/18“,”display_name“:”Decision Sciences“},”domain“:{”id“:”https://openalex.org/domains/2“,”“display_name”:“社会科学”}},{”id“:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9135,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/sumplically-optimal-algorithm“,”display_name“:”渐近最优算法“,”score“:0.7833319},{”id“:”https://openalex.org/keywords/reinforcement-learning网站“,”display_name“:”强化学习“,”score“:0.618501},{”id“:”https://openalex.org/keywords/multi-gent-systems网站“,”display_name“:”Multi-Agent Systems“,”score“:0.5079},{”id“:”https://openalex.org/keywords/value“,”display_name“:”Value(mathematics)“,”score“:0.42464685},{”id“:”https://openalex.org/keywords/q-learning(https://openalex.org/keywords/q-learning)“,”display_name“:”Q-learning“,”score“:0.41972646}],”concepts“:[{”id“:”https://openalex.org/C97541855,“wikidata”:https://www.wikidata.org/wiki/Q830687“,”display_name“:”强化学习“,”level“:2,”score“:0.837218},{”id“:”https://openalex.org/C181789720,“wikidata”:https://www.wikidata.org/wiki/Q4812191“,”display_name“:”渐近最优算法“,”level“:2,”score“:0.7833319},{”id“:”https://openalex.org/C49937458,“wikidata”:https://www.wikidata.org/wiki/Q2599292“,”display_name“:”概率逻辑“,”level“:2,”score“:0.74970996},{”id“:”https://openalex.org/C34388435,“wikidata”:https://www.wikidata.org/wiki/Q2267362网址“,”display_name“:”绑定函数“,”level“:2,”score“:0.6325488},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.612947},{”id“:”https://openalex.org/C2777212361,“wikidata”:https://www.wikidata.org/wiki/Q5127848“,”display_name“:”类(哲学)“,”级别“:2,”分数“:0.5678084},{”id“:”https://openalex.org/C126255220,“wikidata”:https://www.wikidata.org/wiki/Q141495“,”display_name“:”数学优化“,”level“:1,”score“:0.5121124},{”id“:”https://openalex.org/C187691185,“wikidata”:https://www.wikidata.org/wiki/Q2020720“,”display_name“:”Grid“,”level“:2,”score“:0.43656388},{”id“:”https://openalex.org/C2776291640,“wikidata”:https://www.wikidata.org/wiki/Q2912517“,”display_name“:”Value(mathematics)“,”level“:2,”score“:0.42464685},{”id“:”https://openalex.org/C188116033,“wikidata”:https://www.wikidata.org/wiki/Q2664563“,”display_name“:”Q-learning“,”level“:3,”score“:0.41972646},{”id“:”https://openalex.org/C67203356,“wikidata”:https://www.wikidata.org/wiki/Q1321905“,”display_name“:”钢筋“,”level“:2,”score“:0.41255698},{”id“:”https://openalex.org/C33923547,“wikidata”:https://www.wikidata.org/wiki/Q395“,”display_name“:”数学“,”等级“:0,”分数“:0.3270054},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.20704994},{”id“:”https://openalex.org/C119857082,“wikidata”:https://www.wikidata.org/wiki/Q2539“,”display_name“:”机器学习“,”level“:1,”score“:0.10753575},{”id“:”https://openalex.org/C134306372,“wikidata”:https://www.wikidata.org/wiki/Q7754“,”display_name“:”数学分析“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C2524010,“wikidata”:https://www.wikidata.org/wiki/Q8087“,”display_name“:”Geometry“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C15744967,“wikidata”:https://www.wikidata.org/wiki/Q9418“,”display_name“:”心理学“,”等级“:0,”分数“:0.0},{”id“:”https://openalex.org/C77805123,“wikidata”:https://www.wikidata.org/wiki/Q161272“,”display_name“:”社会心理学“,”level“:1,”score“:0.0}],”mesh“:[],”locations_count“:2,”locations“:[{”is_oa“:true,”landing_page_url“:”https://doi.org/10.24963/ijcai.2019/302,“pdf_url”:https://www.jcai.org/proceedings/2019/0302.pdf“,”source“:null,”license“:null,”license_id“:null,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/1903.01021,“pdf_url”:https://arxiv.org/pdf/1903.01021,“源”:{“id”:https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”is_core“:fase,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“https://doi.org/10.24963/ijcai.2019/302,“pdf_url”:https://www.ijcai.org/proceedings/2019/0302.pdf“,”source“:null,”license“:null,”licence_id“:nul,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true}“,”sustainable_development_goals“:[],”grants“:[],”datasets“:],”versions“:[https://openalex.org/W1915057100","https://openalex.org/W2127042005","https://openalex.org/W2145339207","https://openalex.org/W2171438620","https://openalex.org/W2281341692","https://openalex.org/W2514775068","https://openalex.org/W2761873684","https://openalex.org/W2772709170","https://openalex.org/W2964043796","https://openalex.org/W4248423132","https://openalex.org/W4297748582","https://openalex.org/W4299502902","https://openalex.org/W4299797008“],”related_works“:[”https://openalex.org/W4376605461","https://openalex.org/W3096874164","https://openalex.org/W3087814763","https://openalex.org/W2937181779","https://openalex.org/W2892507673","https://openalex.org/W2537866915","https://openalex.org/W2361647908","https://openalex.org/W2357975469","https://openalex.org/W2136202932","https://openalex.org/W2089415692“],”abstract_inverted_index“:{”强化“:[0,93149],”学习“:[1],”代理“:[2],”是“:[3],”预期“:[4],”to“:[5,77,99108145151],”最终“:[6],”执行“:[7],”well.“:[8],”典型地,“:[9],”this“:[10],”takes“:%11],”the“:[12,18,40,52,83101119147],”form“:[13],”of“:[14,21,85],“a”:[15,35,55,75125],“担保”:[16],“关于”:[17,27112],“渐近“:[19,63],“行为”:[20],“an”:[22,32105],“算法”:[23,33],“给定”:[24],“一些”:[25],“假设”:[26],“环境”。“:[29],”We“:[30140],”present“:[31],”for“:[34,74132],”policy“:[36,76],”which“:[37],”value“:38,42],”approachs“:[39],”optimal“:[41,81155],”with“:[C3],”probability“:[44],”1“:[45],”in“:[46,82143],”all“:[47,86],”computable“:[48,87],”概率“:[49,88],”environments,“:[50],”provided“:[51],”agent“:[53],”has“:[54],”bounded“:[56],”horizon。“:[57],”此“:[58],”是“:[59,96116124138],”已知“:[60],”作为“:[61],”强“:[62],”最优性,“:[64],”和“:[65],”it“:[66,71103115],”was“:[67,72],”previous“:68],”未知“:[69],”是否“:[70],”可能“:[73],”be“:[78129],”strong“:[79],”渐近“:[80154],“类”:[84],“环境。“:[89],“我们的”:[90],“代理”:[91],“探究性”:[92148],“学习者”:[94150],“(查询)”:[95],“更多”:[97102133],“可能”:[98],“探索”:[100],“预期”:[104],“探讨性”:[106],“行动”:[107],“减少”:[109],“其”:[110],“不确定性”:[111],“其中”:[113],“环境”:[114135],“in,“:[117],”因此“:[118],”术语“:[120],”好奇。“:[121],”探索“:[122],”好奇“:[123],”策略“:[126],”那“:[127],”可以“:[128],”应用“:[130],”一般;“:[131],”可管理“:[134],”类“:[136],”好奇“:[137],”易驾驭。“:[139],”执行“:[141],”实验“:[142],”网格世界“:[144],”比较“:[146],”其他“:[152],”弱“:[153],”代理。“:[156]},”cited_by_api_url“:”https://api.openalex.org/works?filter=cites:W2966368748“,”counts_by_year“:[{”年份“:2021,”cited_by_count“:4},{”年“:2020,”cited_by_count”:1}],”更新日期“:”2024-09-25T19:06:56.729404“,”创建日期“:“2019-08-13”}