{“id”:“https://openalex.org/W4298330226“,”doi“:”https://doi.org/10.1609/aaai.v29i1.9600“,”title“:”Compress and Control“,”display_name“:”压缩和控制“,”publication_year“:2015,”publiation_date“:”2015-02-21“,”ids“:{”openalex“:”https://openalex.org/W4298330226“,”doi“:”https://doi.org/10.1609/aai.v29i1.9600“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://doi.org/10.1609/aaai.v29i1.9600,“pdf_url”:https://ojs.aaai.org/index.php/aaai/article/download/9600/9459,“源”:{“id”:https://openalex.org/S4210191458“,”“display_name”“:”“AAAI人工智能会议记录”“,”issn_l“:”2159-5399“,”isn“:[”21595599“,”2374-3468“],”is_oa“:true,”is_ in_doaj“:false,”is_core“:false,”host_organization“:”https://openalex.org/P431032058“,”“host_organization_name”:“人工智能发展协会”,“host_ordanization_lineage”:[“https://openalex.org/P431032058“],”host_organization_lineage_names“:[”人工智能发展协会“],“type”:“conference”},“license”:null,“licence_id”:nul,“version”:“publishedVersion”,“is_accepted”:true,“is_published”:true},”type“:”article“,”type_crossref“:“journal-article”,“indexed_in”:[”crossref“]oaurl“:”https://ojs.aaai.org/index.php/aaai/article/download/9600/9459“,”any_repository_has_fulltext“:false},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A506070909021“,”display_name“:”Joel Veness“,”orcid“:null},”institutions“:[{”id“:”https://openalex.org/I1291425158“,”display_name“:”谷歌(美国)“,”错误“:”https://ror.org/00njsd438“,”country_code“:”US“,”type“:“company”,”lineage“:[”https://openalex.org/I1291425158","https://openalex.org/I4210128969“]},{”id“:”https://openalex.org/I4210090411“,”display_name“:”DeepMind(英国)“,”ror“:”https://ror.org/00971b260“,”“country_code”“:”GB“,”type“:”company“,”seriance“:[”https://openalex.org/I4210090411","https://openalex.org/I4210128969“]}],”国家“:[”GB“,”US“],”is_corresponding“:false,”raw_author_name“:”Joel Veness“,”raw _affiliation_strings“:[“Google DeepMind”],”affiliations“:[{”raw _affiliation_string“:”Google DeepMend“,”institution_ids“:[https://openalex.org/I1291425158","https://openalex.org/I4210090411“]}]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5001087292“,”display_name“:”Marc G.Bellemare“,”orcid“:”https://orcid.org/0000-0002-6096-0105},“机构”:[{“id”:https://openalex.org/I1291425158“,”display_name“:”谷歌(美国)“,”错误“:”https://ror.org/00njsd438“,”country_code“:”US“,”type“:“company”,”lineage“:[”https://openalex.org/I1291425158","https://openalex.org/I4210128969“]},{”id“:”https://openalex.org/I4210090411“,”display_name“:”DeepMind(英国)“,”ror“:”https://ror.org/00971b260“,”“country_code”“:”GB“,”type“:”company“,”seriance“:[”https://openalex.org/I4210090411","https://openalex.org/I4210128969“]}],”国家“:[”GB“,”US“],”is_corresponding“:false,”raw_author_name“:”Marc Bellemare“,”raw _ afiliation_strings“:[“Google DeepMind”],”affiliations“:[{”raw_ afiliation _string“:”Google DeepMend“,”institution_ids“:[https://openalex.org/I1291425158","https://openalex.org/I4210090411“]}]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5073944062“,”display_name“:”马库斯·赫特“,”兽人“:”https://orcid.org/0000-0002-3263-4097},“机构”:[{“id”:https://openalex.org/I118347636“,”display_name“:”澳大利亚国立大学“,”ror“:”https://ror.org/019wvm592“,”country_code“:”AU“,”type“:“教育”,”世系“:[”https://openalex.org/I118347636“]}],”国家“:[”AU“],”is_corresponding“:false,”raw_author_name“:”Marcus Hutter“,”raw _affiliation_strings“:[“澳大利亚国立大学”],”affiliations“:[{”raw _affiliation_string“:”澳大利亚国立大学“,”institution_ids“:]”https://openalex.org/I118347636“]}]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5028585856“,”display_name“:”Alvin J.K.Chua“,”orcid“:”https://orcid.org/0000-0001-5242-8269},“机构”:[{“id”:https://openalex.org/I1291425158“,”display_name“:”谷歌(美国)“,”错误“:”https://ror.org/00njsd438“,”country_code“:”US“,”type“:“company”,”lineage“:[”https://openalex.org/I1291425158","https://openalex.org/I4210128969“]},{”id“:”https://openalex.org/I4210090411“,”display_name“:”DeepMind(英国)“,”ror“:”https://ror.org/00971b260“,”“country_code”“:”GB“,”type“:”company“,”seriance“:[”https://openalex.org/I4210090411","https://openalex.org/I4210128969“]}],”国家“:[”GB“,”US“],”is_corresponding“:false,”raw_author_name“:”Alvin Chua“,”raw _affiliation_strings“:[“Google DeepMind”],”affiliations“:[{”raw _affiliation_string“:”Google DeepMend“,”institution_ids“:[https://openalex.org/I1291425158","https://openalex.org/I4210090411“]}]},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A5089648583“,”display_name“:”Guillaume Desjardins“,”orcid“:”https://orcid.org/0000-0002-5669-6671},“机构”:[{“id”:https://openalex.org/I1291425158“,”display_name“:”谷歌(美国)“,”错误“:”https://ror.org/00njsd438“,”country_code“:”US“,”type“:“company”,”lineage“:[”https://openalex.org/I1291425158","https://openalex.org/I4210128969“]},{”id“:”https://openalex.org/I4210090411“,”display_name“:”DeepMind(英国)“,”ror“:”https://ror.org/00971b260“,”“country_code”“:”GB“,”type“:”company“,”seriance“:[”https://openalex.org/I4210090411","https://openalex.org/I4210128969“]}],”国家“:[”GB“,”US“],”is_corresponding“:false,”raw_author_name“:”Guillaume Desjardins“,”raw _affiliation_strings“:[“Google DeepMind”],”affiliations“:[{”raw _affiliation_string“:”Google DeepMend“,”institution_ids“:[https://openalex.org/I1291425158","https://openalex.org/I4210090411“]}]}],”institution_assertions“:[],”countries_distiction_count“:3,”institutions_disticent_count”:3,“corresponding_author_ids”:[]、“corresconding_institution_ids“:[].”apc_list“:null,”apc_payed“:null,”fwci“:0.17,”has_fulltext“:true,”fulltext_origin“:”pdf“,”cited_by_count 134,“is_in_top_1_percent”:假,“is_in_top_10_percent“:false},”cited_by_percentile_year“:{”min“:66,”max“:73},“biblio”:{“volume”:“29”,“issue”:“1”,“first_page”:null,“last_page”:null},‘is_retracted’:false,‘is_paratext’:false,‘primary_topic’:{‘id’:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9916,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9916,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/reinforcement-learning网站“,”display_name“:”强化学习“,”score“:0.614668},{”id“:”https://openalex.org/keywords/遍历性“,”display_name“:”遍历性“,”score“:0.6044805},{”id“:”https://openalex.org/keywords/policy-gradient网站“,”display_name“:”策略渐变“,”score“:0.512342},{”id“:”https://openalex.org/keywords/dep-learning网站“,”display_name“:”深度学习“,”score“:0.502956},{”id“:”https://openalex.org/keywords/value“,”display_name“:”Value(mathematics)“,”score“:0.48763004}],”concepts“:[{”id“:”https://openalex.org/C185429906,“wikidata”:https://www.wikidata.org/wiki/Q1130160“,”display_name“:”Estimator“,”level“:2,”score“:0.70510215},{”id“:”https://openalex.org/C97541855,“wikidata”:https://www.wikidata.org/wiki/Q830687“,”display_name“:”强化学习“,”level“:2,”score“:0.67174107},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.66748834},{”id“:”https://openalex.org/C14646407,“wikidata”:https://www.wikidata.org/wiki/Q1430750“,”display_name“:”Bellman equation“,”level“:2,”score“:0.6193809},{”id“:”https://openalex.org/C201779956,“wikidata”:https://www.wikidata.org/wiki/Q5426803“,”display_name“:”遍历“,”level“:2,”score“:0.6044805},{”id“:”https://openalex.org/C2775924081,“wikidata”:https://www.wikidata.org/wiki/Q55608371“,”display_name“:”Control(management)“,”level“:2,”score“:0.4915944},{”id“:”https://openalex.org/C2776291640,“wikidata”:https://www.wikidata.org/wiki/Q2912517“,”display_name“:”Value(mathematics)“,”level“:2,”score“:0.48763004},{”id“:”https://openalex.org/C14036430网址,“wikidata”:https://www.wikidata.org/wiki/Q3736076网址“,”display_name“:”功能(生物学)“,”级别“:2,”分数“:0.48125312},{”id“:”https://openalex.org/C2778755073,“wikidata”:https://www.wikidata.org/wiki/Q10858537“,”display_name“:”Scale(ratio)“,”level“:2,”score“:0.4374123},{”id“:”https://openalex.org/C126255220,“wikidata”:https://www.wikidata.org/wiki/Q141495“,”display_name“:”数学优化“,”level“:1,”score“:0.3747214},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.27412838},{”id“:”https://openalex.org/C33923547,“wikidata”:https://www.wikidata.org/wiki/Q395“,”display_name“:”数学“,”等级“:0,”分数“:0.23384061},{”id“:”https://openalex.org/C119857082,“wikidata”:https://www.wikidata.org/wiki/Q2539“,”display_name“:”机器学习“,”level“:1,”score“:0.23019701},{”id“:”https://openalex.org/C105795698,“wikidata”:https://www.wikidata.org/wiki/Q12483“,”display_name“:”Statistics“,”level“:1,”score“:0.12760994},{”id“:”https://openalex.org/C121332964,“wikidata”:https://www.wikidata.org/wiki/Q413“,”display_name“:”物理“,”级别“:0,”分数“:0.0},{”id“:”https://openalex.org/C62520636,“wikidata”:https://www.wikidata.org/wiki/Q944“,”display_name“:”量子力学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C78458016,“wikidata”:https://www.wikidata.org/wiki/Q840400“,”display_name“:”进化生物学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C86803240,“wikidata”:https://www.wikidata.org/wiki/Q420“,”display_name“:”Biology“,”level“:0,”score“:0.0}],”mesh“:[],”locations_count“:1,”location“:[{”is_oa“:true,”landing_page_url“:”https://doi.org/10.1609/aaai.v29i1.9600,“pdf_url”:https://ojs.aaai.org/index.php/aaai/article/download/9600/9459,“源”:{“id”:https://openalex.org/S4210191458“,”“display_name”“:”“AAAI人工智能会议记录”“,”issn_l“:”2159-5399“,”isn“:[”21595599“,”2374-3468“],”is_oa“:true,”is_ in_doaj“:false,”is_core“:false,”host_organization“:”https://openalex.org/P431032058“,”“host_organization_name”:“人工智能发展协会”,“host_ordanization_lineage”:[“https://openalex.org/P431032058“],”host_organization_lineage_names“:[”促进人工智能协会“],“type”:“conference”},“license”:null,“licence_id”:nul,“version”:“publishedVersion”,“is_accepted”:true,“is_published”:true}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“https://doi.org/10.1609/aaai.v29i1.9600,“pdf_url”:https://ojs.aaai.org/index.php/aaai/article/download/9600/9459,“源”:{“id”:https://openalex.org/S4210191458“,”“display_name”“:”“AAAI人工智能会议记录”“,”issn_l“:”2159-5399“,”isn“:[”21595599“,”2374-3468“],”is_oa“:true,”is_ in_doaj“:false,”is_core“:false,”host_organization“:”https://openalex.org/P431032058“,”“host_organization_name”:“人工智能发展协会”,“host_ordanization_lineage”:[“https://openalex.org/P431032058“],”host_organization_lineage_names“:[”人工智能发展协会“],“type”:“conference”},“license”:null,“licence_id”:nul,“version”:“publishedVersion”,“is_accepted”:true,“is_published”:true},”sustainable_development_goals“:[{”id“:”https://metadata.un.org/sdg/16“,”score“:0.66,”display_name“:”Peace,justice,and strong institutions“}],”grants“:[],”datasets“:【】,”versions“:【],”referenced_works_count“:40,”referrenced_works“:[”https://openalex.org/W107054272","https://openalex.org/W136985510","https://openalex.org/W1506806321","https://openalex.org/W1515308897","https://openalex.org/W1528086278","https://openalex.org/W2024780670","https://openalex.org/W2028145673","https://openalex.org/W2064175235","https://openalex.org/W2104290684","https://openalex.org/W2107745473","https://openalex.org/W2123372395","https://openalex.org/W2128859735","https://openalex.org/W2129652681","https://openalex.org/W2136065708","https://openalex.org/W2137509429","https://openalex.org/W2148029210","https://openalex.org/W2149418961","https://openalex.org/W2158191646","https://openalex.org/W2163294786","https://openalex.org/W2171886309","https://openalex.org/W2404689820","https://openalex.org/W2408670836","https://openalex.org/W2568832377","https://openalex.org/W285471286","https://openalex.org/W2949931500","https://openalex.org/W2964050205","https://openalex.org/W2998508934","https://openalex.org/W2998993395","https://openalex.org/W3103780890","https://openalex.org/W4211221179","https://openalex.org/W4214717370","https://openalex.org/W4230511558","https://openalex.org/W4230960895","https://openalex.org/W4253181625","https://openalex.org/W4293405734","https://openalex.org/W4294023993","https://openalex.org/W4298130528","https://openalex.org/W4298857966","https://openalex.org/W4301183862","https://openalex.org/W4307347247“],”related_works“:[”https://openalex.org/W3124353475","https://openalex.org/W3099153698","https://openalex.org/W3091331701","https://openalex.org/W3038962357","https://openalex.org/W2392918297","https://openalex.org/W2386410636","https://openalex.org/W2381286475","https://openalex.org/W2313545085","https://openalex.org/W2152685658","https://openalex.org/W2025663273“],”abstract_inverted_index“:{”This“:[0,12],”paper“:[1],”descriptions“:[2],”a“:[3,21,38,45110],”new“:[4],”information-theoretic“:/5],”policy“:[6],”evaluation“:[7],”technique“:[8,13,57,97118],”for“:[9103],”reinforcement“:[10],”learning.“:[11],”converts“:[14],“any”:[15],“compression”:[16],“or”:[17],“density”:[18],“model”:[19,41,86],“into”:[20]相应的“:[22],”估计“:[23],”的“:[24,37,55,69,89116],”值。“:[25],”Under“:[26],”appropriate“:[27],”stationary“:[28],”and“:[29],”遍历性“:[30],”conditions,“:[31],”we“:[32,93],”show“:[33],”that“:[34,95],”the“:[35,53,67,87,90114],”use“:[36,68],”sufficient“:[39,99],”powered“:[40],”gives“:%42],”rise“:[43],”to“:[44,60,84119121],”一致“:[46],”值“:[47101],”函数“:[48],”估计器。“:[49],“我们”:[50,75107],“也”:[51],“研究”:[52112],“行为”:[54],“这个”:[56],“何时”:[58],“应用”:[59],“各种”:[61],“Atari”:[62],“2600”:[63],“视频”:[64],“游戏”:[65],“其中”:[66],“次优”:[70],“建模”:[71],“技术”:[72],“是”:[73],“不可避免。“:[74],”考虑“:[76],”三“:[77],”基本“:[78],”不同“:[79],”模型“:[80],”全部“:[81],”太“:[82],”限制“:[83],”完美“:[85],”动力学“:[88],”系统。“:[91],”显著“:[92],”查找“:[94],”我们的“:[96117],”提供“:[98],”准确“:[100],”估计“:[102],”有效“:[104],”政策上“:[105],”控制。“:[106],”总结“:[108],”有“:[109],”暗示“:[111],”突出显示“:[113],”潜在“:[115],”规模“:[120],”大型“:[122],”问题。“:[123]},”cited_by_api_url“:”https://api.openalex.org/works?filter=cites:W4298330226“,”counts_by_year“:[{”年“:2018,”cited_by_count“:1}],”更新日期“:”2024-09-18T06:17:05.099385“,”创建日期“:“2022-10-02”}