{“id”:“https://openalex.org/W4385007921“,”doi“:”https://doi.org/10.48550/arxiv.2307.11046“,”title“:”持续强化学习的定义“,”display_name“:”连续强化学习的含义“,”publication_year“:2023,”publitation_date“:”2023-01-01“,”ids“:{”openalex“:”https://openalex.org/W4385007921“,”doi“:”https://doi.org/10.48550/arxiv.2307.11046“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2307.11046“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”is_core“:fase,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“other-oa”,“licence_id”:“https://openalex.org/licenses/other-oa网站“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},”type“:”preprint“,”type_crossref“:“posted-content”,”indexed_in“:[”arxiv“,”datacite“],”open_access“:{”is_oa“:true,”oa_status“:”green“,”oa_url“:”https://arxiv.org/abs/2307.11046“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5080191195“,”display_name“:”David Abel“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Abel,David“,”raw _affiliation_strings“:],”affiliations“:[/]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5008592589“,”display_name“:”Andr\u00e9 Barreto“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Barreto,Andr\u 00e9“,”raw _affiliation_strings“:],”affiliations“:[/]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5045543562“,”display_name“:”Benjamin Van Roy“,”orcid“:”https://orcid.org/0000-0001-8364-3746“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”Van Roy,Benjamin“,”raw_affiliation_strings“:[],“affiliations”:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5065836447“,”display_name“:”Doina Precup“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Precup,Doina“,”raw _affiliation_strings“:],”affiliations“:[/]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5033135596“,”display_name“:”Hado van Hasselt“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”van Hassert,Hado“,”raw _affiliation_strings“:],”affiliations“:[/]},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A5065366930“,”display_name“:”Satinder Singh“,”orcid“:”https://orcid.org/0000-0002-8215-8295“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”辛格,萨汀德“,”raw_affiliation_strings“:[],“隶属关系”:[]}],“countries_distict_count”:0,“institutions_disticenc_count”:零,“corresponding_author_ids”:[]、“corresconding_institution_ids“:[]],”apc_list“:null,“apc_payed”:null,“fwci”:1.025,“has_fulltext”:假,“cited_by_count“:2,”cited_by_percentile_year“:{“min”:85,“max”:90},“biblio”:{”volume“:null,“issue”:null、“first_page”:null,“last_page”:null},”is_retracted“:false,”is_paratext“:false,”primary_topic“:{”id“:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9644,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9644,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/reinforcement-learning网站“,”display_name“:”强化学习“,”score“:0.585717}],”concepts“:[{”id“:”https://openalex.org/C97541855,“wikidata”:https://www.wikidata.org/wiki/Q830687“,”display_name“:”强化学习“,”level“:2,”score“:0.8378726},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.59809947},{”id“:”https://openalex.org/C139807058,“wikidata”:https://www.wikidata.org/wiki/Q352374“,”display_name“:”适应(眼睛)“,”级别“:2,”分数“:0.5461203},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.49848104},{”id“:”https://openalex.org/C77967617,“wikidata”:https://www.wikidata.org/wiki/Q4677561“,”display_name“:”主动学习(机器学习)“,”level“:2,”score“:0.49581847},{”id“:”https://openalex.org/C98045186,“wikidata”:https://www.wikidata.org/wiki/Q205663“,”display_name“:”Process(computing)“,”level“:2,”score“:0.4847226},{”id“:”https://openalex.org/C12713177,“wikidata”:https://www.wikidata.org/wiki/Q1900281“,”display_name“:”透视(图形)“,”level“:2,”score“:0.4766068},{”id“:”https://openalex.org/C67203356,“wikidata”:https://www.wikidata.org/wiki/Q1321905“,”display_name“:”钢筋“,”level“:2,”score“:0.45634186},{”id“:”https://openalex.org/C2780451532,“wikidata”:https://www.wikidata.org/wiki/Q759676“,”display_name“:”任务(项目管理)“,”级别“:2,”分数“:0.4225363},{”id“:”https://openalex.org/C15744967,“wikidata”:https://www.wikidata.org/wiki/Q9418“,”display_name“:”心理学“,”等级“:0,”分数“:0.13863549},{”id“:”https://openalex.org/C127413603,“wikidata”:https://www.wikidata.org/wiki/Q11023“,”display_name“:”Engineering“,”level“:0,”score“:0.10591459},{”id“:”https://openalex.org/C77805123,“wikidata”:https://www.wikidata.org/wiki/Q161272“,”display_name“:”社会心理学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C201995342,“wikidata”:https://www.wikidata.org/wiki/Q682496“,”display_name“:”系统工程“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C169760540,“wikidata”:https://www.wikidata.org/wiki/Q207011“,”display_name“:”Neuroscience“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C111919701,“wikidata”:https://www.wikidata.org/wiki/Q9135“,”display_name“:”操作系统“,”level“:1,”score“:0.0}],”mesh“:[],”locations_count“:2,”location“:[{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2307.11046“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”is_core“:fase,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“other-oa”,“licence_id”:“https://openalex.org/licenses/other-oa“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},{”is_oa“:false,”landing_page_url“:”https://api.datacite.org/dois/10.48550/arxiv.2307.11046“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4393179698“,”display_name“:”DataCite API“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_in_doaj“:false,”is_core“:false,”host_organization“:”https://openalex.org/I4210145204“,”“host_organization_name”:“DataCite”,“host_organization_lineage”:[“https://openalex.org/I4210145204“],”host_organization_lineage_names“:[”DataCite“],“type”:“metadata”},“license”:null,“licence_id”:null,“version”:null}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“https://arxiv.org/abs/2307.11046“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”is_core“:fase,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],”type“:”repository“},”license“:”other oa“,”license_id“:”https://openalex.org/licenses/other-oa“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},”sustainable_development_goals“:[],”grants“:[],”datasets“:],”versions“:[https://openalex.org/W4310083477","https://openalex.org/W2920061524","https://openalex.org/W2328553770","https://openalex.org/W2145821588","https://openalex.org/W2107890255","https://openalex.org/W2106552856","https://openalex.org/W2086122291","https://openalex.org/W2038908348","https://openalex.org/W1987513656","https://openalex.org/W1977959518“],”ngrams_url“:”https://api.openalex.org/works/W4385007921/ngrams“,”“abstract_inverted_index”:{“In”:[0,44],“a”:[1,16,28,35,71115130],“standard”:[2],“view”:[3,30],“of”:[4,31,64,74108174185200],“the”:[5,51,55,62,68,75,99106153157198],“reinforction”:[6,47,66101156],“learning”:[7,32,40,48102151163177181209],“problem”:[8],“an”:[9143],“agent”:[10],“目标”:[11],“是”:[12,25,94],“到“:[13,50,96],”高效“:[14],”识别“:[15],”政策“:[17],”那“:[18,77110136171],”最大化“:[19],”长期“:[20],”奖励。“:[21],”“然而,”:[22],“this”:[23,90,92125],“perspective”:[24],“based”:[26],“on”:[27],“restricted”:[29],“as”:[33,4134140152],“finding”:[34],“solution”,“:[36],“rate”:[37],“than”:[38],“treating”:[39],“enound”:[42],“adaption”。“:[43],”对比“:[45],”连续“:[46,65100131149162179208],”指“:[49],”设置“:[52154],”in“:[53155],”which“:[54156],”best“:[56158],”agents“:[57109159],”never“:[58],”stop“:[59112],”learning。“:[60],“尽管”:[61],“重要性”:[63],“学习”:[67201],“社区”:[69],“缺乏”:[70],“简单”:[72],“定义”:[73],“问题”:[76],“突出”:[78],“其”:[79,83],“承诺”:[80],“和”:[81,87121148178191202],“制造”:[82],“主要”:[84],“概念”:[85196],“精确”:[86],“明确”●●●●。“:[88],”收件人“:[89],”结束“:[91],”纸张“:[93],”专用“:[95],”小心“:[97],”定义“:[98],”问题。“:[103],“我们”:[104165],“形式化”:[105193],“概念”:[107],“从不”:[111],“学习”:[113],“通过”:[114],“新”:[1116126204],“数学”:[117],“语言”:[118],“用于”:[119],“分析”:[120],“编目”:[122],“代理”。“:[123164210],”使用“:[124],”语言“:[127],”我们“:[128],”定义“:[129],”代理“:[133],”一“:[135],”可以“:[137],”是“:[138],”理解“:[139],”携带“:[141],”输出“:[142],”隐含“:[144],”搜索“:[145],”进程“:[146],”无限期“:[147],”are“:[160182],”全部“:[161],”提供“:[166],”二“:[167],”激励“:[168],”示例“:[169],”说明“:[170],”传统“:[172],”视图“:[173],”多任务“:[175],”监督“:[180],”特殊“:[183],”案例“:[184],”我们的“:[186],”定义。“:[187],”“集体”“:[188],”这些“:[189],”定义“:[190],”视角“:[192],”许多“:[194],”直觉“:[195],”在“:[197],”心“:[199],”开放“:[203],”研究“:[205],”路径“:[206],”周围“:[207]},”引用_by_api_url“:”https://api.openalex.org/works?filter=cites:W4385007921“,”counts_by_year“:[{”年“:2024,”引用_by_count“:2}],”更新日期“:”2024-07-10T02:05:1746675“,”创建日期“:“2023-07-22”}