{“id”:“https://openalex.org/W4315487473“,”doi“:”https://doi.org/10.1613/jair.1.14174“,”title“:“深度强化学习中零激发泛化的调查”,“display_name”:“深度增强学习中零触发泛化的研究”,“publication_year”:2023,“publiation_date”:“2023-01-09”,“ids”:{“openalex”:“https://openalex.org/W4315487473“,”doi“:”https://doi.org/10.1613/jair.1.14174“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://doi.org/10.1613/jair.1.14174“,”pdf_url“:”https://jair.org/index.php/jair/article/download/14174/26890,“源”:{“id”:https://openalex.org/S139930977“,”“display_name”:“人工智能研究杂志/\u0098The \u009c Journal of artificial intelligence research”,“issn_l”:“1076-9757”,“isn”:[“1076-97”,“1943-5037”],“is_oa”:true,“is-in_doaj”:true,“is_core”:真,“host_organization”:“https://openalex.org/P4310315760“,”“host_organization_name”:“AI Access Foundation”,“host_organization_lineage”:[“https://openalex.org/P4310315760“],”host_organization_lineage_names“:[”AI Access Foundation“],“type”:“journal”},“license”:“publisher-specific-oa”,“licence_id”:“https://openalex.org/licenses/publisher-specific-oa“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},”type“:”article“,”type_crossref“:”期刊文章“,”indexed_in“:[”arxiv“,”crossref“],”open_access“:{”is_oa“:true,”oa_status“:”gold“,”oa_url“:”https://jair.org/index.php/jair/article/download/14174/26890“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5051243028“,”display_name“:”Robert Kirk“,”orcid“:”https://orcid.org/0000-0002-6541-5915},“机构”:[{“id”:https://openalex.org/I45129253“,”display_name“:”伦敦大学学院“,”ror“:”https://ror.org/02jx3x895“,”country_code“:”GB“,”type“:“教育”,”世系“:[”https://openalex.org/I124357947","https://openalex.org/I45129253“]}],”国家“:[”GB“],”is_corresponding“:false,”raw_author_name“:”Robert Kirk“,”raw_affiliation_strings“:[“a:1:{s:5:\”en_US\“”,“s:25:\”伦敦大学学院“,”}“],“从属关系”:[{“raw_affilition_string”:“}”,“institution_ids”:[]},{“ras_affilication_string“:”s:25:“大学伦敦大学\“”,“institution_ids”:[“https://openalex.org/I45129253“]},{”raw_affiliation_string“:”a:1:{s:5:\“en_US\”“,”institution_ids“:[]}]}“作者位置”:“中间”,“作者”:{“id”:“https://openalex.org/A5052068951“,”display_name“:”Amy Zhang“,”orcid“:”https://orcid.org/0000-0002-6536-3609“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”Amy Zhang“,”raw_affiliation_strings“:[],“从属关系”:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5023508792“,”display_name“:”Edward Grefenstette“,”orcid“:”https://orcid.org/0000-0003-1164-8809“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”Edward Grefenstette“,”raw_affiliation_strings“:[],“affiliations”:[]},{“author_position”:“last”,“author”:{“id”:“https://openalex.org/A5079315903“,”display_name“:”Tim Rockt\u00e4schel“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“,”Tim Rockt\u00 e4scheL“,”raw _affiliation_strings“:],”affiliations“:【】}】,”contries_distiction_count“:1,”corresponding_author_ids“:【],”correcponding_institution_id ds“:[],”apc_list“:{”value“:0,”currency“:”USD“,”value_USD“:0,”出处“:”doaj“},”apc_payed“:{”value“:0,”currency“:”USD“,”value_USD“:0,”出处“:”doaj“},”fwci“:24.6,”has_fulltext“:true,”fulltext_origin“:”pdf“,”cited_by_count“:30,”cited_by_percentle_year“:{”min“:99,”max“:100},”biblio“:{”volume“:”76“,”issue“:null,”first_page“:”201“,”last_page“:”264“},”is_retracted“:false,”is_paratext“:fase,”primary_topic“:{”id“:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.968,”subfield“:{”id“:”https://openalex.org/subfields/s702“,”display_name“:”Artificial Intelligence“},”field“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.968,”subfield“:{”id“:”https://openalex.org/subfields/s702“,”display_name“:”Artificial Intelligence“},”field“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/reinforcement-learning网站“,”display_name“:”强化学习“,”score“:0.593866}],”concepts“:[{”id“:”https://openalex.org/C97541855,“wikidata”:https://www.wikidata.org/wiki/Q830687“,”display_name“:”强化学习“,”level“:2,”score“:0.85409725},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.69468004},{”id“:”https://openalex.org/C22019652,“wikidata”:https://www.wikidata.org/wiki/Q331309“,”display_name“:”Overfitting“,”level“:3,”score“:0.68034357},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.5521947},{”id“:”https://openalex.org/C105339364,“wikidata”:https://www.wikidata.org/wiki/Q2297740“,”display_name“:”软件部署“,”级别“:2,”分数“:0.46448287},{”id“:”https://openalex.org/C119857082,“wikidata”:https://www.wikidata.org/wiki/Q2539“,”display_name“:”机器学习“,”level“:1,”score“:0.46407726},{”id“:”https://openalex.org/C185798385,“wikidata”:https://www.wikidata.org/wiki/Q1161707“,”display_name“:”基准(测量)“,”level“:2,”score“:0.4148683},{”id“:”https://openalex.org/C50644808,“wikidata”:https://www.wikidata.org/wiki/Q192776“,”display_name“:”人工神经网络“,”level“:2,”score“:0.2527068},{”id“:”https://openalex.org/C205649164,“wikidata”:https://www.wikidata.org/wiki/Q1071“,”display_name“:”地理“,”级别“:0,”分数“:0.0},{”id“:”https://openalex.org/C13280743,“wikidata”:https://www.wikidata.org/wiki/Q131089网址“,”display_name“:”大地测量学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C111919701,“wikidata”:https://www.wikidata.org/wiki/Q9135“,”display_name“:”操作系统“,”level“:1,”score“:0.0}],”mesh“:[],”locations_count“:3,”location“:[{”is_oa“:true,”landing_page_url“:”https://doi.org/10.1613/jair.1.14174“,”pdf_url“:”https://jair.org/index.php/jair/article/download/1414/26890,“源”:{“id”:https://openalex.org/S139930977“,”“display_name”:“人工智能研究杂志/\u0098The \u009c Journal of artificial intelligence research”,“issn_l”:“1076-9757”,“isn”:[“1076-97”,“1943-5037”],“is_oa”:true,“is-in_doaj”:true,“is_core”:真,“host_organization”:“https://openalex.org/P4310315760“,”“host_organization_name”:“AI Access Foundation”,“host_organization_lineage”:[“https://openalex.org/P4310315760“],”host_organization_lineage_names“:[”AI Access Foundation“],“type”:“journal”},“license”:“publisher-specific-oa”,“licence_id”:“https://openalex.org/licenses/publisher-specific-oa“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2111.09794“,”pdf_url“:”https://arxiv.org/pdf/2111.09794,“源”:{“id”:https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”is_core“:fase,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”Cornell University“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false},{“is_oa”:true,“landing_page_url”:“https://discovery.ucl.ac.uk/id/eprint/10169918/1/14174wPg%23s.pdf“,”pdf_url“:”https://discovery.ucl.ac.uk/id/eprint/10169918/1/14174wPg%23s.pdf,“源”:{“id”:https://openalex.org/S4306400024“,”display_name“:”UCL Discovery(伦敦大学学院)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”is_core“:false,”host_organization“:”https://openalex.org/I45129253“,”“host_organization_name”:“伦敦大学学院”,“host_ordanization_lineage”:[“https://openalex.org/I45129253“],”host_organization_lineage_names“:[”伦敦大学学院“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“publishedVersion”,“is_accepted”:true,“is_published”:true}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“https://doi.org/10.1613/jair.1.14174“,”pdf_url“:”https://jair.org/index.php/jair/article/download/14174/26890,“源”:{“id”:https://openalex.org/S139930977“,”“display_name”:“人工智能研究杂志/\u0098The \u009c Journal of artificial intelligence research”,“issn_l”:“1076-9757”,“isn”:[“1076-97”,“1943-5037”],“is_oa”:true,“is-in_doaj”:true,“is_core”:真,“host_organization”:“https://openalex.org/P4310315760“,”“host_organization_name”:“AI Access Foundation”,“host_organization_lineage”:[“https://openalex.org/P4310315760“],”host_organization_lineage_names“:[”AI Access Foundation“],“type”:“journal”},“license”:“publisher-specific-oa”,“licence_id”:“https://openalex.org/licenses/publisher-specific-oa“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},”sustainable_development_goals“:[],”grants“:[],”datasets“:],”versions“:[https://openalex.org/W4387297750","https://openalex.org/W4378510483","https://openalex.org/W4362597605","https://openalex.org/W4297676672","https://openalex.org/W4281702477","https://openalex.org/W2989932438","https://openalex.org/W2922073769","https://openalex.org/W2490526372","https://openalex.org/W2186333919","https://openalex.org/W1574414179“],”ngrams_url“:”https://api.openalex.org/works/W4315487473/ngrams“,”“abstract_inverted_index”:{“The”:[0],“study”:[1],“of”:[2,63108112],“zero-shot”:[3],“generalisation”:[4],“(ZSG)”:[5],“in”:[6,45141167],“deep”:[7],“钢筋”:[8],“Learning”:[9],“RL”:[10],“aims”:[11],“to”:[12,20,29,40,87133139],“product”:[13],“URL”:[14174],“算法”:[15,44],“which”:[16],“policies”:[17],“generalise”:[18],“井”:[19,94],“新颖”:[21],“看不见的”:[22],“情况”:[23],“在”:[24],“部署”:[25],“时间”:[26],“避免”:[27],“过度拟合”:[28],“他们的”:[30],“训练”:[31],“环境”。“:[32],”应对“:[33],”这“:[34,64],”是“:[35,60136],”至关重要“:[36],“如果”:[37],“我们”:[38103123143163],“是”:[39],“部署”:[41],“强化”:[42],“学习”:[43],“真实”:[46],“世界”:[47],“场景,”:[48],“其中”:[49],“the”:[50109113],“环境”:[51],“will”“:[52],”成为“:[53],”多样化“:[54],”动态“:[55],”和“:[56,73148162176],”不可预知的。“:[57],”This“:[58],”survey“:[59],”an“:[61],”overview“:[62],”nascent“:[65],”field。“:[66],“我们”:[67,84],“依赖”:[68],“on”:[69,86158],“a”:[70105127],“统一”:[71],“形式主义”:[72],“术语”:[74],“for”:[75,91,98117155160],“讨论”:[76],“不同”:[77],“ZSG”:[78175],“问题,”:[79],“建筑物”:[80165],“基于”:[81],“以前的”:[82],“作品”。“:[83],“go”:[85],“categorise”:[88],“existing”:[89],“benchmarks”:[00166],“ZSG”,“:[92142161],“as”:[93,95152172],“current”:[96110],“methods”:[97159],“taggling”:[99149],“these”:[100],“problems”。“:[101],“最后,”:[102],“提供”:[104],“关键”:[106],“讨论”:[107],“状态”:[111],“字段”:[114],“包括”:[115],“建议”:[116],“未来”:[1118156],“工作”:[119],“其中”:[120],“其他”:[121],“结论”:[122],“争论”:[124],“那”:[125],“采取”:[126],“纯粹”:[128],“程序性“:[129],”内容“:[130],”生成“:[131],”方法“:[132],”基准“:[134],”设计“:[135],”非“:[137],”有益“:[138],”进度“:[140],”建议“:[144],”快速“:[145],”在线“:[146],”适应“:[147],”特定RL“:[150],”问题“:[151],”部分“:[153],”领域“:[154],”工作“:[157],”推荐“:[164],”未充分开发“:[168],”难题“:[169],”设置“:[170],“such”:[171],“offline”:[173],“奖励函数“:[177],”变化。“:[178]},”cited_by_api_url“:”https://api.openalex.org/works?filter=cites:W4315487473“,”counts_by_year“:[{”年份“:2024,”cited_by_count“:16},{”年“:2023,”ciped_by_cunt“:11},”{“年份”:2022,“cited_by_count”:3}],”updated_date“:“2024-07-01T16:30:49.748110”,“创建日期”:“2023-01-11”}