{“id”:“https://openalex.org/W4386794113“,”doi“:”https://doi.org/10.48550/arxiv.2309.07168“,”title“:”通过可达性分析进行分层强化学习中的目标空间抽象“,”display_name“:”基于可达性分析的分层强化学习的目标空间提取“,”publication_year“:2023,”publitation_date“:”2023-01-01“,”ids“:{”openalex“:”https://openalex.org/W4386794113“,”doi“:”https://doi.org/10.48550/arxiv.2309.07168“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2309.07168“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_in_doaj“:false,”is_core“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“other-oa”,“licence_id”:“https://openalex.org/licenses/other-oa网站“,”version“:null,”is_accepted“:false,”is_published“:false},”type“:预打印”,”type_crossref“:”journal-article“,”indexed_in“:[”arxiv“,”datacite“],”open_access“:{”is_oa“:true,”oa_status“:”青铜“,”oa_url“:”https://arxiv.org/abs/2309.07168“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5081747756“,”display_name“:”Mehdi Zadem“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Mehdi-Zadems“,”raw _affiliation_string“:[”LIX,U2IS“],”affiliation“:[{”raw_affiliation_string“:”LIX、U2IS”,“institution_ids”:[]},{”author_position“:”middle“,”author“:{”id“:“”https://openalex.org/A5023894417“,”display_name“:”Sergio Mover“,”orcid“:”https://orcid.org/0000-0003-1029-9547“},”机构“:[{”id“:”https://openalex.org/I4210139461“,”display_name“:”Laboratoire d'Informatique de l'\u00c9cole Polytechnique“,”ror“:”https://ror.org/04afed728“,”“country_code”“:”FR“,”type“:”facility“,”lineage“:[”https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I142476485","https://openalex.org/I4210139461","https://openalex.org/I4210145102","https://openalex.org/I4210159245“]}],”国家“:[”FR“],”is_corresponding“:false,”raw_author_name“:”Sergio Mover“,”raw _ afiliation_strings“:[“LIX”],”从属关系“:[{”raw_ afiliation _string“:”LIX“,”institution_ids“:[https://openalex.org/I4210139461“]}]},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A5046094611“,”display_name“:”Sao Mai Nguyen“,”orcid“:”https://orcid.org/0000-0003-0929-0019“},”机构“:[{”id“:”https://openalex.org/I79172759“,”display_name“:”Lantiq(德国)“,”ror“:”https://ror.org/01bvfdq42“,”country_code“:”DE“,”type“:“company”,”lineage“:[”https://openalex.org/I79172759“]},{”id“:”https://openalex.org/I4210127572“,”display_name“:”IMT Atlastyly“,”ror“:”https://ror.org/030hj3061“,”country_code“:”FR“,”type“:“教育”,”世系“:[”https://openalex.org/I4210127572“]}],”国家“:[”DE“,”FR“],”is_corresponding“:false,”raw_author_name“:”Sao Mai Nguyen“,”raw _affiliation_strings“:[“U2IS,Flowers,IMT Atlastive-INFO,Lab-STICC_RAMBO”],”affiliations“:[{”raw _affiliation_string“:”U2IS、Flowers、IMT Atlestive-信息,Lab-SPICC_RAMBO“,“institution_ids”:[“https://openalex.org/I79172759","https://openalex.org/I4210127572“]}]}],”institution_assertions“:[],”countries_distinact_count“:2,”institutions_disticant_count”:3,”corresponding_author_ids“:[[],”corresponding_institution_ids”:[],“apc_list”:null,”apc_payed“:null”,“fwci”:null,”has_fulltext“:false,”cited_by_count“is_in_top_10_percent”:错误},“cited_by_percentile_year“:{“min”:0,“max”:71},“biblio”:{卷:null,“问题”:nullhttps://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9975,”subfield“:{”id“:”https://openalex.org/subfields/s702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9975,”subfield“:{”id“:”https://openalex.org/subfields/s702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T11975“,”“display_name”:“遗传编程在机器学习中的应用”,“score”:0.975,“subfield”:{“id”:“https://openalex.org/subfields/s702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T11714“,”“display_name”:“图像和视频中的可视问答”,“score”:0.9476,“subfield”:{“id”:“https://openalex.org/subfields/1707“,”display_name“:”计算机视觉和模式识别“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/representation网站“,”display_name“:”Representation(politics)“,”score“:0.76065326},{”id“:”https://openalex.org/keywords/abstraction网站“,”display_name“:”抽象“,”分数“:0.6926485},{”id“:”https://openalex.org/keywords/reinforcement-learning网站“,”display_name“:”强化学习“,”score“:0.586354},{”id“:”https://openalex.org/keywords/symbolic-regression网站“,”display_name“:”符号回归“,”score“:0.533705},{”id“:”https://openalex.org/keywords/language-understanding“,”display_name“:”语言理解“,”score“:0.514666},{”id“:”https://openalex.org/keywords/feature-learning“,”display_name“:”功能学习“,”score“:0.47363037}],”concepts“:[{”id“:”https://openalex.org/C97541855,“wikidata”:https://www.wikidata.org/wiki/Q830687“,”display_name“:”强化学习“,”level“:2,”score“:0.77164865},{”id“:”https://openalex.org/C2776359362,“wikidata”:https://www.wikidata.org/wiki/Q2145286“,”display_name“:”Representation(politics)“,”level“:3,”score“:0.76065326},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.75058305},{”id“:”https://openalex.org/C124304363,“wikidata”:https://www.wikidata.org/wiki/Q673661“,”display_name“:”抽象“,”级别“:2,”分数“:0.6926485},{”id“:”https://openalex.org/C136643341,“wikidata”:https://www.wikidata.org/wiki/Q1361526“,”display_name“:”可达性“,”级别“:2,”分数“:0.6511718},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.58022755},{”id“:”https://openalex.org/C2780451532,“wikidata”:https://www.wikidata.org/wiki/Q759676“,”display_name“:”任务(项目管理)“,”级别“:2,”分数“:0.5470494},{”id“:”https://openalex.org/C2778572836,“wikidata”:https://www.wikidata.org/wiki/Q380933“,”display_name“:”空格(标点符号)“,”level“:2,”score“:0.5145023},{”id“:”https://openalex.org/C161301231,“wikidata”:https://www.wikidata.org/wiki/Q3478658“,”display_name“:”知识表示与推理“,”level“:2,”score“:0.48741463},{”id“:”https://openalex.org/C59404180,“wikidata”:https://www.wikidata.org/wiki/Q17013334“,”display_name“:”功能学习“,”level“:2,”score“:0.47363037},{”id“:”https://openalex.org/C119857082,“wikidata”:https://www.wikidata.org/wiki/Q2539“,”display_name“:”机器学习“,”level“:1,”score“:0.46675137},{”id“:”https://openalex.org/C107457646,“wikidata”:https://www.wikidata.org/wiki/Q207434“,”display_name“:”Human\u2013计算机交互“,”level“:1,”score“:0.3662156},{”id“:”https://openalex.org/C80444323,“wikidata”:https://www.wikidata.org/wiki/Q2878974“,”display_name“:”理论计算机科学“,”level“:1,”score“:0.34073302},{”id“:”https://openalex.org/C138885662,“wikidata”:https://www.wikidata.org/wiki/Q5891“,”display_name“:”哲学“,”等级“:0,”分数“:0.0},{”id“:”https://openalex.org/C187736073,“wikidata”:https://www.wikidata.org/wiki/Q2920921“,”display_name“:”管理“,”级别“:1,”分数“:0.0},{”id“:”https://openalex.org/C111472728,“wikidata”:https://www.wikidata.org/wiki/Q9471“,”display_name“:”认识论“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C94625758,“wikidata”:https://www.wikidata.org/wiki/Q7163“,”display_name“:”政治“,”级别“:2,”分数“:0.0},{”id“:”https://openalex.org/C17744445,“wikidata”:https://www.wikidata.org/wiki/Q36442“,”display_name“:”政治学“,”level“:0,”score“:0.0},{”id“:”https://openalex.org/C199539241,“wikidata”:https://www.wikidata.org/wiki/Q7748“,”display_name“:”Law“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C162324750,“wikidata”:https://www.wikidata.org/wiki/Q8134“,”display_name“:”经济学“,”level“:0,”score“:0.0},{”id“:”https://openalex.org/C111919701,“wikidata”:https://www.wikidata.org/wiki/Q9135“,”display_name“:”操作系统“,”level“:1,”score“:0.0}],”mesh“:[],”locations_count“:3,”location“:[{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2309.07168“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_in_doaj“:false,”is_core“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“other-oa”,“licence_id”:“https://openalex.org/licenses/other-oa网站“,”版本“:null,”is_accepted“:false,”is_published“:false},{”is_oa“:true,”landing_page_url“:”https://hal.science/hal-04201363,“pdf_url”:https://hal.science/hal-04201363/document“,”source“:null,”license“:”cc-by“,”licence_id“:”https://openalex.org/licenses/cc-by“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},{”is_oa“:false,”landing_page_url“:”https://api.datacite.org/dois/10.48550/arxiv.2309.07168“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4393179698“,”display_name“:”DataCite API“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”is_core“:false,”host_organization“:”https://openalex.org/I4210145204“,”host_organization_name“:”DataCite“,”host_organization_lineage“:[”https://openalex.org/I4210145204“],”host_organization_lineage_names“:[”DataCite“],“type”:“metadata”},“license”:null,“licence_id”:null,“version”:null}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“https://arxiv.org/abs/2309.07168“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_in_doaj“:false,”is_core“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“other-oa”,“licence_id”:“https://openalex.org/licenses/other-oa网站“,”version“:null,”is_accepted“:false,”is_published“:false},”sustainable_development_goals“:[],”grants“:[],”datasets“:【],”versions“:【】,”referenced_works_count“:0,”referrenced_works“:〔〕,”related_work“:[”https://openalex.org/W4321471459","https://openalex.org/W2889071233","https://openalex.org/W2387511021","https://openalex.org/W2380814829","https://openalex.org/W2156446763","https://openalex.org/W2150194458","https://openalex.org/W2143461633","https://openalex.org/W2136512912","https://openalex.org/W2127267268","https://openalex.org/W2067910792“],”abstract_inverted_index“:{”Open-ended“:[0],”learning“:[1],”benefits“:[2],”immensely“:[3],”from“:[4],”the“:[5,26,65,97111121],”use“:[6],”of“:[7,89],”symbol“:[8,35,53],”methods“:[9],”for“:[10,20,76],”goal“:[11,45,54],”representation“:[12,55,82108123],”as“:[13,4]0,64],“他们”:[14,41],“提供”:[15],“方式”:[16],“到”:[17119],“结构”:[18],“知识”:[19],“有效”:[21],“和”:[22113126],“可转移”:[23],“学习。“:[24],”“然而,”:[25],“现有”:[27],“分层”:[28],“强化”:[29],“学习”:[30],“(HRL)”:[31],“方法”:[32],“依赖”:[33],“on”:[34116],“推理”:[36],“are”:[37],“经常”:[38],“有限”:[39],“需要”:[42],“a”:[43,52,73101],“手动”:[44],“表示。“:[46],”The“:[47],”challenge“:[48],”in“:[49,96128],”autonomyly“:[50],”discoverying“:[51],”is“:[56124],”that“:[57,83,92104],”it“:[58115],”must“:[59],”preserve“:[60],”critical“:/61],”information“:[62],”such“:[63],”environment“:[66,90],”dynamics“。“:[67],“In”:[68],“this”:[69107],“work”,:[70],“we”:%71],“propose”:[72],“developmental”:[74],“mechanism”:[75],“subgoal”:[77],“discovery”:【78】,“via”:【79】,“an”:【80】,“emergent”:【81】,“abstracts”:【84】,“(即,“:[85],”groups“:【86】,“together”)”:【87】,“set”:【88】,“状态”:[91],“有”:[93],“类似”:[94],“角色”:[95],“任务”。“:[98],“我们”:[99],“创建”:[100],“HRL”:[102],“算法”:[103],“逐步”:[105],“学习”:[106],“沿着”:[109],“with”:[110],“策略”:[112],“评估”:[114],“导航”:[117],“任务”:[118],“显示”:[120],“学会”:[122],“可解释”:[125],“结果”:[127],“数据”:[129],“效率”。“:[130]},”cited_by_api_url“:”https://api.openalex.org/works?filter=cites:W4386794113“,”counts_by_year“:[],”updated_date“:”2024-09-16T09:24:00.634909“,”created_date:“2023-09-16”}“