{“id”:“https://openalex.org/W3034528880“,”doi“:”https://doi.org/10.24963/ijcai.2020/280“,”title“:”IR-VIC:在RL中无监督地发现要转移的子目标“,”display_name“:”IR-VIC:在RL中无监督地发现要转移的子目标“,”publication_year“:2020,”publication_date“:”2020-07-01“,”ids“:{”openalex“:”https://openalex.org/W3034528880“,”doi“:”https://doi.org/10.24963/ijcai.2020/280“,”mag“:”3034528880“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://doi.org/10.24963/ijcai.2020/280,“pdf_url”:https://www.ijcai.org/proceedings/2020/0280.pdf“,”“source”“:null,”“license”“:null,”“license_id”“:null,”version“:”publishedVersion“,”is_accepted“:true,”“is_published”“:true},”type“:”preprint“,”type_crossref“:“proceedings-article”“,”indexed_in“:[”arxiv“,”crossref“,”datacite“],”open_access“:{”is_oa“:true,”“oa_status”:”青铜“,”oa_url“:”https://www.ijcai.org/proceedings/2020/0280.pdf“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5054644876“,”display_name“:”Nirbhay Modhe“,”orcid“:null},”institutions“:[{”id“:”https://openalex.org/I130701444“,”display_name“:”佐治亚理工学院“,”ror“:”网址:https://ror.org/01zkghx44“,”country_code“:”US“,”type“:“教育”,”世系“:[”https://openalex.org/I130701444“]}],”国家“:[“美国”],”is_corresponding“:false,”raw_author_name“:”Nirbhay Modhe“,”raw _ afiliation_strings“:[”佐治亚理工学院“],”affiliations“:[{”raw_ afiliation _string“:”佐治雅理工学院”,“institution_ids”:[”https://openalex.org/I130701444“]}]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5029904363“,”display_name“:”Prithvijit Chattopadhyay“,”orcid“:null},”institutions“:[{”id“:”https://openalex.org/I130701444“,”display_name“:”佐治亚理工学院“,”ror“:”网址:https://ror.org/01zkghx44“,”country_code“:”US“,”type“:“教育”,”世系“:[”https://openalex.org/I130701444“]}],”国家“:[”美国“],”is_corresponding“:false,”raw_author_name“:”Prithvijit Chattopadhyay“,”raw _ afiliation_strings“:[“佐治亚理工学院”],”affiliations“:[{”raw_ afiliation _string“:”佐治亚工学院“,”institution_ids“:[https://openalex.org/I130701444“]}]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5102792137“,”display_name“:”Mohit Sharma“,”orcid“:”https://orcid.org/0000-0002-5680-9111},“机构”:[{“id”:https://openalex.org/I130701444“,”display_name“:”佐治亚理工学院“,”ror“:”网址:https://ror.org/01zkghx44“,”country_code“:”US“,”type“:“教育”,”世系“:[”https://openalex.org/I130701444“]}],”国家“:[”美国“],”is_corresponding“:false,”raw_author_name“:”Mohit Sharma“,”raw _affiliation_strings“:[“佐治亚理工学院”],”affiliations“:[{”raw _affiliation_string“:”佐治亚工学院“,”institution_ids“:[https://openalex.org/I130701444“]}]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5102972112“,”display_name“:”Abhishek Das“,”orcid“:”https://orcid.org/0000-0002-4718-4316},“机构”:[{“id”:https://openalex.org/I130701444“,”display_name“:”佐治亚理工学院“,”ror“:”网址:https://ror.org/01zkghx44“,”country_code“:”US“,”type“:“教育”,”世系“:[”https://openalex.org/I130701444“]}],”国家“:[”美国“],”is_corresponding“:false,”raw_author_name“:”Abhishek Das“,”raw_affiliation_strings“:[“佐治亚理工学院”],”affiliations“:[{”raw_affiliation_string“:”佐治亚工学院“,”institution_ids“:[https://openalex.org/I130701444“]}]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5050342343“,”display_name“:”Devi Parikh“,”orcid“:”https://orcid.org/0000-0002-3779-6706},“机构”:[{“id”:https://openalex.org/I130701444“,”display_name“:”佐治亚理工学院“,”ror“:”网址:https://ror.org/01zkghx44“,”country_code“:”US“,”type“:“教育”,”世系“:[”https://openalex.org/I130701444“]},{”id“:”https://openalex.org/I2252078561“,”display_name“:”Meta(以色列)“,”ror“:”https://ror.org/02388em19“,”country_code“:”IL“,”type“:“company”,”lineage“:[”https://openalex.org/I2252078561","https://openalex.org/I4210114444“]}],”国家“:[”IL“,”US“],”is_corresponding“:false,”raw_author_name“:”Devi Parikh“,”raw _affiliation_strings“:[“Facebook AI Research”,“乔治亚理工学院”],”affiliations“:[{”raw _affiliation_string“:”佐治亚理工大学“,”institution_ids“:[”https://openalex.org/I130701444“]},{”raw_affiliation_string“:”Facebook AI Research“,”institution_ids“:[”https://openalex.org/I2252078561“]}]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5014035752“,”display_name“:”Dhruv Batra“,”orcid“:”https://orcid.org/0000-0002-1358-0011},“机构”:[{“id”:https://openalex.org/I130701444“,”display_name“:”佐治亚理工学院“,”ror“:”网址:https://ror.org/01zkghx44“,”country_code“:”US“,”type“:“教育”,”世系“:[”https://openalex.org/I130701444“]},{”id“:”https://openalex.org/I2252078561“,”display_name“:”Meta(以色列)“,”ror“:”https://ror.org/02388em19“,”country_code“:”IL“,”type“:“company”,”lineage“:[”https://openalex.org/I2252078561","https://openalex.org/I4210114444“]}],”国家“:[”IL“,”US“],”is_corresponding“:false,”raw_author_name“:”Dhruv Batra“,”raw _affiliation_strings“:[“Facebook AI Research”,“Georgia Institute of Technology”],“affiliations”:[{“raw _afiliation_string”:“Georgiation institution_ids”:[”https://openalex.org/I130701444“]},{”raw_affiliation_string“:”Facebook AI Research“,”institution_ids“:[”https://openalex.org/I2252078561“]}]},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A5041797310“,”display_name“:”Ramakrishna Vedantam“,”orcid“:null},”institutions“:[{”id“:”https://openalex.org/I2252078561“,”display_name“:”Meta(以色列)“,”ror“:”https://ror.org/02388em19“,”country_code“:”IL“,”type“:“company”,”lineage“:[”https://openalex.org/I2252078561","https://openalex.org/I4210114444“]}],”国家“:[”IL“],”is_corresponding“:false,”raw_author_name“:”Ramakrishna Vedantam“,”raw _ afiliation_strings“:[“Facebook AI Research”],”从属关系“:[{”raw _affiliation_string“:”Facebook AI研究“,”institution_ids“:[https://openalex.org/I2252078561“]}]}],”institution_assertions“:[],”countries_distiction_count“:2,”institutions_disticent_count”:2,“corresponding_author_ids”:[]、“corresconding_institution_ids“:[[],”apc_list“:null,”apc _payed“:nul,”fwci“:null,”has_fulltext“:true,”fulltext_origin“:”pdf“,”cited_by_count:2、“citation_normalized_percentile”:{“value”:0.50103,““is_in_top_1_percent”:假,“is_in_top_10_percent“:false},”cited_by_percentile_year“:{”min“:70,”max“:75},“biblio”:{“volume”:null,“issue”:nul,“first_page”:null,“last_page”:null},,“is_retracted”:false,“is_paratext”:false,“primary_topic”:{“id”:“https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9969,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9969,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T12761“,”“display_name”:“适应数据流中的概念漂移”,“score”:0.9943,“subfield”:{“id”:“https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T11303“,”“display_name”:“贝叶斯网络中的学习和推理”,“score”:0.991,“subfield”:{“id”:“https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/observability网站“,”display_name“:”Observability“,”score“:0.90430593},{”id“:”https://openalex.org/keywords/sample-complexity网站“,”display_name“:”示例复杂性“,”score“:0.62319905},{”id“:”https://openalex.org/keywords/change-detection网站“,”display_name“:”更改检测“,”score“:0.525609},{”id“:”https://openalex.org/keywords/reinforcement-learning网站“,”display_name“:”强化学习“,”score“:0.523466},{”id“:”https://openalex.org/keywords/incremental-learning网站“,”display_name“:”增量学习“,”score“:0.519266},{”id“:”https://openalex.org/keywords/adaptive-algorithms网站“,”display_name“:”自适应算法“,”score“:0.515576},{”id“:”https://openalex.org/keywords/structure-learning(https://openalex.org/关键词/结构学习)“,”display_name“:”Structure Learning“,”score“:0.514007}],”concepts“:[{”id“:”https://openalex.org/C36299963,“wikidata”:https://www.wikidata.org/wiki/Q1369844“,”display_name“:”Observability“,”level“:2,”score“:0.90430593},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.6830721},{”id“:”https://openalex.org/C2778445095,“wikidata”:https://www.wikidata.org/wiki/Q18354077“,”display_name“:”示例复杂性“,”level“:2,”score“:0.62319905},{”id“:”https://openalex.org/C187691185,“wikidata”:https://www.wikidata.org/wiki/Q2020720“,”display_name“:”Grid“,”level“:2,”score“:0.5469005},{”id“:”https://openalex.org/C177264268,“wikidata”:https://www.wikidata.org/wiki/Q1514741“,”display_name“:”Set(abstract data type)“,”level“:2,”score“:0.53211695},{”id“:”https://openalex.org/C119857082,“wikidata”:https://www.wikidata.org/wiki/Q2539“,”display_name“:”机器学习“,”level“:1,”score“:0.45701838},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.42927703},{”id“:”https://openalex.org/C2775924081,“wikidata”:https://www.wikidata.org/wiki/Q55608371“,”display_name“:”Control(management)“,”level“:2,”score“:0.41584814},{”id“:”https://openalex.org/C33923547,“wikidata”:https://www.wikidata.org/wiki/Q395网址“,”display_name“:”数学“,”等级“:0,”分数“:0.16366187},{”id“:”https://openalex.org/C2524010,“wikidata”:https://www.wikidata.org/wiki/Q8087“,”display_name“:”Geometry“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C28826006,“wikidata”:https://www.wikidata.org/wiki/Q33521“,”display_name“:”应用数学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C199360897,“wikidata”:https://www.wikidata.org/wiki/Q9143“,”display_name“:”编程语言“,”level“:1,”score“:0.0}],”mesh“:[],”locations_count“:4,”location“:[{”is_oa“:true,”landing_page_url“:”https://doi.org/10.24963/ijcai.2020/280,“pdf_url”:https://www.ijcai.org/proceedings/2020/0280.pdf“,”source“:null,”license“:null,”license_id“:null,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},{”is_oa“:true,”landing_page_url“:”http://arxiv.org/abs/1907.10580,“pdf_url”:http://arxiv.org/pdf/1907.10580,“源”:{“id”:https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”is_core“:fase,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”Cornell University“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false},{“is_oa”:true,“landing_page_url”:“https://arxiv.org/abs/1907.10580,“pdf_url”:https://arxiv.org/pdf/1907.10580,“源”:{“id”:https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”is_core“:fase,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”Cornell University“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false},{“is_oa”:false,“landing_page_url”:“https://api.datacite.org/dois/10.48550/arxiv.1907.10580“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4393179698“,”display_name“:”DataCite API“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”is_core“:false,”host_organization“:”https://openalex.org/I4210145204“,”“host_organization_name”:“DataCite”,“host_organization_lineage”:[“https://openalex.org/I4210145204“],”host_organization_lineage_names“:[”DataCite“],“type”:“metadata”},“license”:null,“licence_id”:null,“version”:null}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“https://doi.org/10.24963/ijcai.2020/280,“pdf_url”:https://www.ijcai.org/proceedings/2020/0280.pdf“,”source“:null,”license“:null,”license_id“:null,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},”sustainable_development_goals“:[{”id“:”https://metadata.un.org/sdg/16“,”score“:0.79,”display_name“:”和平、正义和强大的机构“}],”grants“:[],”datasets“:[],”versions“:[”https://openalex.org/W3034528880","https://openalex.org/W3101757010“],”referenced_works_count“:31,”referrenced_works“:[”https://openalex.org/W1686946872","https://openalex.org/W172298727","https://openalex.org/W1786044565","https://openalex.org/W187288179","https://openalex.org/W1970302770","https://openalex.org/W2044442377","https://openalex.org/W2098774185","https://openalex.org/W2099111195","https://openalex.org/W2115807451","https://openalex.org/W2117533361","https://openalex.org/W2143435603","https://openalex.org/W2160589914","https://openalex.org/W2173248099","https://openalex.org/W2398870399","https://openalex.org/W2556477470","https://openalex.org/W2592215206","https://openalex.org/W2735995851","https://openalex.org/W2753738274","https://openalex.org/W28829877577","https://openalex.org/W2883433335","https://openalex.org/W288600153","https://openalex.org/W2913854057","https://openalex.org/W2950152428","https://openalex.org/W2963199420","https://openalex.org/W2963343988","https://openalex.org/W2963438456","https://openalex.org/W2964009285","https://openalex.org/W2964160479","https://openalex.org/W4290994727","https://openalex.org/W4293469690","https://openalex.org/W4294351673“],”related_works“:[”https://openalex.org/W4312300846","https://openalex.org/W4206221578","https://openalex.org/W3157641275","https://openalex.org/W3029572990","https://openalex.org/W2967463586","https://openalex.org/W2765830098","https://openalex.org/W2615757685","https://openalex.org/W2517338020","https://openalex.org/W2046459260","https://openalex.org/W1971989957“],”abstract_inverted_index“:{”We“:[0,19],”propose“:[1],”a“:[2,38],”novel“:[3],”framework“:[4,25],”to“:[5,35,46,82],”identified“:[6,47],”sub-goals“:[7,48,69],”有用“:[8],”for“:[9],“exploration”:[10,72],”in“:[11,85],”sequential“:[12],”decision“:[13],”making“:[14],“tasks”:[15,80],“under”:[16],“partial”:[17],“observability”:[18],“use”:[20],““:[21,33],“变化”:[22],“内在”:[23],“控制”:[24],“(格雷戈”:[26],“et.al.,”:[27],“2016)”:[28],“其中”:[29],“最大化”:[30],“赋权”:[31],“--”:[32],“能力”:[34],“可靠”:[36],“到达”:[37],“多样”:[39],“集合”:[40],“of”:[41],“状态”:[42,50],“and”:[43,73],“show”:[44],“how”:%45],“as”:[49],“with”:[51],“high”:[52],“necessary”:[53],“选项”:[54],“信息”:[55,58],“通过”:[56],“an”:[57],“理论”:[59],“正则化器”:[60],“尽管”:[61],“存在”:[62],“发现”:[63],“没有”:[64],“显式”:[65],“目标”:[66],“监督”:[67],“我们的”:[68],“提供”:[70],“更好”:[71],“样本”:[74],“复杂性”:[75],“on”:[76],“challenge”:[77],“grid-world”:[78],“navigation”:[79],“已比较”:[81],“受监督”:[83],“同行”:[84],“先前”:[86],“工作。”:[87]},“cited_by_api_url”:“https://api.openalex.org/works?filter=引用:W3034528880“,”counts_by_year“:[{”年“:2022,”引用_by_count“:2}],”更新日期“:”2024-09-15T11:49:24.657171“,”创建日期“:“2020-06-19”}