{“id”:“https://openalex.org/W4285429144“,”doi“:”https://doi.org/10.48550/arxiv.2207.05219“,”title“:”无监督环境设计中的基于Aleatory不确定性“,”display_name“:”非监督环境设计的基于Aleotory不确定“,”publication_year“:2022,”publiation_date“:”2022-01-01“,”ids“:{”openalex“:”https://openalex.org/W4285429144“,”doi“:”https://doi.org/10.48550/arxiv.2207.05219“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2207.05219“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”is_core“:fase,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“other-oa”,“licence_id”:“https://openalex.org/licenses/other-oa网站“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},”type“:”preprint“,”type_crossref“:“posted-content”,”indexed_in“:[”arxiv“,”datacite“],”open_access“:{”is_oa“:true,”oa_status“:”green“,”oa_url“:”https://arxiv.org/abs/2207.05219“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5017949957“,”display_name“:”Minqi Jiang“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Jiang,Minqi“,”raw _affiliation_strings“:],”affiliations“:【】},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5011988886“,”display_name“:”Michael Dennis“,”orcid“:”https://orcid.org/0000-0002-8175-5311“},”机构“:[],”国家“:[],”is_correresponsing“:false,”raw_author_name“:”Dennis,Michael“,”raw_affiation_strings“:[],”附属机构“:[]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5083828420“,”display_name“:”Jack Parker-Holder“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Parker-Helder,Jack“,”raw _affiliation_strings“:],”affiliations“:[/]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5086769710“,”display_name“:”Andrei N.Lupu“,”orcid“:null},”institutions“:[],”countries“:[],”is_correresponsing“:false,”raw_author_name“:”Lupu,Andrei“,”raw_affiation_strings“:[],”affiliations“:[]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5004147468“,”display_name“:”Heinrich K\u00fcttler“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“,”K\u00 fcttler,Heinrich“,”raw _affiliation_strings“:],”afliations“:【】},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5023508792“,”display_name“:”Edward Grefenstette“,”orcid“:”https://orcid.org/0000-0003-1164-8809“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”Grefenstette,Edward“,”raw_affiliation_strings“:[],“从属关系”:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5079315903“,”display_name“:”Tim Rockt\u00e4schel“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“,”Rockt\u 00e4schel,Tim“,”raw _affiliation_strings“:],”afliations“:【】},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A5059094093“,”display_name“:”Jakob Foerster“,”orcid“:”https://orcid.org/0000-0001-9688-2498“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”Foerster,Jakob“,”raw _ afiliation_strings“:[],“隶属关系”:[]}],“countries _ distinct _count”:0,“institutions _ disting _count“:0,”corresponding_author_ids“:[】,“correspounding _ institution_ids”:[].,“apc _ list”:null,“apc_payed”:null.,“fwci”:0.3 36,“has_fulltext”:假,“cited_by_count“:1,”cited_by_percentile_year“:{“min”:66,“max”:76},“biblio”:{”volume“:null,“issue”:null、“first_page”:null,“last_page”:null},”is_retracted“:false,”is_paratext“:false,”primary_topic“:{”id“:”https://openalex.org/T12101“,”“display_name”:“多臂盗贼问题的优化”,“score”:0.9962,“subfield”:{“id”:“https://openalex.org/subfields/1803“,”display_name“:”管理科学与运筹学“},”field“:{”id“:”https://openalex.org/fields/18“,”display_name“:”Decision Sciences“},”domain“:{”id“:”https://openalex.org/domains/2“,”display_name“:”社会科学“}},”主题“:[{”id“:”https://openalex.org/T12101“,”display_name“:”多武装匪徒问题的优化“,”score“:0.9962,”subfield“:{”id“:”https://openalex.org/subfields/1803“,”display_name“:”管理科学与运筹学“},”field“:{”id“:”https://openalex.org/fields/18“,”display_name“:”Decision Sciences“},”domain“:{”id“:”https://openalex.org/domains/2“,”“display_name”:“社会科学”}},{”id“:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9937,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10603“,”display_name“:”智能电网中的需求响应“,”score“:0.9765,”subfield“:{”id“:”https://openalex.org/subfields/2208“,”display_name“:”电气与电子工程“},”字段“:{”id“:”https://openalex.org/fields/22“,”display_name“:”Engineering“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/reinforcement-learning网站“,”display_name“:”强化学习“,”score“:0.543254},{”id“:”https://openalex.org/keywords/convex优化“,”display_name“:”凸优化“,”score“:0.521139},{”id“:”https://openalex.org/keywords/regret-analysis网站“,”display_name“:”遗憾分析“,”score“:0.513373}],”concepts“:[{”id“:”https://openalex.org/C50817715,“wikidata”:https://www.wikidata.org/wiki/Q79895177“,”display_name“:”遗憾“,”等级“:2,”分数“:0.711068},{”id“:”https://openalex.org/C63479239,“wikidata”:https://www.wikidata.org/wiki/Q7353546“,”display_name“:”健壮性(进化)“,”level“:3,”score“:0.68990105},{”id“:”https://openalex.org/C146849305,“wikidata”:https://www.wikidata.org/wiki/Q370766“,”display_name“:”基本事实“,”level“:2,”score“:0.6532455},{”id“:”https://openalex.org/C149728462,“wikidata”:https://www.wikidata.org/wiki/Q751319“,”display_name“:”Minimax“,”level“:2,”score“:0.6462206},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.6003238},{”id“:”https://openalex.org/C47177190,“wikidata”:https://www.wikidata.org/wiki/Q207137网址“,”display_name“:”课程“,”级别“:2,”分数“:0.5634059},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.53726214},{”id“:”https://openalex.org/C97541855,“wikidata”:https://www.wikidata.org/wiki/Q830687“,”display_name“:”强化学习“,”level“:2,”score“:0.483858},{”id“:”https://openalex.org/C119857082,“wikidata”:https://www.wikidata.org/wiki/Q2539“,”display_name“:”机器学习“,”level“:1,”score“:0.39224043},{”id“:”https://openalex.org/C126255220,“wikidata”:https://www.wikidata.org/wiki/Q141495“,”display_name“:”数学优化“,”level“:1,”score“:0.35058358},{”id“:”https://openalex.org/C33923547,“wikidata”:https://www.wikidata.org/wiki/Q395“,”display_name“:”数学“,”等级“:0,”分数“:0.1999268},{”id“:”https://openalex.org/C199539241,“wikidata”:https://www.wikidata.org/wiki/Q7748“,”display_name“:”Law“,”level“:1,”score“:0.1625979},{”id“:”https://openalex.org/C17744445,“wikidata”:https://www.wikidata.org/wiki/Q36442“,”display_name“:”政治学“,”level“:0,”score“:0.08946505},{”id“:”https://openalex.org/C55493867,“wikidata”:https://www.wikidata.org/wiki/Q7094“,”display_name“:”生物化学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C185592680,“wikidata”:https://www.wikidata.org/wiki/Q2329“,”display_name“:”Chemistry“,”level“:0,”score“:0.0},{”id“:”https://openalex.org/C104317684,“wikidata”:https://www.wikidata.org/wiki/Q7187“,”display_name“:”Gene“,”level“:2,”score“:0.0}],”mesh“:[],”locations_count“:3,”locations“:[{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2207.05219“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”is_core“:fase,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“other-oa”,“licence_id”:“https://openalex.org/licenses/other-oa网站“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},{”is_oa“:true,”landing_page_url“:”http://arxiv.org/abs/2207.05219,“pdf_url”:http://arxiv.org/pdf/2207.05219,“源”:{“id”:https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”is_core“:fase,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”Cornell University“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false},{“is_oa”:false,“landing_page_url”:“https://api.datacite.org/dois/10.48550/arxiv.2207.05219“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4393179698“,”display_name“:”DataCite API“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_in_doaj“:false,”is_core“:false,”host_organization“:”https://openalex.org/I4210145204“,”“host_organization_name”:“DataCite”,“host_organization_lineage”:[“https://openalex.org/I4210145204“],”host_organization_lineage_names“:[”DataCite“],“type”:“metadata”},“license”:null,“licence_id”:null,“version”:null}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“https://arxiv.org/abs/2207.05219“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”is_core“:fase,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“other-oa”,“licence_id”:“https://openalex.org/licenses/other-oa网站“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},”sustainable_development_goals“:[],”grants“:[],”datasets“:],”versions“:[https://openalex.org/W4376155396","https://openalex.org/W4292701710","https://openalex.org/W4200062060","https://openalex.org/W2971351794","https://openalex.org/W2527791220","https://openalex.org/W2174986909","https://openalex.org/W2155070487","https://openalex.org/W2101991911","https://openalex.org/W1947085858","https://openalex.org/W1925875298“],”ngrams_url“:”https://api.openalex.org/works/W4285429144/ngrams网站“,”abstract_inverted_index“:{”适应性“:[0],”课程“:[1,30],”in“:[2,47,66,93],”强化“:[3],”学习“:[4,73],”(RL)“:[5],”have“:[6],”proved“:[7],”effective“:[8],”for“:[9],”生产“:[10],”策略“:[11,53],”robust“:[12,42],”to“:[13,38,98139],”差异“:[14],“协议双方”:[15],“协议方”:[16,22,57,64,67,76106110126132154161],“列车“:[17],”和“:[18,88143],”测试“:[19],”环境。“:[20],”最近,“:[21],”未监督“:[23],”环境“:[24],”设计“:[25],”(UED)“:[26],”框架“:[27],”广义“:[28],”RL“:[29],”生成“:[32],”序列“:[33],”的“:[34,63164],”整体“:[35],”环保“:[36],”领先“:[37],”新“:[39],”方法“:[40],”with“:[41],“minimax”:[43120],“遗憾”:[44121],“属性”。“:[45],”问题,“:[46],”部分可观测“:[48],”或“:[49],”随机“:[50],”设置“,:[51],”最佳“:[52],”可能“:[54],”依赖“:[55],”on“:[56145],”接地“:[58107127155],”分布“:[59108],”超过“:[60],”任意“:[61,94],”参数“:[62,95104],”环境“:[65104]165],“预期”:[68],“部署”:[69],“设置”:[70],“while“:[71157],”课程“:[72114],”必然“:[74],”轮班“:[75],”培训“:[77134],”分配。“:[78],“我们”:[79116141],“形式化”:[80],“这个”:[81],“现象”:[82],“作为”:[83],“课程诱导”:[84],“协变量”:[85],“移位”:[86],“(CICS),”:[87],“描述”:[89],“如何”:[90],“它的”:[91],“发生”:[92],“可以”:[96],“领先”:[97],“次优”:[99],”政策。“:[100],”直接“:[101],”采样“:[102],”这些“:[103],”来自“:[105],”避免“:[109],”问题“:[111],”但是“:[112],”阻碍“:[113],”学习。“:[115],”propose“:[117],”SAMPLR“:[118],”a“:[119],”UED“:[122],”method“:[123],”that“:[124148],”optimizes“:[125],”utility“:[128],”function“:[129],”even“:[130],”when“:[131],”underfund“:[133],”data“:%135],”is“:[136],”bipeded“:[137],”due“:%138],”CICS。“:[140],”证明“:[142],”验证“:[144],”挑战“:[146],”域“:[147],”我们的“:[149],”方法“:[150],”保留“:[151],”优化“:[152],”低于“:[153],”分布“:[156],”提升“:[158],”健壮性“:[159],”跨越“:[160],”完整“:[162],”范围“:[163],”设置。“:[166]},”cited_by_api_url“:”https://api.openalex.org/works?filter=引用:W4285429144“,”counts_by_year“:[{”年“:2023,”cited_by_count“:1}],”更新日期“:”2024-06-25T12:13:50.988562“,”创建日期“:“2022-07-15”}“