{“id”:“https://openalex.org/W4281986404“,”doi“:”https://doi.org/10.48550/arxiv.2205.14205“,”title“:”ALMA:复合多代理任务的分层学习“,”display_name“:”ALMA:复合多重代理任务的层次学习“,“publication_year”:2022,”publication_date“:”2022-01-01“,”ids“:{”openalex“:”https://openalex.org/W4281986404“,”doi“:”https://doi.org/10.48550/arxiv.2205.14205“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2205.14205“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],”type“:”repository“},”license“:”抄送人“,”license_id“:”https://openalex.org/licenses/cc-by“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},”type“:”preprint“,”type_crossref“:“posted-content”,”indexed_in“:[”arxiv“,”datacite“],”open_access“:{”is_oa“:true,”oa_status“:”green“,”oa_url“:”https://arxiv.org/abs/2205.14205“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5036422995“,”display_name“:”Shariq Iqbal“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Iqball,Shariq“,”raw _affiliation_strings“:],”affiliations“:【】},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5049051691“,”display_name“:”Robby Costales“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Costales,Robby“,”raw _affiliation_strings“:],”affiliations“:[/]},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A5021516103“,”display_name“:”飞沙“,”兽人“:”https://orcid.org/0000-0002-5115-2229“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:Sha,Fei”,“raw_affiliation_strings”:[],“从属关系”:[]}],“countries_distict_count”:0,“institutions_disticenc_count”:“0,”corresponding_author_ids“:[]”,“correspounding_institution_ids”:[]、“apc_list”:null,“apc_payed”:nul,“fwci”:0.665,“has”_fulltext“:false,”cited_by_count“:2,”cited_by_percentile_year“:{“min”:76,“max”:81},“biblio”:{”volume“:null,“issue”:null、“first_page”:null,“last_page”:null},”is_retracted“:false,”is_paratext“:false,”primary_topic“:{”id“:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9845,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9845,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T12026“,”display_name“:”可解释人工智能“,”score“:0.9178,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/reinforcement-learning网站“,”display_name“:”强化学习“,”score“:0.560022},{”id“:”https://openalex.org/keywords/multi-gent-systems网站“,”display_name“:”Multi-Agent Systems“,”score“:0.545884},{”id“:”https://openalex.org/keywords/responsibility-in-ai“,”display_name“:”AI中的责任“,”score“:0.503805}],”concepts“:[{”id“:”https://openalex.org/C97541855,“wikidata”:https://www.wikidata.org/wiki/Q830687“,”display_name“:”强化学习“,”level“:2,”score“:0.74932015},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.7192023},{”id“:”https://openalex.org/C2779478453,“wikidata”:https://www.wikidata.org/wiki/Q6889748“,”display_name“:”模块化(生物学)“,”level“:2,”score“:0.59665924},{”id“:”https://openalex.org/C2776760102,“wikidata”:https://www.wikidata.org/wiki/Q5139900“,”“display_name”“:”代码(集合论)“,”级别“:3,”分数“:0.48376775},{”id“:”https://openalex.org/C2780791683,“wikidata”:https://www.wikidata.org/wiki/Q846785“,”display_name“:”Action(physical)“,”level“:2,”score“:0.42738786},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.42722753},{”id“:”https://openalex.org/C119857082,“wikidata”:https://www.wikidata.org/wiki/Q2539“,”display_name“:”机器学习“,”level“:1,”score“:0.35955432},{”id“:”https://openalex.org/C120314980,“wikidata”:https://www.wikidata.org/wiki/Q180634“,”display_name“:”分布式计算“,”level“:1,”score“:0.33533257},{”id“:”https://openalex.org/C177264268,“wikidata”:https://www.wikidata.org/wiki/Q1514741“,”display_name“:”Set(abstract data type)“,”level“:2,”score“:0.19957721},{”id“:”https://openalex.org/C199360897,“wikidata”:https://www.wikidata.org/wiki/Q9143“,”display_name“:”编程语言“,”level“:1,”score“:0.14655802},{”id“:”https://openalex.org/C54355233,“wikidata”:https://www.wikidata.org/wiki/Q7162“,”display_name“:”Genetics“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C121332964,“wikidata”:https://www.wikidata.org/wiki/Q413“,”display_name“:”物理“,”级别“:0,”分数“:0.0},{”id“:”https://openalex.org/C62520636,“wikidata”:https://www.wikidata.org/wiki/Q944“,”display_name“:”量子力学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C86803240,“wikidata”:https://www.wikidata.org/wiki/Q420“,”display_name“:”Biology“,”level“:0,”score“:0.0}],”mesh“:[],”locations_count“:3,”location“:[{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2205.14205“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“cc-by”,“licence_id”:“https://openalex.org/licenses/cc-by“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},{”is_oa“:true,”landing_page_url“:”http://arxiv.org/abs/2205.14205,“pdf_url”:http://arxiv.org/pdf/2205.14205,“源”:{“id”:https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”Cornell University“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false},{“is_oa”:false,“landing_page_url”:“https://api.datacite.org/dois/10.48550/arxiv.2205.14205“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4393179698“,”display_name“:”DataCite API“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I4210145204“,”host_organization_name“:”DataCite“,”host_organization_lineage“:[”https://openalex.org/I4210145204“],”host_organization_lineage_names“:[”DataCite“],“type”:“metadata”},“license”:null,“licence_id”:null,“version”:null}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“https://arxiv.org/abs/2205.14205“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],”type“:”repository“},”license“:”抄送人“,”license_id“:”https://openalex.org/licenses/cc-by“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},”sustainable_development_goals“:[{”display_name“:”减少不平等“,”id“:”https://metadata.un.org/sdg/10“,”score“:0.51},{”display_name“:”和平、正义和强大的机构“,”id“:”https://metadata.un.org/sdg/16“,”score“:0.5}],”grants“:[],”datasets“:【】,”versions“:【],”referenced_works_count“:0,”referrenced_works“:[],”related_work“:[”https://openalex.org/W4316651471","https://openalex.org/W4230687177","https://openalex.org/W3120118008网址","https://openalex.org/W3005557527","https://openalex.org/W2367249529","https://openalex.org/W2349859869","https://openalex.org/W2088885441","https://openalex.org/W2051365847","https://openalex.org/W2027187261","https://openalex.org/W1968829728“],”ngrams_url“:”https://api.openalex.org/works/W4281986404/ngrams网站“,”“abstract_inverted_index”:{“尽管”:[0],“重要”:[1],“进步”:[2],“开启”:[3,23,62],“多智能体”:[4],“强化”:[5],“学习”:[6147],“(MARL)”:[7],“in”:[8,12,19,35,71176],“最近”:[9],“年”:[10],“协调”:[1174],“复杂”:[13],“域”:[14],a“:[1610145159177],”挑战。“:[17],”工作“:[18],”MARL“:[20],”经常“:[21,45,81],”焦点“:[22],”解决“:[24],”任务“:[25,43],”其中“:[26],”代理“:[27,32,89],”交互“:[28],”与“:[29],”全部“:[30,69219],“其他”:[31],”和“:[33,56,95120127164208],”实体“:[34],”the“:[36,72211],”环境;“:[37],”然而,“:[38],”我们“:[39198],”观察“:[40],”那“:[41170200],”现实世界“:[42],”是“:[44,90],”组合“:[46128],”的“:[47,51,68,87138152179],”多个“:[48],”隔离“:[49],”实例“:[50],”本地“:[52],”代理“:[53,58,97117166],”交互“:[54],”(子任务),“:[55],“每个”:[57,96135],“可以”:[59,80203],“有意义的”:[60],“focus“:[61],”one“:[63],”subtask“:[64103161],”to“:[65,9124133190193],”exclusion“:[67],”else“:[70],”environment。“:[73],“In”:[74],“these”:[75153],“composite”:[76],“tasks”,:[77],“successful”:[78],“policies”:[79123],“be”:[82125],“decomposed”:[83106],“into”:[84],“two”:【85】,“levels”:【86】,“decision:”:【88】,“allocated”:【91】,“specific”:【93】,“subtask”:[94139],“acts”:[98],“productive”:【99】],“朝向”:[100],“他们的”:[101],“分配的”:%102],“单独。“:[104],”This“:[105],”decision“:[107],”making“:[108],”provides“:[109],”strong“:[111183],”structural“:[112],”inductive“:[113],”bias“:[114],”显着“:[115],”reduced“:[116],”observation“:[118],”spaces“:[119],”鼓励“:[121],”特定子任务“:[122],”重用“:[126],”在“:[129],”培训“:[130],”作为“:[131140],”反对“:[132],”处理”:[134],“新”:[136194],“组成”:[137],“独特”。“:[141],”我们“:[142168],”介绍“:[143],”ALMA,“:[144],”一般“:[146],”方法“:[148],”对于“:[149],”采取“:[150],”优势“:[151],”结构化“:[154],”任务。“:[155],”ALMA“:[156171202],”同时“:[157],”学习“:[158172],”高级“:[160],”分配“:[162207],”策略“:[163],”低级“:[165],”政策。“:[167],”演示“:[169],”复杂“:[173],”行为“:[175],”数字“:[178],”挑战“:[180],”环境“:[181],”超越“:[182],”基线。“:[184],”ALMA’s“:[185],”模块化“:[186],”也“:[187],”启用“:[188],”it“:[189],”更好“:[191],”泛化“:%192],”环境“:[195],”配置。“:[196],”最后,“:[197],”查找“:[199],”while“:[201],”集成“:[204],”分别“:[205],”训练“:[206],”动作“:[209],”策略“:[210],”最佳“:[212],”性能“:[213],”是“:[214224],”获得“:[215],”仅“:[216],”通过“:[217],”培训“:[218],”组件“联合。“:[221],”我们的“:[222],”代码“:[223],”可用“:[225],”在“:[226],”https://github.com/shariqiqbal2810/ALMA网站“:[227]},”cited_by_api_url“:”https://api.openalex.org/works?filter=cites:W4281986404“,”counts_by_year“:[{”年份“:2024,”cited_by_count“:1},{”年“:2023,”cited_by_count”:1}],”更新日期“:”2024-06-24T12:19:53.116701“,”创建日期“:“2022-06-13”}