{“id”:“https://openalex.org/W4391988133“,”doi“:”https://doi.org/10.48550/arxiv.2402.12181“,”title“:”在深度强化学习中重温数据增强“,”display_name“:”重温深度强化学习的数据增强“、”publication_year“:2024,”publication_date“:”2024-02-19“,”ids“:{”openalex“:”https://openalex.org/W4391988133“,”doi“:”https://doi.org/10.48550/arxiv.2402.12181“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2402.12181,“pdf_url”:https://arxiv.org/pdf/2402.12181,“源”:{“id”:https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”Cornell University“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false},”type“:”preprint“,”type_crossref“:“posted-content”,“indexed_in”:[”arxiv“],‘open_access’:{”is_oa“:true,”“oa_status”:“green”,“oa_url”:“https://arxiv.org/pdf/2402.12181“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5051535552“,”display_name“:”Jianshu Hu“,”orcid“:”https://orcid.org/0000-0003-1384-7465“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”胡建树“,”raw _ afiliation_strings“:[],“affiliations”:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5031855517“,”display_name“:”Yunpeng Jiang“,”orcid“:”https://orcid.org/0000-0003-4229-0301“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”江,云鹏“,”raw关联字符串“:[],“隶属关系”:[]},{“author_position”:“last”,“author”:{“id”:“https://openalex.org/A5073106112“,”display_name“:”Paul Weng“,”orcid“:”https://orcid.org/0000-0002-2008-4569“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:Weng,Paul”,“raw_affiliation_strings”:[]_fulltext“:false,”cited_by_count“:0,”cited_by_percentile_year“:{”min“:0”,“max”:91},“biblio”:{“volume”:null,“issue”:nul,“first_page”:null,“last_page”:null},”is_retracted“:false,”is_paratext“:false,”primary_topic“:”{“id”:“https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.389,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.389,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/reinforcement-learning网站“,”display_name“:”强化学习“,”score“:0.603492},{”id“:”https://openalex.org/keywords/deep-learning(https://openalex.org/keywords/deep-learning)“,”display_name“:”Deep Learning“,”score“:0.510483}],”concepts“:[{”id“:”https://openalex.org/C67203356,“wikidata”:https://www.wikidata.org/wiki/Q1321905“,”display_name“:”钢筋“,”level“:2,”score“:0.6574001},{”id“:”https://openalex.org/C97541855,“wikidata”:https://www.wikidata.org/wiki/Q830687“,”display_name“:”强化学习“,”level“:2,”score“:0.6231404},{”id“:”https://openalex.org/C15744967,“wikidata”:https://www.wikidata.org/wiki/Q9418“,”display_name“:”心理学“,”等级“:0,”分数“:0.3969367},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.38196582},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.3753073},{”id“:”https://openalex.org/C180747234,“wikidata”:https://www.wikidata.org/wiki/Q23373“,”display_name“:”认知心理学“,”level“:1,”score“:0.3666903},{”id“:”https://openalex.org/C77805123,“wikidata”:https://www.wikidata.org/wiki/Q161272“,”display_name“:”社会心理学“,”level“:1,”score“:0.19872364}],”mesh“:[],”locations_count“:1.”locations“:[{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2402.12181,“pdf_url”:https://arxiv.org/pdf/2402.12181,“源”:{“id”:https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“https://arxiv.org/abs/2402.12181,“pdf_url”:https://arxiv.org/pdf/2402.12181,“源”:{“id”:https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false},”sustainable_development_goals“:[],“grants”:[]https://openalex.org/W4310083477","https://openalex.org/W2920061524","https://openalex.org/W2748952813","https://openalex.org/W2107890255","https://openalex.org/W2106552856","https://openalex.org/W2089013912","https://openalex.org/W2072376847","https://openalex.org/W2038908348","https://openalex.org/W1987513656","https://openalex.org/W1977959518“],”ngrams_url“:”https://api.openalex.org/works/W4391988133/ngrams网站“,”“abstract_inverted_index”:{“各种”:[0],“数据”:[1,21102118],“增强”:[2,22103119],“技术”:[3],“有”:[4],“曾经”:[5],“最近”:[6],“提议”:[7136],“in”:[8105120137176188],“基于图像”:[9],“深度”:[10],“强化”:[11],“学习”:[12],“(DRL)。”:[13],“尽管”:[14],“他们”:[15,54],“经验上”:[16],“演示“:[17170],”the“:[18,60,63,68,78107148],”effectives“:[19],”of“:[20,62,67,72,80150],”for“:[23],”improvement“:[24],”sample“:[25182],”enficiency“:[26183],”or“:[27],”generalization“:[28],”which“:[29],“technology”:[30],“should”:[31],“be”:[32,97],“preferred”:[33],“is”:[34145],“not”:[35],“always”:[36],“clear”。“:[37],”To“:[38],”toll“:[39],”this“:[40],”question“,”[41],“we”:[42,75127169],”analyze“:[43,77],”existing“:[44],”methods“:[45,95],”To“:[46,51116143147165],”better“:[47185],”understand“:[48],”them“:[49],”and“:[50,65,84157179184],”discover“:[52],”how“:[53,93]115],“are”:[55],“connected”。“:[56],“值得注意”:[57],“by”:[58,99],“expressing”:[59],“variance”:[61],“Q-targets”:[64],“that”:[66171],“empirical”:[69],“actor/critic”:[70],“loss”:[71],“these”:[73,94],“methods”:[74],“can”:[76],“effects”:[%9],“thers”:+81],“different”:[82101166],“component”:[83],“比较“:[85]”。“:[86],“我们”:[87153],“此外”:[88],“制定”:[89],“一个”:[90],“解释”:[91],“关于”:[92],“可能”:[96],“受影响”:[98],“选择”:[100],“转换”:[104],“计算”:[106],“目标”:[108],“Q值。“:[109],”This“:[110],”analysis“:[11160],”suggests“:[112],”recommensions“:[113],”on“:[114],”exploit“:[117],”a“:[12129],”more“:[122],”principled“:[123],”way。“:[124],”In“:[125],”addition“:/126],”include“:[128],”regulationation“:[130],”term“:[131],”called“:/132],”tangent“:[133],”prop“:[134],”previous“:[135],”computer“:%138],”vision“:[139],”but“:-140],”which“:[141],”adaptation“[142],”DRL“:[144],”novel“novel”:[146],”best“:[149],”我们的“:[151155159],”知识。“:[152],”评估“:[154],”命题“:[156],”验证“:[158],”多个“:[162],”域。“:[163],”比较“:[164],”相关“:[167],”基线“:[168],”it“:[172],”实现“:[173],”最先进“:[174],”性能“:[175],”大多数“:[177],”环境“:[178],”显示“:[180],”较高“:[181],”概括“:[186],”能力“:[187],”部分“:[189],”复杂“:[190],”环保。“:[191]},”cited_by_api_url“:”https://api.openalex.org/works?filter=cites:W4391988133“,”counts_by_year“:[],”updated_date“:”2024-06-24T12:29:14.905863“,”created_date“:”2024-02-21“}