{“id”:“https://openalex.org/W4220779439“,”doi“:”https://doi.org/10.1145/3517207.3526968“,”title“:“时态移位强化学习”,”display_name“:”时态移位加强学习“,”publication_year“:2022,”publiation_date“:”2022-04-05“,”ids“:{”openalex“:”https://openalex.org/W4220779439“,”doi“:”https://doi.org/10.1145/3517207.3526968“},”language“:”en“,”primary_location“:{”is_oa“:false,”landing_page_url“:”https://doi.org/10.1145/3517207.3526968“,”pdf_url“:null,”source“:nul,”license“:null',”licence_id“:null,”version“:nuller,”is_accepted“:false,”is_published“:false},”type“:”article“,”type_crossref“:“proceedings-article”,”indexed_in“:[”crossref“],”open_access“:{”is_oa“:true,”oa_status“:”green“,”“oa_url”:“”http://arxiv.org/pdf/2109.02145“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5007430044“,”display_name“:”Deepak George Thomas“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Deepak George-Thomas”,“raw_affiliation_strings”:[“Department of Computer Science”]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5017176660“,”display_name“:”Tichakorn Wongpiromsarn“,”orcid“:”https://orcid.org/0000-0002-3977-122X“},”机构“:[],”国家“:[】,”is_corresponding“:false,”raw_author_name“:”Tichakorn Wongpiromsarn“,”raw _ afiliation_strings“:[”计算机科学部“]},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A5079359777“,”display_name“:”Ali Jannesari“,”orcid“:”https://orcid.org/0000-0001-8672-5317“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”Ali Jannesari“,”raw关联字符串“:[”计算机科学部“]}],”countries_distict_count“:0,”institutions_disticent_count“:O,”corresponding_author_ids“:[],“correspounding_institution_ids”:[]“apc_list”:null,“apc_payed”:nul,“has_fulltext”:false“cited_by_count“:0,”cited_by_percentile_year“:{”min“:0”,“max”:67},“biblio”:{“volume”:null,“issue”:nul,“first_page”:null,“last_page”:null},”is_retracted“:false,”is_paratext“:false,”primary_topic“:”{“id”:“https://openalex.org/T12794“,”“display_name”:“最优控制的自适应动态规划”,“score”:0.9617,“subfield”:{“id”:“https://openalex.org/subfields/1703“,”display_name“:”计算理论与数学“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T12794“,”“display_name”:“最优控制的自适应动态规划”,“score”:0.9617,“subfield”:{“id”:“https://openalex.org/subfields/1703“,”display_name“:”计算理论与数学“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T14011“,”“display_name”:“电梯交通控制系统优化”,“score”:0.9418,“subfield”:{“id”:“https://openalex.org/subfields/2207“,”display_name“:”控制与系统工程“},”字段“:{”id“:”https://openalex.org/fields/22“,”display_name“:”Engineering“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9337,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/reinforcement-learning网站“,”display_name“:”强化学习“,”score“:0.580127},{”id“:”https://openalex.org/keywords/dep-learning网站“,”display_name“:”深度学习“,”score“:0.50615},{”id“:”https://openalex.org/keywords/adaptive-dynamic-programming(https://openalex.org/keywords/adaptive-dynamic-programming)“,”display_name“:”自适应动态编程“,”score“:0.503796}],”concepts“:[{”id“:”https://openalex.org/C97541855,“wikidata”:https://www.wikidata.org/wiki/Q830687“,”display_name“:”强化学习“,”level“:2,”score“:0.73219067},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.6596229},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.41953555}],”mesh“:[],”locations_count“:2,”location“:[{”is_oa“:false,”landing_page_url“:”https://doi.org/10.1145/3517207.3526968“,”pdf_url“:null,”source“:null,”license“:nully,”licence_id“:null,”version“:nuller,”is_accepted“:false,”is_published“:false},{”is_oa“:true,”landing_page_url”:“http://arxiv.org/abs/2109.02145,“pdf_url”:http://arxiv.org/pdf/2109.02145,“源”:{“id”:https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“http://arxiv.org/abs/2109.02145,“pdf_url”:http://arxiv.org/pdf/2109.02145,“源”:{“id”:https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false},”sustainable_development_goals“:[],“grants”:[]、“datasets”:[],“versions”:[】,“referenced_works_count”:13,“referrenced_works”:https://openalex.org/W1522734439","https://openalex.org/W2016053056","https://openalex.org/W2145339207","https://openalex.org/W2507009361","https://openalex.org/W2529601334","https://openalex.org/W2596585349","https://openalex.org/W2746553466","https://openalex.org/W2770804203","https://openalex.org/W2799176631","https://openalex.org/W2963524571","https://openalex.org/W2968883249","https://openalex.org/W2990152177","https://openalex.org/W3011985620“],”related_works“:[”https://openalex.org/W4380318855","https://openalex.org/W4362501864","https://openalex.org/W4306904969","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2376932109","https://openalex.org/W2358668433","https://openalex.org/W2138720691","https://openalex.org/W2031695474","https://openalex.org/W2001405890“],”ngrams_url“:”https://api.openalex.org/works/W4220779439/ngrams网站”,“abstract_inverted_index”:{“The”:[0],“function”:[1],“approximators”:[2],“employed”:[3],“by”:[4],“traditional”:[5],“image-based”:[6],“Deep”:[7],“Reinforcement”:[8,32],“Learning”:[9,33],“(DRL)”:[10],“algorithms”:[11],“normal”:[12],“lack”:[13],“a”:[14,28],“temporal”:[15,5]5],“学习”:[16,22],“组成部分”:[17],“和”:[18],“改为”:[19],“专注”:[20],“on”:[21,68,76],“the”:[23,62,71,79,92],“spatial”:[24,41],“component.”:[25],“We”:[26,57],“propose”:[27],“technology”:[29],“Temporal”:[30],“Shift”:[31],“(TSRL),”:[34],“where”:[35],“both”:[36],“Temporal”,“:[37],”as“:[38,40,94,96],“well”:[39,95],“组件”:[42],“是”:[43],“联合”:[44],“学习”:[45],“此外”:[46],“TSRL”:[47,60],“做”:[48],“not”:[49],“require”:[50],“additional”:[51],“parameters”:[52],“to”:[53],“performance”:[54],“learning.”:[56],“show”:[58],“that”:[59],“excellents”:[61],“commonly”:[63],“used”:[64],“frame”:[65],“stacking”:[66],“启发式”:[67],“all”:[69,82],“of”:[70,85],“Atari”:[72],“环境”:[73],“我们”:[74],“测试”:[75],“while”:[77],“跳动”:[78],“SOTA”:[80],“for”:[81],“除”:[83],“一”:[84],“他们。”:[86],“此”:[87],“调查”:[88],“有”:[89],“暗示”:[90],“in”:[91],“机器人”:[93],“顺序”:[97],“决策”:[98],“域。”:99],“我们的”:[100],“代码”:[101],“是”:[102],“可用”:[103],“在”:[104],“-”:[105],“https://github.com/Deepakgthomas/TSM_RL“:[106]},”cited_by_api_url“:”https://api.openalex.org/works?filter=cites:W4220779439“,”counts_by_year“:[],”updated_date“:”2024-05-22T22:37:37.589806“,”created_date“:”2022-04-03“}