{“id”:“https://openalex.org/W2788842776“,”doi“:”https://doi.org/10.3389/frobt.2018.00079“,”title“:“异步环境中的反应强化学习”,“display_name”:“异步条件下的反应强化教学”,“publication_year”:2018,“publiation_date”:“2018-06-26”,“ids”:{“openalex”:“https://openalex.org/W2788842776“,”doi“:”https://doi.org/10.3389/frobt.2018.00079“,”mag“:”2788842776“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://doi.org/10.3389/frobt.2018.00079,“pdf_url”:https://www.frontiersin.org/articles/10.3389/frobt.2018.00079/pdf,“源”:{“id”:https://openalex.org/S2595095599“,”“display_name”:“机器人与人工智能的前沿”,“issn_l”:“2296-9144”,“isn”:[“2296-6144”],“is_oa”:true,“is.in_doaj”:true,“host_organization”:“https://openalex.org/P4310320527“,”“host_organization_name”:“Frontiers Media”,“host_organization_lineage”:[“https://openalex.org/P4310320527“],”host_organization_lineage_names“:[”Frontiers Media“],“type”:“journal”},“license”:“cc-by”,“licence_id”:“https://openalex.org/licenses/cc-by“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},”type“:”article“,”type_crossref“:“journal-article”,”indexed_in“:[”arxiv“,”crossref“,”datacite“,”doaj“],”open_access“:{”is_oa“:true,”oa_status“:”gold“,”oa_url“:”https://www.frontiersin.org/articles/10.3389/frobt.2018.00079/pdf“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5059024724“,”display_name“:”Jaden B.Travnik“,”orcid“:null},”institutions“:[{”id“:”https://openalex.org/I154425047“,”display_name“:”阿尔伯塔大学“,”ror“:”https://ror.org/0160cpw27“,”country_code“:”CA“,”type“:“教育”,”世系“:[”https://openalex.org/I154425047“]}],”国家“:[”CA“],”is_corresponding“:false,”raw_author_name“:”Jaden B.Travnik“,”raw _affiliation_strings“:[“加拿大爱德蒙顿阿尔伯塔大学医学系改良自然控制实验室的仿生肢体”]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5068452444“,”display_name“:”Kory W.Mathewson“,”orcid“:”https://orcid.org/0000-0002-5688-6221},“机构”:[{“id”:https://openalex.org/I154425047“,”display_name“:”阿尔伯塔大学“,”ror“:”https://ror.org/0160cpw27“,”country_code“:”CA“,”type“:“教育”,”世系“:[”https://openalex.org/I154425047“]}],”国家“:[”CA“],”is_corresponding“:false,”raw_author_name“:”Kory W.Mathewson“,”raw_affiliation_strings“:[“加拿大亚伯达州埃德蒙顿阿尔伯塔大学医学系改良自然控制实验室的仿生肢体”]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5004923102“,”display_name“:”Richard S.Sutton“,”orcid“:null},”institutions“:[{”id“:”https://openalex.org/I154425047“,”display_name“:”阿尔伯塔大学“,”ror“:”https://ror.org/0160cpw27“,”country_code“:”CA“,”type“:“教育”,”世系“:[”https://openalex.org/I154425047“]}],”国家“:[”CA“],”is_corresponding“:false,”raw_author_name“:”Richard S.Sutton“,”raw _affiliation_strings“:[“加拿大爱德蒙顿阿尔伯塔大学计算科学系强化学习与人工智能实验室”]},{“author_position”:“last”,“author”:{“id”:“https://openalex.org/A5010596280“,”display_name“:”Patrick M.Pilarski“,”orcid“:”https://orcid.org/0000-0003-1686-2978},“机构”:[{“id”:https://openalex.org/I154425047“,”display_name“:”阿尔伯塔大学“,”ror“:”https://ror.org/0160cpw27“,”country_code“:”CA“,”type“:“教育”,”世系“:[”https://openalex.org/I154425047“]}],”国家“:[”CA“],”is_corressinding“:true,”raw_author_name“:”Patrick M.Pilarski“,”raw_affiation_strings“:[”加拿大阿尔伯塔大学埃德蒙顿医学系改善自然控制实验室仿生肢体“]}],”国家_目标_计数“:1,”机构_区别_计数“:1,”对应_作者_ ID“:[”https://openalex.org/A5010596280“],”对应的机构ID“:[”https://openalex.org/I154425047“],”apc_list“:{“value”:1900,”currency“:”USD“,”value_USD“:1900“:{”卷“:”5“,”问题“:null,”第一页“:null,”最后一页“:null},”is_retracted“:false,”is_paratext“:fase,”primary_topic“:{”id“:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9994,”subfield“:{”id“:”https://openalex.org/subfields/s702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9994,”subfield“:{”id“:”https://openalex.org/subfields/s702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T12288“,”“display_name”:“在线机器人研究中的分布式协调”,“score”:0.9957,“subfield”:{“id”:“https://openalex.org/subfields/1705“,”display_name“:”计算机网络和通信“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10876“,”“display_name”:“工业过程故障检测与诊断”,“score”:0.98,“subfield”:{“id”:“https://openalex.org/subfields/2207“,”display_name“:”控制与系统工程“},”字段“:{”id“:”https://openalex.org/fields/22“,”display_name“:”Engineering“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/reinforcement-learning网站“,”display_name“:”强化学习“,”score“:0.586024},{”id“:”https://openalex.org/keywords/simmulations网站“,”display_name“:”Simulations“,”score“:0.503351}],”concepts“:[{”id“:”https://openalex.org/C97541855,“wikidata”:https://www.wikidata.org/wiki/Q830687“,”display_name“:”强化学习“,”level“:2,”score“:0.8432138},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.83877087},{”id“:”https://openalex.org/C151319957,“wikidata”:https://www.wikidata.org/wiki/Q752739“,”display_name“:”异步通信“,”level“:2,”score“:0.79753876},{”id“:”https://openalex.org/C106189395,“wikidata”:https://www.wikidata.org/wiki/Q176789网址“,”display_name“:”Markov决策过程“,”level“:3,”score“:0.7264199},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.43343267},{”id“:”https://openalex.org/C120314980,“wikidata”:https://www.wikidata.org/wiki/Q180634“,”display_name“:”分布式计算“,”level“:1,”score“:0.41774508},{”id“:”https://openalex.org/C119857082,“wikidata”:https://www.wikidata.org/wiki/Q2539“,”display_name“:”机器学习“,”level“:1,”score“:0.34575176},{”id“:”https://openalex.org/C159886148,“wikidata”:https://www.wikidata.org/wiki/Q176645“,”display_name“:”Markov过程“,”level“:2,”score“:0.29645574},{”id“:”https://openalex.org/C31258907,“wikidata”:https://www.wikidata.org/wiki/Q1301371“,”display_name“:”计算机网络“,”level“:1,”score“:0.08626008},{”id“:”https://openalex.org/C105795698,“wikidata”:https://www.wikidata.org/wiki/Q12483“,”display_name“:”Statistics“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C33923547,“wikidata”:https://www.wikidata.org/wiki/Q395“,”display_name“:”Mathematics“,”level“:0,”score“:0.0}],”mesh“:[],”locations_count“:7,”location“:[{”is_oa“:true,”landing_page_url“:”https://doi.org/10.3389/frobt.2018.00079,“pdf_url”:https://www.frontiersin.org/articles/10.3389/frobt.2018.00079/pdf,“源”:{“id”:https://openalex.org/S2595095599“,”“display_name”:“机器人与人工智能的前沿”,“issn_l”:“2296-9144”,“isn”:[“2296-6144”],“is_oa”:true,“is.in_doaj”:true,“host_organization”:“https://openalex.org/P4310320527“,”host_organization_name“:”Frontiers Media“,”host_organization_lineage“:[”https://openalex.org/P4310320527“],”host_organization_lineage_names“:[”Frontiers Media“],“type”:“journal”},“license”:“cc-by”,“licence_id”:“https://openalex.org/licenses/cc-by“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},{”is_oa“:false,”landing_page_url“:”https://doaj.org/article/2b1b274c790d4ab1be3c2de9333b687a“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306401280“,”display_name“:”DOAJ(DOAJ:开放存取期刊目录)“,”issn_l“:null,”issn“:null:”is_oa“:true,”is_in_DOAJ“:false,”host_organization“:null,”host_organization_name“:null,“host_orgganization_lineage”:[],“host_orgganization _lineage_names”:[[],“type”:“repository”},“license”:null、“license_id”:null、“version”:null.、“is_accepted”:false、“is_published“:false},{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/1802.06139,“pdf_url”:https://arxiv.org/pdf/1802.06139,“源”:{“id”:https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”Cornell University“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false},{“is_oa”:true,“landing_page_url”:“https://europepmc.org/articles/pmc7805616,“pdf_url”:https://europepmc.org/articles/pmc7805616?pdf=render,“源”:{“id”:https://openalex.org/S4306400806“,”display_name“:”Europe PMC(PubMed Central)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I1303153112“,”“host_organization_name”:“欧洲生物信息学研究所”,“host_organization_lineage”:[“https://openalex.org/I1303153112“],”host_organization_lineage_names“:[”欧洲生物信息学研究所“],“type”:“repository”},“license”:“cc-by”,“licence_id”:“https://openalex.org/licenses/cc-by“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},{”is_oa“:true,”landing_page_url“:”https://www.ncbi.nlm.nih.gov/pmc/articles/PMC7805616“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S2764455111“,”display_name“:”PubMed Central“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I1299303238“,”“host_organization_name”:“美国国立卫生研究院”,“host_ordanization_lineage”:[“https://openalex.org/I1299303238“],”host_organization_lineage_names“:[”National Institutes of Health“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“publishedVersion”,“is_accepted”:true,“is_published”:true},{“is_oa”:true,“landing_page_url”:“http://arxiv.org/abs/1802.06139,“pdf_url”:网址:http://arxiv.org/pdf/1802.06319,“源”:{“id”:https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”Cornell University“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false},{“is_oa”:false,“landing_page_url”:“https://api.datacite.org/dois/10.48550/arxiv.1802.06139“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4393179698“,”display_name“:”DataCite API“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I4210145204“,”“host_organization_name”:“DataCite”,“host_organization_lineage”:[“https://openalex.org/I4210145204“],”host_organization_lineage_names“:[”DataCite“],“type”:“metadata”},“license”:null,“licence_id”:null,“version”:null}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“https://doi.org/10.3389/frobt.2018.00079,“pdf_url”:https://www.frontiersin.org/articles/10.3389/frobt.2018.00079/pdf,“源”:{“id”:https://openalex.org/S2595095599“,”“display_name”:“机器人与人工智能的前沿”,“issn_l”:“2296-9144”,“isn”:[“2296-6144”],“is_oa”:true,“is.in_doaj”:true,“host_organization”:“https://openalex.org/P4310320527“,”host_organization_name“:”Frontiers Media“,”host_organization_lineage“:[”https://openalex.org/P4310320527“],”host_organization_lineage_names“:[”Frontiers Media“],“type”:“journal”},“license”:“cc-by”,“licence_id”:“https://openalex.org/licenses/cc-by“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},”sustainable_development_goals“:[{”id“:”https://metadata.un.org/sdg/16“,”display_name“:”和平、正义和强大的制度“,”score“:0.68}],”grants“:[{”funder“:”https://openalex.org/F4320319952“,”“funder_display_name”:“加拿大创新基金会”,“award_id”:null},{“funder”:“https://openalex.org/F4320320994“,”funder_display_name“:”Canada Research Chairs“,”award_id“:null},{”funder“:”https://openalex.org/F4320325651“,”funder_display_name“:”Alberta Innovates“,”award_id“:null},{”funder“:”https://openalex.org/F4320334593“,”“funder_display_name”:“加拿大自然科学与工程研究委员会”,“award_id”:null}],“数据集”:[],“版本”:[“https://openalex.org/W2788842776","https://openalex.org/W3104173699“],”referenced_works_count“:17,”referrenced_works“:[”https://openalex.org/W1525280637","https://openalex.org/W1711093554","https://openalex.org/W1977655452","https://openalex.org/W2009533501","https://openalex.org/W2041367235","https://openalex.org/W2091565802","https://openalex.org/W2150339816","https://openalex.org/W2257979135","https://openalex.org/W2408978589","https://openalex.org/W2619103847","https://openalex.org/W2623293810","https://openalex.org/W2766207971","https://openalex.org/W2792812366","https://openalex.org/W3139377883","https://openalex.org/W317521241","https://openalex.org/W32403112","https://openalex.org/W4214717370“],”related_works“:[”https://openalex.org/W3168977894","https://openalex.org/W3096874164","https://openalex.org/W2937181779","https://openalex.org/W2386410636","https://openalex.org/W2357975469","https://openalex.org/W2341346307","https://openalex.org/W2145363145","https://openalex.org/W2116677773","https://openalex.org/W1985560493","https://openalex.org/W1626977535“],”ngrams_url“:”https://api.openalex.org/works/W2788842776/ngrams网站“,”“abstract_inverted_index”:{“The”:[0],“relationship”:[1],“between”:[2,21],“a”:[3119130154],“reference”:[4134],“learning”:[5135157163196217],“(RL)”:[6],“agent”:[7,23,73101188],“and”:[8,24172175208],“an”:[9,22,62,72,77100114],“asynchronous”:[10,46,63142167],“environment”:[11,52,88109],“是”:[12126],“经常”:[13],“忽略。“:[14],”频繁“:[15],”使用“:[16],”模型“:[17],”的“:[18,50,86,99132141186193201],”the“:[19,41,48,51,59,80,84,87,96108123160183187191194],”interaction“:[20],”its“:[25],“environment,”:[26,64],“such”:[27],“as”:[28],“Markov”:[29],“Decision”:[30,35],“Processes”:[318,36],“(MDP)”:[32],“或”:[33118],“Semi-Markov”:[34],”(SMDP),“:[37],”do“:[38],“not”:[39],“capture”:[40],“fact”:[42],“that”:[43],“in”:[44,82],“state”:[P9,85117120150],“may”:[53,89204],“change”:[54,90214],“during”:[55],“computeration”:[56],“performed”:[57],“by”:[58106144189],“agent”。“:[60],”In“:[61,93],”最小化“:[65],”反应“:[66,97184],”time\u2014the“:[67],”时间“:[68,81,98185],”it“:[69],”takes“:[70],”for“:[71],”to“:[74,76110215],”react“:[75],”observation\u2014also“:78],”minimization“:[79],”which“:[83],”following“:[91],”观察。“:[92],“许多”:[94],“环境”,:[95],“直接”:[102],“影响”:[103],“任务”:[104],“性能”:[105],“允许”:[107],“过渡”:[111],“到”:[112],“任其一”:[113],“不需要”:[115],“终端”:[116],“其中”:[121],“执行”:[122],“选择”:[124],“操作”:[125],“不当。“:[127],“我们”:[128152],“提议”:[129],“类”:[1310200],“反应”:[133155179202],“算法”:[136203],“那个”:[137177],“地址”:[138],“这个”:[139],“问题”:[140],“环境”:[143],“立即”:[145],“行动”:[146],“之后”:[147],“观察”:[148],“新”:[149199],“信息。“:[151],”比较“:[153],”SARSA“:[156162],”算法“:[158164181],”与“:[159],”常规“:[161],”on“:[165],”两个“:[166],”机器人“:[168],”任务“:[169],”(紧急“:[170],”停止“:[171],”影响“173],”预防“,”:[174],”显示“:[176],”RL“:[180],”减少“:[182],”近似“:[190],“持续时间”:[192],“算法”:[195],“更新。“:[197],”此“:[198],”便利“:[205],”更安全“:[206],”控制“:[207],”更快“:[209],”决策“:[210],”制定“:[211],”没有“:[212],”任何“:[213],”标准“:[216],”保证。“:[218]},”cited_by_api_url“:”https://api.openalex.org/works?filter=cites:W2788842776“,”counts_by_year“:[{”年“:2023,”cited_by_count“:3},{”年份“:2022,”cited_by_count”:4},“{”年度“:2021,”citecd_by_count“:4}.,{“年份”:2020,“cited_by_count):3}.,“年份”:2018,“citecd_by_counts”:1}],”updated_date“:”2024-05-14T23:21:05.051722“,”created_date:“2018-03-06”}