{“id”:“https://openalex.org/W2015051472“,”doi“:”https://doi.org/10.109/adprl.2013.6615000“,”title“:“探究强化学习中的奖惩关系”,”display_name“:“探索强化学习中奖惩的关系”,“publication_year”:2013,“publitation_date”:“2013-04-01”,“ids”:{“openalex”:“https://openalex.org/W2015051472“,”doi“:”https://doi.org/10.109/adprl.2013.6615000“,”mag“:”2015051472“},”language“:”en“,”primary_location“:{”is_oa“:false,”landing_page_url“:”https://doi.org/10.109/adprl.2013.6615000“,”pdf_url“:null,”source“:null,”license“:null',”licence_id“:null,”version“:nuller,”is_accepted“:false,”is_published“:false},”type“:”article“,”type_crossref“:“procesdings-article”,”indexed_in“:[”crossref“],”open_access“:{”is_oa“:false,”oa_status“:”closed“,”oa_url”:null“,”any_repository_has_fulltext“:false}”,”authorships“:[{”author_position“:”first“,”作者“:{”id“:”https://openalex.org/A5080721542“,”display_name“:”Robert Lowe“,”orcid“:”https://orcid.org/0000-0002-0307-3171},“机构”:[{“id”:https://openalex.org/I205158640“,”display_name“:”苏格兰大学\u00f6vde“,”ror“:”https://ror.org/051mrsz47“,”country_code“:”SE“,”type“:“教育”,”世系“:[”https://openalex.org/I205158640“]}],”国家“:[”SE“],”is_corresponding“:false,”raw_author_name“:”Robert Lowe“,”raw _ afiliation_strings“:[“瑞典Sk\u00f6vde大学互动实验室”],”affiliations“:[{”raw _affiliation_string“:”瑞典Sk\ u00f6 vde大学交互实验室”,“institution_ids”:[“https://openalex.org/I205158640“]}]},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A5001467069“,”display_name“:”Tom Ziemke“,”orcid“:”https://orcid.org/0000-0001-6883-2450},“机构”:[{“id”:https://openalex.org/I205158640“,”display_name“:”苏格兰大学\u00f6vde“,”ror“:”https://ror.org/051mrsz47“,”country_code“:”SE“,”type“:“教育”,”世系“:[”https://openalex.org/I205158640“]}],”国家“:[”SE“],”is_corresponding“:false,”raw_author_name“:”Tom Ziemke“,”raw _affiliation_strings“:[“瑞典Sk\u00f6vde大学互动实验室”,“affiliations”:[{“raw_affilition_string”:“瑞典Sk大学互动实验室https://openalex.org/I205158640“]}]}],”countries_distinct_count“:1,”institutions_disting_count”:1,“corresponding_author_ids”:[],”correspounding_institution_ids“:[]、”apc_list“:null,”apc_payed“:null,”has_fulltext“:true,”fulltext_origin“:”ngrams“,”cited_by_count,“issue”:空,“first_page”:空last_page“:null},”is_retracted“:false,”is_paratext“:fase,”primary_topic“:{”id“:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9859,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”Physical Sciences“}},”topics“:[{”id“:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9859,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T12761“,”“display_name”:“适应数据流中的概念漂移”,“score”:0.9623,“subfield”:{“id”:“https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T13283“,”“display_name”:“精神病理学和精神障碍的网络分析”,“score”:0.9475,“subfield”:{“id”:“https://openalex.org/subfields/3205“,”display_name“:”实验与认知心理学“},”field“:{”id“:”https://openalex.org/fields/32“,”display_name“:”心理学“},”域“:{”id“:”https://openalex.org/domains/2“,”display_name“:”社会科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/reinforcement-learning网站“,”display_name“:”强化学习“,”score“:0.598317}],”concepts“:[{”id“:”https://openalex.org/C97541855,“wikidata”:https://www.wikidata.org/wiki/Q830687“,”display_name“:”强化学习“,”level“:2,”score“:0.929923},{”id“:”https://openalex.org/C166109690,“wikidata”:https://www.wikidata.org/wiki/Q4677422“,”display_name“:”Action selection“,”level“:3,”score“:0.82632446},{”id“:”https://openalex.org/C27799295839,“wikidata”:https://www.wikidata.org/wiki/Q3544090“,”display_name“:”惩罚(心理)“,”level“:2,”score“:0.70215464},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.6697917},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.6108788},{”id“:”https://openalex.org/C2779343474,“wikidata”:https://www.wikidata.org/wiki/Q3109175“,”display_name“:”Context(考古学)“,”level“:2,”score“:0.60510445},{”id“:”https://openalex.org/C2780451532,“wikidata”:https://www.wikidata.org/wiki/Q759676“,”display_name“:”Task(project management)“,”level“:2,”score“:0.5797866},{”id“:”https://openalex.org/C2780791683,“wikidata”:https://www.wikidata.org/wiki/Q846785“,”display_name“:”Action(physical)“,”level“:2,”score“:0.5776396},{”id“:”https://openalex.org/C81917197,“wikidata”:https://www.wikidata.org/wiki/Q628760“,”display_name“:”Selection(genetic algorithm)“,”level“:2,”score“:0.52363396},{”id“:”https://openalex.org/C188116033,“wikidata”:https://www.wikidata.org/wiki/Q2664563“,”display_name“:”Q-learning“,”level“:3,”score“:0.5189135},{”id“:”https://openalex.org/C8880873,“wikidata”:https://www.wikidata.org/wiki/Q187787“,”display_name“:”遗传算法“,”level“:2,”score“:0.4605204},{”id“:”https://openalex.org/C199190896,“wikidata”:https://www.wikidata.org/wiki/Q3509276“,”display_name“:”学习分类器系统“,”level“:3,”score“:0.44927442},{”id“:”https://openalex.org/C2776291640,“wikidata”:https://www.wikidata.org/wiki/Q2912517“,”display_name“:”Value(mathematics)“,”level“:2,”score“:0.43907055},{”id“:”https://openalex.org/C106189395,“wikidata”:https://www.wikidata.org/wiki/Q176789“,”display_name“:”Markov决策过程“,”level“:3,”score“:0.43133622},{”id“:”https://openalex.org/C67203356,“wikidata”:https://www.wikidata.org/wiki/Q1321905“,”display_name“:”钢筋“,”level“:2,”score“:0.41826826},{”id“:”https://openalex.org/C119857082,“wikidata”:https://www.wikidata.org/wiki/Q2539“,”display_name“:”机器学习“,”level“:1,”score“:0.41196865},{”id“:”https://openalex.org/C15744967,“wikidata”:https://www.wikidata.org/wiki/Q9418“,”display_name“:”心理学“,”等级“:0,”分数“:0.22080252},{”id“:”https://openalex.org/C77805123,“wikidata”:https://www.wikidata.org/wiki/Q161272“,”display_name“:”社会心理学“,”level“:1,”score“:0.14876443},{”id“:”https://openalex.org/C127413603,“wikidata”:https://www.wikidata.org/wiki/Q11023“,”display_name“:”Engineering“,”level“:0,”score“:0.1233744},{”id“:”https://openalex.org/C159886148,“wikidata”:https://www.wikidata.org/wiki/Q176645“,”display_name“:”Markov过程“,”level“:2,”score“:0.08983976},{”id“:”https://openalex.org/C33923547,“wikidata”:https://www.wikidata.org/wiki/Q395“,”display_name“:”数学“,”等级“:0,”分数“:0.08662036},{”id“:”https://openalex.org/C151730666,“wikidata”:https://www.wikidata.org/wiki/Q7205“,”display_name“:”古生物学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C121332964,“wikidata”:https://www.wikidata.org/wiki/Q413“,”display_name“:”物理“,”级别“:0,”分数“:0.0},{”id“:”https://openalex.org/C201995342,“wikidata”:https://www.wikidata.org/wiki/Q682496“,”display_name“:”系统工程“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C62520636,“wikidata”:https://www.wikidata.org/wiki/Q944“,”display_name“:”量子力学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C169760540,“wikidata”:https://www.wikidata.org/wiki/Q207011“,”display_name“:”Neuroscience“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C26760741,“wikidata”:https://www.wikidata.org/wiki/Q160402“,”display_name“:”Perception“,”level“:2,”score“:0.0},{”id“:”https://openalex.org/C86803240,“wikidata”:https://www.wikidata.org/wiki/Q420“,”display_name“:”生物学“,”等级“:0,”分数“:0.0},{”id“:”https://openalex.org/C105795698,“wikidata”:https://www.wikidata.org/wiki/Q12483“,”display_name“:”Statistics“,”level“:1,”score“:0.0}],”mesh“:[],”locations_count“:1.”locations“:[{”is_oa“:false,”landing_page_url“:”https://doi.org/10.109/adprl.2013.6615000“,”pdf_url“:null,”source“:nul,”license“:null:”license_id“:nulse,”version“:null,”is_accepted“:false,”is_published“:false}],”best_oa_location“:nuld,”sustainable_development_goals“:[{”display_name“:”和平、正义和强大的机构“,”score“:0.76,”id“:”https://metadata.un.org/sdg/16“}],”grants“:[],”datasets“:[],”versions“:[】,”referenced_works_count“:20,”referrenced_works“:]”https://openalex.org/W1516301787","https://openalex.org/W1538815457","https://openalex.org/W1965692465","https://openalex.org/W2005078497","https://openalex.org/W2007028190","https://openalex.org/W2037121244","https://openalex.org/W2073654928","https://openalex.org/W2108804935","https://openalex.org/W2116085129","https://openalex.org/W2117564498","https://openalex.org/W2156952192","https://openalex.org/W2161563886","https://openalex.org/W2165527701","https://openalex.org/W2499825296","https://openalex.org/W2773677792","https://openalex.org/W2963302368","https://openalex.org/W4214717370","https://openalex.org/W4238720562","https://openalex.org/W622828751","https://openalex.org/W67729719“],”related_works“:[”https://openalex.org/W4380550992","https://openalex.org/W4322760752","https://openalex.org/W3167472281","https://openalex.org/W3096874164","https://openalex.org/W2970347269","https://openalex.org/W2937181779","https://openalex.org/W2808418668","https://openalex.org/W2357975469","https://openalex.org/W2146763310","https://openalex.org/W2101748387“],”ngrams_url“:”https://api.openalex.org/works/W2015051472/ngrams“,”“abstract_inverted_index”:{“We”:[0],“present”:[1],“a”:[2,32,43,49,63],“reinforction”:[3,73],“learning”:[4,21,74],“algorithm”:[5,34,65],“based”:[6],“on”:[7],“Dyna-Sarsa”:[8],“that”:[9],“useds”:[10],“separated”:[11],“representation”:[12],“of”:[13,27,42,71],“redward”:[14],“和”:[15,22,37],“惩罚”:[16],“何时”:[17],“引导”:[18],“状态-动作“:[19],”值“:[20],”动作“:[23],”选择。“:[24],“The”:[25,55],“adoption”:[26],“policy”:[28],“meta-learning”:[29],“optimized”:[30],“by”:[31],“genetic”:[33,64],“is”:[35],“explored”:[36],“results”:[38],“in”:[39,48],“The”:[40,69],“context”:[41],“two-armed”:[44],“batter”:[45],“goal-navigation”:[46],”任务“:[47],”简单“:[50],”网格“:[51],”世界“:[52],”are“:[53],”presented。“:[54],“发现”:[56],“争论”:[57],“for”:[58,62,67],“an”:[59],“important”:[60],“role”:[61],“approach”:66],“constructing”:[68],“foundations”:[70],“autonomous”:[72],“agents”。“:[75]},”cited_by_api_url“:”https://api.openalex.org/works?filter=cites:W2015051472“,”“counts_by_year”:[{“年份”:2023,”“cited_by_count”:1},{“年度”:2022,”“cited_by_cunt”:1',{(年份):2021,年份“:2016,”cited_by_count“:3},{“年份”:2014,”ciped_by_cunt“:1}],”updated_date“:”2024-06-18T12:22:19.410883“,”创建日期“:”2016-06-24“}