{“id”:“https://openalex.org/W2578350735“,”doi“:”https://doi.org/10.1017/s026988891500017x网址“,”title“:”克服基于计划的奖励塑造中的错误知识“,”display_name“:”消除基于计划的奖金塑造中的不正确知识“,“publication_year”:2016,“publiation_date”:“2016-01-01”,“ids”:{“openalex”:“https://openalex.org/W2578350735“,”doi“:”https://doi.org/10.1017/s026988891500017x网址“,”mag“:”2578350735“},”language“:”en“,”primary_location“:{”is_oa“:false,”landing_page_url“:”https://doi.org/10.1017/s026988891500017x网址“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S137506714“,”display_name“:”The Knowledge Engineering Review“,”issn_l“:”0269-8889“,”isn“:[”02698-8889“,”1469-8005“],”is_oa“:false,”is-in_doaj“:false,”is_core“:true,”host_organization“:”https://openalex.org/P4310311721“,”“host_organization_name”:“剑桥大学出版社”,“host_ordanization_lineage”:[“https://openalex.org/P4310311721","https://openalex.org/P4310311702“],”host_organization_lineage_names“:[”剑桥大学出版社“,”剑桥大学“],“type”:“journal”},“license”:null,“licence_id”:null,“version”:nully,“is_accepted”:false,“is_published”:false},”type“:”article“,”type_crossref“:“jornal-article”,“indexed_in”:[”crossref“],‘open_access’:{”is_oa“:false,”“oa_status”:“closed”,“oa_url”:空,“any_repository_has_fulltext“:false},”作者身份“:[{”作者位置“:”第一个“,”作者“:{”id“:”https://openalex.org/A5056510473“,”display_name“:”Kyriakos Efthymiadis“,”orcid“:”https://orcid.org/0000-0002-2235-5115},“机构”:[{“id”:https://openalex.org/I52099693“,”display_name“:”约克大学“,”ror“:”https://ror.org/04m01e293“,”country_code“:”GB“,”type“:“教育”,”世系“:[”https://openalex.org/I52099693“]}],”国家“:[”GB“],”is_corresponding“:false,”raw_author_name“:”Kyriakos Efthymiadis“,”raw _ afiliation_strings“:[“约克大学”],”从属关系“:[{”raw _affiliation_string“:”约克大学“,”institution_ids“:[https://openalex.org/I52099693“]}]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5048451922“,”display_name“:”Sam Devlin“,”orcid“:”https://orcid.org/0000-0002-7769-3090},“机构”:[{“id”:https://openalex.org/I52099693“,”display_name“:”约克大学“,”ror“:”https://ror.org/04m01e293“,”country_code“:”GB“,”type“:“教育”,”世系“:[”https://openalex.org/I52099693“]}],”国家“:[”GB“],”is_corresponding“:false,”raw_author_name“:”Sam Devlin“,”raw _affiliation_strings“:[“约克大学”],”affiliations“:[{”raw_affiliation_string“:”约克大学“,”institution_ids“:[”https://openalex.org/I52099693“]}]},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A5009587907“,”display_name“:”Daniel Kudenko“,”orcid“:”https://orcid.org/0000-0003-3359-3255},“机构”:[{“id”:https://openalex.org/I52099693“,”display_name“:”约克大学“,”ror“:”https://ror.org/04m01e293“,”country_code“:”GB“,”type“:“教育”,”世系“:[”https://openalex.org/I52099693“]}],”国家“:[”GB“],”is_corresponding“:false,”raw_author_name“:”Daniel Kudenko“,”raw _affiliation_strings“:[“约克大学”],”affiliations“:[{”raw _affiliation_string“:”约克大学“,”institution_ids“:[https://openalex.org/I52099693“]}]}],”institution_assertions“:[],”countries_distiction_count“:1,”institutions_disticent_count”:1,“corresponding_author_ids”:[]、“corresconding_institution_ids“:[].”apc_list“:null,”apc_payed“:null,”fwci“:0.267,”has_fulltext“:true,”fulltext_origin“:”ngrams“,”cited_by_count,“:5,”citation_normalized_percentile“:{”value“:0.7”40125,“is_in_top_1_percent“:false,”is_in_top_10_percennt“:false},”cited_by_percentile_year“:{”min“:81,”max“:83},“biblio”:{“volume”:“31”,”issue“:”1“,”first_page“:”31“,”last_page“:”43“}https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9999,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9999,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10653“,”“display_name”:“机器人抓取和示范学习”,“score”:0.9861,“subfield”:{“id”:“https://openalex.org/subfields/2207“,”display_name“:”控制与系统工程“},”字段“:{”id“:”https://openalex.org/fields/22“,”display_name“:”Engineering“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T1975“,”“display_name”:“遗传编程在机器学习中的应用”,“score”:0.9855,“subfield”:{“id”:“https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/reinforcement-learning网站“,”display_name“:”强化学习“,”score“:0.562119},{”id“:”https://openalex.org/keywords/symbolic-regression网站“,”display_name“:”符号回归“,”score“:0.512555}],”concepts“:[{”id“:”https://openalex.org/C2776505523,“wikidata”:https://www.wikidata.org/wiki/Q4785468“,”display_name“:”Plan(考古学)“,”level“:2,”score“:0.7761764},{”id“:”https://openalex.org/C97541855,“wikidata”:https://www.wikidata.org/wiki/Q830687“,”display_name“:”强化学习“,”level“:2,”score“:0.7310531},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.6578433},{”id“:”https://openalex.org/C207685749,“wikidata”:https://www.wikidata.org/wiki/Q2088941“,”display_name“:”领域知识“,”level“:2,”score“:0.5774209},{”id“:”https://openalex.org/C36503486,“wikidata”:https://www.wikidata.org/wiki/Q11235244“,”display_name“:”域(数学分析)“,”level“:2,”score“:0.46547812},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.4616581},{”id“:”https://openalex.org/C182306322,“wikidata”:https://www.wikidata.org/wiki/Q1779371“,”display_name“:”Order(exchange)“,”level“:2,”score“:0.44874167},{”id“:”https://openalex.org/C56739046,“wikidata”:https://www.wikidata.org/wiki/Q192060“,”display_name“:”知识管理“,”level“:1,”score“:0.35052645},{”id“:”https://openalex.org/C119857082,“wikidata”:https://www.wikidata.org/wiki/Q2539“,”display_name“:”机器学习“,”level“:1,”score“:0.3392551},{”id“:”https://openalex.org/C144133560,“wikidata”:https://www.wikidata.org/wiki/Q4830453网址“,”display_name“:”Business“,”level“:0,”score“:0.11923626},{”id“:”https://openalex.org/C33923547,“wikidata”:https://www.wikidata.org/wiki/Q395“,”display_name“:”数学“,”等级“:0,”分数“:0.071219},{”id“:”https://openalex.org/C134306372,“wikidata”:https://www.wikidata.org/wiki/Q7754“,”display_name“:”数学分析“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C166957645,“wikidata”:https://www.wikidata.org/wiki/Q23498“,”display_name“:”考古学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C10138342,“wikidata”:https://www.wikidata.org/wiki/Q43015“,”display_name“:”Finance“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C95457728,“wikidata”:https://www.wikidata.org/wiki/Q309“,”display_name“:”History“,”level“:0,”score“:0.0}],”mesh“:[],”locations_count“:1,”location“:[{”is_oa“:false,”landing_page_url“:”https://doi.org/10.1017/s026988891500017x网址“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S137506714“,”display_name“:”The Knowledge Engineering Review“,”issn_l“:”0269-8889“,”isn“:[”02698-8889“,”1469-8005“],”is_oa“:false,”is-in_doaj“:false,”is_core“:true,”host_organization“:”https://openalex.org/P4310311721“,”“host_organization_name”:“剑桥大学出版社”,“host_ordanization_lineage”:[“https://openalex.org/P4310311721","https://openalex.org/P4310311702“],”host_organization_lineage_names“:[”剑桥大学出版社“,”剑桥大学“],“type”:“journal”},“license”:null,“licence_id”:nul,“version”:null,“is_accepted”:false,“is_published”:false}],“best_oa_location”:null,“sustainable_development_goals”:[],“grants”:[],“datasets”:〔〕,“versions”:[〕,“referenced_works_count”:18,“referenced_works“:[”https://openalex.org/W119236796","https://openalex.org/W1499408472","https://openalex.org/W1553476745","https://openalex.org/W1777239053","https://openalex.org/W2081944499","https://openalex.org/W2095564494","https://openalex.org/W2098432798","https://openalex.org/W2111316871","https://openalex.org/W2119567691","https://openalex.org/W2121863487","https://openalex.org/W2151382427","https://openalex.org/W2158969944","https://openalex.org/W2159600763","https://openalex.org/W2305373430","https://openalex.org/W233478222","https://openalex.org/W2337392266","https://openalex.org/W2989739191","https://openalex.org/W4214717370“],”related_works“:[”https://openalex.org/W4380318855","https://openalex.org/W4362501864","https://openalex.org/W4306904969","https://openalex.org/W3213252596","https://openalex.org/W2138720691","https://openalex.org/W2031695474","https://openalex.org/W2024136090","https://openalex.org/W1649619740","https://openalex.org/W1583422155","https://openalex.org/W1534006406“],”abstract_inverted_index“:{”abstract“:[0],”Reward“:[1],”shaping“:[2,17118],”has“:[3,47],”been“:[4,48],”show“:[5,49],”to“:[6,31,35,55,67,87,94],”显着“:[7],”improve“:[8],”an“:[9,95105],”agent\u2019s“:[10],”performance“:[11],”in“:[12,29,61],”reinforcement“:[13],“学习”:[14],“基于计划”:[15],“奖励”:[16,99117],“是”:[18,27,44],“a“:[19,24,81],“成功”:[20],“方法”:[21],“其中”:[23],“字符串”:[25],“计划”:[26],“使用”:[28],“顺序”:[30],“指南”:[32],“the”:[33,36,41,50,57112],“agent”:[34,51,96106114],“最优”:[37,58],“行为”。“:[38],”“然而,”:[39],“if”:[40],“provided”:[42,93],“knowledge”:[43,71,85,91120],“wrong”,“:[45],“it”:[46,64,73],“will”:[52],“take”:[53],“longer”:[54],“learn”:[56],“policy”。“:[59],”Previous,“:[60],”some“:[62],”cases,“:/63],”was“:[65],”better“:[66],”ignore“:[68],”all“:[69],”previous“:%70],”whiled“:[72],”only“:[74],”be“:[75],”partial“:[76],”incorrect“。“:[77],“This”:[78],“paper”:[79],“investings”:[80],“novel”:[82],“use”:[83],“of”:[84],“revision”:[86],“overview”:[88],“correct”:[89],“domain”:[00],“when”:[92],“receiving”:[97115],“plan-based”:[98116],“shaping”。“:[100],“实证”:[101],“结果”:[102],“显示”:[103],“那”:[104],“使用”:[107],“这个”:[108],“方法”:[109],“可以”:[110],“跑赢大市”:[111],“之前”:[113],“没有”:[119],“修订。“:[121]},”cited_by_api_url“:”https://api.openalex.org/works?filter=cites:W2578350735“,”counts_by_year“:[{年:2023,”cited_by_count“:2},{年“:2022,”cited_by_count”:1},“年”:2018