{“id”:“https://openalex.org/W2766180905“,”doi“:”https://doi.org/10.1007/s10015-017-0401-2“,”title“:“采用不精确动力学模型的线性可解马尔可夫对策的稳健性”,”display_name“:“使用不精确动力学模式的线性可求解马尔可夫博弈的稳健度”,”publication_year“:2017,”publitation_date“:”2017-10-31“,”ids“:{”openalex“:”https://openalex.org/W2766180905“,”doi“:”https://doi.org/10.1007/s10015-017-0401-2“,”mag“:”2766180905“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://doi.org/10.1007/s10015-017-0401-2,“pdf_url”:https://link.springer.com/content/pdf/10.1007/s10015-017-0401-2.pdf,“源”:{“id”:https://openalex.org/S104439334“,”display_name“:”人造生命与机器人“,”issn_l“:”1433-5298“,”isn“:[”1433-52“,”1614-7456“],”is_oa“:false,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/P4310318900“,”“host_organization_name”:“Springer Science+Business Media”,“host_organization_lineage”:[“https://openalex.org/P431031965","https://openalex.org/P4310319900“],”host_organization_lineage_names“:[”Springer Nature“,”Springer-Science+Business Media“],“type”:“journal”},“license”:null,“licence_id”:nul,“version”:“publishedVersion”,“is_accepted”:true,“is_published”:true},”type“:“article”,“type_crossref”:”journal-article“,”indexed_in“:[“crossref”],“open_access”:{“is_oa”:true,“oa_status”:“青铜色,“oa_url”:https://link.springer.com/content/pdf/10.1007/s10015-017-0401-2.pdf“,”any_repository_has_fulltext“:false},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5085840994“,”display_name“:”Ken Kinjo“,”orcid“:null},”institutions“:[{”id“:”https://openalex.org/I142637625“,”display_name“:”冲绳理工大学研究生院“,”ror“:”https://ror.org/02qg15b79“,”country_code“:”JP“,”type“:“教育”,”世系“:[”https://openalex.org/I142637625“]}],”国家“:[”JP“],”is_corresponding“:false,”raw_author_name“:”Ken Kinjo“,”raw _affiliation_strings“:[“日本冲绳冲绳科技研究生院”]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5031054137“,”display_name“:”Eiji Uchibe“,”orcid“:”https://orcid.org/0000-0001-7908-0258“},”机构“:[{”id“:”https://openalex.org/I4210104143“,”display_name“:”Advanced Telecommunications Research Institute International“,”ror“:”https://ror.org/01pe1d703“,”“country_code”“:”JP“,”type“:”facility“,”lineage“:[”https://openalex.org/I4210104143“]}],”国家“:[”JP“],”is_corresponding“:true,”raw_author_name“:”Eiji Uchibe“,”raw_affiliation_strings“:[“日本京都ATR计算神经科学实验室”]},{“author_position”:“last”,“author”:{“id”:“https://openalex.org/A5004840638“,”display_name“:”Kenji Doya“,”orcid“:”https://orcid.org/0000-0002-2446-6820“},”机构“:[{”id“:”https://openalex.org/I142637625“,”display_name“:”冲绳理工大学研究生院“,”ror“:”https://ror.org/02qg15b79“,”country_code“:”JP“,”type“:“教育”,”世系“:[”https://openalex.org/I142637625“]}],”国家“:[”JP“],”is_corresponding“:false,”raw_author_name“:”Kenji Doya“,”raw _ afiliation_strings“:[“日本冲绳冲绳科学技术研究生院”]}],”countries _ distinct_count“:1,”institutions _ disting_count”:2,“corresponding_author_ids”:[“https://openalex.org/A5031054137“],”对应的机构ID“:[”https://openalex.org/I4210104143“],”apc_list“:{”value“:2390,”currency“:”EUR“,”value_usd“:2990,”provenance“:”doaj“},”apc _payed“:”{“value”:2390、”current“:”欧元“,”value_usd”:2990、“provenance”:“doaj”}、“has_fulltext”:true、“fulltext_origin”:“pdf”、“cited_by_count”:0、“citecd_by_percentile_year”:{“min”:0,“max”:68},“biblio”:{“volume”:“23”,“issue”:“1”,“first_page”:“0”,“last_page”::“9”},“is_retracted“:false,”is_paratext“:fase,”primary_topic“:{”id“:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9994,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9994,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10848“,”“display_name”:“进化算法中的多目标优化”,“score”:0.9617,“subfield”:{“id”:“https://openalex.org/subfields/1703“,”display_name“:”计算理论与数学“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T12794“,”display_name“:”最优控制的自适应动态规划“,”score“:0.9613,”subfield“:{”id“:”https://openalex.org/subfields/1703“,”display_name“:”计算理论与数学“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/reinforcement-learning网站“,”display_name“:”强化学习“,”score“:0.537481},{”id“:”https://openalex.org/keywords/adaptive-dynamic编程“,”display_name“:”自适应动态编程“,”score“:0.518419}],”concepts“:[{”id“:”https://openalex.org/C63479239,“wikidata”:https://www.wikidata.org/wiki/Q7353546“,”display_name“:”健壮性(进化)“,”level“:3,”score“:0.784539},{”id“:”https://openalex.org/C97541855,“wikidata”:https://www.wikidata.org/wiki/Q830687“,”display_name“:”强化学习“,”level“:2,”score“:0.7775449},{”id“:”https://openalex.org/C106189395,“wikidata”:https://www.wikidata.org/wiki/Q176789“,”display_name“:”Markov决策过程“,”level“:3,”score“:0.6909437},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.68689966},{”id“:”https://openalex.org/C98763669,“wikidata”:https://www.wikidata.org/wiki/Q176645“,”display_name“:”Markov链“,”level“:2,”score“:0.5688883},{”id“:”https://openalex.org/C126255220,“wikidata”:https://www.wikidata.org/wiki/Q141495“,”display_name“:”数学优化“,”level“:1,”score“:0.5640581},{”id“:”https://openalex.org/C159886148,“wikidata”:https://www.wikidata.org/wiki/Q176645“,”display_name“:”Markov过程“,”level“:2,”score“:0.48177},{”id“:”https://openalex.org/C2778029271,“wikidata”:https://www.wikidata.org/wiki/Q5421931“,”display_name“:”扩展(谓词逻辑)“,”level“:2,”score“:0.4643104},{”id“:”https://openalex.org/C21200559,“wikidata”:https://www.wikidata.org/wiki/Q7451068“,”display_name“:”灵敏度(控制系统)“,”级别“:2,”分数“:0.45314512},{”id“:”https://openalex.org/C77405623,“wikidata”:https://www.wikidata.org/wiki/Q598451“,”display_name“:”System dynamics“,”level“:2,”score“:0.4333039},{”id“:”https://openalex.org/C47446073,“wikidata”:https://www.wikidata.org/wiki/Q5165890“,”display_name“:”控制理论(社会学)“,”level“:3,”score“:0.41995782},{”id“:”https://openalex.org/C2775924081,“wikidata”:https://www.wikidata.org/wiki/Q55608371“,”display_name“:”Control(management)“,”level“:2,”score“:0.32357588},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.29817754},{”id“:”https://openalex.org/C33923547,“wikidata”:https://www.wikidata.org/wiki/Q395“,”display_name“:”数学“,”等级“:0,”分数“:0.28447193},{”id“:”https://openalex.org/C119857082,“wikidata”:https://www.wikidata.org/wiki/Q2539“,”display_name“:”机器学习“,”level“:1,”score“:0.23313248},{”id“:”https://openalex.org/C55493867,“wikidata”:https://www.wikidata.org/wiki/Q7094“,”display_name“:”生物化学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C185592680,“wikidata”:https://www.wikidata.org/wiki/Q2329“,”display_name“:”Chemistry“,”level“:0,”score“:0.0},{”id“:”https://openalex.org/C105795698,“wikidata”:https://www.wikidata.org/wiki/Q12483“,”display_name“:”Statistics“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C24326235,“wikidata”:https://www.wikidata.org/wiki/Q126095“,”display_name“:”电子工程“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C199360897,“wikidata”:https://www.wikidata.org/wiki/Q9143“,”display_name“:”编程语言“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C104317684,“wikidata”:https://www.wikidata.org/wiki/Q7187“,”display_name“:”Gene“,”level“:2,”score“:0.0},{”id“:”https://openalex.org/C127413603,“wikidata”:https://www.wikidata.org/wiki/Q11023“,”display_name“:”Engineering“,”level“:0,”score“:0.0}],”mesh“:[],”locations_count“:1,”location“:[{”is_oa“:true,”landing_page_url“:”https://doi.org/10.1007/s10015-017-0401-2,“pdf_url”:https://link.springer.com/content/pdf/10.1007/s10015-017-0401-2.pdf,“源”:{“id”:https://openalex.org/S104439334“,”display_name“:”人造生命与机器人“,”issn_l“:”1433-5298“,”isn“:[”1433-52“,”1614-7456“],”is_oa“:false,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/P4310318900“,”“host_organization_name”:“Springer Science+Business Media”,“host_organization_lineage”:[“https://openalex.org/P431031965","https://openalex.org/P4310319900“],”host_organization_lineage_names“:[”Springer Nature“,”Springer-Science+Business Media“],“type”:“journal”},“license”:null,“licence_id”:nul,“version”:“publishedVersion”,“is_accepted”:true,“is_published”:true}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“https://doi.org/10.1007/s10015-017-0401-2,“pdf_url”:https://link.springer.com/content/pdf/10.1007/s10015-017-0401-2.pdf,“源”:{“id”:https://openalex.org/S104439334“,”display_name“:”人造生命与机器人“,”issn_l“:”1433-5298“,”isn“:[”1433-52“,”1614-7456“],”is_oa“:false,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/P4310318900“,”“host_organization_name”:“Springer Science+Business Media”,“host_organization_lineage”:[“https://openalex.org/P431031965","https://openalex.org/P4310318900“],”host_organization_lineage_names“:[”Springer Nature“,”Springer-Science+Business Media“],“type”:“journal”},“license”:null,“licence_id”:nul,“version”:“publishedVersion”,“is_accepted”:true,“is_published”:true},”sustainable_development_goals“:[],”grants“:【】,”datasets“:〔】,”versions“:【〕,”referenced_works_count“:9,”https://openalex.org/W2008920573","https://openalex.org/W2029722408","https://openalex.org/W2066920868","https://openalex.org/W2078639473","https://openalex.org/W2093524643","https://openalex.org/W2105078254","https://openalex.org/W2128152413","https://openalex.org/W2155919457","https://openalex.org/W4214717370“],”related_works“:[”https://openalex.org/W4284974072","https://openalex.org/W4225269853","https://openalex.org/W3096874164","https://openalex.org/W2937181779","https://openalex.org/W2386410636","https://openalex.org/W2357975469","https://openalex.org/W2341346307","https://openalex.org/W2145363145","https://openalex.org/W1985560493","https://openalex.org/W1626977535“],”ngrams_url“:”https://api.openalex.org/works/W2766180905/ngrams“,”“abstract_inverted_index”:{“As”:[0],“a”:[1100],“基于模型”:[2,35],“强化”:[3,36],“学习”:[4],“技术”:[5],“线性”:[6,58],“可解”:[7,59],“马尔可夫”:[8,60],“决策”:[9],“过程”:[10],“(LMDP)”:[11],“给出”:[12],“an”:[13,18,68143],“有效”:[14],“方式”:[15],“到”:[16,44],“查找”:[17],“最优”:[19],“策略”:[2010120130],“通过“:[21],“制造”:[22],“the”:[23,38,45,48,53,56,74,80103108114117127136147],“Bellman”:[24],“equation”:[25],“linear”:[26],“under”:[27],“some”:[28],“substitutions”。“:[29],”自“:[30],”LMDP“:[31,41,71],”是“:[32,42,67,99149],”被视为“:[33],”作为“:[34],”学习,“:[37],”性能“:[39123],”的“:[40,47,55,70,82113126138146],”敏感“:[43],”准确度“:[46],”环境“:[49],”模型。“:[50],“收件人”:[51],“克服”:[52],“问题”:[54],“敏感度”:[57],“游戏”:[61,75],“(LMG)”:[62],“已”:[63],“被”:[64],“提议”:[65],“其中”:[66],“扩展”:[69],“基于”:[72],“依据”:[73],“理论”。“:[76],“This”:[77],“paper”:[78],“investments”:[79],“robustivity”:[81],“LMDP-”:[83],“and”:[84,93111],“基于LMG-”:[85118],“controllers”:[86],“against”:[87],“modeling”:[88],“errors”:+89],“in”:[90],“both”:[91],“discrete”:[92],“consistent”:[94],“state-action”:[95],“problems”。“:[96],”When“:[97],”there“:[98],”difference“:[101],”between“:[102],”model“:[104145],”used“:[105],”for“:[106],”building“:[107],”control“:%109119129],”dynamics“:[112],”tested“:%11],”environment“:[116],”maintained“:121],”good“:[122],”while“:/124],”that“:[125],”LMDP-based“:[128],”严重恶化“:[131],”。“:[132],“实验”:[133],“结果”:[134],“支持”:[135],“有用性”:[137],“LMG”:[139],“框架”:[140],“何时”:[141],“获取”:[142],“准确”:[144],“环境”:[148],“困难”。“:[150]},”cited_by_api_url“:”https://api.openalex.org/works?filter=cites:W2766180905“,”counts_by_year“:[],”updated_date“:”2024-05-22T14:12:16.941689“,”创建日期“:”2017-11-10“}