{“id”:“https://openalex.org/W2657184275“,”doi“:”https://doi.org/10.1142/s0218213017600144“,”title“:”功能性奖励马尔可夫决策过程:理论与应用“,”display_name“:”功能性奖励马尔可夫决策过程:理论与应用“,”publication_year“:2017,”publication_date“:”2017-06-01“,”ids“:{”openalex“:”https://openalex.org/W2657184275“,”doi“:”https://doi.org/10.1142/s0218213017600144“,”mag“:”2657184275“},”language“:”en“,”primary_location“:{”is_oa“:false,”landing_page_url“:”https://doi.org/10.1142/s0218213017600144“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S178780388“,”display_name“:”国际人工智能工具杂志“,”issn_l“:”0218-2130“,”isn“:[”0218-2330“,”1793-6349“],”is_oa“:false,”is_ in_doaj“:false,”is_core“:true,”host_organization“:”https://openalex.org/P4310318815“,”host_organization_name“:”World Scientific“,”host_organization _lineage“:[”https://openalex.org/P4310318815“],”host_organization_lineage_names“:[”World Scientific“],“type”:“journal”},“license”:null,“licence_id”:null,“version”:null,“is_accepted”:false,“is_published”:false},”type“:”article“,”type_crossref“:“jornal-article”,“indexed_in”:[”crossref“],_has_fulltext“:false},”authorships“:[{”author_position“:”first“,”author“:{”id“:”https://openalex.org/A5073106112“,”display_name“:”Paul Weng“,”orcid“:”https://orcid.org/0000-0002-2008-4569},“机构”:[{“id”:https://openalex.org/I4210129003“,”display_name“:”SYSU-CMU国际联合研究院“,”ror“:”https://ror.org/02w30ae27“,”“country_code”“:”CN“,”type“:”facility“,”lineage“:[”https://openalex.org/I4210129003“]},{”id“:”https://openalex.org/I157773358“,”display_name“:”中山大学“,”ror“:”https://ror.org/0064kty71“,”country_code“:”CN“,”type“:“教育”,”世系“:[”https://openalex.org/I157773358“]}],”国家“:[”CN“],”is_corresponding“:false,”raw_author_name“:”Paul Weng“,”rau_affiliation_strings“:[“中大联合工程学院,中国广州”,“中大顺德国际联合研究院(中国)”,“中国广州高等教育中心外环东路132号SYSU电子与信息技术学院,510006“],“附属机构”:[{“raw_affiliation_string”:“SYSU-CMU联合工程学院,中国广州”,“institution_ids”:[“https://openalex.org/I4210129003","https://openalex.org/I157773358“]},{”raw_affiliation_string“:”SYSU-CMU顺德国际联合研究院(中国)“,”institution_ids“:[”https://openalex.org/I4210129003","https://openalex.org/I157773358“]},{”raw_affiliation_string“:”广州高等教育中心外环东路132号南洋理工大学电子信息技术学院,中国广州,510006”,“institution_ids”:[]}]}、{“author_position”:“last”,“author”:{“id”:“https://openalex.org/A5012670875“,”display_name“:”Olivier Spanjaard“,”orcid“:”https://orcid.org/0000-0002-9948-090X},“机构”:[{“id”:https://openalex.org/I3017942884“,”display_name“:”数学研究所\u00e9matiques de Jussieu-Paris Rive Gauche“,”ror“:”https://ror.org/03fk87k11“,”“country_code”“:”FR“,”type“:”facility“,”lineage“:[”https://openalex.org/I1294671590","https://openalex.org/I204730241","https://openalex.org/I3017942884","https://openalex.org/I39804081","https://openalex.org/I4210141950“]},{”id“:”https://openalex.org/I204730241“,”display_name“:”Universit\u00e9 Paris Cit\u00e8“,”ror“:”https://ror.org/05f82e368“,”country_code“:”FR“,”type“:“教育”,”世系“:[”https://openalex.org/I204730241“]},{”id“:”https://openalex.org/I39804081“,”display_name“:”索邦大学\u00e9“,”ror“:”https://ror.org/02en5vm52“,”country_code“:”FR“,”type“:“教育”,”世系“:[”https://openalex.org/I39804081“]},{”id“:”https://openalex.org/I4210159731“,”display_name“:”巴黎信息实验室6“,”ror“:”https://ror.org/05krcen59“,”“country_code”“:”FR“,”type“:”facility“,”lineage“:[”https://openalex.org/I1294671590","https://openalex.org/I39804081","https://openalex.org/I4210159245","https://openalex.org/I4210159731“]},{”id“:”https://openalex.org/I1294671590“,”display_name“:”国家科学中心“,”ror“:”https://ror.org/02feahw73“,”country_code“:”FR“,”type“:“政府”,”世系“:[”https://openalex.org/I1294671590“]}],”国家“:[”FR“],”is_corresponding“:false,”raw_author_name“:”Olivier Spanjaard“,”raw _ afiliation_strings“:[“4 Place Jussieu,75005,Paris,France”,“CNRS,UMR 7606,LIP6,F-75005,巴黎,法国”,“索邦大学\u00e9s,UPMC Univ Paris 06,UMR 7906,LIP 6,F-7505,Parisis,Frances”],“afiliations”:[{“raw_affiliation_string”:“4 Place Jussieu,75005,法国巴黎”,“institute_ids”:[“https://openalex.org/I3017942884“]},{”raw_affiliation_string“:”索邦大学\u00e9s,巴黎UPMC大学06,UMR 7606,LIP6,F-75005,法国巴黎“,”institution_ids“:[”https://openalex.org/I204730241","https://openalex.org/I39804081“]},{”raw_affiliation_string“:”CNRS,UMR 7606,LIP6,F-75005,法国巴黎“,”institution_ids“:[”https://openalex.org/I4210159731","https://openalex.org/I1294671590“]}]}],”institution_assertions“:[],”countries_distinct_count“:2,”institutions_disting_count”:7,”corresponding_author_ids“:[[],”coresponding_institution_ids”:[]、“apc_list”:null,“apc_payed”:nul,“fwci”:null,“has_fulltext”:“true,”fulltext_origin“:”ngrams“,”“cited_by-count”“:1,”citation_normalized_percentile“:{”“value”:0.4878 573,“is_in_to_1_percent“:false,”is_in_to_10_percent“:false},”cited_by_percentle_year“:{”min“:64,”max“:71},”biblio“:{”volume“:”26“,”issue“:”03“,”first_page“:”1760014“,”last_page“:”1760014“},”is_retracted“:false,”is_paratext“:false,”primary_topic“:{”id“:”https://openalex.org/T11303“,”“display_name”:“贝叶斯网络中的学习和推理”,“score”:0.9755,“subfield”:{“id”:“https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T11303“,”“display_name”:“贝叶斯网络中的学习和推理”,“score”:0.9755,“subfield”:{“id”:“https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10328“,”display_name“:”供应链中的协调与信息共享“,”score“:0.9702,”subfield“:{”id“:”https://openalex.org/subfields/1404“,”display_name“:”管理信息系统“},”字段“:{”id“:”https://openalex.org/fields/14“,”display_name“:”商业、管理和会计“},”域“:{”id“:”https://openalex.org/domains/2“,”“display_name”:“社会科学”}},{”id“:”https://openalex.org/T10142“,”“display_name”:“软件验证和控制中的形式方法”,“score”:0.9693,“subfield”:{“id”:“https://openalex.org/subfields/1703“,”display_name“:”计算理论与数学“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/operator网站“,”display_name“:”运算符(生物学)“,”score“:0.56474864},{”id“:”https://openalex.org/keywords/dynamic-pricing“,”display_name“:”动态定价“,”score“:0.532693},{”id“:”https://openalex.org/keywords/decision-theory网站“,”display_name“:”决策理论“,”score“:0.4259811},{”id“:”https://openalex.org/keywords/value“,”display_name“:”Value(mathematics)“,”score“:0.42336747}],”concepts“:[{”id“:”https://openalex.org/C106189395,“wikidata”:https://www.wikidata.org/wiki/Q176789“,”display_name“:”Markov决策过程“,”level“:3,”score“:0.87952507},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.85309094},{”id“:”https://openalex.org/C177148314,“wikidata”:https://www.wikidata.org/wiki/Q170084“,”display_name“:”Generalization“,”level“:2,”score“:0.72880274},{”id“:”https://openalex.org/C37404715,“wikidata”:https://www.wikidata.org/wiki/Q380679“,”display_name“:”动态编程“,”level“:2,”score“:0.58806807},{”id“:”https://openalex.org/C17020691,“wikidata”:https://www.wikidata.org/wiki/Q139677“,”display_name“:”运算符(生物学)“,”level“:5,”score“:0.56474864},{”id“:”https://openalex.org/C126255220,“wikidata”:https://www.wikidata.org/wiki/Q141495“,”display_name“:”数学优化“,”level“:1,”score“:0.5429033},{”id“:”https://openalex.org/C98763669,“wikidata”:https://www.wikidata.org/wiki/Q176645“,”display_name“:”Markov链“,”level“:2,”score“:0.5091669},{”id“:”https://openalex.org/C14646407,“wikidata”:https://www.wikidata.org/wiki/Q1430750“,”display_name“:”Bellman方程“,”level“:2,”score“:0.49619943},{”id“:”https://openalex.org/C159886148,“wikidata”:https://www.wikidata.org/wiki/Q176645“,”display_name“:”Markov过程“,”level“:2,”score“:0.44382593},{”id“:”https://openalex.org/C28901747,“wikidata”:https://www.wikidata.org/wiki/Q177571“,”display_name“:”决策理论“,”level“:2,”score“:0.4259811},{”id“:”https://openalex.org/C2776291640,“wikidata”:https://www.wikidata.org/wiki/Q2912517“,”display_name“:”Value(mathematics)“,”level“:2,”score“:0.42336747},{”id“:”https://openalex.org/C163836022,“wikidata”:https://www.wikidata.org/wiki/Q6771326“,”display_name“:”Markov模型“,”level“:3,”score“:0.42291656},{”id“:”https://openalex.org/C80444323,“wikidata”:https://www.wikidata.org/wiki/Q2878974“,”display_name“:”理论计算机科学“,”level“:1,”score“:0.32976747},{”id“:”https://openalex.org/C119857082,“wikidata”:https://www.wikidata.org/wiki/Q2539“,”display_name“:”机器学习“,”level“:1,”score“:0.25902498},{”id“:”https://openalex.org/C11413529,“wikidata”:https://www.wikidata.org/wiki/Q8366“,”display_name“:”Algorithm“,”level“:1,”score“:0.22335821},{”id“:”https://openalex.org/C33923547,“wikidata”:https://www.wikidata.org/wiki/Q395“,”display_name“:”数学“,”等级“:0,”分数“:0.12406844},{”id“:”https://openalex.org/C134306372,“wikidata”:https://www.wikidata.org/wiki/Q7754“,”display_name“:”数学分析“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C55493867,“wikidata”:https://www.wikidata.org/wiki/Q7094“,”display_name“:”生物化学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C105795698,“wikidata”:https://www.wikidata.org/wiki/Q12483“,”display_name“:”Statistics“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C185592680,“wikidata”:https://www.wikidata.org/wiki/Q2329“,”display_name“:”Chemistry“,”level“:0,”score“:0.0},{”id“:”https://openalex.org/C158448853,“wikidata”:https://www.wikidata.org/wiki/Q425218“,”display_name“:”Repressor“,”level“:4,”score“:0.0},{”id“:”https://openalex.org/C86339819,“wikidata”:https://www.wikidata.org/wiki/Q407384“,”display_name“:”转录因子“,”level“:3,”score“:0.0},{”id“:”https://openalex.org/C104317684,“wikidata”:https://www.wikidata.org/wiki/Q7187“,”display_name“:”Gene“,”level“:2,”score“:0.0}],”mesh“:[],”locations_count“:2.”locations“:[{”is_oa“:false,”landing_page_url“:”https://doi.org/10.1142/s0218213017600144“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S178780388“,”display_name“:”国际人工智能工具杂志“,”issn_l“:”0218-2130“,”issn“:[”0218-2130“,”1793-6349“],”is_oa“:false,”is_in_doaj“:false,”is_core“:true,”host_organization“:”https://openalex.org/P4310318815“,”host_organization_name“:”World Scientific“,”host_organization _lineage“:[”https://openalex.org/P4310318815“],”host_organization_lineage_names“:[”World Scientific“],“type”:“journal”},“license”:null,“licence_id”:null,“version”:null,“is_accepted”:false,“is_published”:false},{“is_oa”:false,“landing_page_url”:“https://hal.archives-ouvertes.fr/hal-01560264“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306402512“,”display_name“:”HAL(通信科学指导中心)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is-in_doaj“:false,”is_core“:false,”host_organization“:”https://openalex.org/I1294671590“,”“host_organization_name”:“国家科学研究中心”,“host_ordanization_lineage”:[“https://openalex.org/I1294671590“],”host_organization_lineage_names“:[”Centre National de la Recherche Scientifique“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:null,“is_accepted”:false,“is_published”:false}],“best_oa_location”:nul,“sustainable_development_goals”:[{“id”:”https://metadata.un.org/sdg/16“,”display_name“:”和平、正义和强大的机构“,”score“:0.57}],”grants“:[],”datasets“:[],”versions“:[】,”referenced_works_count“:8,”referrenced_works“:]”https://openalex.org/W1965941457","https://openalex.org/W1997477668","https://openalex.org/W2011592542","https://openalex.org/W2016049811","https://openalex.org/W2043858175","https://openalex.org/W2069918405","https://openalex.org/W2132807882","https://openalex.org/W3165743976“],”related_works“:[”https://openalex.org/W4389475841","https://openalex.org/W4385342861","https://openalex.org/W4285537323","https://openalex.org/W4281791088","https://openalex.org/W4255265352","https://openalex.org/W4239477580","https://openalex.org/W2952594763","https://openalex.org/W2903299703","https://openalex.org/W2117282672","https://openalex.org/W1574958246“],”abstract_inverted_index“:{”Markov“:[0],”decision“:[1],”processs“:[2],”(MDP)“:[3],”have“:[4],”begine“:[5],”one“:[6],”of“:[7,36,46,62112],”the“:[8,54,66,92,97110110117],”standard“:[9,19],”models“:[10],”for“:[11,83],”decisiontheory“:[12],”planning“:[13],”problems““:[14],”under“:[15],”不确定性“:[16],”In“:[17,29106],”its“:[18],”form“:[20],”奖励“:[21,40],”are“:[22],”assumed“:[23],”to“:[24,41,86108],”be“:[25,42,69,87],”numerical“:[26],”additive“:[27],”scalars。“:[28],”this“:[30,37,72],”paper“:[31],”we“:[32115],”propose“:[33],”a“:[34,47100],”generalization“:[35],”model“:[38],”allowing“:[39],”functional。“:[43],”The“:[44],”value“:[45],”history“:[48],”is“:[49],”recursively“:[50],”computed“:[51],”by“:[52119],”combining“:[53],”reward“:55,81],”functions“。“:[56],”We“:[57,74,89],”show“:[58109],”that“:[59],”severy“:[60121],”variants“:[61],”MDP“:[63],”presented“:/64],”in“:[65,71],”literial“:[67],”can“:[68],”installated“:[70],”setting。“:[73],”then“:[75],”identify“:[76],”sufficient“:[77],”conditions“:[78],”on“:[79],”thise“:[80],”functions“:+82],”dynamic“:[84],”programming“:[85],”valid。“:[88],”也“:[90],”讨论“:[91],”无限“:[93],”地平线“:[94],”案例“:[95,98],”和“:[96],”其中“:[99],”最大值“:[101],”运算符“:[102],”does“:[103],”not“:[104],”存在。“:[105],“顺序”:[107],“潜力”:[111],“我们的”:[113],“框架”:[114],“结论”:[116],“论文”:[118],“呈现”:[120],“说明性”:[122],“示例”。“:[123]},”cited_by_api_url“:”https://api.openalex.org/works?filter=cites:W2657184275“,”counts_by_year“:[{”年“:2017,”cited_by_count“:1}],”更新日期“:”2024-09-23T18:56:13.373423“,”创建日期“:“2017-06-30”}“