{“id”:“https://openalex.org/W4372233826“,”doi“:”https://doi.org/10.1016/j.neucom.2023.126291“,”title“:“非线性动态系统的在线强化学习控制:基于状态-动作值函数的解决方案”,”display_name“:”非线性动力学系统的在线增强学习控制:一种基于状态-行动值函数的解决方案“,”publication_year“:2023,”publitation_date“:”2023-05-05“,”ids“:{”openalex“:”https://openalex.org/W4372233826“,”doi“:”https://doi.org/10.1016/j.neucom.2023.126291“},”language“:”en“,”primary_location“:{”is_oa“:false,”landing_page_url“:”https://doi.org/10.1016/j.neucom.2023.126291“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S45693802“,”display_name“:”Neurocomputing“,”issn_l“:”0925-2312“,”isn“:[”0925-2312“,”1872-8286“],”is_oa“:false,”is_ in_doaj“:false,”is_core“:true,”host_organization“:”https://openalex.org/P4310320990“,”host_organization_name“:”爱思唯尔BV“,”host_organization_lineage“:[”https://openalex.org/P4310320990“],”host_organization_lineage_names“:[”Elsevier BV“],“type”:“journal”},“license”:null,“licence_id”:null,“version”:null,“is_accepted”:false,“is_published”:false},”type“:”article“,”type_crossref“:“jornal-article”,“indexed_in”:[”crossref“],pository_has_fulltext“:false},”authorships“:[{”author_position“:”first“,”author“:{”id“:”https://openalex.org/A5083543090“,”display_name“:”Hamed Jabbari Asl“,”orcid“:”https://orcid.org/0000-0002-3040-8539},“机构”:[{“id”:https://openalex.org/I128277893“,”display_name“:”Bah\u00e7e\u015fehir University“,”ror“:”https://ror.org/00yze4d93“,”country_code“:”TR“,”type“:“教育”,”世系“:[”https://openalex.org/I128277893“]}],”国家“:[”TR“],”is_corresponding“:true,”raw_author_name“:”Hamed Jabbari Asl“,”raw _affiliation_strings“:[“ATR计算神经科学实验室脑机器人接口部,2-2-2 Hikaridai,Seikacho,Soraku-gun,Kyoto 619-0288,日本”,“土耳其伊斯坦布尔Bahcesehir大学机电工程系工程与自然科学学院“],“affiliations”:[{“raw_affiliation_string”:“土耳其伊斯坦堡Bahcese hir大学机械电子工程系工程和自然科学学院”,“institution_ids”:[“https://openalex.org/I128277893“]},{”raw_affiliation_string“:”ATR计算神经科学实验室脑-机器人接口部,2-2-2 Hikaridai,Seikacho,Soraku-gun,Kyoto 619-0288,日本“,”institution_ids“:[]}]}“,{“author_position”:“last”,“author”:{“id”:“https://openalex.org/A5031054137“,”display_name“:”Eiji Uchibe“,”orcid“:”https://orcid.org/0000-0001-7908-0258“},”机构“:[],”国家“:[”JP“],”is_corresponding“:false,”raw_author_name“:”内知英二“,”raw _ afiliation_strings“:[“ATR计算神经科学实验室脑-机器人接口部,2-2-2 Hikaridai,Seikacho,Soraku-gun,Kyoto 619-0288,Japan”],“afliations”:[{“raw_affiliation_strong”:“”ATR计算神经科学实验室脑机器人接口部,2-2-2 Hikaridai,Seikacho,Soraku-gun,京都619-0288,日本https://openalex.org/A5083543900“],”对应的机构ID“:[”https://openalex.org/I128277893“],”apc_list“:{”value“:2470,”currency“:”USD“,”value_USD“:2480,”provenance“:”doaj“},”apc _pay“:null,”fwci“:1.12,”has_fulltext“:false,”cited_by_count“:2,”citation_normalized_percentile“:{”value:0.999884,”is_in_top_1_percent“:true,”is_ in_top_ 10_percennt“:true},“cited_by_percentile_year”:{“min”:82,“max”:87},“biblio”:{“volume”:“544”,“issue”:nullfirst_page“:”126291“,”last_page“:”26291“},”is_retracted“:false,”is_paratext“:fase,”primary_topic“:{”id“:”https://openalex.org/T12794“,”display_name“:”最优控制的自适应动态规划“,”score“:1.0,”subfield“:{”id“:”https://openalex.org/subfields/1703“,”display_name“:”计算理论与数学“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T12794“,”display_name“:”最优控制的自适应动态规划“,”score“:1.0,”subfield“:{”id“:”https://openalex.org/subfields/1703“,”display_name“:”计算理论与数学“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10040“,”“display_name”:“机器人控制与稳定技术”,“score”:0.9798,“subfield”:{“id”:“https://openalex.org/subfields/2207“,”display_name“:”控制与系统工程“},”字段“:{”id“:”https://openalex.org/fields/22“,”display_name“:”Engineering“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T14083“,”“display_name”:“动态系统中的极值搜索控制”,“score”:0.9721,“subfield”:{“id”:“https://openalex.org/subfields/2207“,”display_name“:”控制与系统工程“},”字段“:{”id“:”https://openalex.org/fields/22“,”display_name“:”Engineering“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/reinforcement-learning网站“,”display_name“:”强化学习“,”score“:0.592664},{”id“:”https://openalex.org/keywords/非线性控制“,”display_name“:”非线性控制“,”score“:0.578398},{”id“:”https://openalex.org/keywords/optimal-control(https://openalex.org/关键词/最优控制)“,”display_name“:”最优控制“,”score“:0.5651},{”id“:”https://openalex.org/keywords/adaptive-control网站“,”display_name“:”自适应控制“,”score“:0.54679},{”id“:”https://openalex.org/keywords/real-time-optimization(https://openalex.org/keywords/real-time-optimization)“,”display_name“:”实时优化“,”score“:0.546599}],”concepts“:[{”id“:”https://openalex.org/C97541855,“wikidata”:https://www.wikidata.org/wiki/Q830687“,”display_name“:”强化学习“,”level“:2,”score“:0.77982444},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.6586847},{”id“:”https://openalex.org/C47446073,“wikidata”:https://www.wikidata.org/wiki/Q5165890“,”display_name“:”控制理论(社会学)“,”level“:3,”score“:0.63762283},{”id“:”https://openalex.org/C154504017,“wikidata”:https://www.wikidata.org/wiki/Q853614“,”display_name“:”标识符“,”级别“:2,”分数“:0.606136},{”id“:”https://openalex.org/C158622935,“wikidata”:https://www.wikidata.org/wiki/Q660848“,”display_name“:”非线性系统“,”level“:2,”score“:0.5553104},{”id“:”https://openalex.org/C14646407,“wikidata”:https://www.wikidata.org/wiki/Q1430750“,”display_name“:”Bellman equation“,”level“:2,”score“:0.5509247},{”id“:”https://openalex.org/C2777303404,“wikidata”:https://www.wikidata.org/wiki/Q759757“,”display_name“:”Convergence(economics)“,”level“:2,”score“:0.53491837},{”id“:”https://openalex.org/C91575142,“wikidata”:https://www.wikidata.org/wiki/Q1971426“,”display_name“:”最优控制“,”level“:2,”score“:0.5275357},{”id“:”https://openalex.org/C60640748,“wikidata”:https://www.wikidata.org/wiki/Q2337858“,”display_name“:”Lyapunov函数“,”level“:3,”score“:0.52217174},{”id“:”https://openalex.org/C126255220,“wikidata”:https://www.wikidata.org/wiki/Q141495“,”display_name“:”数学优化“,”level“:1,”score“:0.48287943},{”id“:”https://openalex.org/C203479927,“wikidata”:https://www.wikidata.org/wiki/Q5165939“,”display_name“:”控制器(灌溉)“,”level“:2,”score“:0.48129},{”id“:”https://openalex.org/C13662910,“wikidata”:https://www.wikidata.org/wiki/Q193139“,”display_name“:”Trajectory“,”level“:2,”score“:0.4722668},{”id“:”https://openalex.org/C14036430网址,“wikidata”:https://www.wikidata.org/wiki/Q3736076“,”display_name“:”功能(生物学)“,”级别“:2,”分数“:0.42883408},{”id“:”https://openalex.org/C33923547,“wikidata”:https://www.wikidata.org/wiki/Q395“,”display_name“:”数学“,”等级“:0,”分数“:0.2944497},{”id“:”https://openalex.org/C2775924081,“wikidata”:https://www.wikidata.org/wiki/Q55608371“,”display_name“:”Control(management)“,”level“:2,”score“:0.2593661},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.117409945},{”id“:”https://openalex.org/C86803240,“wikidata”:https://www.wikidata.org/wiki/Q420“,”display_name“:”生物学“,”等级“:0,”分数“:0.0},{”id“:”https://openalex.org/C121332964,“wikidata”:https://www.wikidata.org/wiki/Q413“,”display_name“:”物理“,”级别“:0,”分数“:0.0},{”id“:”https://openalex.org/C62520636,“wikidata”:https://www.wikidata.org/wiki/Q944“,”display_name“:”量子力学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C78458016,“wikidata”:https://www.wikidata.org/wiki/Q840400“,”display_name“:”进化生物学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C1276947,“wikidata”:https://www.wikidata.org/wiki/Q333“,”display_name“:”天文学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C6557445,“wikidata”:https://www.wikidata.org/wiki/Q173113“,”display_name“:”农学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C162324750,“wikidata”:https://www.wikidata.org/wiki/Q8134“,”display_name“:”经济学“,”level“:0,”score“:0.0},{”id“:”https://openalex.org/C199360897,“wikidata”:https://www.wikidata.org/wiki/Q9143“,”display_name“:”编程语言“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C50522688,“wikidata”:https://www.wikidata.org/wiki/Q189833“,”display_name“:”经济增长“,”level“:1,”score“:0.0}],”mesh“:[],”locations_count“:1.”locations“:[{”is_oa“:false,”landing_page_url“:”https://doi.org/10.1016/j.neucom.2023.126291“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S45693802“,”display_name“:”Neurocomputing“,”issn_l“:”0925-2312“,”isn“:[”0925-2312“,”1872-8286“],”is_oa“:false,”is_ in_doaj“:false,”is_core“:true,”host_organization“:”https://openalex.org/P4310320990“,”host_organization_name“:”爱思唯尔BV“,”host_organization_lineage“:[”https://openalex.org/P4310320990“],”host_organization_lineage_names“:[”Elsevier BV“],“type”:“journal”},“license”:null,“licence_id”:nul,“version”:null,“is_accepted”:false,“is_published”:false}],“best_oa_location”:null,“sustainable_development_goals”:[{“score”:0.55,“display_name”:“和平、正义和强大的制度”,“id”:“https://metadata.un.org/sdg/16“}],”grants“:[],”datasets“:[],”versions“:[】,”referenced_works_count“:31,”referrenced_works“:【”https://openalex.org/W1542432808","https://openalex.org/W1606119439","https://openalex.org/W1854776945","https://openalex.org/W1968908471","https://openalex.org/W1977671496","https://openalex.org/W1981174120","https://openalex.org/W1983523797","https://openalex.org/W1998173386","https://openalex.org/W2010152647","https://openalex.org/W2011694027","https://openalex.org/W2013184330","https://openalex.org/W2085194340","https://openalex.org/W2104843094","https://openalex.org/W2131030156","https://openalex.org/W2136064843","https://openalex.org/W2146014298","https://openalex.org/W2152161277","https://openalex.org/W2184126965","https://openalex.org/W2478039428","https://openalex.org/W2528940545","https://openalex.org/W2564717627","https://openalex.org/W2777247237","https://openalex.org/W2943141190","https://openalex.org/W3215095098","https://openalex.org/W4210935577","https://openalex.org/W4214691950","https://openalex.org/W4238093859","https://openalex.org/W4239705272","https://openalex.org/W4285175029","https://openalex.org/W4285505520","https://openalex.org/W644929910“],”related_works“:[”https://openalex.org/W4384825839","https://openalex.org/W4372294702","https://openalex.org/W4313123734","https://openalex.org/W4239477580","https://openalex.org/W2907195160","https://openalex.org/W2787184676","https://openalex.org/W2507513082","https://openalex.org/W2156232164","https://openalex.org/W1990582753","https://openalex.org/W1971360108“],”abstract_inverted_index“:{”In“:[0109],”this“:[1],”paper“:[2],”we“:[3],”present“:[4],”an“:[5],”online“:[6],”reinforction“:[7],”learning-based“:[8],”solution“:[9],”to“:[10,44,69,79,98135],”the“:[11,34,62,65,71,81,92102111116142145],”optimal“:[12,83106],”control“:[13147],“问题”:[14],“的”:[15,31,33,64119144],“连续时间”:[16],“非线性“:[17],”输入仿射“:[18],”系统。“:[19129],”The“:[20,40,54,85],”proposed“:[21],”approach“:[22,87],”contains“:[23],”a“:[24,46],”concurrent“:[25],”identifier“:[26,41],”that“:[27],”estimaties“:[28],”time“:[2],”derivatives“:[30],”states“:[32],”system“:35,66],”in“:[36,50105127],”some“:[37,51],”任意“:[38],“点。“:[39,53],”is“:[42,76,96123],”used“:[43],”simulate“:[45],”所谓的“:[47],”Bellman“:[48113],”error“:[49],”unvisited“:[52],”simulated“:[55112],”errors“:[56,59114],”together“:[57],”with“:[58],”获得“:[60],”along“:[61],”trajection“:[63],”are“:[67],”used“:[68],”估计“:[70],”状态操作“:[72],”值“:[73],”函数“:[74],”其中“:[75,95122],”则“:[77],”采用“:[78],”推导“:[80136],”估计“:[82],”控制器。“:[84],“设计”:[86],“做”:[88],“不”:[89],“明确”:[90],“要求”:[91],“输入”:[93],“动态”:[94],“硬”:[97],“隔离”:[99],“它”:[100],“来自”:[101],“漂移”:[103],“动力学”:[104],“监管”:[107],“问题”。“:[108],”addition,“:[110],”relax“:[115],”confining“:[117],”persistence“:[118],”excision“:[120],”条件,“:121],”needed“:[124],”for“:[125],”收敛“:[126137],”确定性“:[128],”A“:[130],”Lyapunov-based“:[131],”分析“:[132],”was“:[133],”执行“:[134],”个条件。“:[138],”模拟“:[139],”研究“:[140],”演示“:[141],”有效性“:[143],”开发“:[146],”方案。“:[148]},”cited_by_api_url“:”https://api.openalex.org/works?filter=引用:W4372233826“,”counts_by_year“:[{”年份“:2024,”cited_by_count“:1},{”年“:2023,”cited_by_count”:1}],”更新日期“:”2024-09-24T18:06:13.117497“,”创建日期“:“2023-05-07”}