{“id”:“https://openalex.org/W4296963693“,”doi“:”https://doi.org/10.1007/978-3-031-17108-6_12“,”title“:”Training Agents to Satisfy Timed and Untimed Signal Temporal Logic Specifications with Reinforcement Learning“训练代理通过强化学习满足定时和非定时信号时序逻辑规范”,“display_name”:“训练代理使用强化学习满足时间和非时间信号时序逻辑规范”,“publication_year”:2022,“publiction_date”:“2022-01-01”,“ids”:{“openalex”:“https://openalex.org/W4296963693“,”doi“:”https://doi.org/10.1007/978-3-031-17108-6_12“},”language“:”en“,”primary_location“:{”is_oa“:false,”landing_page_url“:”https://doi.org/10.1007/978-3-031-17108-6_12“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S106296714“,”display_name“:”计算机科学讲义“,”issn_l“:”0302-9743“,”isn“:[”0302-7743“、”1611-3349“],”is_oa“:false、”is_in_doaj“:false、”is_core“:true、”host_organization“:”https://openalex.org/P4310318900“,”“host_organization_name”:“Springer Science+Business Media”,“host_organization_lineage”:[“https://openalex.org/P431031965","https://openalex.org/P4310318900“],”host_organization_lineage_names“:[”Springer Nature“,”Springer-Science+Business Media“],“type”:“book-series”},“license”:null,“licence_id”:nul,“version”:null,“is_accepted”:false,“is_published”:false},”type“:”book-chapter“,”type_crossref“:“book-chapter”,”indexed_in“:[“crossref”],”open_access“:{”is_oa“:false”“,”oa_url“:空,”any_repository_has_fulltext“:false},”作者身份“:[{”作者位置“:”第一个“,”作者“:{”id“:”https://openalex.org/A5062691664“,”display_name“:”Nathaniel Hamilton“,”orcid“:”https://orcid.org/0000-0002-7147-1964},“机构”:[{“id”:https://openalex.org/I200719446“,”display_name“:”范德比尔特大学“,”ror“:”https://ror.org/02vm5rt34“,”country_code“:”US“,”type“:“教育”,”世系“:[”https://openalex.org/I200719446“]}],”国家“:[”美国“],”is_corresponding“:true,”raw_author_name“:”纳撒尼尔·汉密尔顿“,”raw_affiation_strings“:[”范德比尔特大学,田纳西州纳什维尔,37212,美国“],”附属机构“:[{”raw_affiation_string“:”范德比尔特大学,田纳西州纳什维尔,37212,美国“,”institution_ids“:[”https://openalex.org/I200719446“]}]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5028566361“,”display_name“:”Preston K.Robinette“,”orcid“:”https://orcid.org/0000-0002-4906-2179},“机构”:[{“id”:https://openalex.org/I200719446“,”display_name“:”范德比尔特大学“,”ror“:”https://ror.org/02vm5rt34“,”country_code“:”US“,”type“:“教育”,”世系“:[”https://openalex.org/I200719446“]}],”国家“:[”美国“],”is_corresponding“:false,”raw_author_name“:”Preston K Robinette“,”raw _ afiliation_strings“:[“范德比尔特大学,田纳西州纳什维尔,37212,美国”],”affiliations“:[{”raw _affiliation_string“:”范德比特大学,田纳州纳什维尔,37211,美国“,”institution_ids“:[https://openalex.org/I200719446“]}]},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A5067901159“,”display_name“:”Taylor T.Johnson“,”orcid“:”https://orcid.org/0000-0001-8021-9923},“机构”:[{“id”:https://openalex.org/I200719446“,”display_name“:”范德比尔特大学“,”ror“:”https://ror.org/02vm5rt34“,”country_code“:”US“,”type“:“教育”,”世系“:[”https://openalex.org/I200719446“]}],”国家“:[”美国“],”is_corresponding“:false,”raw_author_name“:”Taylor T Johnson“,”raw _affiliation_strings“:[“范德比尔特大学,田纳西州纳什维尔,37212,美国”],”affiliations“:[{”raw _affiliation_string“:”范德比特大学,田纳州纳什威尔,37212,美国“,”institution_ids“:[https://openalex.org/I200719446“]}]}],”countries_disticont_count“:1,”institutions_disticent_count”:1,“corresponding_author_ids”:[“https://openalex.org/A5062691664“],”对应的机构ID“:[”https://openalex.org/I200719446“],”apc_list“:{”value“:5000,”currency“:”EUR“,”value_usd“:5392,”provenance“:”doaj“},”apc _payed“:null,”fwci“:1.4,”has_fulltext“:false,”cited_by_count“:1,”cited_by_percentile_year“:{”min“:66,”max“:76},“biblio”:{“volume”:null、“issue”:null,“first_page”:“190”,“last_page”:“206”},“is_retracted”:false,“is_paratext”:false,“primary_topic”:{“id”:https://openalex.org/T10142“,”“display_name”:“软件验证和控制中的形式方法”,“score”:0.998,“subfield”:{“id”:“https://openalex.org/subfields/1703“,”display_name“:”计算理论与数学“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10142“,”“display_name”:“软件验证和控制中的形式方法”,“score”:0.998,“subfield”:{“id”:“https://openalex.org/subfields/1703“,”display_name“:”计算理论与数学“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9922,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T12072“,”“display_name”:“机器学习研究中的主动学习”,“score”:0.9823,“subfield”:{“id”:“https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/reinforcement-learning网站“,”display_name“:”强化学习“,”score“:0.604134},{”id“:”https://openalex.org/keywords/temoral-logic网站“,”display_name“:”时态逻辑“,”score“:0.557968},{”id“:”https://openalex.org/keywords/active-learning网站“,”display_name“:”主动学习“,”score“:0.527951},{”id“:”https://openalex.org/keywords/runtime验证“,”display_name“:”Runtime Verification“,”score“:0.518934},{”id“:”https://openalex.org/keywords/semi-supervised-learning网站“,”display_name“:”半监督学习“,”score“:0.515565}],”concepts“:[{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.889702},{”id“:”https://openalex.org/C97541855,“wikidata”:https://www.wikidata.org/wiki/Q830687“,”display_name“:”强化学习“,”level“:2,”score“:0.8723682},{”id“:”https://openalex.org/C2780451532,“wikidata”:https://www.wikidata.org/wiki/Q759676“,”display_name“:”Task(project management)“,”level“:2,”score“:0.6883741},{”id“:”https://openalex.org/C14036430网址,“wikidata”:https://www.wikidata.org/wiki/Q3736076“,”display_name“:”功能(生物学)“,”级别“:2,”分数“:0.6026331},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.54879534},{”id“:”https://openalex.org/C2779662365,“wikidata”:https://www.wikidata.org/wiki/Q5416694“,”display_name“:”Event(particle physics)“,”level“:2,”score“:0.51959014},{”id“:”https://openalex.org/C2779843651,“wikidata”:https://www.wikidata.org/wiki/Q7390335“,”display_name“:”SIGNAL(编程语言)“,”level“:2,”score“:0.42138672},{”id“:”https://openalex.org/C119857082,“wikidata”:https://www.wikidata.org/wiki/Q2539“,”display_name“:”机器学习“,”level“:1,”score“:0.38404053},{”id“:”https://openalex.org/C199360897,“wikidata”:https://www.wikidata.org/wiki/Q9143“,”display_name“:”编程语言“,”level“:1,”score“:0.17319217},{”id“:”https://openalex.org/C121332964,“wikidata”:https://www.wikidata.org/wiki/Q413“,”display_name“:”物理“,”级别“:0,”分数“:0.0},{”id“:”https://openalex.org/C187736073,“wikidata”:https://www.wikidata.org/wiki/Q2920921“,”display_name“:”Management“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C62520636,“wikidata”:https://www.wikidata.org/wiki/Q944“,”display_name“:”量子力学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C78458016,“wikidata”:https://www.wikidata.org/wiki/Q840400“,”display_name“:”进化生物学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C162324750,“wikidata”:https://www.wikidata.org/wiki/Q8134“,”display_name“:”经济学“,”level“:0,”score“:0.0},{”id“:”https://openalex.org/C86803240,“wikidata”:https://www.wikidata.org/wiki/Q420“,”display_name“:”Biology“,”level“:0,”score“:0.0}],”mesh“:[],”locations_count“:1,”location“:[{”is_oa“:false,”landing_page_url“:”https://doi.org/10.1007/978-3-031-17108-6_12“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S106296714“,”display_name“:”计算机科学讲义“,”issn_l“:”0302-9743“,”isn“:[”0302-7743“、”1611-3349“],”is_oa“:false、”is_in_doaj“:false、”is_core“:true、”host_organization“:”https://openalex.org/P4310318900“,”“host_organization_name”:“Springer Science+Business Media”,“host_organization_lineage”:[“https://openalex.org/P431031965","https://openalex.org/P4310318900“],”host_organization_lineage_names“:[”Springer Nature“,”Springer-Science+Business Media“],“type”:“book-series”},“license”:null,“licence_id”:null,“version”:null,“is_accepted”:false,“is_published”:false}],“best_oa_location”:nul,“sustainable_development_goals”:[],“grants”:[],“dataset”:[]],“versions”:[】,“referenced_works_count”:17,“referenced_works“:[”https://openalex.org/W1499669280","https://openalex.org/W1547304883","https://openalex.org/W166862392","https://openalex.org/W2091565802","https://openalex.org/W2145339207","https://openalex.org/W2257979135","https://openalex.org/W2524638160","https://openalex.org/W2567705466","https://openalex.org/W2966537673","https://openalex.org/W2982316857","https://openalex.org/W3004091789","https://openalex.org/W3017464978","https://openalex.org/W3096990961","https://openalex.org/W3164005523","https://openalex.org/W32403112","https://openalex.org/W4210870706","https://openalex.org/W4281757468“],”related_works“:[”https://openalex.org/W4380318855","https://openalex.org/W4362501864","https://openalex.org/W4306904969","https://openalex.org/W3049728571","https://openalex.org/W2964765435","https://openalex.org/W2586732548","https://openalex.org/W2138720691","https://openalex.org/W20361778","https://openalex.org/W2031695474","https://openalex.org/W2024136090“],”ngrams_url“:”https://api.openalex.org/works/W4296963693/ngrams“,”“abstract_inverted_index”:{“强化”:[0],“学习”:[1],“(RL)”:[2],“依赖”:[3],“批判性”:[4],“on”:[5],“如何”:[6126],“奖励”:[7,42,60,83111],“函数”:[8,43],“是”:[9,18,44],“设计”:[10],“到”:[11,20,57,64,85,90131135143147],“捕获”:[12],“预期”:[13],“行为”:[14,68,93],“然而”:[15],“传统”:[16140],“方法“:[17141],”无法“:[19],”表示“:[21,38],”暂时“:[22,39],”行为“:[23,40],”这样“:[24],”作为“:[25117],”做“:[26],”任务“:[27,31],”1“:[28],”之前“:[29],“正在做”:[30],”2.“:[32],”In“:[33,69121],”the“:[34,59,66,72,78,87118150],“事件”:[35],“他们”:[36],“可以”:[37128],“这些”:[41,70],“手工制作”:[45],“作者”:[46],“研究人员”:[47],“和”:[48,5106142],“经常”:[49],“需要”:[50],“长”:[51],“小时”:[52],“的”:[53],“试验”:[54],“错误”:[56],“形状”:[58],“功能”:[61,84],“只是”:[62],“正确”:[63],“得到”:[65],“所需”:[67,73],“案例”:[71],“行为”:[74146],“是”:[75,80],“已经”:[76],“已知”:[77],“问题”:[79],“生成”:[81],“a”:[82110],“列车”:[86132],“RL”:[88133],“代理”:[89],“满足”:[91136],“that”:[92],“To”:[94],“address”:[95],“this”:[96122],“issue”,:[97],“we”:[C8124],“present”:[99],“our”:[100],“approach”:%101],“for”:[102],“automatically”:[103],“converting”:/104],“timed”:[105],“untimeed”:[107],“specifications”:[108137],“into”:[109],“函数”:[112],“其中”:[113],“有”:[114],“曾经”:[115],“实现”:[116],“工具”:[119],“STLGym.”:[120],“工作”,:[123],“显示”:[125],“ST LGym”:[127],“被”:[129],“使用”:[130],“代理”:[134],“更好”:[138148],“比”:[139],“精炼”:[144],“学习”:[145],“匹配”:[149],“规范。”:[151]},“引用_by_api_url”:“https://api.openalex.org/works?filter=cites:W4296963693“,”counts_by_year“:[{”年“:2023,”引用_by_count“:1}],”更新日期“:”2024-06-28T02:50:27.007945“,”创建日期“:“2022-09-25”}