{“id”:“https://openalex.org/W2032950725“,”doi“:”https://doi.org/10.1007/st0994-014-5458-8“,”title“:“基于偏好的强化学习:使用基于偏好的竞赛算法进行进化性直接策略搜索”,”display_name“:”基于偏好的加强学习:使用以偏好为基础的竞赛算法的进化性直接政策搜索“,”publication_year“:2014,”publiation_date“:”2014-07-02“,”ids“:{”openalex“:”https://openalex.org/W2032950725“,”doi“:”https://doi.org/10.1007/st0994-014-5458-8“,”mag“:”2032950725“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://doi.org/10.1007/s10994-014-5458-8,“pdf_url”:https://link.springer.com/content/pdf/10.1007%2Fs10994-014-5458-8.pdf“,”源“:{”id“:”https://openalex.org/S62148650“,”display_name“:”机器学习“,”issn_l“:”0885-6125“,”isn“:[”0885-6 125“,“1573-0565”],”is_oa“:false,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/P4310318900“,”“host_organization_name”:“Springer Science+Business Media”,“host_organization_lineage”:[“https://openalex.org/P431031965","https://openalex.org/P4310318900“],”host_organization_lineage_names“:[”Springer Nature“,”Springer-Science+Business Media“],“type”:“journal”},“license”:null,“licence_id”:nul,“version”:“publishedVersion”,“is_accepted”:true,“is_published”:true},”type“:“article”,“type_crossref”:”journal-article“,”indexed_in“:[“crossref”],“open_access”:{“is_oa”:true,“oa_status”:“青铜色,“oa_url”:https://link.springer.com/content/pdf/10.1007%2Fs10994-014-5458-8.pdf“,”any_repository_has_fulltext“:true},”作者身份“:[{”作者位置“:”第一个“,”作者“:{”id“:”https://openalex.org/A5047520070“,”display_name“:”R\u00f3bert Busa\u2010Fekete“,”orcid“:”https://orcid.org/0000-0002-3691-650X},“机构”:[{“id”:https://openalex.org/I161103922“,”display_name“:”马尔堡菲利普斯大学“,”ror“:”https://ror.org/01rdrb571“,”country_code“:”DE“,”type“:“教育”,”世系“:[”https://openalex.org/I161103922“]}],”国家“:[”DE“],”is_corresponding“:true,”raw_author_name“:”R\u00f3bert Busa-Fekete“,”raw _ afiliation_strings“:[“计算智能小组,德国马尔堡大学数学与计算机科学系”]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5048258912“,”display_name“:”Bal\u00e1zs Sz\u00f6r\u00e9nyi“,”orcid“:null},”institutions“:[{”id“:”https://openalex.org/I4210152167“,”display_name“:”MTA-SZTE人工智能研究小组“,”ror“:”https://ror.org/0507fk326“,”“country_code”“:”HU“,”type“:”facility“,”lineage“:[”https://openalex.org/I227486990","https://openalex.org/I4210152167","https://openalex.org/I7597260“]}],”国家“:[”HU“],”is_corresponding“:false,”raw_author_name“:”Bal\u00e1zs Sz\u00f6r\u00e9nyi“,”raw _affiliation_strings“:[“MTA-SZTE人工智能研究组,Tisza Lajos Krt.103,6720\u00a0,Szeged,Hungary”]},{“author_position”:“middle”,“author”:{“id”https://openalex.org/A5073106112“,”display_name“:”Paul Weng“,”orcid“:”https://orcid.org/0000-0002-2008-4569},“机构”:[{“id”:https://openalex.org/I204730241“,”display_name“:”Universit\u00e9 Paris Cit\u00e8“,”ror“:”https://ror.org/05f82e368“,”country_code“:”FR“,”type“:“教育”,”世系“:[”https://openalex.org/I204730241“]},{”id“:”https://openalex.org/I39804081“,”display_name“:”索邦大学\u00e9“,”ror“:”https://ror.org/02en5vm52“,”country_code“:”FR“,”type“:“教育”,”世系“:[”https://openalex.org/I39804081“]}],”国家“:[”FR“],”is_corresponding“:false,”raw_author_name“:”Paul Weng“,”raw _affiliation_strings“:[“索邦大学\u00e9/s,UPMC巴黎大学06,UMR 7606,LIP6,4 Place Jussieu,75005,\u00a0Paris,France”]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5043737358“,”display_name“:”Weiwei Cheng“,”orcid“:”https://orcid.org/0000-0002-3381-4188},“机构”:[{“id”:https://openalex.org/I161103922“,”display_name“:”马尔堡菲利普斯大学“,”ror“:”https://ror.org/01rdrb571“,”country_code“:”DE“,”type“:“教育”,”世系“:[”https://openalex.org/I161103922“]}],”国家“:[”DE“],”is_corresponding“:false,”raw_author_name“:”Weiwei Cheng“,”raw _affiliation_strings“:[“计算智能小组,德国马尔堡大学数学与计算机科学系”]},{“author_position”:“last”,“author”:{“id”:“https://openalex.org/A5059439673“,”display_name“:”Eyke H\u00fcllermier“,”orcid“:”https://orcid.org/0000-0002-9944-4108},“机构”:[{“id”:https://openalex.org/I161103922“,”display_name“:”马尔堡菲利普斯大学“,”ror“:”https://ror.org/01rdrb571“,”country_code“:”DE“,”type“:“教育”,”世系“:[”https://openalex.org/I161103922“]}],”国家“:[”DE“],”is_corresponding“:false,”raw_author_name“:”Eyke H\u00fcllermier“,”raw_affiliation_strings“:[“计算智能小组,德国马尔堡大学数学与计算机科学系”]}]“countries_distiction_count”:3,“institutions_disticent_count“:4,”corresponding_author_ids“:]”https://openalex.org/A5047520070“],”对应的机构ID“:[”https://openalex.org/I161103922“],”apc_list“:{”value“:2390,”currency“:”EUR“,”value_usd“:2990,”provenance“:”doaj“},”apc _payed“:”{“value”:2390、”current“:”欧元“,”value_usd”:2990、“provenance”:“doaj”}、“has_fulltext”:true、“fulltext_origin”:“pdf”、“cited_by_count”:27、“citecd_by_percentile_year”:{“min”:93、“max”:94},“biblio”:{“volume”:“97”,“issue”:“3”,“first_page”:“327”,“last_page”:”351“},“is_retracted“:false,”is_paratext“:false,”primary_topic“:{”id“:”https://openalex.org/T1975“,”“display_name”:“遗传编程在机器学习中的应用”,“score”:0.9996,“subfield”:{“id”:“https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T1975“,”“display_name”:“遗传编程在机器学习中的应用”,“score”:0.9996,“subfield”:{“id”:“https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.999,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10848“,”“display_name”:“进化算法中的多目标优化”,“score”:0.9986,“subfield”:{“id”:“https://openalex.org/subfields/1703“,”display_name“:”计算理论与数学“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/reinforcement-learning网站“,”display_name“:”强化学习“,”score“:0.597688},{”id“:”https://openalex.org/keywords/dep-learning网站“,”display_name“:”深度学习“,”score“:0.529622},{”id“:”https://openalex.org/keywords/symbolic-regression网站“,”display_name“:”符号回归“,”score“:0.519929},{”id“:”https://openalex.org/keywords/semantic-genetic-programming“,”display_name“:”语义遗传编程“,”score“:0.516456},{”id“:”https://openalex.org/keywords/feature-selection(https://openalex.org/keywords/feature-selection)“,”display_name“:”功能选择“,”score“:0.516078}],”concepts“:[{”id“:”https://openalex.org/C184898388,“wikidata”:https://www.wikidata.org/wiki/Q1435712“,”display_name“:”成对比较“,”level“:2,”score“:0.7807478},{”id“:”https://openalex.org/C2781249084,“wikidata”:https://www.wikidata.org/wiki/Q908656“,”display_name“:”首选项“,”级别“:2,”分数“:0.7516581},{”id“:”https://openalex.org/C97541855,“wikidata”:https://www.wikidata.org/wiki/Q830687“,”display_name“:”强化学习“,”level“:2,”score“:0.693906},{”id“:”https://openalex.org/C181204326,“wikidata”:https://www.wikidata.org/wiki/Q7239820“,”display_name“:”偏好学习“,”level“:3,”score“:0.5979493},{”id“:”https://openalex.org/C2164484,“wikidata”:https://www.wikidata.org/wiki/Q5170150“,”display_name“:”芯(光纤)“,”level“:2,”score“:0.57554793},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.56009966},{”id“:”https://openalex.org/C159149176,“wikidata”:https://www.wikidata.org/wiki/Q14489129“,”display_name“:”进化算法“,”level“:2,”score“:0.5272022},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.51597387},{”id“:”https://openalex.org/C177264268,“wikidata”:https://www.wikidata.org/wiki/Q1514741“,”display_name“:”Set(abstract data type)“,”level“:2,”score“:0.5082425},{”id“:”https://openalex.org/C119857082,“wikidata”:https://www.wikidata.org/wiki/Q2539“,”display_name“:”机器学习“,”level“:1,”score“:0.4671034},{”id“:”https://openalex.org/C41608201,“wikidata”:https://www.wikidata.org/wiki/Q980509“,”display_name“:”Embedding“,”level“:2,”score“:0.4627879},{”id“:”https://openalex.org/C11413529,“wikidata”:https://www.wikidata.org/wiki/Q8366“,”display_name“:”Algorithm“,”level“:1,”score“:0.39740664},{”id“:”https://openalex.org/C126255220,“wikidata”:https://www.wikidata.org/wiki/Q141495“,”display_name“:”数学优化“,”level“:1,”score“:0.37935504},{”id“:”https://openalex.org/C33923547,“wikidata”:https://www.wikidata.org/wiki/Q395“,”display_name“:”数学“,”等级“:0,”分数“:0.2923271},{”id“:”https://openalex.org/C105795698,“wikidata”:https://www.wikidata.org/wiki/Q12483“,”display_name“:”Statistics“,”level“:1,”score“:0.093312114},{”id“:”https://openalex.org/C76155785,“wikidata”:https://www.wikidata.org/wiki/Q418“,”display_name“:”Telecommunications“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C199360897,“wikidata”:https://www.wikidata.org/wiki/Q9143“,”display_name“:”Programming language“,”level“:1,”score“:0.0}],”mesh“:[],”locations_count“:6,”locations“:[{”is_oa“:true,”landing_page_url“:”https://doi.org/10.1007/s10994-014-5458-8,“pdf_url”:https://link.springer.com/content/pdf/10.1007%2Fs10994-014-5458-8.pdf“,”源“:{”id“:”https://openalex.org/S62148650“,”display_name“:”机器学习“,”issn_l“:”0885-6125“,”isn“:[”0885-6 125“,“1573-0565”],”is_oa“:false,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/P4310318900“,”“host_organization_name”:“Springer Science+Business Media”,“host_organization_lineage”:[“https://openalex.org/P431031965","https://openalex.org/P4310318900“],”host_organization_lineage_names“:[”Springer Nature“,”Springer-Science+Business Media“],“type”:“journal”},“license”:null,“licence_id”:nul,“version”:“publishedVersion”,“is_accepted”:true,“is_published”:true},{“is_oa”:true,“landing_page_url”:“https://hal.inia.fr/hal-01079370,“pdf_url”:https://inria.hal.science/hal-01079370/document(英文),“源”:{“id”:https://openalex.org/S4306402512“,”display_name“:”HAL(通信科学指导中心)“,”issn_l“:null,”issn“:nul,”is_oa“:true,”is-in_doaj“:false,”host_organization“:”https://openalex.org/I1294671590“,”“host_organization_name”:“法国国家科学研究中心”,“host_ordanization_lineage”:[“https://openalex.org/I1294671590“],”host_organization_lineage_names“:[”法国国家科学研究中心“],“type”:“repository”},“license”:“other-oa”,“licence_id”:“https://openalex.org/licenses/other-oa网站“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},{”is_oa“:true,”landing_page_url“:”https://hal.inia.fr/hal-01079370/document,“pdf_url”:https://hal.inia.fr/hal-01079370/document,“源”:{“id”:https://openalex.org/S4306402512“,”display_name“:”HAL(通信科学指导中心)“,”issn_l“:null,”issn“:nul,”is_oa“:true,”is-in_doaj“:false,”host_organization“:”https://openalex.org/I1294671590“,”“host_organization_name”:“法国国家科学研究中心”,“host_ordanization_lineage”:[“https://openalex.org/I1294671590“],”host_organization_lineage_names“:[”法国国家科学研究中心“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false},{“is_oa”:true,“landing_page_url”:“https://publicatio.bibl.u-szeged.hu/4795/1/revised_1_5.pdf,“pdf_url”:https://publicatio.bibl.u-szeged.hu/4795/1/revised_1_5.pdf,“源”:{“id”:https://openalex.org/S430640436“,”display_name“:”SZTE Publicatio Repozit\u00f3rium(瑞典大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I227486990“,”“host_organization_name”:“塞格德大学”,“host_organization_lineage”:[“https://openalex.org/I227486990“],”host_organization_lineage_names“:[”塞格德大学“],”type“:”repository“},”license“:null,”license_id“:null,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},{”is_oa“:true,”landing_page_url“:”https://inria.hal.science/hal-01079370/file/revised_1_1.pdf,“pdf_url”:https://inria.hal.science/hal-01079370/file/revised_1_1.pdf,“源”:{“id”:https://openalex.org/S4306402512“,”display_name“:”HAL(通信科学指导中心)“,”issn_l“:null,”issn“:nul,”is_oa“:true,”is-in_doaj“:false,”host_organization“:”https://openalex.org/I1294671590“,”“host_organization_name”:“法国国家科学研究中心”,“host_ordanization_lineage”:[“https://openalex.org/I1294671590“],”host_organization_lineage_names“:[”法国国家科学研究中心“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false},{“is_oa”:true,“landing_page_url”:“https://hal.inia.fr/hal-01079370/file/revised_1_1.pdf,“pdf_url”:https://hal.inia.fr/hal-01079370/file/revised_1_1.pdf,“源”:{“id”:https://openalex.org/S4306402512“,”display_name“:”HAL(通信科学指导中心)“,”issn_l“:null,”issn“:nul,”is_oa“:true,”is-in_doaj“:false,”host_organization“:”https://openalex.org/I1294671590“,”“host_organization_name”:“法国国家科学研究中心”,“host_ordanization_lineage”:[“https://openalex.org/I1294671590“],”host_organization_lineage_names“:[”法国国家科学研究中心“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“https://doi.org/10.1007/s10994-014-5458-8,“pdf_url”:https://link.springer.com/content/pdf/10.1007%2Fs10994-014-5458-8.pdf“,”源“:{”id“:”https://openalex.org/S62148650“,”display_name“:”机器学习“,”issn_l“:”0885-6125“,”isn“:[”0885-6 125“,“1573-0565”],”is_oa“:false,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/P4310318900“,”“host_organization_name”:“Springer Science+Business Media”,“host_organization_lineage”:[“https://openalex.org/P431031965","https://openalex.org/P4310318900“],”host_organization_lineage_names“:[”Springer Nature“,”Springer-Science+Business Media“],“type”:“journal”},“license”:null,“licence_id”:nul,“version”:“publishedVersion”,“is_accepted”:true,“is_published”:true},”sustainable_development_goals“:[{”score“:0.51,”id“:”https://metadata.un.org/sdg/16“,”display_name“:”和平、正义和强大的机构“}],”grants“:[],”datasets“:[],”versions“:[】,”referenced_works_count“:27,”refernced_works“:[”https://openalex.org/W122021961","https://openalex.org/W1484675474","https://openalex.org/W1576660662","https://openalex.org/W1583155004","https://openalex.org/W1583953806","https://openalex.org/W1585839838","https://openalex.org/W1605438009","https://openalex.org/W1861050369","https://openalex.org/W1965281372","https://openalex.org/W1977326596网址","https://openalex.org/W1999874108","https://openalex.org/W2012367441","https://openalex.org/W2027907186","https://openalex.org/W2044493620","https://openalex.org/W2057785395","https://openalex.org/W2059654640","https://openalex.org/W2066251678","https://openalex.org/W2097452095","https://openalex.org/W2129297552","https://openalex.org/W2154023516","https://openalex.org/W2156682402","https://openalex.org/W2168405694","https://openalex.org/W2315464424","https://openalex.org/W233478222","https://openalex.org/W2797333853","https://openalex.org/W4211221179","https://openalex.org/W4233413206“],”related_works“:[”https://openalex.org/W4389072749","https://openalex.org/W4324116389","https://openalex.org/W4206238124","https://openalex.org/W3126212998","https://openalex.org/W3105737538","https://openalex.org/W2516425091","https://openalex.org/W2161073979","https://openalex.org/W2060303324","https://openalex.org/W1968265719","https://openalex.org/W1515481220“],”ngrams_url“:”https://api.openalex.org/works/W2032950725/ngrams“,”“abstract_inverted_index”:{“We”:[0],“introduce”:[1],“a”:[2,10,14,29,38,54,75101],“novel”:[3],“approach”:[4,27115],“to”:[5],“preference-based”:[6,11,30],“reinforction”:[7],“learning”:[8],“即”:[9],“variant”:[12],“of”:[13,25,41,67,84,89],“direct”:[15],“policy”:[16],“搜索”:[17,78],“方法”:[18],“基于”:[19],“on”:[20,53],“进化“:[21,77],”优化。“:[22],”The“:[23],”core“:[24],”our“:[26114],”is“:[28],”racing“:[31,72],”algorithm“:[32,51,73],”that“:[33,82113],”selects“:[34],”The“:[35,50,68,71,85],”best“:[36],”from“:[37],”givent“:[39],”set“:[40,88],”candidated“:[42],”policies“:[43,91],”with“:[44,95],“高”:[45],“概率。“:[46],“收件人”:[47],“此”:[48],“结束”:[49],“操作”:[52],“合适”:[55],“序号”:[56],“首选项”:[57],“结构”:[58],“和”:[59104],“仅”:[60],“使用”:[61],“成对”:[62],“比较”:[63],“介于”:[64],“示例”:[65],“卷展栏”:[66],“策略”。“:[69],“嵌入”:[70],“in”:[74118],“基于等级”:[76],“过程”,:[79],“我们”:[80107],“显示”:[81],“近似值”:[83],“所谓的”:[86],“史密斯”:[87],“最佳”:[90],“可以”:[92],“是”:[93],“生产”:[94],“确定”:[96],“理论”:[97],“保证”。“:[98],“分开”:[99],“来自”:[100],“正式”:[102],“表现”:[103],“复杂性”:[105],“分析”:[106],“现在”:[108],“第一”:[109],“实验”:[110],“研究”:[111],“显示”:[112],“执行”:[116],“好”:[117],“实践”。“:[119]},”cited_by_api_url“:”https://api.openalex.org/works?filter=cites:W2032950725“,”counts_by_year“:[{”year“:2024,”cited_by_count“:1},{”year“:2023,”cited_by_count”:3},”{“year”:2022,”citecd_by_count“:3{,”年“:2021,”citesd_by_count“:4},“year“:2020,”citted_by-count“:5},“年份”:2017,“引用_by_count”:2},{“年份”:2016,“引用_ by_counts”:1},}“年份“:2015,“引用的by_count:1},{“年份”:2014,“引用_ by_count”:1},{”年份“:2013,”引用_ by-count“:1}],”更新日期“:“2024-05-25T20:38:52.475647”,“创建日期”:“2016-06-24”}