{“id”:“https://openalex.org/W2580338731“,”doi“:”https://doi.org/10.3389/fnbot.2017.00001“,”title“:“自适应基线增强了基于EM的策略搜索:在智能手机平衡器的基于视图的定位任务中进行验证”,“display_name”:“自适应基准增强了基于EM的策略检索:在智能电话平衡器的以视图为基础的定位任务上进行验证”、“publication_year”:2017,“publication_date”:“2017-01-23”,“ids”:{“openalex”:“https://openalex.org/W2580338731“,”doi“:”https://doi.org/10.3389/fnbot.2017.00001“,”mag“:”2580338731“,”pmid“:”https://pubmed.ncbi.nlm.nih.gov/28167910“,”pmcid“:”https://www.ncbi.nlm.nih.gov/pmc/articles/5256123网址“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://doi.org/10.3389/fnbot.2017.00001,“pdf_url”:https://www.frontiersin.org/articles/10.3389/fnbot.2017.00001/pdf,“源”:{“id”:https://openalex.org/S115606517“,”“display_name”“:”神经机器人学的前沿“,”issn_l“:”1662-5218“,”isn“:[”1662-51218“],”is_oa“:true,”is_in_doaj“:true,”host_organization“:”https://openalex.org/P4310320527“,”host_organization_name“:”Frontiers Media“,”host_organization_lineage“:[”https://openalex.org/P4310320527“],”host_organization_lineage_names“:[”Frontiers Media“],“type”:“journal”},“license”:“cc-by”,“licence_id”:“https://openalex.org/licenses/cc-by“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},”type“:”article“,”type_crossref“:“journal-article”,”indexed_in“:[”crossref“,”publimed“],”open_access“:{”is_oa“:true,”oa_status“:”gold“,”oa_url“:”https://www.frontiersin.org/articles/10.3389/fnbot.2017.00001/pdf“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5002996776“,”display_name“:”王洁欣“,”orcid“:null},”机构“:[{”id“:”https://openalex.org/I22299242“,”display_name“:”京都大学“,”ror“:”https://ror.org/02kpeqv85“,”country_code“:”JP“,”type“:“教育”,”世系“:[”https://openalex.org/I22299242“]},{”id“:”https://openalex.org/I142637625“,”display_name“:”冲绳理工大学研究生院“,”ror“:”https://ror.org/02qg15b79“,”country_code“:”JP“,”type“:“教育”,”世系“:[”https://openalex.org/I142637625“]}],”国家“:[”JP“],”is_corresponding“:true,”raw_author_name“:”Jiexin Wang“,”raw _affiliation_strings“:[“日本京都京都大学信息学研究生院系统科学系综合系统生物学实验室”,“冲绳科学技术研究生院神经计算室,日本冲绳县Onna-son“]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5031054137“,”display_name“:”Eiji Uchibe“,”orcid“:”https://orcid.org/0000-0001-7908-0258“},”机构“:[{”id“:”https://openalex.org/I142637625“,”display_name“:”冲绳理工大学研究生院“,”ror“:”https://ror.org/02qg15b79“,”country_code“:”JP“,”type“:“教育”,”世系“:[”https://openalex.org/I142637625“]},{”id“:”https://openalex.org/I4210104143“,”display_name“:”Advanced Telecommunications Research Institute International“,”ror“:”https://ror.org/01pe1d703“,”“country_code”“:”JP“,”type“:”facility“,”lineage“:[”https://openalex.org/I4210104143“]}],”国家“:[”JP“],”is_corresponding“:false,”raw_author_name“:”Eiji Uchibe“,”raw _affiliation_strings“:[“日本京都Soraku-gun ATR计算神经科学实验室脑-机器人接口系”,“日本冲绳岛Onna-son冲绳科技研究生院神经计算室”]},{“author_position“:”last“,”author“:{”id“:”https://openalex.org/A5004840638“,”display_name“:”Kenji Doya“,”orcid“:”https://orcid.org/0000-0002-2446-6820“},”机构“:[{”id“:”https://openalex.org/I142637625“,”display_name“:”冲绳理工大学研究生院“,”ror“:”https://ror.org/02qg15b79“,”country_code“:”JP“,”type“:“教育”,”世系“:[”https://openalex.org/I142637625“]}],”国家“:[”JP“],”is_corresponding“:false,”raw_author_name“:”Kenji Doya“,”raw _affiliation_strings“:[“日本冲绳岛Onna-son冲绳科学技术研究生院神经计算部”]}],”countries_disticont_count“:1,”institutions_disticent_count”:3,“corresponding_author_ids”:[“”https://openalex.org/A5002996776“],”对应的机构ID“:[”https://openalex.org/I22299242","https://openalex.org/I142637625“],”apc_list“:{”value“:2950,”currency“:”USD“,”value_USD“:2960,”provenance“:”doaj“},”apc _payed“:”{“value”:2950、”currentary“:”美元“,”value_USD”:2960、“provenance”:“doaj”}、“has_fulltext”:true、“fulltext_origin”:“pdf”、“cited_by_count”:4、“citecd_by_percentile_year”:{“min”:81、“max”:82},“biblio”:{“volume”:“11”,“issue”:null,“first_page”:null,“last_page”:null},“is_retracted“:false,”is_paratext“:fase,”primary_topic“:{”id“:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9942,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10462“,”display_name“:”强化学习算法“,”score“:0.9942,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T12072“,”“display_name”:“机器学习研究中的主动学习”,“score”:0.9844,“subfield”:{“id”:“https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10028“,”display_name“:”自然语言处理“,”score“:0.9613,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/policy-gradient网站“,”display_name“:”策略渐变“,”score“:0.535271},{”id“:”https://openalex.org/keywords/reinforcement-learning网站“,”display_name“:”强化学习“,”score“:0.525145},{”id“:”https://openalex.org/keywords/semi-supervised-learning网站“,”display_name“:”半监督学习“,”score“:0.505029},{”id“:”https://openalex.org/keywords/named-entity-recognition网站“,”display_name“:”命名实体识别“,”score“:0.502836}],”concepts“:[{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.80165017},{”id“:”https://openalex.org/C12725497,“wikidata”:https://www.wikidata.org/wiki/Q810247“,”display_name“:”基线(sea)“,”级别“:2,”分数“:0.7591865},{”id“:”https://openalex.org/C2780451532,“wikidata”:https://www.wikidata.org/wiki/Q759676“,”display_name“:”Task(project management)“,”level“:2,”score“:0.57423574},{”id“:”https://openalex.org/C185798385,“wikidata”:https://www.wikidata.org/wiki/Q1161707“,”display_name“:”基准(测量)“,”level“:2,”score“:0.56475425},{”id“:”https://openalex.org/C2776330181,“wikidata”:https://www.wikidata.org/wiki/Q18358244“,”display_name“:”Maximization“,”level“:2,”score“:0.52863634},{”id“:”https://openalex.org/C90509273,“wikidata”:https://www.wikidata.org/wiki/Q11012“,”display_name“:”Robot“,”level“:2,”score“:0.46712926},{”id“:”https://openalex.org/C183115368,“wikidata”:https://www.wikidata.org/wiki/Q856577“,”display_name“:”Weighting“,”level“:2,”score“:0.45738026},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.42776787},{”id“:”https://openalex.org/C192921069,“wikidata”:https://www.wikidata.org/wiki/Q550134“,”display_name“:”倒立摆“,”level“:3,”score“:0.42560196},{”id“:”https://openalex.org/C8642999,“wikidata”:https://www.wikidata.org/wiki/Q417168“,”display_name“:”Hyperparameter“,”level“:2,”score“:0.42055985},{”id“:”https://openalex.org/C126255220,“wikidata”:https://www.wikidata.org/wiki/Q141495“,”display_name“:”数学优化“,”level“:1,”score“:0.20065647},{”id“:”https://openalex.org/C33923547,“wikidata”:https://www.wikidata.org/wiki/Q395“,”display_name“:”数学“,”等级“:0,”分数“:0.09389159},{”id“:”https://openalex.org/C11368507,“wikidata”:https://www.wikidata.org/wiki/Q43518“,”display_name“:”Oceanography“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C121332964,“wikidata”:https://www.wikidata.org/wiki/Q413“,”display_name“:”物理“,”级别“:0,”分数“:0.0},{”id“:”https://openalex.org/C187736073,“wikidata”:https://www.wikidata.org/wiki/Q2920921“,”display_name“:”管理“,”级别“:1,”分数“:0.0},{”id“:”https://openalex.org/C13280743,“wikidata”:https://www.wikidata.org/wiki/Q131089网址“,”display_name“:”大地测量“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C158622935,“wikidata”:https://www.wikidata.org/wiki/Q660848“,”display_name“:”非线性系统“,”level“:2,”score“:0.0},{”id“:”https://openalex.org/C62520636,“wikidata”:https://www.wikidata.org/wiki/Q944“,”display_name“:”量子力学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C205649164,“wikidata”:https://www.wikidata.org/wiki/Q1071“,”display_name“:”地理“,”级别“:0,”分数“:0.0},{”id“:”https://openalex.org/C162324750,“wikidata”:https://www.wikidata.org/wiki/Q8134“,”display_name“:”经济学“,”level“:0,”score“:0.0},{”id“:”https://openalex.org/C127313418,“wikidata”:https://www.wikidata.org/wiki/Q1069“,”display_name“:”地质“,”等级“:0,”分数“:0.0},{”id“:”https://openalex.org/C71924100,“wikidata”:https://www.wikidata.org/wiki/Q11190“,”display_name“:”Medicine“,”level“:0,”score“:0.0},{”id“:”https://openalex.org/C126838900,“wikidata”:https://www.wikidata.org/wiki/Q77604“,”display_name“:”放射学“,”level“:1,”score“:0.0}],”mesh“:[],”locations_count“:6,”location“:[{”is_oa“:true,”landing_page_url“:”https://doi.org/10.3389/fnbot.2017.00001,“pdf_url”:https://www.frontiersin.org/articles/10.3389/fnbot.2017.00001/pdf,“源”:{“id”:https://openalex.org/S115606517“,”“display_name”“:”神经机器人学的前沿“,”issn_l“:”1662-5218“,”isn“:[”1662-51218“],”is_oa“:true,”is_in_doaj“:true,”host_organization“:”https://openalex.org/P4310320527“,”“host_organization_name”:“Frontiers Media”,“host_organization_lineage”:[“https://openalex.org/P4310320527“],”host_organization_lineage_names“:[”Frontiers Media“],“type”:“journal”},“license”:“cc-by”,“licence_id”:“https://openalex.org/licenses/cc-by“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},{”is_oa“:true,”landing_page_url“:”https://europepmc.org/articles/pmc5256123,“pdf_url”:https://europepmc.org/articles/pmc5256123?pdf=render,“源”:{“id”:https://openalex.org/S4306400806“,”display_name“:”Europe PMC(PubMed Central)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I1303153112“,”“host_organization_name”:“欧洲生物信息学研究所”,“host_organization_lineage”:[“https://openalex.org/I1303153112“],”host_organization_lineage_names“:[”欧洲生物信息学研究所“],”type“:”repository“},”license“:”抄送人“,”license_id“:”https://openalex.org/licenses/cc-by“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},{”is_oa“:true,”landing_page_url“:”https://oist.repo.nii.ac.jp/?action=repository_action_common_download&item_id=210&item_no=1&attribute_id=22&file_no=1,“pdf_url”:https://oist.repo.nii.ac.jp/?action=repository_action_common_download&item_id=210&item_no=1&attribute_id=22&file_no=1,“源”:{“id”:https://openalex.org/S4306402452“,”“display_name”:“冲绳科学技术研究生院(冲绳理工研究生院)”,“issn_l”:null,“issn”:nul,“is_oa”:true,“is_ in_doaj”:false,“host_organization”:“https://openalex.org/I142637625“,”“host_organization_name”:“冲绳理工大学研究生院”,“host_ordanization_lineage”:[“https://openalex.org/I142637625“],”host_organization_lineage_names“:[”冲绳理工大学研究生院“],“type”:“repository”},“license”:“cc-by”,“licence_id”:“https://openalex.org/licenses/cc-by“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},{”is_oa“:true,”landing_page_url“:”http://hdl.handle.net/2433/218530,“pdf_url”:https://repository.kulib.kyoto-u.ac.jp/dspace/bitstream/2433/218530/1/fnbot.2017.00001.pdf,“源”:{“id”:https://openalex.org/S4306401454“,”display_name“:”京都大学研究信息库(京都大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I22299242“,”“host_organization_name”:“京都大学”,“host_ordanization_lineage”:[“https://openalex.org/I22299242“],”host_organization_lineage_names“:[”京都大学“],“type”:“repository”},“license”:“cc-by”,“licence_id”:“https://openalex.org/licenses/cc-by“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},{”is_oa“:true,”landing_page_url“:”https://www.ncbi.nlm.nih.gov/pmc/articles/PMC5256123“,”pdf_url“:null,”source“:{”id“:”https://openalex.org/S2764455111“,”display_name“:”PubMed Central“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_in_doaj“:false,”host_organization“:”https://openalex.org/I1299303238“,”“host_organization_name”:“美国国立卫生研究院”,“host_ordanization_lineage”:[“https://openalex.org/I1299303238“],”host_organization_lineage_names“:[”National Institutes of Health“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“publishedVersion”,“is_accepted”:true,“is_published”:true},{“is_oa”:false,“landing_page_url”:“https://pubmed.ncbi.nlm.nih.gov/28167910“,”pdf_url“:null,”source“:{”id“:”https://openalex.org/S4306525036“,”display_name“:”PubMed“,”issn_l“:null,”issn“:null,”is_oa“:false,”is_in_doaj“:false,”host_organization“:”https://openalex.org/I1299303238“,”“host_organization_name”:“美国国立卫生研究院”,“host_ordanization_lineage”:[“https://openalex.org/I1299303238“],”host_organization_lineage_names“:[”National Institutes of Health“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:null,“is_accepted”:false,“is_published”:false}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“https://doi.org/10.3389/fnbot.2017.00001,“pdf_url”:https://www.frontiersin.org/articles/10.3389/fnbot.2017.00001/pdf,“源”:{“id”:https://openalex.org/S115606517“,”display_name“:”神经机器人前沿“,”issn_l“:”1662-5218“,”issn“:[”1662-5218“],”is_oa“:true,”is_in_doaj“:true,”host_organization“:”https://openalex.org/P4310320527“,”“host_organization_name”:“Frontiers Media”,“host_organization_lineage”:[“https://openalex.org/P4310320527“],”host_organization_lineage_names“:[”Frontiers Media“],“type”:“journal”},“license”:“cc-by”,“licence_id”:“https://openalex.org/licenses/cc-by“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},”sustainable_development_goals“:[],”grants“:{”funder“:”https://openalex.org/F4320334764“,”funder_display_name“:”日本科学促进会“,”award_id“:”16K12504“}],”datasets“:[],”versions“:[],”referenced_works_count“:22,”referrenced_works“:[”https://openalex.org/W1499669280","https://openalex.org/W1929309940","https://openalex.org/W1971492381","https://openalex.org/W2012392077","https://openalex.org/W2075323224","https://openalex.org/W2098524868","https://openalex.org/W2105934010","https://openalex.org/W2109169869","https://openalex.org/W2112036188","https://openalex.org/W2113501460","https://openalex.org/W2133224499","https://openalex.org/W2137104525","https://openalex.org/W2146737184","https://openalex.org/W2148053762","https://openalex.org/W2163302320","https://openalex.org/W2220533764","https://openalex.org/W2271318666","https://openalex.org/W3005581722","https://openalex.org/W3007384386","https://openalex.org/W4205513846","https://openalex.org/W4241811150","https://openalex.org/W4302570325“],”related_works“:[”https://openalex.org/W4385436674","https://openalex.org/W4319453497","https://openalex.org/W4312411443","https://openalex.org/W4304777330","https://openalex.org/W4294661698","https://openalex.org/W4286982322","https://openalex.org/W2946668189","https://openalex.org/W2758480492","https://openalex.org/W2498017833","https://openalex.org/W1485630101“],”ngrams_url“:”https://api.openalex.org/works/W2580338731/ngrams网站“,”“abstract_inverted_index”:{“EM-based”:[0,57],“policy”:[1,21],“search”:[2],“methods”:[3],“estimate”:[4],“a”:[5,27,73130163188],“lower”:[6,28],“bound”:%7,29],“of”:[8,15,26,3016114117129],”“the”:[9,13,20,24,51,62,78,94102109140156174177],“expected”:[10,31],“return”摘自:[12,93108],“历史”:[14],“剧集”:[16,68],“和“:[17,37,56,97104121124127159162180183],“迭代”:[18],“更新”:[19],“参数”:[22],“使用”:[23,72],“最大值”:[25],“返回”:[32],“其中”:[33],“生成”:[34],“梯度”:[35],“计算”:[36],“学习”:[38,46],“速率”:[39],“调整”:[40],“不必要”。“:[41],”上一个“:[42],”算法“:[43179],”like“:[44],”Policy“:[45,58],”by“:[47,77],”Weighting“:[48],”Exploration“:[49,60],”with“:[00143171],”Returns“:[52],”Fitness“:[53],”Expectation“:[54],”Maximization“,”Hyperparameter“:[59],”implemented“:[61139],”mechanisures“:[63],”to“:[64,89151],“丢弃”:[65,90],“无用”:[66],“低回报”:[67],““:[69],”隐式“:[70],”或“:[71],”固定“:[74],”基线“:[75,87142],”确定“:[76],”实验者。“:[79],”In“:[80],”this“:[81],”paper“:[82],”we“:+83],”propose“:[84],”an“:[85],”适应性“:[86141172],”method“:[88175],”better“:[91],”samples“:[92],”reward“:95],”history“:[96],”examine“:[98],”different“:99],”baselines“:[100],”including“:[101],”mean“:[103],“倍数”:[105],“SDs”:[107],“平均值”。“:[110],“The”:[111],“simulation”:[112],“results”:[113168],“benchmark”:[115],“tasks”:116],“sween”:[118],“swing”:[119],“up”:[1212158],“cart-pole”:[122],“balancing”:[123],“standing”:[125157],“barging”:[128160],“tweels”:[131147],“smartphonel”:[132148],“robot”:[133149],“show”:[134169],“improved”“:[135],”表演。“:[136],“我们”:[137],“进一步”:[138],“意思”:[144],“in”:[145155],“our”:[146],“硬件”:[150],“测试”:[152],“its”:[153],“性能”:[154],“任务”:[161],“基于视图”:[164],“接近”:[165],“task”。“:[166],“我们的”:[167],“那”:[170],“基线”,:[173],“跑赢大市”:[176],“前一个”:[178],“实现”:[181],“更快”:[182],“更多”:[184],“精确”:[185],“行为”:[186],“在”:[187],“更高”:[189],“成功”:[190],“速率”。“:[191]},”cited_by_api_url“:”https://api.openalex.org/works?filter=cites:W2580338731“,”counts_by_year“:[{”year“:2020,”cited_by_count“:2},{”year“:2019,”cited_by_count”:1},“年份”:2018,”citecd_by_count“:1}],”updated_date“:”2024-06-03T01:51:23.858427“,”created_dates“:”2017-02-03“}