{“id”:“https://openalex.org/W4388584595“,”doi“:”https://doi.org/10.48550/arxiv.2311.04919“,”title“:“偏好协议在人类反馈强化学习中的影响:总结中的案例研究”,”display_name“:”偏好协议在人的反馈强化学习的影响:摘要中的案例分析“,”publication_year“:2023,”publitation_date“:”2023-01-01“,”ids“:{”openalex“:”https://openalex.org/W4388584595“,”doi“:”https://doi.org/10.48550/arxiv.2311.04919“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2311.04919“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“cc-by”,“licence_id”:“https://openalex.org/licenses/cc-by“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},”type“:”preprint“,”type_crossref“:“posted-content”,”indexed_in“:[”arxiv“,”datacite“],”open_access“:{”is_oa“:true,”oa_status“:”green“,”oa_url“:”https://arxiv.org/abs/2311.04919“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5079229866“,”display_name“:”Sian Gooding“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Gooding,Sian“,”raw _affiliation_strings“:],”affiliations“:[/]},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A5089795752“,”display_name“:”Hassan Mansoor“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Mansoor,Hassan“,”raw _affiliation_strings“:],”affiliations“:【】}】,“countries_distiction_count”:0,“institutions_distition_count“:0,”corresponding_author_ids“:【],”coresponding_institution_ids list“:null,”apc_payed“:null,”fwci“:null,”has_fulltext“:false,”cited_by_count“:0,”cited_by_percentile_year“:{”min“:0”max“:77},”biblio“:{”volume“:null,”issue“:nul,”first_page“:null,”last_page“:null},“is_retracted”:false、“is_paratext”:false,“primary_topic”:{“id”:“https://openalex.org/T13083“,”“display_name”:“从文本数据中自动提取关键字”,“score”:0.9986,“subfield”:{“id”:“https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T13083“,”“display_name”:“从文本数据中自动提取关键字”,“score”:0.9986,“subfield”:{“id”:“https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10028“,”display_name“:”自然语言处理“,”score“:0.9954,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10181“,”display_name“:”统计机器翻译与自然语言处理“,”score“:0.9917,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/neural-machine-translation网站“,”display_name“:”神经机器翻译“,”score“:0.486409}],”concepts“:[{”id“:”https://openalex.org/C170858558,“wikidata”:https://www.wikidata.org/wiki/Q1394144“,”display_name“:”自动摘要“,”level“:2,”score“:0.968399},{”id“:”https://openalex.org/C97541855,“wikidata”:https://www.wikidata.org/wiki/Q830687“,”display_name“:”强化学习“,”level“:2,”score“:0.7201582},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.65328443},{”id“:”https://openalex.org/C2781249084,“wikidata”:https://www.wikidata.org/wiki/Q908656“,”display_name“:”首选项“,”级别“:2,”分数“:0.6378623},{”id“:”https://openalex.org/C2779530757,“wikidata”:https://www.wikidata.org/wiki/Q1207505“,”display_name“:”质量(理念)“,”级别“:2,”分数“:0.6040153},{”id“:”https://openalex.org/C2776818064,“wikidata”:https://www.wikidata.org/wiki/Q829903“,”display_name“:”协议“,”级别“:2,”分数“:0.5558167},{”id“:”https://openalex.org/C2780451532,“wikidata”:https://www.wikidata.org/wiki/Q759676“,”display_name“:”Task(project management)“,”level“:2,”score“:0.54439765},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.51078105},{”id“:”https://openalex.org/C67203356,“wikidata”:https://www.wikidata.org/wiki/Q1321905“,”display_name“:”钢筋“,”level“:2,”score“:0.4980452},{”id“:”https://openalex.org/C204323151,“wikidata”:https://www.wikidata.org/wiki/Q905424“,”“display_name”“:”范围(航空)“,”级别“:2,”分数“:0.48480955},{”id“:”https://openalex.org/C140779682,“wikidata”:https://www.wikidata.org/wiki/Q210868“,”display_name“:”采样(信号处理)“,”level“:3,”score“:0.46305013},{”id“:”https://openalex.org/C98045186,“wikidata”:https://www.wikidata.org/wiki/Q205663“,”display_name“:”Process(computing)“,”level“:2,”score“:0.42637223},{”id“:”https://openalex.org/C119857082,“wikidata”:https://www.wikidata.org/wiki/Q2539“,”display_name“:”机器学习“,”level“:1,”score“:0.40519956},{”id“:”https://openalex.org/C15744967,“wikidata”:https://www.wikidata.org/wiki/Q9418“,”display_name“:”心理学“,”等级“:0,”分数“:0.21248072},{”id“:”https://openalex.org/C105795698,“wikidata”:https://www.wikidata.org/wiki/Q12483“,”display_name“:”Statistics“,”level“:1,”score“:0.16410884},{”id“:”https://openalex.org/C33923547,“wikidata”:https://www.wikidata.org/wiki/Q395“,”display_name“:”数学“,”等级“:0,”分数“:0.13030076},{”id“:”https://openalex.org/C77805123,“wikidata”:https://www.wikidata.org/wiki/Q161272“,”display_name“:”社会心理学“,”level“:1,”score“:0.1145404},{”id“:”https://openalex.org/C127413603,“wikidata”:https://www.wikidata.org/wiki/Q11023“,”display_name“:”Engineering“,”level“:0,”score“:0.10821095},{”id“:”https://openalex.org/C41895202,“wikidata”:https://www.wikidata.org/wiki/Q8162“,”display_name“:”语言学“,”level“:1,”score“:0.06241402},{”id“:”https://openalex.org/C138885662,“wikidata”:https://www.wikidata.org/wiki/Q5891“,”display_name“:”Philosophy“,”level“:0,”score“:0.0},{”id“:”https://openalex.org/C201995342,“wikidata”:https://www.wikidata.org/wiki/Q682496“,”display_name“:”系统工程“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C111472728,“wikidata”:https://www.wikidata.org/wiki/Q9471“,”display_name“:”认识论“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C106131492,“wikidata”:https://www.wikidata.org/wiki/Q3072260“,”display_name“:”筛选器(信号处理)“,”level“:2,”score“:0.0},{”id“:”https://openalex.org/C31972630,“wikidata”:https://www.wikidata.org/wiki/Q844240“,”display_name“:”计算机视觉“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C146978453,“wikidata”:https://www.wikidata.org/wiki/Q3798668“,”display_name“:”航空航天工程“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C111919701,“wikidata”:https://www.wikidata.org/wiki/Q9135“,”display_name“:”操作系统“,”level“:1,”score“:0.0}],”mesh“:[],”locations_count“:2,”location“:[{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2311.04919“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“cc-by”,“licence_id”:“https://openalex.org/licenses/cc-by“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},{”is_oa“:false,”landing_page_url“:”https://api.datacite.org/dois/10.48550/arxiv.2311.04919“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4393179698“,”display_name“:”DataCite API“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I4210145204“,”“host_organization_name”:“DataCite”,“host_organization_lineage”:[“https://openalex.org/I4210145204“],”host_organization_lineage_names“:[”DataCite“],“type”:“metadata”},“license”:null,“licence_id”:null,“version”:null}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“https://arxiv.org/abs/2311.04919“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“cc-by”,“licence_id”:“https://openalex.org/licenses/cc-by“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},”sustainable_development_goals“:[],”grants“:[],”datasets“:],”versions“:[https://openalex.org/W4389760904","https://openalex.org/W4323520239","https://openalex.org/W4306886878","https://openalex.org/W424223894","https://openalex.org/W3148229873","https://openalex.org/W2366403280","https://openalex.org/W2150160875","https://openalex.org/W2091301346","https://openalex.org/W1517524280","https://openalex.org/W1495108544“],”ngrams_url“:”https://api.openalex.org/works/W4388584595/ngrams网站“,”abstract_inverted_index“:{”强化“:[0],”学习“:[1],”来自“:[2],”人类“:[3],”反馈“:[4],”(RLHF)“:[5],”可以“:[6],”是“:[7],”使用“:[8],”to“:[9,58],”捕获“:[10],”复杂“:[11],”和“:[12,72],”细微差别“:[13],”属性“:[14],“of”:[15,24,48,6]2,77,96106114],“文本”:[16,25],“生成”:[17,86],“质量”:[18],“作为”:[19],“a”:[20,31,60,89,94],“结果”:[21],“the”:[22,46,75104112],“task”:[23],“summary”:[26],“has”:[27],“been”:[28],“identified”:[29],“as”:[309111],“good”:[32],“candidate”:[33],“for”:[34,51003],“this”:[35,38],“process”:[36],“In”:[37],“paper”:[39],“we”:[40],“explore”:[41],“如何”:[42],“偏好”:[43,97],“协议”:[44,64],“影响”:[45],“疗效”:[47],“RLHF”:[49],“摘要。”:[51],“我们”:[52,80],“显示”:[53,82],“那个”:[54],“采样”:[55],“人类”:[56],“偏好”:[57],“包括”:[59],“范围”:[61,95],“注释器”:[63],“结果”:[65],“在”:[66,81418],“(1)”:[67],“更高”:[68],“准确性”:[69],“奖励”:[70,90],“模型”:[71],“(2)”:[73],“改变”:[74],“特性”:[76],“质量”:[7816],“捕获”:[79],“另外”:[81],“改进”:[83],“下游”:[85],“何时”:[87],“使用”:[88],“模型”:[91],“训练”:[92],“与”:[93],“协议。”:[98],“我们的”:[99],“贡献”:[100],“有”:[101],“含义”:[102],“设计”:[105],“合成”:[107],“数据集”:[108],“井”:[110],“重要性”:[113]],“考虑”:[115],“差异”:[117],“基于比较”:[119],“数据”:[120]},“引用_by_api_url”:“https://api.openalex.org/works?filter=cites:W4388584595“,”counts_by_year“:[],”updated_date“:”2024-06-23T01:32:05.230996“,”created_date:“2023-11-11”}“