{“id”:“https://openalex.org/W4389911544“,”doi“:”https://doi.org/10.48550/arxiv.2312.09390“,”title“:”弱到强概括:在弱监督下激发强大能力“,”display_name“:”弱到强概括:在弱监督下激发强大能力“,”publication_year“:2023,”publication_date“:”2023-01-01“,”ids“:{”openalex“:”https://openalex.org/W4389911544“,”doi“:”https://doi.org/10.48550/arxiv.2312.09390“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2312.09390“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“other-oa”,“licence_id”:“https://openalex.org/licenses/other-oa网站“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},”type“:”preprint“,”type_crossref“:“posted-content”,”indexed_in“:[”arxiv“,”datacite“],”open_access“:{”is_oa“:true,”oa_status“:”green“,”oa_url“:”https://arxiv.org/abs/2312.09390“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5022381014“,”display_name“:”Collin Burns“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Burns,Collin“,”raw _affiliation_strings“:]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5069234607“,”display_name“:”Pavel Izmailov“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“,”Izmaillov,Pavel“,”raw _affiliation_strings“:[/]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5018518179“,”display_name“:”Jan H.Kirchner“,”orcid“:”https://orcid.org/0000-0002-9126-0558“},”机构“:[],”国家“:[],”is_correresponsing“:false,”raw_author_name“:”Kirchner,Jan Hendrik“,”raw_affiation_strings“:[]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5048522044“,”display_name“:”Bowen Baker“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Baker,Bowen“,”raw _affiliation_strings“:]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5057062066“,”display_name“:”Leo Gao“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Gao,Leo“,“raw_affiliation_strings”:[]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5093524861“,”display_name“:”Leopold Aschenbrenner“,”orcid“:null}“,”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Aschenblenner,Leopld“,”raw _affiliation_string“:[]},{“author_position”:“middle”,”author“:{”id“:”https://openalex.org/A5066483084“,”display_name“:”陈一宁“,”兽人“:”https://orcid.org/0000-0002-9501-5293“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”陈,伊宁“,”raw关联字符串“:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5033112877“,”display_name“:”Adrien Ecoffet“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Ecoffet,Adrien“,”raw _affiliation_strings“:[/]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5050060224“,”display_name“:”Manas Joglekar“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Joglekar-Manas“,”raw _affiliation_strings“:[/]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5090592321“,”display_name“:”Jan Leike“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Leike,Jan“,”raw _affiliation_strings“:]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5006446297“,”display_name“:”Ilya Sutskever“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Sutskeve,Ilya“,”raw _affiliation_string“:[]},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A5007570707“,”display_name“:”Jeff Wu“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Wu,Jeff“,”raw _affiliation_string“:[]}],“countries_distict_count”:0,“institutions_disticenc_count”:零,“corresponding_author_ids”:[]has_fulltext“:false,”cited_by_count“:0,”cited_by_percentile_year“:{”min“:0”,“max”:78},“biblio”:{“volume”:null,“issue”:nul,“first_page”:null,“last_page”:null},”is_retracted“:false,”is_paratext“:false,”primary_topic“:”{“id”:“https://openalex.org/T10028“,”display_name“:”自然语言处理“,”score“:0.9986,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10028“,”display_name“:”自然语言处理“,”score“:0.9986,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10181“,”display_name“:”统计机器翻译与自然语言处理“,”score“:0.9841,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T12026“,”display_name“:”可解释人工智能“,”score“:0.9659,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/language-modeling“,”display_name“:”语言建模“,”score“:0.537325},{”id“:”https://openalex.org/keywords/preained-models“,”display_name“:”预训练模型“,”score“:0.523753},{”id“:”https://openalex.org/keywords/cinterpretable-models“,”display_name“:”可解释模型“,”score“:0.515783},{”id“:”https://openalex.org/keywords/model-in-enterprisetability网站“,”display_name“:”模型可解释性“,”score“:0.509447},{”id“:”https://openalex.org/keywords/machine-learning可解释性“,”display_name“:”机器学习可解释性“,”score“:0.505508}],”concepts“:[{”id“:”https://openalex.org/C177148314,“wikidata”:https://www.wikidata.org/wiki/Q170084“,”display_name“:”泛化“,”level“:2,”score“:0.83687747},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.69842565},{”id“:”https://openalex.org/C2779110517,“wikidata”:https://www.wikidata.org/wiki/Q1240788“,”display_name“:”Supervisor“,”level“:2,”score“:0.65811694},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.5592355},{”id“:”https://openalex.org/C97541855,“wikidata”:https://www.wikidata.org/wiki/Q830687“,”display_name“:”强化学习“,”level“:2,”score“:0.551836},{”id“:”https://openalex.org/C137293760,“wikidata”:https://www.wikidata.org/wiki/Q3621696“,”display_name“:”语言模型“,”level“:2,”score“:0.4716063},{”id“:”https://openalex.org/C119857082,“wikidata”:https://www.wikidata.org/wiki/Q2539“,”display_name“:”机器学习“,”level“:1,”score“:0.43325493},{”id“:”https://openalex.org/C2780586882,“wikidata”:https://www.wikidata.org/wiki/Q7520643(网址:https://www.wikidata.org/wiki/Q7520643)“,”display_name“:”Simple(哲学)“,”level“:2,”score“:0.42763925},{”id“:”https://openalex.org/C33923547,“wikidata”:https://www.wikidata.org/wiki/Q395“,”display_name“:”数学“,”等级“:0,”分数“:0.10663068},{”id“:”https://openalex.org/C134306372,“wikidata”:https://www.wikidata.org/wiki/Q7754“,”display_name“:”数学分析“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C138885662,“wikidata”:https://www.wikidata.org/wiki/Q5891“,”display_name“:”哲学“,”等级“:0,”分数“:0.0},{”id“:”https://openalex.org/C111472728,“wikidata”:https://www.wikidata.org/wiki/Q9471“,”display_name“:”认识论“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C17744445,“wikidata”:https://www.wikidata.org/wiki/Q36442“,”display_name“:”政治学“,”level“:0,”score“:0.0},{”id“:”https://openalex.org/C199539241,“wikidata”:https://www.wikidata.org/wiki/Q7748“,”display_name“:”Law“,”level“:1,”score“:0.0}],”mesh“:[],”locations_count“:2,”location“:[{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2312.09390“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“other-oa”,“licence_id”:“https://openalex.org/licenses/other-oa网站“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},{”is_oa“:false,”landing_page_url“:”https://api.datacite.org/dois/10.48550/arxiv.2312.09390“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4393179698“,”display_name“:”DataCite API“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I4210145204“,”“host_organization_name”:“DataCite”,“host_organization_lineage”:[“https://openalex.org/I4210145204“],”host_organization_lineage_names“:[”DataCite“],“type”:“metadata”},“license”:null,“licence_id”:null,“version”:null}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“https://arxiv.org/abs/2312.09390“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“other-oa”,“licence_id”:“https://openalex.org/licenses/other-oa网站“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},”sustainable_development_goals“:[],”grants“:[],”datasets“:],”versions“:[https://openalex.org/W4387731985","https://openalex.org/W4379086698","https://openalex.org/W4377009725","https://openalex.org/W4320164562","https://openalex.org/W2941808082","https://openalex.org/W2755149878","https://openalex.org/W2528721242网址","https://openalex.org/W2468425257","https://openalex.org/W2372069567","https://openalex.org/W2356364326“],”ngrams_url“:”https://api.openalex.org/works/W4389911544/ngrams“,”abstract_inverted_index“:{”广泛“:[0],”使用“:[1],”对齐“:[2],”技术“:[3],”例如“:[4],”作为“:[5],”强化“:[6],”学习“:[7],”来自“:[8143],”人类“:[9],”反馈“:[10],”(RLHF),“:[11],”依赖“:[12],”依赖“:[13,97117201216],”the“:[14,7,5,94145],”能力“:[15],”of“:[16,78,89148220],”人类“:[17,49,53],”to“:[18,25,58,67163198211],“supervise”:[19,60],“model”:[20,29,72],“behavior”:[21],“-”:[22],“for”:[23,48180],“example”,“:[24181],“evaluate”:[26],“ift”:[27],“a”:[28,79,87121132186217],,“fally”:[30],“following”:[31],“instructions”:[32],“or”:[33],“generated”:[34119],“safe”:[35],“outputs”:[36],“然而”:[37138],“未来”:[38],“超人”:[39,6116422],“模型”:[40,92116150165],“将”:[41,54],“行为”:[42],“in”:[43,93],“复杂”:[44],“方式”:[45],“太”:[46],“困难”:[47],“可靠”:[51],“评估”:[52],“仅”:[55],“是”:[56],“能”:[57],“弱”:[59],“模型。”:[62223],“我们”:[63,83107169],“研究”:[64],“an”:[65190],“analogy”:[66],“this”:[68,85],“problem:”:[69],“can”:[70174195],“weak”:[71122130],“监管”:[73],“引出”:[74],“完整”:[76146],“能力”:[77147],“很多”:[80],“更强”:[81],“模型?”:[82],“测试”:[84],“使用”:[86],“范围”:[88],“预处理”:[90115],“语言”:[91,99],“GPT-4”:[95184],“家族”:[96],“自然”:[98],“处理”:[100],“(NLP),”:[101],“象棋”,:[102],“和”:[103189],“奖励”:[104],“建模”:[105],“任务”:[106203],“发现”:[108170],“那”:[109156171207],“当”:[110182],“我们”:[1111134139194],“天真”:[112],“微调”:[113],“强”:[111449],“标签”:[118],“by”:[120],“模型”:[123],“他们”:[124],“始终如一”:[125],“表现”:[126],“更好”:[127],“比”:[128],“其”:[129],“主管,“:[131],”现象“:[133],”调用“:[135],”弱到强“:[136178],“泛化”:[137],“are”:[140],“still”:[141],“far”:[142],“recovering”:[144],“with”:151185],“naive”:%152],“finetooning”:[153183],“alone”:[154],“suggesting”:[155],“techniques”:[157],“like”:[158],“RLHF”:[P59],“may”:[160],“scale”:[161],“lookly”:[162],“without”:[266],“进一步”:[167],“工作”:[168],“简单”:[172],“方法”:[173],“经常”:[175],“显著”:[176],“改善”:[177],“概括:”:[179],“GPT-2级”:[187],“主管”:[188],“辅助”:[191],“信心”:[192],“损失”:[193],“恢复”:[196],“关闭”:[197],“GPT-3.5级”:%199],“性能”:[200],“NLP”:[202],“我们的”:[204],“结果”:[205],“建议”:[206],it“:[208],”is“:[209],”可行“:[210],”make“:[212],”经验主义“:[213],“进度”:[214],“今天”:[215],“基础”:[218],“挑战”:[219],“对齐”:[221]},“引用_by_api_url”:“https://api.openalex.org/works?filter=cites:W4389911544“,”counts_by_year“:[],”updated_date“:”2024-05-25T13:34:17.301712“,”created_date:“2023-12-19”}“