{“id”:“https://openalex.org/W4386081016“,”doi“:”https://doi.org/10.48550/arxiv.2308.10032“,”title“:”GameEval:评估对话游戏上的LLM“,”display_name“:”GameEval:Evaling LLM on Conversational Games“,”publication_year“:2023,”publiation_date“:”2023-01-01“,”ids“:{”openalex“:”https://openalex.org/W4386081016“,”doi“:”https://doi.org/10.48550/arxiv.2308.10032“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2308.10032“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”is_core“:fase,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“other-oa”,“licence_id”:“https://openalex.org/licenses/other-oa“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},”type“:”预印本“,”type_crossref“:”发布的内容“,”indexed_in“:[”arxiv“,”datacite“],”open_access“:{”is_oa“:true,”oa_status“:”green“,”oa_url“:”https://arxiv.org/abs/2308.10032“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5049349334“,”display_name“:”Dan Qiao“,”orcid“:”https://orcid.org/0000-0003-2375-1512“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”乔,丹“,”raw关联字符串“:[],“附属关系”:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5025407608“,”display_name“:”吴成东“,”兽人“:”https://orcid.org/0000-0003-2025-2646“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”吴,陈飞“,”raw关联字符串“:[],“隶属关系”:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5038539867“,”display_name“:”Yilong Liang“,”orcid“:”https://orcid.org/0000-0002-1914-6769“},”机构“:[],”国家“:[],”is_correresponsing“:false,”raw_author_name“:”梁耀波“,”raw_affiation_strings“:[],”附属“:[]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5028766349“,”display_name“:”李俊涛“,”兽人“:”https://orcid.org/0000-0002-3288-4395“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”李俊涛“,”raw _ afiliation_strings“:[],“隶属关系”:[]},{“author_position”:“last”,“author”:{“id”:“”https://openalex.org/A5042018181“,”display_name“:”南端“,”兽人“:”https://orcid.org/0000-0002-3387-4674“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”段,南“,”raw关联字符串“:[],“隶属关系”:[]}],“国家区分计数”:0,”机构区分计数“:0,“对应作者id”:[]、“对应机构id”:[]、“apc_list”:null,“apc_payed”:nul,“fwci”:null,“hasi”_fulltext“:false,”cited_by_count“:0,”cited_by_percentile_year“:{”min“:0”,“max”:77},“biblio”:{“volume”:null,“issue”:nul,“first_page”:null,“last_page”:null},”is_retracted“:false,”is_paratext“:false,”primary_topic“:”{“id”:“https://openalex.org/T10028“,”display_name“:”自然语言处理“,”score“:0.9989,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”Artificial Intelligence“},”field“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10028“,”display_name“:”自然语言处理“,”score“:0.9989,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”Artificial Intelligence“},”field“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10181“,”display_name“:”统计机器翻译与自然语言处理“,”score“:0.9947,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”Artificial Intelligence“},”field“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T13629“,”display_name“:”自动文本简化和可读性评估“,”score“:0.9536,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”Artificial Intelligence“},”field“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/language-modeling“,”display_name“:”语言建模“,”score“:0.53202},{”id“:”https://openalex.org/keywords/topic-modeling网站“,”display_name“:”Topic Modeling“,”score“:0.517296}],”concepts“:[{”id“:”https://openalex.org/C37736160,“wikidata”:https://www.wikidata.org/wiki/Q1801315“,”display_name“:”对抗体系“,”level“:2,”score“:0.65360814},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.61972797},{”id“:”https://openalex.org/C520049643,“wikidata”:https://www.wikidata.org/wiki/Q189760“,”display_name“:”Voting“,”level“:3,”score“:0.5028965},{”id“:”https://openalex.org/C2781249084,“wikidata”:https://www.wikidata.org/wiki/Q908656“,”display_name“:”首选项“,”级别“:2,”分数“:0.50252986},{”id“:”https://openalex.org/C2776760102,“wikidata”:https://www.wikidata.org/wiki/Q5139900“,”“display_name”“:”代码(集合论)“,”级别“:3,”分数“:0.49542654},{”id“:”https://openalex.org/C2777267654,“wikidata”:https://www.wikidata.org/wiki/Q3519023网址“,”display_name“:”Test(biology)“,”level“:2,”score“:0.46746162},{”id“:”https://openalex.org/C2780665704,“wikidata”:https://www.wikidata.org/wiki/Q959298“,”display_name“:”干预(咨询)“,”level“:2,”score“:0.4159517},{”id“:”https://openalex.org/C539667460网址,“wikidata”:https://www.wikidata.org/wiki/Q2414942“,”display_name“:”Management science“,”level“:1,”score“:0.33474958},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.3155452},{”id“:”https://openalex.org/C15744967,“wikidata”:https://www.wikidata.org/wiki/Q9418“,”display_name“:”心理学“,”等级“:0,”分数“:0.24780053},{”id“:”https://openalex.org/C17744445,“wikidata”:https://www.wikidata.org/wiki/Q36442“,”display_name“:”政治学“,”level“:0,”score“:0.21074587},{”id“:”https://openalex.org/C199360897,“wikidata”:https://www.wikidata.org/wiki/Q9143“,”display_name“:”编程语言“,”level“:1,”score“:0.100854665},{”id“:”https://openalex.org/C175444787,“wikidata”:https://www.wikidata.org/wiki/Q39072“,”display_name“:”微观经济学“,”level“:1,”score“:0.09139937},{”id“:”https://openalex.org/C127413603,“wikidata”:https://www.wikidata.org/wiki/Q11023“,”display_name“:”Engineering“,”level“:0,”score“:0.09092739},{”id“:”https://openalex.org/C162324750,“wikidata”:https://www.wikidata.org/wiki/Q8134“,”display_name“:”经济学“,”level“:0,”score“:0.07556233},{”id“:”https://openalex.org/C151730666,“wikidata”:https://www.wikidata.org/wiki/Q7205“,”display_name“:”古生物学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C177264268,“wikidata”:https://www.wikidata.org/wiki/Q1514741“,”display_name“:”Set(abstract data type)“,”level“:2,”score“:0.0},{”id“:”https://openalex.org/C94625758,“wikidata”:https://www.wikidata.org/wiki/Q7163“,”display_name“:”政治“,”级别“:2,”分数“:0.0},{”id“:”https://openalex.org/C199539241,“wikidata”:https://www.wikidata.org/wiki/Q7748“,”display_name“:”Law“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C118552586,“wikidata”:https://www.wikidata.org/wiki/Q7867“,”display_name“:”精神病学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C86803240,“wikidata”:https://www.wikidata.org/wiki/Q420“,”display_name“:”Biology“,”level“:0,”score“:0.0}],”mesh“:[],”locations_count“:2,”location“:[{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2308.10032“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”is_core“:fase,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“other-oa”,“licence_id”:“https://openalex.org/licenses/other-oa“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},{”is_oa“:false,”landing_page_url“:”https://api.datacite.org/dois/10.48550/arxiv.2308.10032“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4393179698“,”display_name“:”DataCite API“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”is_core“:false,”host_organization“:”https://openalex.org/I4210145204“,”“host_organization_name”:“DataCite”,“host_organization_lineage”:[“https://openalex.org/I4210145204“],”host_organization_lineage_names“:[”DataCite“],“type”:“metadata”},“license”:null,“licence_id”:null,“version”:null}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“https://arxiv.org/abs/2308.10032(网址:https://arxiv.org/abs/2308.10032)“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”is_core“:fase,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“other-oa”,“licence_id”:“https://openalex.org/licenses/other-oa“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},”sustainable_development_goals“:[{”id“:”https://metadata.un.org/sdg/4“,”score“:0.63,”display_name“:”Quality education“}],”grants“:[],”datasets“:【】,”versions“:【],”referenced_works_count“:0,”referrenced_works“:[],”related_work斯“:[”https://openalex.org/W4310988119","https://openalex.org/W4297672492","https://openalex.org/W4288019534","https://openalex.org/W4285226279","https://openalex.org/W4246396837","https://openalex.org/W3191453585","https://openalex.org/W3126451824","https://openalex.org/W2502115930","https://openalex.org/W2482350142","https://openalex.org/W1561927205“],”ngrams_url“:”https://api.openalex.org/works/W4386081016/ngrams网站“,”“abstract_inverted_index”:{“The”:[0],“rapid”:[1],“advancements”:[2],“in”:[3,11],“large”:[4],“language”:[5],“models”:[6],“(LLM)”:[7],“have”:[8],“presented”:[9],“challenges”:[10],“evaluation”:[12,47],“these”:[13],“models.”:[14,36],“Existing”:[15],],“方法”:[17],“是”:[18],“任一”:[19],“基于引用”:[20],“或”:[21,29,93],“偏好:[22],“基于”,:[23],“其中”:[24],“不可避免”:[25],“需要”:[26],“人类”:[27],“干预”:[28],“介绍”:[30],“测试”:[31],“偏见”:[32],“引起”:[33],“由”:[34,74,97],“评估者”:[35],“入”:[37],“此”:[38104],“论文”:[39],“我们”:[40113],“提议”:[41],“游戏评估”,:[42],“a”:[43126],“小说”:[44],“方法”:[45],“to”:[46101133],“LLM“:[48,61],“通过”:[49],“目标驱动”:[50],“对话”:[51],“游戏”:[52],“克服”:[53],“the”:[54120],“limitions”:[55],“of”:[56,77122129],“previous”:[57],“methods”。“:[58],”GameEval“:[59116],”treates“:[60],”as“:[62],”game“:[63],”players“:/64],”and“:[65,84],”assigners“:[66],”them“:[67],”distinct“:[68],”roles“:[69],”with“:[70,91],”specific“:[71],”goals“:[72],”reached“:[73],”launching“:[75],”conversation“:[76],”variable“:[78123],“表格”:[79],“包括”:[80],“讨论”:[81],“问题”:[82],“回答”:[83],“投票。“:[85],”我们“:[86],”设计“:[87],”三“:[88],”独特“:[89],”游戏“:[90],”合作“:[92],”对抗“:[94],”目标“:[95],”伴随“:[96],”对应“:[98],”度量“:[100],”展示“:[102114],”如何“:[103],”新“:[105],”范式“:[106],”综合“:[107],”评估“:[108],”模型“:[109],“性能。通过“:[110],”广泛“:[111],”实验“:[112],”那“:[115],”可以“:[117],”有效“:[118],”区分“:[119],”能力“:[121],”LLM,“:[124],”提供“:[125],”综合“:[127],”评估“:[128],”他们的“:[130],”集成“:[131],”技能“:[132],”解决“:[134],”复杂“:[135],”问题。“:[136],”我们的“:[137],”公共“:[138],”匿名“:[139],”代码“:[140],”是“:[141],”可用“:[142],”在“:[143],”https://github.com/GameEval/GameEval。“:[144]},”cited_by_api_url“:”https://api.openalex.org/works?filter=cites:W4386081016“,”counts_by_year“:[],”updated_date“:”2024-06-26T01:44:45.310771“,”created_date:“2023-08-23”}“