{“id”:“https://openalex.org/W2903357770“,”doi“:”https://doi.org/10.18653/v1/w18-6310“,”title“:”使用权重范数初始化和正则化改进神经语言模型“,”display_name“:”用权重范数初始和正则化改善神经语言模型”,“publication_year”:2018,“publiation_date”:“2018-01-01”,“ids”:{“openalex”:“https://openalex.org/W2903357770“,”doi“:”https://doi.org/10.18653/v1/w18-6310“,”mag“:”2903357770“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://doi.org/10.18653/v1/w18-6310,“pdf_url”:https://www.aclweb.org/antology/W18-6310.pdf“,”source“:null,”license“:”cc-by“,”licence_id“:”https://openalex.org/licenses/cc-by“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},”type“:”article“,”type_crossref“:“procesdings-article”,”indexed_in“:[”crossref“],”open_access“:{”is_oa“:true,”oa_status“:”hybrid“,”oa_url“:”https://www.aclweb.org/antology/W18-6310.pdf“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5010730319“,”display_name“:”Christian Herold“,”orcid“:”https://orcid.org/0000-0001-7097-2057},“机构”:[{“id”:https://openalex.org/I887968799“,”display_name“:”亚琛理工大学“,”ror“:”https://ror.org/04xfq0f34“,”country_code“:”DE“,”type“:“教育”,”世系“:[”https://openalex.org/I887968799“]}],”国家“:[”DE“],”is_corresponding“:false,”raw_author_name“:”Christian Herold“,”raw _ afiliation_strings“:[“人类语言技术和模式识别集团计算机科学系RWTH Aachen University D-52056,Germany Aachen”]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5046577673“,”display_name“:”Yingbo Gao“,”orcid“:null},”institutions“:[{”id“:”https://openalex.org/I887968799“,”display_name“:”亚琛理工大学“,”ror“:”https://ror.org/04xfq0f34“,”country_code“:”DE“,”type“:“教育”,”世系“:[”https://openalex.org/I887968799“]}],”国家“:[”DE“],”is_corresponding“:false,”raw_author_name“:”Yingbo Gao“,”raw _affiliation_strings“:[“人类语言技术与模式识别集团计算机科学系RWTH Aachen University D-52056,Germany Aachen”]},{“author_position”:“last”,“author”:{“id”:“https://openalex.org/A5087367411“,”display_name“:”Hermann Ney“,”orcid“:null},”institutions“:[{”id“:”https://openalex.org/I887968799“,”display_name“:”亚琛理工大学“,”ror“:”https://ror.org/04xfq0f34“,”country_code“:”DE“,”type“:“教育”,”世系“:[”https://openalex.org/I887968799“]}],”国家“:[”DE“],”is_corresponding“:false,”raw_author_name“:”Hermann Ney“,”raw _affiliation_strings“:[“人类语言技术和模式识别集团计算机科学部RWTH Aachen University D-52056 Aachen,Germany”]}]“countries_distict_count”:1,“institutions_distic _count”:2,“corresponding_author_ids”:[],“corresponding_institution_ids“:[],”apc_list“:null,”apc _ paid“:null,”has_fulltext“:true,”fulltext_origin“:”pdf“,”cited_by_count“:3,”citecd_by_percentile_year“:{”min“:78,”max“:80},”biblio“:{volume”:null、“issue”:null、“first_page”:nully、“last_page”:null}、“is_retracted”:false、“is_paratext”:false、“primary_topic”:{“id”:“https://openalex.org/T10028“,”display_name“:”自然语言处理“,”score“:1.0,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10028“,”display_name“:”自然语言处理“,”score“:1.0,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10181“,”display_name“:”统计机器翻译和自然语言处理“,”score“:0.9999,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10201“,”display_name“:”语音识别技术“,”score“:0.9903,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/language-modeling“,”display_name“:”语言建模“,”score“:0.608187},{”id“:”https://openalex.org/keywords/neural机器翻译“,”display_name“:”神经机器翻译“,”score“:0.585879},{”id“:”https://openalex.org/keywords/统计语言建模“,”display_name“:”统计语言建模“,”score“:0.567735},{”id“:”https://openalex.org/keywords/topic-modeling网站“,”display_name“:”主题建模“,”score“:0.566984},{”id“:”https://openalex.org/keywords/多语言-神经-机器翻译“,”display_name“:”多语言神经机器翻译“,”score“:0.531759}],”concepts“:[{”id“:”https://openalex.org/C206134035,“wikidata”:https://www.wikidata.org/wiki/Q811525“,”display_name“:”Treebank“,”level“:3,”score“:0.8965664},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.70459324},{”id“:”https://openalex.org/C114466953,“wikidata”:https://www.wikidata.org/wiki/Q6034165“,”display_name“:”初始化“,”级别“:2,”分数“:0.69564503},{”id“:”https://openalex.org/C137293760,“wikidata”:https://www.wikidata.org/wiki/Q3621696“,”display_name“:”语言模型“,”level“:2,”score“:0.6398723},{”id“:”https://openalex.org/C2776135515,“wikidata”:https://www.wikidata.org/wiki/Q17143721“,”display_name“:”正则化(语言学)“,”level“:2,”score“:0.5515216},{”id“:”https://openalex.org/C8642999,“wikidata”:https://www.wikidata.org/wiki/Q4171168“,”display_name“:”Hyperparameter“,”level“:2,”score“:0.51971245},{”id“:”https://openalex.org/C50644808,“wikidata”:https://www.wikidata.org/wiki/Q192776“,”display_name“:”人工神经网络“,”level“:2,”score“:0.49798918},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.48801437},{”id“:”https://openalex.org/C90805587,“wikidata”:https://www.wikidata.org/wiki/Q10944557“,”display_name“:”Word(群论)“,”level“:2,”score“:0.47132543},{”id“:”https://openalex.org/C191795146,“wikidata”:https://www.wikidata.org/wiki/Q3878446“,”display_name“:”Norm(哲学)“,”level“:2,”score“:0.4618982},{”id“:”https://openalex.org/C204321447,“wikidata”:https://www.wikidata.org/wiki/Q30642“,”display_name“:”自然语言处理“,”level“:1,”score“:0.41655397},{”id“:”https://openalex.org/C28490314,“wikidata”:https://www.wikidata.org/wiki/Q189436“,”display_name“:”语音识别“,”level“:1,”score“:0.39188176},{”id“:”https://openalex.org/C11413529,“wikidata”:https://www.wikidata.org/wiki/Q8366“,”display_name“:”Algorithm“,”level“:1,”score“:0.37126797},{”id“:”https://openalex.org/C33923547,“wikidata”:https://www.wikidata.org/wiki/Q395“,”display_name“:”数学“,”等级“:0,”分数“:0.21739283},{”id“:”https://openalex.org/C2524010,“wikidata”:https://www.wikidata.org/wiki/Q8087“,”display_name“:”Geometry“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C19768560,“wikidata”:https://www.wikidata.org/wiki/Q320727“,”display_name“:”依赖(UML)“,”level“:2,”score“:0.0},{”id“:”https://openalex.org/C17744445,“wikidata”:https://www.wikidata.org/wiki/Q36442“,”display_name“:”政治学“,”level“:0,”score“:0.0},{”id“:”https://openalex.org/C199539241,“wikidata”:https://www.wikidata.org/wiki/Q7748“,”display_name“:”Law“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C199360897,“wikidata”:https://www.wikidata.org/wiki/Q9143“,”display_name“:”编程语言“,”level“:1,”score“:0.0}],”mesh“:[],”locations_count“:1.”locations“:[{”is_oa“:true,”landing_page_url“:”https://doi.org/10.18653/v1/w18-6310,“pdf_url”:https://www.aclweb.org/antology/W18-6310.pdf“,”source“:null,”license“:”cc-by“,”licence_id“:”https://openalex.org/licenses/cc-by“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true}],”best_oa_location“:{”is_oa“:true,”landing_page_url“:”https://doi.org/10.18653/v1/w18-6310,“pdf_url”:https://www.aclweb.org/antology/W18-6310.pdf“,”source“:null,”license“:”cc-by“,”licence_id“:”https://openalex.org/licenses/cc-by(https://openalex.org/licenses/cc-by)“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},”sustainable_development_goals“:[{”id“:”https://metadata.un.org/sdg/4“,”score“:0.85,”display_name“:”Quality education“}],”grants“:[],”datasets“:【】,”versions“:【],”referenced_works_count“:27,”referrenced_works“:[”https://openalex.org/W1591801644“,”https://openalex.org/W179875071“,”https://openalex.org/W1934041388“,”https://openalex.org/W1938755728“,”https://openalex.org/W1970689298“,”https://openalex.org/W1999965501“,”https://openalex.org/W2064675550“,”https://openalex.org/W2086161653“,”https://openalex.org/W2132339004“,”https://openalex.org/W2134237567“,”https://openalex.org/W2144513243“,”https://openalex.org/W2265902746“,”https://openalex.org/W2408727897网址“,”https://openalex.org/W2525332836“,”https://openalex.org/W2571859396“,”https://openalex.org/W2742448943“,”https://openalex.org/W2743945814“,”https://openalex.org/W2962964385“,”https://openalex.org/W2963266340“,”https://openalex.org/W2963347649“,”https://openalex.org/W2963374479“,”https://openalex.org/W2963403868“,”https://openalex.org/W2963537482“,”https://openalex.org/W2963685250“,”https://openalex.org/W2963748792“,”https://openalex.org/W2963938518“,”https://openalex.org/W2963983719“],”related_works“:[”https://openalex.org/W589103562“,”https://openalex.org/W3142119062“,”https://openalex.org/W2964047924“,”https://openalex.org/W2962832505“,”https://openalex.org/W2743945814“,”https://openalex.org/W2740662036“,”https://openalex.org/W2251234095“,”https://openalex.org/W1991220724“,”https://openalex.org/W159209093“,”https://openalex.org/W131522978“],”ngrams_url“:”https://api.openalex.org/works/W2903357770/ngrams网站“,”“abstract_inverted_index”:{“嵌入”:[0],“和”:[1,32116],“投影”:[2],“矩阵”:[3,27],“是”:[4,42,84,93],“常用”:[5],“使用”:[6],“in”:[7,15,28,69],“神经”:[8],“语言”:[9,3012],“模型”:[10,31],“(NLM)”:[11],“as”:[12,14],“well”:[13],“其他“:[16,62],”序列“:[17],”处理“:[18],”网络“:[19],”那“:[20,34,49],”操作“:[21],”关于“:[22,99112121],“大型”:[23],“词汇表”。我们”:[24],“检查”:[25],“这样”:[26],“微调”:[29],“观察”:[33],“a”:[35,76,87],“NLM”:[36],“学习”:[37],“单词”:[38,46,58],“向量”:[39],“其”:[40,82],“范数”:[41,54],“相关”:[43],“to”:[44,9510110119],“:[45,52],”频率。We“:[47],“show”:[48],“by”:[50],“initializing”:[51],“weight”:[53,77],“with”:[55,61],“scaled”:[56],“log”:[P7],“counts”:[59],“together”:60],“technologies”:[63],“lower”:【64】,“fuzzities”:[65,98],“can”:[66],“be”:[67],“get”:[68],“early”:[70],“epochs”:[71],“of”:[72],“training”(训练)。我们“:[73],”也“:[74],”引入“:[75],”规范“:[78],”正则化“:[79],”损失“:[80],”术语“:[81],”超参数“:[83],”调谐“:[85],”via“:[86],”网格“:[88],”搜索。使用“:[89],”this“:[90],”method“,”we“:[92],”able“:[94],”significally“:[96],”improve“:[97],”two“:[100],”wordlevel“:[101],”modeling“:[103],”tasks“:[104],”(without“:[105],”dynamic“:[106],”evaluation):“:[107],”from“:[108117],”54.44“:[109],”53.16“:[111],”Penn“:[113],“树库”:[114],“(PTB)”:[115],“61.45”:[118],“60.13”:[120],“WikiText-2”:[122],“(工作任务2)。“:[123]},”cited_by_api_url“:”https://api.openalex.org/works?filter=cites:W2903357770“,”counts_by_year“:[{”年份“:2020,”cited_by_count“:2},{”年“:2019,”cited_by_count”:1}],”更新日期“:”2024-06-05T18:25:36.123926“,”created_date“:”2018-12-11“}”