{“id”:“https://openalex.org/W2963281280“,”doi“:”https://doi.org/10.18653/v1/w18-6478“,”title“:”带噪并行语料库的双条件交叉熵过滤“,”display_name“:”含噪并行语料的双条件交互熵过滤“;”publication_year“:2018,”publication_date“:”2018-01-01“,”ids“:{”openalex“:”https://openalex.org/W2963281280“,”doi“:”https://doi.org/10.18653/v1/w18-6478“,”mag“:”2963281280“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://doi.org/10.18653/v1/w18-6478,“pdf_url”:https://www.aclweb.org/antology/W18-6478.pdf“,”source“:null,”license“:”cc-by“,”licence_id“:”https://openalex.org/licenses/cc-by“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},”type“:”article“,”type_crossref“:“procesdings-article”,”indexed_in“:[”crossref“],”open_access“:{”is_oa“:true,”oa_status“:”hybrid“,”oa_url“:”https://www.aclweb.org/antology/W18-6478.pdf“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5065193578“,”display_name“:”Marcin Junczys-Dowmunt“,”orcid“:null},”institutions“:[{”id“:”https://openalex.org/I1290206253“,”display_name“:”Microsoft(美国)“,”ror“:”https://ror.org/00d0nc645“,”country_code“:”US“,”type“:“company”,”lineage“:[”https://openalex.org/I1290206253“]}],”国家“:[”美国“],”is_corresponding“:true,”raw_author_name“:”Marcin Junczys-Dowmunt“,”raw _ afiliation_strings“:[“Microsoft 1 Microsoft Way Redmond,WA 98121,USA”]}],”countries _ distinct_count“:1,”institutions _ disting_count”:1,“corresponding_author_ids”:[”https://openalex.org/A5065193578“],”对应的机构ID“:[”https://openalex.org/I1290206253“],”apc_list“:null,”apc _ paid“:nul,”has_fulltext“:false,”cited_by_count“:91,”ciped_by_percentile_year“:{”min“:98,”max“:99},”biblio“:{volume“:null,”issue“:null,”first_page“:null}https://openalex.org/T10181“,”display_name“:”统计机器翻译与自然语言处理“,”score“:1.0,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10181“,”display_name“:”统计机器翻译与自然语言处理“,”score“:1.0,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10028“,”display_name“:”自然语言处理“,”score“:0.9999,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T11714“,”“display_name”:“图像和视频中的可视问答”,“score”:0.9988,“subfield”:{“id”:“https://openalex.org/subfields/1707“,”display_name“:”计算机视觉和模式识别“},”field“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/statistical-machine-translation网站“,”display_name“:”统计机器翻译“,”score“:0.498911}],”concepts“:[{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.76137966},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.5948669},{”id“:”https://openalex.org/C203005215,“wikidata”:https://www.wikidata.org/wiki/Q79798“,”display_name“:”机器翻译“,”level“:2,”score“:0.517142},{”id“:”https://openalex.org/C106301342,“wikidata”:https://www.wikidata.org/wiki/Q4117933“,”display_name“:”熵(时间箭头)“,”level“:2,”score“:0.4960092},{”id“:”https://openalex.org/C167981619,“wikidata”:https://www.wikidata.org/wiki/Q1685498“,”display_name“:”交叉熵“,”level“:3,”score“:0.47429612},{”id“:”https://openalex.org/C189430467,“wikidata”:https://www.wikidata.org/wiki/Q7293293“,”display_name“:”排名(信息检索)“,”级别“:2,”分数“:0.47232527},{”id“:”https://openalex.org/C191178318,“wikidata”:https://www.wikidata.org/wiki/Q2256906“,”display_name“:”阈值“,”level“:3,”score“:0.46968347},{”id“:”https://openalex.org/C101721835,“wikidata”:https://www.wikidata.org/wiki/Q813908“,”display_name“:”条件熵“,”level“:3,”score“:0.44948184},{”id“:”https://openalex.org/C2777530160,“wikidata”:https://www.wikidata.org/wiki/Q41796“,”display_name“:”句子“,”级别“:2,”分数“:0.42963174},{”id“:”https://openalex.org/C204321447,“wikidata”:https://www.wikidata.org/wiki/Q30642“,”display_name“:”自然语言处理“,”level“:1,”score“:0.40894234},{”id“:”https://openalex.org/C119857082,“wikidata”:https://www.wikidata.org/wiki/Q2539“,”display_name“:”机器学习“,”level“:1,”score“:0.37271726},{”id“:”https://openalex.org/C153180895,“wikidata”:https://www.wikidata.org/wiki/Q7148389“,”display_name“:”模式识别(心理学)“,”level“:2,”score“:0.36946303},{”id“:”https://openalex.org/C9679016,“wikidata”:https://www.wikidata.org/wiki/Q1417473“,”display_name“:”最大熵原理“,”level“:2,”score“:0.27898002},{”id“:”https://openalex.org/C121332964,“wikidata”:https://www.wikidata.org/wiki/Q413“,”display_name“:”Physics“,”level“:0,”score“:0.0},{”id“:”https://openalex.org/C62520636,“wikidata”:https://www.wikidata.org/wiki/Q944“,”display_name“:”量子力学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C115961682,“wikidata”:https://www.wikidata.org/wiki/Q860623“,”display_name“:”图像(数学)“,”level“:2,”score“:0.0}],”mesh“:[],”locations_count“:2,”locations“:[{”is_oa“:true,”landing_page_url“:”https://doi.org/10.18653/v1/w18-6478,“pdf_url”:https://www.aclweb.org/antology/W18-6478.pdf“,”source“:null,”license“:”cc-by“,”licence_id“:”https://openalex.org/licenses/cc-by“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/1809.00197,“pdf_url”:https://arxiv.org/pdf/1809.00197,“源”:{“id”:https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“https://doi.org/10.18653/v1/w18-6478,“pdf_url”:https://www.aclweb.org/antology/W18-6478.pdf“,”source“:null,”license“:”cc-by“,”licence_id“:”https://openalex.org/licenses/cc-by“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},”sustainable_development_goals“:[],”grants“:[],”datasets“:〔],”versions“:[〕,”referenced_works_count“:11,”reforenced_works“:[”https://openalex.org/W1905522558","https://openalex.org/W2117278770","https://openalex.org/W2124807415","https://openalex.org/W2546938941","https://openalex.org/W2794365787","https://openalex.org/W2798389157","https://openalex.org/W2902918014","https://openalex.org/W2963266340","https://openalex.org/W2963403868","https://openalex.org/W2963661177","https://openalex.org/W2963919854“],”related_works“:[”https://openalex.org/W4312766348","https://openalex.org/W4297899318","https://openalex.org/W2953058328","https://openalex.org/W2750730210","https://openalex.org/W2371188576","https://openalex.org/W2236974868","https://openalex.org/W2116854923","https://openalex.org/W1661087619","https://openalex.org/W1542224353","https://openalex.org/W1509573209“],”ngrams_url“:”https://api.openalex.org/works/W2963281280/ngrams网站“,”“abstract_inverted_index”:{“In”:[0],“this”:[1],“work”:[2],“we”:[3,21],“introduce”:[4],“dual”:[5],“conditional”:[6],“交叉熵”:[7,23],“filtering”:[8,99],“for”:[9],“noise”:[10,18],“parallel”:[11,9,60,70,97],“data.for”:[12],“each”:[13],“sentence”:[14],”pair“:[15],”of“:[16,46,59,91107116],”the“:[17,40,43,89,92102108],”语料库“:[20,98],”计算“:[22],”分数“:[24,54,65106],”根据“:[25,51],”到“:[26,52],”两个“:[27],”逆“:[28],”翻译“:[29],”模型“:[30,67,78],”训练“:[31,68,79],”打开“:[32,69,80,96],”干净“:[33,81],”数据。We“:[34,61,83],“惩罚”:[35],“发散”:[36],“交叉熵”:[37],“和”:[38100],“权重”:[39],“处罚”:[41],“by”:[42],“交互熵”:44],“平均”:[45],“两者”:[47],“模型”。排序:[48],“或”:[49],“阈值”:[50],“这些”:[53],“结果”:[55],“in”:[56,88113],“better”:[57],“子集”:[58],“实现”:[62101],“更高”:[63],“BLEU”:[64],“有”:[66,77],“数据”:[71],“过滤”:[72],“仅”:[73],“来自”:[74],“Paracroble”:[75],“than”:[76],“WMT”:[82],“进一步”:[84],“评估”:[85],“我们的”:[86],“方法”:[87],“上下文”:[90],“WMT2018“:[93],”共享“:[94109],”任务“:[95],”总体“:[103],”最高“:[104],”排名“:[105],”工作“:[110],”得分“:[111],”顶级“:[112],”三“:[114],”淘汰“:[115],”四“:[117],”子任务。“:[118]},”cited_by_api_url“:”https://api.openalex.org/works?filter=cites:W2963281280“,”counts_by_year“:[{“年”:2023,”cited_by_count“:5},{“年份”:2022,”ciped_by_cunt“:11},”{“年度”:2021,“cited_by_count”:16},“年份”:2020,”cited_by_count:41},,{”year“2019,”citted_by_count“:16}“,”创建日期“:”2019-07-30“}