{“id”:“https://openalex.org/W2902831278“,”doi“:”https://doi.org/10.18653/v1/w18-6473“,”title“:“STACC,OOV Density and N-gram Saturation:Vicomtech\u2019s Participation in the WMT 2018 Shared Task on Parallel Corpus Filtering”,“display_name”:“STACC,OOV Depensity and N-gram Saturation:Vicomtech \u2019%Particiption in WMT 2018共享Task on Parallel Corpus Filtering“,publication_year”:2018,“publication_date”:“2018-01-01”,“ids“:{”openalex“:”https://openalex.org/W2902831278“,”doi“:”https://doi.org/10.18653/v1/w18-6473“,”mag“:”2902831278“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://doi.org/10.18653/v1/w18-6473,“pdf_url”:https://www.aclweb.org/antology/W18-6473.pdf“,”source“:null,”license“:”cc-by“,”licence_id“:”https://openalex.org/licenses/cc-by“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},”type“:”article“,”type_crossref“:“procesdings-article”,”indexed_in“:[”crossref“],”open_access“:{”is_oa“:true,”oa_status“:”hybrid“,”oa_url“:”https://www.aclweb.org/antology/W18-6473.pdf“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5085424842“,”display_name“:”Andoni Azpeitia“,”orcid“:null},”institutions“:[],”countries“:[”ES“],”is_corresponding“:false,”raw_author_name“:”Andoni-Azpeitia”,“raw_affiliation_strings”:[”Donostia/San Sebasti\u00e1n,Gipuzkoa,Spain“]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5087412588“,”display_name“:”Thierry Etchegoyhen“,”orcid“:”https://orcid.org/0000-0001-7253-1693“},”机构“:[],”国家“:[”ES“],”is_corresponding“:false,”raw_author_name“:”Thierry Etchegoyhen“,”raw_affiation_strings“:[”Donostia/San Sebasti\u00e1n,Gipuzkoa,Spain“]},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A5055241434“,”display_name“:”Eva Mart\u00ednez Garc\u00eda“,”orcid“:”https://orcid.org/0000-0002-3693-1734“},”机构“:[],”国家“:[”ES“],”is_corresponding“:false,”raw_author_name“:”Eva Mart\u00ednez Garcia“,”raw _affiliation_strings“:[“Donostia/San Sebasti\u00e1n,Gipuzkoa,Spain”]}],”countries_distict_count“:1,”机构_distiction_count“:0,”corresponding_author_ids“:[],c_list“:null,”apc_payed“:null,”has_fulltext“:true,”fulltext_origin“:”pdf“,”cited_by_count“:2,”cited_by_percentile_year“:{”min“:74,”max“:78},”biblio“:{“volume”:null,”issue“:null”,“first_page”:null,“last_page”:null},“is_retracted”:false,“is_paratext”:false,“primary_topic”:{“id”:“https://openalex.org/T10181“,”display_name“:”统计机器翻译与自然语言处理“,”score“:1.0,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10181“,”display_name“:”统计机器翻译与自然语言处理“,”score“:1.0,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10028“,”display_name“:”自然语言处理“,”score“:0.9999,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10201“,”display_name“:”语音识别技术“,”score“:0.9978,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/统计语言建模“,”display_name“:”统计语言建模“,”score“:0.518359},{”id“:”https://openalex.org/keywords/semantic-similarity网站“,”display_name“:”语义相似度“,”score“:0.513543},{”id“:”https://openalex.org/keywords/statistical-machine-translation网站“,”display_name“:”统计机器翻译“,”score“:0.507817},{”id“:”https://openalex.org/keywords/part-of-speech-tagging“,”display_name“:”词性标记“,”score“:0.501345}],”concepts“:[{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.8344347},{”id“:”https://openalex.org/C2777530160,“wikidata”:https://www.wikidata.org/wiki/Q41796“,”display_name“:”句子“,”级别“:2,”分数“:0.7922102},{”id“:”https://openalex.org/C2780451532,“wikidata”:https://www.wikidata.org/wiki/Q759676“,”display_name“:”Task(project management)“,”level“:2,”score“:0.6926302},{”id“:”https://openalex.org/C117884012,“wikidata”:https://www.wikidata.org/wiki/Q94489“,”display_name“:”n-gram“,”level“:3,”score“:0.61780024},{”id“:”https://openalex.org/C204321447,“wikidata”:https://www.wikidata.org/wiki/Q30642“,”display_name“:”自然语言处理“,”level“:1,”score“:0.6127356},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.58263624},{”id“:”https://openalex.org/C189430467,“wikidata”:https://www.wikidata.org/wiki/Q7293293“,”display_name“:”排名(信息检索)“,”级别“:2,”分数“:0.5706566},{”id“:”https://openalex.org/C2780586882,“wikidata”:https://www.wikidata.org/wiki/Q7520643(网址:https://www.wikidata.org/wiki/Q7520643)“,”display_name“:”Simple(哲学)“,”level“:2,”score“:0.5100099},{”id“:”https://openalex.org/C28490314,“wikidata”:https://www.wikidata.org/wiki/Q189436“,”display_name“:”语音识别“,”level“:1,”score“:0.43583283},{”id“:”https://openalex.org/C137293760,“wikidata”:https://www.wikidata.org/wiki/Q3621696“,”display_name“:”语言模型“,”level“:2,”score“:0.33489293},{”id“:”https://openalex.org/C138885662,“wikidata”:https://www.wikidata.org/wiki/Q5891“,”display_name“:”哲学“,”等级“:0,”分数“:0.0},{”id“:”https://openalex.org/C187736073,“wikidata”:https://www.wikidata.org/wiki/Q2920921“,”display_name“:”管理“,”级别“:1,”分数“:0.0},{”id“:”https://openalex.org/C111472728,“wikidata”:https://www.wikidata.org/wiki/Q9471“,”display_name“:”认识论“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C162324750,“wikidata”:https://www.wikidata.org/wiki/Q8134“,”display_name“:”Economics“,”level“:0,”score“:0.0}],”mesh“:[],”locations_count“:1,”location“:[{”is_oa“:true,”landing_page_url“:”https://doi.org/10.18653/v1/w18-6473,“pdf_url”:https://www.aclweb.org/antology/W18-6473.pdf“,”source“:null,”license“:”cc-by“,”licence_id“:”https://openalex.org/licenses/cc-by“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true}],”best_oa_location“:{”is_oa“:true,”landing_page_url“:”https://doi.org/10.18653/v1/w18-6473,“pdf_url”:https://www.aclweb.org/antology/W18-6473.pdf“,”source“:null,”license“:”cc-by“,”licence_id“:”https://openalex.org/licenses/cc-by“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},”sustainable_development_goals“:[{”id“:”https://metadata.un.org/sdg/16“,”display_name“:”和平、正义和强大的机构“,”score“:0.41}],”grants“:[],”datasets“:[],”versions“:[】,”referenced_works_count“:17,”referrenced_works“:]”https://openalex.org/W1560797130","https://openalex.org/W1586104099","https://openalex.org/W2097333193","https://openalex.org/W2107695330","https://openalex.org/W2123318312","https://openalex.org/W2129734311","https://openalex.org/W2135873687","https://openalex.org/W2148708890","https://openalex.org/W2155512447","https://openalex.org/W2186890008","https://openalex.org/W2591659448","https://openalex.org/W2741788241","https://openalex.org/W2773493195","https://openalex.org/W2807130468","https://openalex.org/W2963919854","https://openalex.org/W2964308564","https://openalex.org/W3201817155“],”related_works“:[”https://openalex.org/W4307474317","https://openalex.org/W2787311093","https://openalex.org/W2624072012","https://openalex.org/W2532616038","https://openalex.org/W2250909759","https://openalex.org/W2147879411","https://openalex.org/W2132221452","https://openalex.org/W2081295016","https://openalex.org/W2057384730","https://openalex.org/W2008468404“],”ngrams_url“:”https://api.openalex.org/works/W290283278/ngrams“,”abstract_inverted_index“:{”We“:[0],”describe“:[1],”Vicomtech“:[2],”参与“:[3],”in“:[4,39,59,92142157],”the“:[5,21,63,66,77,87109136143158],”WMT“:[6],”2018“:[7],”Shared“:[8],”Task“:[9],”on“:[10,48,86104135],”parallel“:[11,56113],”语料库“:[12,67144],“筛选.We”:[13],“目标”:[14],“到”:[15,20],“评估”:[16],“a”:[17,83,98],“简单“:[18152],”方法“:[19,47126],”任务“:[22,69],”其中“:[23,70],”可以“:[24,32],”高效“:[25],”过程“:[26],”大型“:[27139],”卷“:[28,73],”的“:[29,65,74,89111122138],”数据“:[30100],”和“:[31,43,52131153],”是“:[33],”容易“:[34],”部署“:[35],”用于“:[36,55],”新“:[37],”数据集“:[38140],”不同“:[40],”语言“:[41],”对“:[42115],”域。我们“:[44],”基于“:[45,85103],”我们的“:[46],”STACC“:[49],”an“:[50],”高效“:[51134],”可移植“:[53154],”方法“:[54,79102],”句子“:[57,93106114],”标识“:[58],”比较“:[60],”语料库。To“:[61],”address“:[62],”specifics“:[64],”filtering“:[68145],”features“:[71],”significant“:[72120],”noisic“:[75],”data“,”:[76],”core“:[78],”was“:[00],”expanded“:[81],”with“:+82,97108150],”pension“:[84],”amount“[88],”unknown“:[90],”words“:[91],”pairs。此外,“:[94],”我们“:[95],”试验“:[96],”补充“:[99],”饱和“:[101],”来源“:[105],”n克,“:[107],”目标“:[110],”降级“:[112],”that“:[116],”do“:[117],”not“:+118],”contribute“:/119],”amounts“:[121],”yet“:[123],”unobserved“:[124],”n-grams。我们的“:[125],”需要“:[127],”否“:[128],”优先“:[129],”训练“:[130],”是“:[132],”高度“:[133],”类型“:[137],”特色“:[141],”任务。我们“:[146],“实现”:[147],“竞争”:[148],“结果”:[149],“本”:[151],“方法”:[155],“排名”:[156],“顶端”:[159],“一半”:[160],“中间”:[161],“竞争力”:[162],“系统”:[163],“总体”。“:[164]},”cited_by_api_url“:”https://api.openalex.org/works?filter=cites:W2902831278“,”counts_by_year“:[{”年份“:2019,”cited_by_count“:1},{”年“:2018,”cited_by_count”:1}],”更新日期“:”2024-06-01T04:02:02.970627“,”创建日期“:“2018-12-11”}