{“id”:“https://openalex.org/W2902689991“,”doi“:”https://doi.org/10.18653/v1/w18-6323“,”title“:“使用数据选择方法提取神经机器翻译的域内训练语料库”,”display_name“:”使用数据选择法提取神经机器转换的域内培训语料库“,”publication_year“:2018,”publiation_date“:”2018-01-01“,”ids“:{”openalex“:”https://openalex.org/W2902689991“,”doi“:”https://doi.org/10.18653/v1/w18-6323“,”mag“:”2902689991“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://doi.org/10.18653/v1/w18-6323,“pdf_url”:https://www.aclweb.org/antology/W18-6323.pdf“,”source“:null,”license“:”cc-by“,”licence_id“:”https://openalex.org/licenses/cc-by“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},”type“:”article“,”type_crossref“:“procesdings-article”,”indexed_in“:[”crossref“],”open_access“:{”is_oa“:true,”oa_status“:”hybrid“,”oa_url“:”https://www.aclweb.org/antology/W18-6323.pdf“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5086498716“,”display_name“:”Catarina Cruz Silva“,”orcid“:null},”institutions“:[{”id“:”https://openalex.org/I4210114793“,”display_name“:”Instituto Polit\u00e9cnico de Santar\u00e9m“,”ror“:”https://ror.org/02bbx2g30“,”country_code“:”PT“,”type“:“教育”,”世系“:[”https://openalex.org/I4210114793“]}],”国家“:[”PT“],”is_corresponding“:false,”raw_author_name“:”Catarina Cruz Silva“,”raw _affiliation_strings“:[“de Santar\u00e9m 67B,1000-286 Lisboa,Portugal”]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5063016307“,”display_name“:”Chao-Hong Liu“,”orcid“:”https://orcid.org/0000-0001-9048-4552},“机构”:[{“id”:https://openalex.org/I42934936“,”display_name“:”都柏林城市大学“,”ror“:”https://ror.org/04a1a1e81“,”country_code“:”IE“,”type“:“教育”,”世系“:[”https://openalex.org/I42934936“]}],”countries“:[”IE“],”is_corresponding“:false,”raw_author_name“:”Chao Hong Liu“,”raw_affiation_strings“:[”ADAPT Centre,School of Computing,Dublin City University Dublin 9,Ireland“]},{”author_position“:”middle“,”author“:”https://openalex.org/A5049646586“,”display_name“:”Alberto Poncelas“,”orcid“:null},”institutions“:[{”id“:”https://openalex.org/I42934936“,”display_name“:”都柏林城市大学“,”ror“:”https://ror.org/04a1a1e81“,”country_code“:”IE“,”type“:“教育”,”世系“:[”https://openalex.org/I42934936“]}],”国家“:[”IE“],”is_corresponding“:false,”raw_author_name“:”Alberto Poncelas“,”raw _ afiliation_strings“:[“爱尔兰都柏林城市大学计算学院ADAPT中心”]},{“author_position”:“last”,“author”:{“id”:“https://openalex.org/A5055864641“,”display_name“:”Andy Way“,”orcid“:”https://orcid.org/0000-0001-5736-5930},“机构”:[{“id”:https://openalex.org/I42934936“,”display_name“:”都柏林城市大学“,”ror“:”https://ror.org/04a1a1e81“,”country_code“:”IE“,”type“:“教育”,”世系“:[”https://openalex.org/I42934936“]}],”国家“:[”IE“],”is_corresponding“:false,”raw_author_name“:”Andy Way“,”raw _affiliation_strings“:[“爱尔兰都柏林城市大学计算学院ADAPT中心”]}]“countries_distict_count”:2,”institutions_disticent_count“:2,“corresponding_author_ids”:[],”correspounding_institution_ids“:[]、”apc_list“:null,”apc_payed“:nul,”has_fulltext“:false,”cited_by_count“:21,”cited_by_percentile_year“:{”min“:92,”max“:93},”biblio“:{”volume“:null,”issue“:nul,”first_page“:null},“last_page”:null{,“is_retracted”:false、“is_paratext”:false,“primary_topic”:{“id”:“https://openalex.org/T10181“,”display_name“:”统计机器翻译和自然语言处理“,”score“:1.0,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10181“,”display_name“:”统计机器翻译和自然语言处理“,”score“:1.0,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10028“,”display_name“:”自然语言处理“,”score“:0.9996,”subfield“:{”id“:”https://openalex.org/subfields/s702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10601“,”display_name“:”手写识别和文本检测“,”score“:0.9481,”subfield“:{”id“:”https://openalex.org/subfields/1707“,”display_name“:”计算机视觉和模式识别“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/neural-machine-translation网站“,”display_name“:”神经机器翻译“,”score“:0.619448},{”id“:”https://openalex.org/keywords/machine翻译“,”display_name“:”机器翻译“,”score“:0.568832},{”id“:”https://openalex.org/keywords/statistical-machine-translation网站“,”display_name“:”统计机器翻译“,”score“:0.560306},{”id“:”https://openalex.org/keywords/多语言-神经-机器翻译“,”display_name“:”多语言神经机器翻译“,”score“:0.552963},{”id“:”https://openalex.org/keywords/document-image-analysis网站“,”display_name“:”文档图像分析“,”score“:0.525304}],”concepts“:[{”id“:”https://openalex.org/C203005215,“wikidata”:https://www.wikidata.org/wiki/Q79798“,”display_name“:”机器翻译“,”level“:2,”score“:0.8548715},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198(网址:https://www.wikidata.org/wiki/Q21198)“,”display_name“:”计算机科学“,”level“:0,”score“:0.8170901},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.6890063},{”id“:”https://openalex.org/C81917197,“wikidata”:https://www.wikidata.org/wiki/Q628760“,”display_name“:”Selection(genetic algorithm)“,”level“:2,”score“:0.55025077},{”id“:”https://openalex.org/C119857082,“wikidata”:https://www.wikidata.org/wiki/Q2539“,”display_name“:”机器学习“,”level“:1,”score“:0.54174787},{”id“:”https://openalex.org/C51632099,“wikidata”:https://www.wikidata.org/wiki/Q3985153“,”display_name“:”训练集“,”level“:2,”score“:0.53132695},{”id“:”https://openalex.org/C106301342,“wikidata”:https://www.wikidata.org/wiki/Q4117933“,”display_name“:”熵(时间箭头)“,”level“:2,”score“:0.52670985},{”id“:”https://openalex.org/C149364088,“wikidata”:https://www.wikidata.org/wiki/Q185917“,”display_name“:”Translation(biology)“,”level“:4,”score“:0.476779},{”id“:”https://openalex.org/C9679016,“wikidata”:https://www.wikidata.org/wiki/Q1417473“,”display_name“:”最大熵原理“,”level“:2,”score“:0.46801054},{”id“:”https://openalex.org/C148483581,“wikidata”:https://www.wikidata.org/wiki/Q446488“,”“display_name”“:”功能选择“,”级别“:2,”分数“:0.45424378},{”id“:”https://openalex.org/C67186912,“wikidata”:https://www.wikidata.org/wiki/Q367664“,”display_name“:”数据建模“,”level“:2,”score“:0.44350132},{”id“:”https://openalex.org/C50644808,“wikidata”:https://www.wikidata.org/wiki/Q192776“,”display_name“:”人工神经网络“,”level“:2,”score“:0.4127079},{”id“:”https://openalex.org/C204321447,“wikidata”:https://www.wikidata.org/wiki/Q30642“,”display_name“:”自然语言处理“,”level“:1,”score“:0.3978646},{”id“:”https://openalex.org/C153180895,“wikidata”:https://www.wikidata.org/wiki/Q7148389“,”display_name“:”模式识别(心理学)“,”level“:2,”score“:0.33763978},{”id“:”https://openalex.org/C124101348,“wikidata”:https://www.wikidata.org/wiki/Q172491“,”display_name“:”数据挖掘“,”level“:1,”score“:0.33373877},{”id“:”https://openalex.org/C55493867,“wikidata”:https://www.wikidata.org/wiki/Q7094“,”display_name“:”生物化学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C185592680,“wikidata”:https://www.wikidata.org/wiki/Q2329“,”display_name“:”Chemistry“,”level“:0,”score“:0.0},{”id“:”https://openalex.org/C121332964,“wikidata”:https://www.wikidata.org/wiki/Q413“,”display_name“:”物理“,”级别“:0,”分数“:0.0},{”id“:”https://openalex.org/C62520636,“wikidata”:https://www.wikidata.org/wiki/Q944“,”display_name“:”量子力学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C77088390,“wikidata”:https://www.wikidata.org/wiki/Q8513“,”display_name“:”数据库“,”级别“:1,”分数“:0.0},{”id“:”https://openalex.org/C105580179,“wikidata”:https://www.wikidata.org/wiki/Q188928“,”display_name“:”Messenger RNA“,”level“:3,”score“:0.0},{”id“:”https://openalex.org/C104317684,“wikidata”:https://www.wikidata.org/wiki/Q7187“,”display_name“:”Gene“,”level“:2,”score“:0.0}],”mesh“:[],”locations_count“:2.”locations“:[{”is_oa“:true,”landing_page_url“:”https://doi.org/10.18653/v1/w18-6323,“pdf_url”:https://www.aclweb.org/antology/W18-6323.pdf“,”source“:null,”license“:”cc-by“,”licence_id“:”https://openalex.org/licenses/cc-by“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},{”is_oa“:true,”landing_page_url“:”http://doras.dcu.ie/23338/,“pdf_url”:http://doras.dcu.ie/23338/1/Extrating_In-domain_Training_Data_for_Neural_Machine_Translation_Using_Data_Selection_Methods%5B1%5D.pdf,“源”:{“id”:https://openalex.org/S4306401512“,”“display_name”“:”都柏林城市大学开放存取机构知识库(都柏林城市学院)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”host_organization“:”https://openalex.org/I42934936“,”host_organization_name“:”都柏林城市大学“,”host_organization_lineage“:[”https://openalex.org/I42934936“],”host_organization_lineage_names“:[”都柏林城市大学“],“type”:“repository”},“license”:“cc-by-nc-sa”,“licence_id”:“https://openalex.org/licenses/cc-by-nc-sa“,”version“:”acceptedVersion“,”is_accepted“:true,”is_published“:false}],”best_oa_location“:{”is_oa“:true,”landing_page_url“:”https://doi.org/10.18653/v1/w18-6323,“pdf_url”:https://www.aclweb.org/antology/W18-6323.pdf“,”source“:null,”license“:”cc-by“,”licence_id“:”https://openalex.org/licenses/cc-by“,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},”sustainable_development_goals“:[],”grants“:[],”datasets“:〔],”versions“:[〕,”referenced_works_count“:22,”reforenced_works“:[”https://openalex.org/W1905522558","https://openalex.org/W2075006521","https://openalex.org/W2101105183","https://openalex.org/W2101816610","https://openalex.org/W2117278770","https://openalex.org/W2123318312","https://openalex.org/W2134800885","https://openalex.org/W2147262247","https://openalex.org/W2149327368","https://openalex.org/W2218630638","https://openalex.org/W2470585229","https://openalex.org/W2572474373","https://openalex.org/W2594229957","https://openalex.org/W2623769564","https://openalex.org/W2741900445","https://openalex.org/W2766733559","https://openalex.org/W2962784628","https://openalex.org/W2963366389","https://openalex.org/W2963816901","https://openalex.org/W3084827186","https://openalex.org/W3208011254","https://openalex.org/W635530177“],”related_works“:[”https://openalex.org/W783305165","https://openalex.org/W4362495644","https://openalex.org/W4292794239","https://openalex.org/W4285877427","https://openalex.org/W4285322112","https://openalex.org/W3151736118","https://openalex.org/W3011059803","https://openalex.org/W2972060578","https://openalex.org/W2154124206","https://openalex.org/W1595744771“],”ngrams_url“:”https://api.openalex.org/works/W2902689991/ngrams“,”“abstract_inverted_index”:{“Data”:[0],“selection”:[1,65,78117],“is”:[2125],“a”:[3,8],“process”:[4],“used”:[5],“in”:[6],“selecting”:[7],“subset”:[9],“of”:[10,16,63],“parallel”:[11],“Data”:[12,64,77104116],“for”:[13,25,57,80112130],“the”6120123],“培训”:[15,26],“机器”:[17],“翻译”:[18],“(MT)”:[19],“系统,“:[20114],”so“:[21],”that“:[22,56111],”1)“:[23],”resources“:/24],”may“:[27],”be“:[28],”reduced“,”:[29],”2)“:[30],”trained“:[31,38,45],”models“:[32,46],”can“:[33],”performance“:[34],”better“:[35],”to“:[36],”these“:[37],”with“:[39101],“整体”:[41],“语料库”:[42],“和/或”:[43],“3)”:[44],“是”:[47],“更多”:[48],“定制”:[49],“到”:[50],“特定的“:[51],”域。它“:[52],”has“:[53],”been“:[54],”shown“:[55],”statistical“:[58],”MT“:[59,69],”(SMT),“:[60],”use“:[62],”helps“:[66],”improve“:[67],”performance“:[70],”significally“。在“:[71],“this”:[72],“study”:[73],“we”:[74],“reviewed”:[75],“three”:【76107】,“approachs”:【79】,“MT,”:【81】,“即:【82】,“Term”:【83】,“Frequency-Inverse”:【84】,“Document”:〔85〕,“Freequency”:【86】,“Cross-Entropy”:〔87〕,“Difference”:【88】,“and”:【89,93】,“Feature”:【90】,“衰退”:[91],“算法”:[92],“执行”:[94],“实验”:[95],“开启”:[96],“神经”:[97],“机器”:[98],“翻译”:[99],“(NMT)”:[100],“选定”:[103],“使用”:[105115],“方法。”:[108],“结果”:[109],“显示”:[110],“NMT”:[113],“也”:[118],“改进”:[119],“性能”:[121],“尽管”:[122],“增益”:[124],“不是”:[126],“如”:[127129],“很多”:[128],“SMT”:[131],“系统。”:[132]},“cited_by_api_url”:“https://api.openalex.org/works?filter=cites:W2902689991“,”counts_by_year“:[{“年”:2024,”cited_by_count“:1},{“年份”:2023,”ciped_by_cunt“:2},”{“年度”:2022,“cited_by_count”:3},“年份”:2021,”cited_by_count“,”创建日期“:”2018-12-11“}