{“id”:“https://openalex.org/W4292957667“,”doi“:”https://doi.org/10.48550/arxiv.2208.09596“,”title“:”Vision-Language Matching for Text-to-Image Synthesis via Generative Adversarial Networks“,”display_name“:”通过生成对手网络进行文本到图像合成的视觉语言匹配“,”publication_year“:2022,”publiction_date“:”2022-01-01“,”ids“:{”openalex“:”https://openalex.org/W4292957667“,”doi“:”https://doi.org/10.48550/arxiv.2208.09596“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2208.09596“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”is_core“:fase,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“other-oa”,“licence_id”:“https://openalex.org/licenses/other-oa网站“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},”type“:”preprint“,”type_crossref“:“posted-content”,”indexed_in“:[”arxiv“,”datacite“],”open_access“:{”is_oa“:true,”oa_status“:”green“,”oa_url“:”https://arxiv.org/abs/2208.09596“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5101178676“,”display_name“:”Qingrong Cheng“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Cheng,Qingron“,”raw _affiliation_strings“:],”affiliations“:[/]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5004061050“,”display_name“:”Keyu Wen“,”orcid“:”https://orcid.org/0000-0002-5048-9014“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”温,科尤“,”raw _ afiliation_strings“:[],“从属关系”:[]},{“author_position”:“last”,“author”:{“id”:“https://openalex.org/A5101294804“,”display_name“:”Xiaodong Gu“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Gu,Xiaoding“,”raw _affiliation_strings“:[/],”affiliations“:【】}】,“countries_distiction_count”:0,“institutions_distition_count“:0,”corresponding_author_ids,“apc_payd”:空,“fwci“:0.0,”has_fulltext“:false,”cited_by_count“:0,”cited_by_percentile_year“:{”min“:0”max“:65},”biblio“:{“volume”:null,”issue“:null”,“first_page”:null,“last_page”:null},“is_retracted”:false、“is_paratext”:false,“primary_topic”:{“id”:“https://openalex.org/T11714“,”“display_name”:“图像和视频中的可视问答”,“score”:0.9835,“subfield”:{“id”:“https://openalex.org/subfields/1707“,”display_name“:”计算机视觉和模式识别“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T11714“,”“display_name”:“图像和视频中的可视问答”,“score”:0.9835,“subfield”:{“id”:“https://openalex.org/subfields/1707“,”display_name“:”计算机视觉和模式识别“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10775“,”“display_name”:“图像处理中的生成对手网络”,“score”:0.9822,“subfield”:{“id”:“https://openalex.org/subfields/1707“,”display_name“:”计算机视觉和模式识别“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10627“,”“display_name”:“图像特征检索与识别技术”,“score”:0.9761,“subfield”:{“id”:“https://openalex.org/subfields/1707“,”display_name“:”计算机视觉和模式识别“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/feature-matching“,”display_name“:”功能匹配“,”score“:0.607643},{”id“:”https://openalex.org/keywords/texture-synthesis网站“,”display_name“:”纹理合成“,”score“:0.603297},{”id“:”https://openalex.org/keywords/image-synthesis网站“,”display_name“:”图像合成“,”score“:0.600768},{”id“:”https://openalex.org/keywords/visual-question-answering“,”display_name“:”可视问答“,”score“:0.589719},{”id“:”https://openalex.org/keywords/language-understanding“,”display_name“:”语言理解“,”score“:0.563981}],”concepts“:[{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.7517381},{”id“:”https://openalex.org/C2776436953,“wikidata”:https://www.wikidata.org/wiki/Q5163215(网址:https://www.wikidata.org/wiki/Q5163215)“,”display_name“:”一致性(知识库)“,”level“:2,”score“:0.73311216},{”id“:”https://openalex.org/C115961682,“wikidata”:https://www.wikidata.org/wiki/Q860623“,”display_name“:”Image(mathematics)“,”level“:2,”score“:0.61062014},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.601043},{”id“:”https://openalex.org/C165064840,“wikidata”:https://www.wikidata.org/wiki/Q1321061“,”display_name“:”Matching(statistics)“,”level“:2,”score“:0.5813676},{”id“:”https://openalex.org/C39890363,“wikidata”:https://www.wikidata.org/wiki/Q36108“,”display_name“:”生成语法“,”level“:2,”score“:0.50975484},{”id“:”https://openalex.org/C2989087649,“wikidata”:https://www.wikidata.org/wiki/Q176953“,”display_name“:”图像合成“,”level“:3,”score“:0.4313194},{”id“:”https://openalex.org/C2780980858,“wikidata”:https://www.wikidata.org/wiki/Q110022“,”display_name“:”Dual(语法数字)“,”level“:2,”score“:0.4243647},{”id“:”https://openalex.org/C184337299,“wikidata”:https://www.wikidata.org/wiki/Q1437428“,”display_name“:”语义(计算机科学)“,”level“:2,”score“:0.42163137},{”id“:”https://openalex.org/C176217482,“wikidata”:https://www.wikidata.org/wiki/Q860554“,”display_name“:”公制(单位)“,”级别“:2,”分数“:0.41704172},{”id“:”https://openalex.org/C204321447,“wikidata”:https://www.wikidata.org/wiki/Q30642“,”display_name“:”自然语言处理“,”level“:1,”score“:0.39913264},{”id“:”https://openalex.org/C31972630,“wikidata”:https://www.wikidata.org/wiki/Q844240“,”display_name“:”计算机视觉“,”level“:1,”score“:0.35917228},{”id“:”https://openalex.org/C23123220,“wikidata”:https://www.wikidata.org/wiki/Q816826“,”display_name“:”信息检索“,”level“:1,”score“:0.33971897},{”id“:”https://openalex.org/C153180895,“wikidata”:https://www.wikidata.org/wiki/Q7148389“,”display_name“:”模式识别(心理学)“,”level“:2,”score“:0.32047832},{”id“:”https://openalex.org/C41895202,“wikidata”:https://www.wikidata.org/wiki/Q8162“,”display_name“:”语言学“,”level“:1,”score“:0.110563785},{”id“:”https://openalex.org/C33923547,“wikidata”:https://www.wikidata.org/wiki/Q395“,”display_name“:”Mathematics“,”level“:0,”score“:0.109847605},{”id“:”https://openalex.org/C105795698,“wikidata”:https://www.wikidata.org/wiki/Q12483“,”display_name“:”Statistics“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C138885662,“wikidata”:https://www.wikidata.org/wiki/Q5891“,”display_name“:”哲学“,”等级“:0,”分数“:0.0},{”id“:”https://openalex.org/C21547014,“wikidata”:https://www.wikidata.org/wiki/Q1423657“,”display_name“:”操作管理“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C162324750,“wikidata”:https://www.wikidata.org/wiki/Q8134“,”display_name“:”经济学“,”level“:0,”score“:0.0},{”id“:”https://openalex.org/C199360897,“wikidata”:https://www.wikidata.org/wiki/Q9143“,”display_name“:”编程语言“,”level“:1,”score“:0.0}],”mesh“:[],”locations_count“:2,”location“:[{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2208.09596“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”is_core“:fase,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“other-oa”,“licence_id”:“https://openalex.org/licenses/other-oa网站“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},{”is_oa“:false,”landing_page_url“:”https://api.datacite.org/dois/10.48550/arxiv.2208.09596“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4393179698“,”display_name“:”DataCite API“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”is_core“:false,”host_organization“:”https://openalex.org/I4210145204“,”“host_organization_name”:“DataCite”,“host_organization_lineage”:[“https://openalex.org/I4210145204“],”host_organization_lineage_names“:[”DataCite“],“type”:“metadata”},“license”:null,“licence_id”:null,“version”:null}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“https://arxiv.org/abs/2208.09596“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”is_core“:fase,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],”type“:”repository“},”license“:”other oa“,”license_id“:”https://openalex.org/licenses/other-oa网站“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},”sustainable_development_goals“:[],”grants“:[],”datasets“:],”versions“:[https://openalex.org/W4390718435","https://openalex.org/W4390549206","https://openalex.org/W4383031710","https://openalex.org/W4366834432","https://openalex.org/W4297411772","https://openalex.org/W4237784285","https://openalex.org/W3165231707","https://openalex.org/W3137171911","https://openalex.org/W2380075625","https://openalex.org/W2374712251“],”ngrams_url“:”https://api.openalex.org/works/W4292957667/ngrams网站“,”abstract_inverted_index“:{”文本到图像“:[0],”合成“:[11412176207],”目标“:[2],”到“:[3,661126170204],”生成“:[4],”a“:[5,12,49,611041020128163],”照片逼真“:[6129],”和“:[7,31,39,71,86,99115130154191284122],”语义“:[8,772132186],”一致“:[9,993133],”图像“:[10,30,37,69,85,98147182190],“来自”:[11145],“具体”:[13105],“文本”:[14,32,89106],“描述。“:[15193],”The“:[16,74194224],”images“:[17],”synthed“:[18,97158189],”by“:[19],”off-The-shelf“:[20],”models“:[21],”commurly“:[22],”contain“:[23],”limited“:[24],“components”:[25],“compared”:[26],“with”:[27220],“The”:[28,36,40,68,83,87,96100136152157181185192233],“对应“:[29,88],”描述“,:[33,90107],”其中“:[34,59149177217],”减少“:[35],”质量“:[38,70183],”文本-视觉“:[41,80],”一致性。“:[42,73],“收件人”:[43],“地址”:[44],“此”:[45211],“问题”:[46],“我们”:[47161],“提议”:[48],“新颖”:[50],“视觉语言”:[51166],“匹配”:[52167],“策略”:[53200212],“用于”:[54140],“文本到图像”:[55141175206],“合成”:[56],“命名”:[57165],“VLMGAN*,”:[58],“介绍”:[60],“双重”:[62,75121196],“视觉语言“:[63,76122198],“匹配”:[64,77,81199],“机制”:[65,78],“强化”:[67],“考虑”:[79],“介于”:[82,95188],“生成”:[84],“视觉视觉”:[92],“约束”:[94],“真实”:[101],“图像”。“:[102134],“给定”:[103],“VLMGAN*”:[108],“第一”:[109],“编码”:[110],“它”:[111],“到”:[112],“文本”:[1131],“特征”:[114],“然后”:[116],“馈送”:[117],“它们”:[118],“基于匹配”:[123],“生成”:[124],“模型”:[125234],“综合”:[127],“此外”:[135],“流行”:[137215],“评估”:[138],“指标”:[139],“是”:[143218],“借用“:[144],”简单“:[146],”生成“:[148],”主要“:[150],”评估“:[151],”现实“:[153],”多样性“:[155],”of“:[156174],”图像。“:[159],”因此,“:[160],”引入“:[162],”度量“:[164],”分数“:[168],”(VLMS)“:[169],”评估“:[171],”性能“:[173],”可以“:[178201],”考虑“:[179],”两者“:[180],”一致性“:[187],”建议“:[195],”多级“:[197],”被“:[202],”应用“:[203],”其他“:[205239],”方法。“:[208241],”We“:[209],”implement“:[210],”on“:[213227],”two“:[214228],”baselines,“:[216],”marked“:[219],”${\\text{VLMGAN}(VLMGAN)_{+\\text{AttnGAN}}$“:[221],”${\\text{VLMGAN}(VLMGAN)_{+\\text{DFGAN}}$。“:[223],”实验“:[225],”结果“:[226],”广泛使用“:[229],”数据集“:[230],”显示“:[231],”该“:[232],”实现“:[235],”显著“:[236],”改进“:[237],”超过“:[238],”最新“:[240]},”引用_by_api_url“:”https://api.openalex.org/works?filter=cites:W4292957667“,”counts_by_year“:[],”updated_date“:”2024-07-13T14:44:20.054116“,”created_date:“2022-08-24”}“