{“id”:“https://openalex.org/W4386076103“,”doi“:”https://doi.org/10.109/cvpr52729.2023.01016“,”title“:”音频驱动协同语言手势生成的缓和扩散模型“,”display_name“:”语音驱动协同语言姿势生成的缓和传播模型“,“publication_year”:2023,“publitation_date”:“2023-06-01”,“ids”:{“openalex”:“https://openalex.org/W4386076103“,”doi“:”https://doi.org/10.109/cvpr52729.2023.01016“},”language“:”en“,”primary_location“:{”is_oa“:false,”landing_page_url“:”https://doi.org/10.109/cvpr52729.2023.01016“,”pdf_url“:null,”source“:null,”license“:null',”licence_id“:null,”version“:nuller,”is_accepted“:false,”is_published“:false},”type“:”article“,”type_crossref“:“procesdings-article”,”indexed_in“:[”crossref“],”open_access“:{”is_oa“:false,”oa_status“:”closed“,”oa_url”:null“,”any_repository_has_fulltext“:false}”,”authorships“:[{”author_position“:”first“,”作者“:{”id“:”https://openalex.org/A5036062525“,”display_name“:”Ling Zhu“,”orcid“:”https://orcid.org/0000-0002-6678-8289},“机构”:[{“id”:https://openalex.org/I889458895“,”display_name“:”香港大学“,”ror“:”https://ror.org/02zhqgq86“,”country_code“:”HK“,”type“:“教育”,”世系“:[”https://openalex.org/I889458895“]}],”国家“:[”HK“],”is_corresponding“:false,”raw_author_name“:”Lingting Zhu“,”raw _affiliation_strings“:[“香港大学”],”affiliations“:[{”raw _affiliation_string“:”The University of Hong Kong“,”institution_ids“:]”https://openalex.org/I889458895“]}]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5020051427“,”display_name“:”仙柳“,”兽人“:”https://orcid.org/0000-0001-7337-591X“},”机构“:[],”国家“:[”CN“],”is_corresponding“:false,”raw_author_name“:”Xian Liu“,”raw_affiliation_strings“:[“香港中文大学”],”affiliations“:[{”raw_affiliation_string“:”香港中文大学“,”institution_ids“:[]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5078523903“,”display_name“:”刘轩宇“,”兽人“:”https://orcid.org/0000-0001-8916-9942},“机构”:[{“id”:https://openalex.org/I889458895“,”display_name“:”香港大学“,”ror“:”https://ror.org/02zhqgq86“,”country_code“:”HK“,”type“:“教育”,”世系“:[”https://openalex.org/I889458895“]}],”国家“:[”香港“],”is_corresponding“:false,”raw_author_name“:”刘轩宇“,”raw _ afiliation_strings“:[“香港大学”],”affiliations“:[{”raw_ afiliation _string“:”香港大学“,”institution_ids“:[https://openalex.org/I889458895“]}]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5013171074“,”display_name“:”瑞曲“,”兽人“:”https://orcid.org/0000-0002-2716-6401“},”机构“:[],”国家“:[”CN“],”is_corresponding“:false,”raw_author_name“:”芮倩“,”raw _ afiliation_strings“:[“香港中文大学”],”附属机构“:[{”raw_ afiliation _string“:”香港中文大学“,”机构id“:[]}]},{”author_position“:”中间“,”author“:{”id“:”https://openalex.org/A5071432355“,”display_name“:”Ziwei Liu“,”orcid“:”https://orcid.org/0000-0002-4220-5958},“机构”:[{“id”:https://openalex.org/I172675005“,”display_name“:”南洋理工大学“,”ror“:”https://ror.org/02e7b5302“,”country_code“:”SG“,”type“:“教育”,”世系“:[”https://openalex.org/I172675005“]}],”国家“:[”SG“],”is_corresponding“:false,”raw_author_name“:”刘紫薇“,”raw _ afiliation_strings“:[“南洋理工大学S-Lab”],”affiliations“:[{”raw_ afiliation _string“:”南洋理工大S-Lab“,”institution_ids“:[”https://openalex.org/I172675005“]}]},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A5012581106“,”display_name“:”乐泉鱼“,”兽人“:”https://orcid.org/0000-0002-9315-6527},“机构”:[{“id”:https://openalex.org/I889458895“,”display_name“:”香港大学“,”ror“:”https://ror.org/02zhqgq86“,”country_code“:”HK“,”type“:“教育”,”世系“:[”https://openalex.org/I889458895“]}],”国家“:[”香港“],”is_corresponding“:false,”raw_author_name“:”俞乐泉“,”raw _ afiliation_strings“:[“香港大学”],”affiliations“:[{”raw _affiliation_string“:”香港大学“,”institution_ids“:[https://openalex.org/I889458895“]}]}],”countries_distinct_count“:3,”institutions_disting_count”:2,”corresponding_author_ids“:[],”corresponding_institution_ids”:[]、“apc_list”:null,”apc_payed“:null、”fwci“:5.16,”has_fulltext“:false,”cited_by_count:7,“cited_by_percentile_year”:{“min”:96,”max“:97},”biblio“:{”volume“:nul,”issue“:null,“first_page”:空,“last_page”:空},“is_retracted“:false,”is_paratext“:fase,”primary_topic“:{”id“:”https://openalex.org/T10860“,”display_name“:”语音增强技术“,”score“:0.9978,”subfield“:{”id“:”https://openalex.org/subfields/1711“,”display_name“:”信号处理“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10860“,”display_name“:”语音增强技术“,”score“:0.9978,”subfield“:{”id“:”https://openalex.org/subfields/1711“,”display_name“:”信号处理“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T11349“,”display_name“:”交互式进化音乐系统和乐器“,”score“:0.9966,”subfield“:{”id“:”https://openalex.org/subfields/1707“,”display_name“:”计算机视觉和模式识别“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T11309“,”display_name“:”音频信号分类与分析“,”score“:0.9959,”subfield“:{”id“:”https://openalex.org/subfields/1711“,”display_name“:”信号处理“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/gesture-recognization网站“,”display_name“:”手势识别“,”score“:0.593115},{”id“:”https://openalex.org/keywords/audi-visual-speech-re认知“,”display_name“:”视听语音识别“,”score“:0.531092},{”id“:”https://openalex.org/keywords/audio-event-detection(https://openalex.org/关键词/音频事件检测)“,”display_name“:”音频事件检测“,”score“:0.525057}],”concepts“:[{”id“:”https://openalex.org/C207347870,“wikidata”:https://www.wikidata.org/wiki/Q371174“,”display_name“:”手势“,”等级“:2,”分数“:0.88501596},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.8313395},{”id“:”https://openalex.org/C28490314,“wikidata”:https://www.wikidata.org/wiki/Q189436“,”display_name“:”语音识别“,”level“:1,”score“:0.56739384},{”id“:”https://openalex.org/C159437735,“wikidata”:https://www.wikidata.org/wiki/Q1519524“,”display_name“:”手势识别“,”level“:3,”score“:0.43569565},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.41157043}],”mesh“:[],”locations_count“:1,”locations“:[{”is_oa“:false,”landing_page_url“:”https://doi.org/10.109/cvpr52729.2023.01016“,”pdf_url“:null,”source“:null,”license“:null,”license_id“:null,”version“:null,”is_accepted“:false,”is_published“:false}],”best_oa_location“:null,”sustainable_development_goals“:[{”score“:0.48,”id“:”https://metadata.un.org/sdg/16“,”display_name“:”和平、正义和强大的机构“}],”grants“:[],”datasets“:[],”versions“:[】,”referenced_works_count“:40,”refernced_works“:[”https://openalex.org/W1915786104","https://openalex.org/W1969784320","https://openalex.org/W1974604838","https://openalex.org/W2007337857","https://openalex.org/W2008208299","https://openalex.org/W2008496867","https://openalex.org/W2023890289","https://openalex.org/W2024536104","https://openalex.org/W2052872069","https://openalex.org/W2962730651","https://openalex.org/W2962795401","https://openalex.org/W2967443589","https://openalex.org/W2982625143","https://openalex.org/W3009042479","https://openalex.org/W3036167779","https://openalex.org/W3083173864","https://openalex.org/W3098994456","https://openalex.org/W3110095664","https://openalex.org/W3110257065","https://openalex.org/W3115266783","https://openalex.org/W3162926177","https://openalex.org/W3181695292","https://openalex.org/W3194872882","https://openalex.org/W3198131199","https://openalex.org/W3204221554","https://openalex.org/W3210580323","https://openalex.org/W4206861281","https://openalex.org/W4221142137","https://openalex.org/W4224035735","https://openalex.org/W4226125322","https://openalex.org/W4226360073","https://openalex.org/W4230429791","https://openalex.org/W4281485151","https://openalex.org/W4288099666","https://openalex.org/W4301206121","https://openalex.org/W4303448003","https://openalex.org/W4310831393网址","https://openalex.org/W4312437946","https://openalex.org/W4312674262","https://openalex.org/W4319300158“],”related_works“:[”https://openalex.org/W4316659390","https://openalex.org/W4281626041","https://openalex.org/W2984615118","https://openalex.org/W2945648453","https://openalex.org/W2520877275","https://openalex.org/W2132774916","https://openalex.org/W2111894689","https://openalex.org/W2005997082","https://openalex.org/W1999635775","https://openalex.org/W1974379374“],”ngrams_url“:”https://api.openalex.org/works/W4386076103/ngrams“,”“abstract_inverted_index”:{“动画”:[0],“虚拟”:[1],“化身”:[2],“to”:[3,37,57,89102105118149],“make”:[4],“同声”:[5,71],“手势”:[6168],“便利”:[7],“各种”:[8],“应用程序”:[9],“in”:[10],“人机”:[11],“交互。”:[12],“The”:[13],“现有”:[14],”方法“:[15],”主要“:[16],”依赖“:[17],”依靠“:[18,82],”生成“:[19],”对抗“:[20],”网络“:[21],”(GAN)“:[22],”其中“:[23165],”通常“:[24],”遭受“:[25],“来自”:[26108136],“臭名昭著”:[27],“模式”:[28171],“崩溃”:[29],“和”:[30,64,87111154173],“不稳定”:[31],“训练”:[32],“因此”:[33],“制造”:[34],“it”:[35],“困难”:[36],“学习”:[38],“准确”:[39],“音频评估”:[40],“联合“:[41],”分配。“:[42],“In”:[43],“this”:[44],“work”,:[45],“we”:%46,75122143],“propose”:[47123],“a”:[48,95],“novel”:+49,96],“diffusion-based”:[50],“framework,”:[51],“named”:[22],“diffusion”:[53,97126],“Co-Speech”:[54],“Gesture”:[55127],“Diff Gesture),”:“[56],“effectively”:[58],“捕获”:[59],“the”:[60,78,91106113137],“cross-modal”:[61],“音频到手势“:[62],“关联”:[63],“保留”:[65],“时间”:[66115120],“一致性”:[67],“用于”:[68],“高保真”:[69],“音频驱动”:[70],“手势”:[72155],“生成”。“:[73],”具体来说,“:[74],”第一个“:[76],”建立“:[77],”扩散条件“:[79],”生成“:[80],”过程“:[81],”剪辑“:[83],”的“:[84140],”骨架“:[85],”序列“:[86],”音频“:[88175],”启用“:[90],”整体“:[92],”框架。99],“is”:[100178],“designed”:[101],“better”:[103170],“attent“:[104],”information“:[107],”multiple“:[109],”models“:[110],”模型“:[112],”长期“:[114],”依赖性。“:[116],”“此外,”:[117],“消除”:[119],“不一致”,:[121],“an”:[124130],“有效”:[125],“稳定器”:[128],“with”:[129169],“退火”:[131],“噪声”:[132],“采样”:[133],“策略”。“:[134],“受益”:[135],“建筑”:[138],“优势”:[139],“扩散”:[141],“模型”:[142],“进一步”:[144],“合并”:[145],“隐含”:[146],“无分类器”:[147],“指导”:[148],“贸易”:[150],“关”:[151],“中间”:[152],“多样性”:[153],“质量”。“:[156],“广泛”:[157],“实验”:[158],“演示”:[159],“那”:[160],“DiffGesture”:[161],“实现”:[162],“最先进”:[163],“性能”:[164],“呈现”:[166],“连贯”:[167],“覆盖”:[172],“更强”:[174],“相关性”。“:[176],”代码“:[177],”可用“:[179],”位于“:[180],”https://github.com/Advocate99/DiffGesture。“:[181]},”cited_by_api_url“:”https://api.openalex.org/works?filter=引用:W4386076103”,“counts_by_year”:[{“year”:2024,“cited_by_count”:3},{“year”:2023,“cited_by_count”:2}],“updated_date”:“2024-06-27T21:24:5539326”,“created_date”:“2023-08-23”}