{“id”:“https://openalex.org/W4385439492“,”doi“:”https://doi.org/10.48550/arxiv.2307.15484“,”title“:”带条件扩散模型和语言模型的最小监督语音合成:语义编码的比较研究“,”display_name“:”带有条件扩散模型的最小监管语音合成和语言模型:语义编码对比研究“,“publication_year”:2023,“publiction_date”:“2023-01-01”,“ids“:{”openalex“:”https://openalex.org/W4385439492“,”doi“:”https://doi.org/10.48550/arxiv.2307.15484“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2307.15484“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“other-oa”,“licence_id”:“https://openalex.org/licenses/other-oa网站“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},”type“:”preprint“,”type_crossref“:“posted-content”,”indexed_in“:[”arxiv“,”datacite“],”open_access“:{”is_oa“:true,”oa_status“:”green“,”oa_url“:”https://arxiv.org/abs/2307.15484“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5028353824“,”display_name“:”Chunyu Qiang“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Qiang,Chunyue“,”raw _affiliation_strings“:],”afliations“:【】},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5019560977“,”display_name“:”郝丽“,”兽人“:”https://orcid.org/0000-0002-6294-6761“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”李,郝“,”raw_affiliation_strings“:[],“隶属关系”:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5029516423“,”display_name“:”郝妮“,”兽人“:”https://orcid.org/0000-0001-5485-4376“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”Ni,Hao“,”raw_affiliation_strings“:[],“从属关系”:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5007386098“,”display_name“:”弘毅区“,”兽人“:”https://orcid.org/0000-0003-3915-507X“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”曲,何“,”raw_affiliation_strings“:[],“隶属关系”:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5073918837“,”display_name“:”傅瑞波“,”orcid“:”https://orcid.org/0000-0001-9598--1881“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”傅瑞波“,”raw _ afiliation_strings“:[],“从属关系”:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5085142676“,”display_name“:”Tao Wang“,”orcid“:”https://orcid.org/0000-0003-0951-5476“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:Wang,Tao”,“raw_affiliation_strings”:[],“affiliations”:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5050763764“,”display_name“:”龙标王“,”兽人“:”https://orcid.org/0000-0002-4005-5036“},”机构“:[],”国家“:[],”is_correresponsing“:false,”raw_author_name“:”王,龙标“,”raw_affiation_strings“:[],”附属“:[]},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A5017251198“,”display_name“:”健武党“,”兽人“:”https://orcid.org/0000-0002-9237-4821“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”党,建武“,”raw _ afiliation_strings“:[],“隶属关系”:[]}],“countries _ distinct _count”:0,“institutions _ disting _count“:0,”corresponding_author_ids“:[].,”correcponding_institution_ids:[]“apc_list”:null,“apc_payed”:null,“fwci”:null,“has_fulltext“:false,”cited_by_count“:0,”cited_by_percentile_year“:{”min“:0”,“max”:77},“biblio”:{“volume”:null,“issue”:nul,“first_page”:null,“last_page”:null},”is_retracted“:false,”is_paratext“:false,”primary_topic“:”{“id”:“https://openalex.org/T10201“,”display_name“:”语音识别技术“,”score“:0.9983,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10201“,”display_name“:”语音识别技术“,”score“:0.9983,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10860“,”display_name“:”语音增强技术“,”score“:0.986,”subfield“:{”id“:”https://openalex.org/subfields/1711“,”display_name“:”信号处理“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T11309“,”display_name“:”音频信号分类与分析“,”score“:0.9726,”subfield“:{”id“:”https://openalex.org/subfields/1711“,”display_name“:”信号处理“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/end-to-end-speech-recognition(https://openalex.org/keywords/end-to-end-speech-recognition)“,”display_name“:”端到端语音识别“,”score“:0.547383},{”id“:”https://openalex.org/keywords/speech-enhancement网站“,”display_name“:”语音增强“,”score“:0.542146},{”id“:”https://openalex.org/keywords/audi-visual-speech-re认知“,”display_name“:”视听语音识别“,”score“:0.541975},{”id“:”https://openalex.org/keywords/统计语言建模“,”display_name“:”统计语言建模“,”score“:0.535166},{”id“:”https://openalex.org/keywords/speaker日记“,”display_name“:”Speaker Dialization“,”score“:0.529336}],”concepts“:[{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198(网址:https://www.wikidata.org/wiki/Q21198)“,”display_name“:”计算机科学“,”level“:0,”score“:0.7778915},{”id“:”https://openalex.org/C137293760,“wikidata”:https://www.wikidata.org/wiki/Q3621696“,”display_name“:”语言模型“,”level“:2,”score“:0.6040224},{”id“:”https://openalex.org/C159877910,“wikidata”:https://www.wikidata.org/wiki/Q2202883“,”display_name“:”自回归模型“,”level“:2,”score“:0.6007187},{”id“:”https://openalex.org/C28490314,“wikidata”:https://www.wikidata.org/wiki/Q189436“,”display_name“:”语音识别“,”level“:1,”score“:0.5905145},{”id“:”https://openalex.org/C101738243,“wikidata”:https://www.wikidata.org/wiki/Q786435“,”display_name“:”自动编码器“,”level“:3,”score“:0.5181593},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.462222},{”id“:”https://openalex.org/C174348530,“wikidata”:https://www.wikidata.org/wiki/Q188635“,”display_name“:”桥接(联网)“,”level“:2,”score“:0.41746885},{”id“:”https://openalex.org/C108583219,“wikidata”:https://www.wikidata.org/wiki/Q197536“,”display_name“:”深度学习“,”level“:2,”score“:0.19130203},{”id“:”https://openalex.org/C33923547,“wikidata”:https://www.wikidata.org/wiki/Q395“,”display_name“:”数学“,”等级“:0,”分数“:0.11592159},{”id“:”https://openalex.org/C31258907,“wikidata”:https://www.wikidata.org/wiki/Q1301371网址“,”display_name“:”计算机网络“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C149782125,“wikidata”:https://www.wikidata.org/wiki/Q160039“,”display_name“:”Econometrics“,”level“:1,”score“:0.0}],”mesh“:[],”locations_count“:2,”location“:[{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2307.15484“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“other-oa”,“licence_id”:“https://openalex.org/licenses/other-oa网站“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},{”is_oa“:false,”landing_page_url“:”https://api.datacite.org/dois/10.48550/arxiv.2307.15484“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4393179698“,”display_name“:”DataCite API“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I4210145204“,”“host_organization_name”:“DataCite”,“host_organization_lineage”:[“https://openalex.org/I4210145204“],”host_organization_lineage_names“:[”DataCite“],“type”:“metadata”},“license”:null,“licence_id”:null,“version”:null}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“https://arxiv.org/abs/2307.15484“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“other-oa”,“licence_id”:“https://openalex.org/licenses/other-oa网站“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},”sustainable_development_goals“:[{”display_name“:”素质教育“,”score“:0.45,”id“:”https://metadata.un.org/sdg/4“}],”grants“:[],”datasets“:[],”versions“:[】,”referenced_works_count“:0,”referrenced_works“:],”related_work斯“:[”https://openalex.org/W4297051394","https://openalex.org/W3131327266","https://openalex.org/W3013693939","https://openalex.org/W2909431601","https://openalex.org/W2803255133","https://openalex.org/W2752972570","https://openalex.org/W2734887215","https://openalex.org/W2566616303","https://openalex.org/W2159052453","https://openalex.org/W2145836866“],”ngrams_url“:”https://api.openalex.org/works/W4385439492/ngrams网站“,”“abstract_inverted_index”:{“最近,”:[0],“那里”:[1],“已经”:[2],“曾经”:[3],“a”:[4,95111122128132144155168203],“正在增长”:[5],“兴趣”:[6],“in”:[7,61],“文本到语音”:[8],“(TTS)”:[9],“方法”:[10,36,83197],“that”:[11153177194],“can”:[12],“be”:[13],“培训”:[14],“有”:[15205],“最低”:[16],“监督”:[17],“由”:[18,56],“组合“:[19],”两个“:[20,28],”类型“:[21],”of“:[22,47,72,9148172181],”离散“:[23,48],”语音“:[24,49],”表示“:[25],”和“:[26,44,64,68,98131186],”使用“:[27],”序列到序列“:[29],”任务“:[30],”到“:[311413559],”解耦“:[32],”TTS。“:[33],”“然而,”:[34],“现有”:[35,73182],“遭受”:[37],“来自”:[38],“三”:[39,81173],“问题:”:[40],“the”:[41,51,57,65107179188],“high”:[42],“dimensionality”:[43],“波形”:[45],“失真”:[46],“representations”:[50],“韵律”:[52162],“averaging”:[53],“problem”:[54],“导致”:[55],“持续时间”:[58156],“预测”:[59],“模型“:[60,97113158],“非自回归”:[62145169],“框架”,:[63],“信息”:[66],“冗余”:[67],“维度”:[69],“爆炸”:[70],“问题”:[71],“语义”:[74104183],“编码”:[75184],“方法”。“:[76200],”收件人“:[77],”地址“:[78],”这些“:[79],”问题“:[80],”渐进“:[82],”是“:[84],”建议的。“:[85],“第一,”:[86],“我们”:[87141165],“提议”:[88142166],“差异语言”:[89],“an”:[90],“自回归”:[91],“结构”:[92125146170],“组成”:[93147171],“语言”:[06],“扩散”:[99112150157174],“模型”:[100],“其中”:[101],“模式”:[102185],“嵌入”:[105],“到”:[106],“梅尔谱图”:[108],“基于”:[109126],“关于“:[110127],”实现“:[115160187],”更高“:[116],”音频“:[117206],”质量。“:[118],“我们”:[119201],“也”:[120],“介绍”:[121],“提示”:[123137],“编码器”:[124],“变分”:[129],“自动编码器”:%130],“韵律”:[133],“瓶颈”:[134],“改进”:[136],“表征”:[138],“能力”。“:[139],“Second,”:[140],“Tetra-Diff-Speech”:[143],“four”:[149],“model-based”:[151175],“modules”:[152176],“design”:%154],“diversity”:[161],“expressions”。“:[163],”最后,“:[164],”三种不同语言“:[167],”验证“:[178],”非必要性“:[180],”最佳“:[189],”结果。“:[190],”实验“:[191],”结果“:[192],”显示“:[193],”我们的“:[195],”建议“:[196],”跑赢大市“:[198],”基线“:[199],”提供“:[202],”网站“:[204],”样本。“:[207]},”引用_by_api_url“:”https://api.openalex.org/works?filter=cites:W4385439492“,”counts_by_year“:[],”updated_date“:”2024-06-21T03:43:33.017001“,”created_date:“2023-08-01”}“