{“id”:“https://openalex.org/W2608377413“,”doi“:”https://doi.org/10.109/icpr.2016.7900072“,”title“:“使用基于深度神经网络的语音层次特征进行文本依赖性语音转换”,”display_name“:”使用基于深度神经元网络的语音层级特征进行文本依存性语音转换“,”publication_year“:2016,”publiation_date“:”2016-12-01“,”ids“:{”openalex“:”https://openalex.org/W2608377413“,”doi“:”https://doi.org/10.109/icpr.2016.7900072“,”mag“:”2608377413“},”language“:”en“,”primary_location“:{”is_oa“:false,”landing_page_url“:”https://doi.org/10.109/icpr.2016.7900072“,”pdf_url“:null,”source“:null,”license“:null',”licence_id“:null,”version“:nuller,”is_accepted“:false,”is_published“:false},”type“:”article“,”type_crossref“:“procesdings-article”,”indexed_in“:[”crossref“],”open_access“:{”is_oa“:false,”oa_status“:”closed“,”oa_url”:null“,”any_repository_has_fulltext“:false}”,”authorships“:[{”author_position“:”first“,”作者“:{”id“:”https://openalex.org/A5007825677“,”display_name“:”华帝正“,”兽人“:”https://orcid.org/0000-0003-1224-9885},“机构”:[{“id”:https://openalex.org/I14243506“,”display_name“:”香港理工大学“,”ror“:”https://ror.org/0030zas98“,”country_code“:”HK“,”type“:“教育”,”世系“:[”https://openalex.org/I14243506“]}],”国家“:[”香港“],”is_corresponding“:false,”raw_author_name“:”None Huadi Zheng“,”raw _affiliation_strings“:[“香港理工大学EIE系”],”affiliations“:[{”raw _affiliation_string“:”香港理工学院EIE系“,”institution_ids“:]”https://openalex.org/I14243506“]}]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5025195497“,”display_name“:”魏成才“,”兽人“:”https://orcid.org/0000-0002-2195-0203},“机构”:[{“id”:https://openalex.org/I4210129003“,”display_name“:”SYSU-CMU国际联合研究所“,”ror“:”https://ror.org/02w30ae27“,”“country_code”“:”CN“,”type“:”facility“,”lineage“:[”https://openalex.org/I4210129003“]},{”id“:”https://openalex.org/I157773358“,”display_name“:”中山大学“,”ror“:”https://ror.org/0064kty71“,”country_code“:”CN“,”type“:“教育”,”世系“:[”https://openalex.org/I157773358“]}],”国家“:[”CN“],”is_corresponding“:false,”raw_author_name“:”魏城蔡“,”raw _ afiliation_strings“:[“中山大学中大联合工程学院”],”affiliations“:[{”raw_ afiliation _string“:”中山大学中小联合工程学院“,”institution_ids“:[https://openalex.org/I4210129003","https://openalex.org/I157773358“]}]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5081293290“,”display_name“:”周天炎“,”兽人“:”https://orcid.org/0000-0003-3238-2982},“机构”:[{“id”:https://openalex.org/I4210129003“,”display_name“:”SYSU-CMU国际联合研究院“,”ror“:”https://ror.org/02w30ae27“,”“country_code”“:”CN“,”type“:”facility“,”lineage“:[”https://openalex.org/I4210129003“]},{”id“:”https://openalex.org/I157773358“,”display_name“:”中山大学“,”ror“:”https://ror.org/0064kty71“,”country_code“:”CN“,”type“:“教育”,”世系“:[”https://openalex.org/I157773358“]}],”国家“:[”CN“],”is_corresponding“:false,”raw_author_name“:”None Tianyan Zhou“,”raw _affiliation_strings“:[“中山大学中大联合工程学院”],”affiliations“:[{”raw _affiliation_string“:”中山大学中小联合工程学院“,”institution_ids“:[https://openalex.org/I4210129003","https://openalex.org/I157773358“]}]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5023863527“,”display_name“:”张石磊“,”orcid“:”https://orcid.org/0009-0008-6755-7926},“机构”:[{“id”:https://openalex.org/I4210126794“,”display_name“:”IBM Research-中国“,”ror“:”https://ror.org/02yg1pf55“,”“country_code”“:”CN“,”type“:”facility“,”lineage“:[”https://openalex.org/I1341412227","https://openalex.org/I4210114115","https://openalex.org/I4210126794“]}],”国家“:[”CN“],”is_corresponding“:false,”raw_author_name“:”None Shilei Zhang“,”raw _affiliation_strings“:[“IBM China Research语音技术与解决方案组”],”affiliations“:[{”raw _affiliation_string“:”IBM China Research语音科技与解决方案小组”,“institution_ids”:[“https://openalex.org/I4210126794“]}]},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A5021384155“,”display_name“:”Ming Li“,”orcid“:”https://orcid.org/0000-0003-4527-4542},“机构”:[{“id”:https://openalex.org/I4210129003“,”display_name“:”SYSU-CMU国际联合研究院“,”ror“:”https://ror.org/02w30ae27“,”“country_code”“:”CN“,”type“:”facility“,”lineage“:[”https://openalex.org/I4210129003“]},{”id“:”https://openalex.org/I157773358“,”display_name“:”中山大学“,”ror“:”https://ror.org/0064kty71“,”country_code“:”CN“,”type“:“教育”,”世系“:[”https://openalex.org/I157773358“]}],”国家“:[”CN“],”is_corresponding“:false,”raw_author_name“:”Ming Li“,”raw _affiliation_strings“:[“中山大学中大联合工程学院”,“中大顺德国际联合研究院”],“affiliations”:[{“raw_affilition_string”:“中大顺德国际联合科研院”,“institution_ids”:[”https://openalex.org/I4210129003","https://openalex.org/I157773358“]},{”raw_affiliation_string“:”中山大学SYSU-CMU联合工程学院“,”institution_ids“:[]}]}],”countries_distiction_count“:2,”instistations_disticent_count”:4,”corresponding_author_ids”:[],“correspounding_institution_ids”:[],“apc_list”:null,“apc_payed”:null,“has_fulltext”:true,“fulltext_origin”:“ngrams”,“cited_by_”计数“:9,”cited_by_percentile_year“:{“min”:87,“max”:88},“biblio”:{卷:null,“问题”:nullhttps://openalex.org/T10201“,”display_name“:”语音识别技术“,”score“:0.9999,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10201“,”display_name“:”语音识别技术“,”score“:0.9999,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10860“,”display_name“:”语音增强技术“,”score“:0.9949,”subfield“:{”id“:”https://openalex.org/subfields/1711“,”display_name“:”信号处理“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T11309“,”display_name“:”音频信号分类与分析“,”score“:0.9933,”subfield“:{”id“:”https://openalex.org/subfields/1711“,”display_name“:”信号处理“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/end-to-end-speech-recognition(https://openalex.org/关键词/端到端语音识别)“,”display_name“:”端到端语音识别“,”score“:0.527305},{”id“:”https://openalex.org/keywords/speaker验证“,”display_name“:”说话人验证“,”score“:0.526958},{”id“:”https://openalex.org/keywords/aoustic-modeling“,”display_name“:”声学建模“,”score“:0.525805},{”id“:”https://openalex.org/keywords/audi-visual-speech-re认知“,”display_name“:”视听语音识别“,”score“:0.515541},{”id“:”https://openalex.org/keywords/audio-event-detection(https://openalex.org/关键词/音频事件检测)“,”display_name“:”音频事件检测“,”score“:0.51342}],”concepts“:[{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198(网址:https://www.wikidata.org/wiki/Q21198)“,”display_name“:”计算机科学“,”level“:0,”score“:0.8043139},{”id“:”https://openalex.org/C28490314,“wikidata”:https://www.wikidata.org/wiki/Q189436“,”display_name“:”语音识别“,”level“:1,”score“:0.73547417},{”id“:”https://openalex.org/C61224824,“wikidata”:https://www.wikidata.org/wiki/Q2260434“,”display_name“:”混合模型“,”level“:2,”score“:0.70361173},{”id“:”https://openalex.org/C2776401178,“wikidata”:https://www.wikidata.org/wiki/Q12050496“,”display_name“:”功能(语言学)“,”级别“:2,”分数“:0.57399136},{”id“:”https://openalex.org/C50644808,“wikidata”:https://www.wikidata.org/wiki/Q192776“,”display_name“:”人工神经网络“,”level“:2,”score“:0.55989665},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.5486801},{”id“:”https://openalex.org/C133892786,“wikidata”:https://www.wikidata.org/wiki/Q1145189网址“,”display_name“:”说话人识别“,”level“:2,”score“:0.54663914},{”id“:”https://openalex.org/C153180895,“wikidata”:https://www.wikidata.org/wiki/Q7148389“,”display_name“:”模式识别(心理学)“,”level“:2,”score“:0.4770702},{”id“:”https://openalex.org/C69738355,“wikidata”:https://www.wikidata.org/wiki/Q1228929“,”display_name“:”线性判别分析“,”level“:2,”score“:0.47416058},{”id“:”https://openalex.org/C78397625,“wikidata”:https://www.wikidata.org/wiki/Q192487“,”display_name“:”Discriminant“,”level“:2,”score“:0.42828804},{”id“:”https://openalex.org/C61328038,“wikidata”:https://www.wikidata.org/wiki/Q3358061“,”display_name“:”语音处理“,”level“:2,”score“:0.4248011},{”id“:”https://openalex.org/C52622490,“wikidata”:https://www.wikidata.org/wiki/Q102626“,”display_name“:”特征提取“,”level“:2,”score“:0.41118962},{”id“:”https://openalex.org/C138885662,“wikidata”:https://www.wikidata.org/wiki/Q5891“,”display_name“:”哲学“,”等级“:0,”分数“:0.0},{”id“:”https://openalex.org/C41895202,“wikidata”:https://www.wikidata.org/wiki/Q8162“,”display_name“:”语言学“,”level“:1,”score“:0.0}],”mesh“:[],”locations_count“:1.”locations“:[{”is_oa“:false,”landing_page_url“:”https://doi.org/10.109/icpr.2016.7900072“,”pdf_url“:null,”source“:nul,”license“:null:”license_id“:nulse,”version“:null,”is_accepted“:false,”is_published“:false}],”best_oa_location“:nuld,”sustainable_development_goals“:[{”display_name“:”减少不平等“,”score“:0.67,”id“:”https://metadata.un.org/sdg/10“}],”grants“:[],”datasets“:[],”versions“:[】,”referenced_works_count“:22,”referrenced_works“:【”https://openalex.org/W1519698338","https://openalex.org/W1977362459","https://openalex.org/W2009674825","https://openalex.org/W2022125261","https://openalex.org/W2026704977","https://openalex.org/W2039057510","https://openalex.org/W2049686551","https://openalex.org/W2105160541","https://openalex.org/W2111550316","https://openalex.org/W2114543868","https://openalex.org/W2114659828","https://openalex.org/W2118850452","https://openalex.org/W2120605154","https://openalex.org/W2123003832","https://openalex.org/W2147768505","https://openalex.org/W2152974894","https://openalex.org/W2158069733","https://openalex.org/W2165712214","https://openalex.org/W2175575774","https://openalex.org/W2290689761","https://openalex.org/W330298975","https://openalex.org/W996208672“],”related_works“:[”https://openalex.org/W3147024994","https://openalex.org/W3021047493","https://openalex.org/W3008559849","https://openalex.org/W2374055396","https://openalex.org/W2362114017","https://openalex.org/W2350751952","https://openalex.org/W2063246903","https://openalex.org/W2021817983","https://openalex.org/W1999647744","https://openalex.org/W1978302214“],”ngrams_url“:”https://api.openalex.org/works/W260837413/ngrams“,”“abstract_inverted_index”:{“This”:[0],“paper”:[1],“presents”:[2],“a”:[3,47,67110127],“phonetically-ware”:[4139160],“joint”:[5],“density”:[6],“Gaussian”:[7],“mixed”:[8],“model”:[9],“(JD-GMM)”:[10],“framework”:[11],“for”:[12],“voice”:[13],“conversion”:[14,43,95],“that”:[15,29,49157],“no”:[16],“longer”:[17],“requires”:[18],“parallel”:[19]data“:[20],”from“:[21,59,85105],”source“:[22,86],”speaker“:[23,87118],”at“:[24,94],”the“:[25,30,42,60,70106132137146169173],”training“:[26151181],”stage。“:[27,96],”考虑“:[28],”语音“:[31,52,82,98],”级别“:[32],”特征“:[33,54,57,76,84,93100],”包含“:[34],”文本“:[35],”信息“:[36],”其中“:[37],”应该“:[38],”是“:[39124],”保留“:[40],”在“:[41115172],”任务“:[44],”我们“:[45,79],”提议“:[46],“方法”:[48140144162],“仅”:[50177],“连接”:[51],“discriminant“:[53,83,99],”and“:[55],”spectric“:[56,92],”extracted“:[58102],”same“:[61],”target“:[62,90178],”扬声器“:[63],”语音“:[64179],”to“:[65,88168],”train“:[66],”JD-GMM。“:[68],”After“:[69],”mapping“:[71],”relationship“:[72],”of“:[73109131175],”these“:[74],”two“:[75],”is“:[77],”trained“,”:[78],”can“:[80123163],”use“:[81],”estimate“:[89],”speaker's“:[91],”The“:[97153],”are“:[101],”using“:[103176],”PCA“:[104],”output“:[107],“层”:[108],“深”:[111],“神经”:[112],“网络”:[113],“(DNN)”:[114],“an”:[116],“自动“:[117],”识别“:[119],”(ASR)“:[120],”系统。“:[121],“It”:[122],“seen”:[125],“as”:[126180],“low”:[128],“dimensional”:[129],“representation”:[130],“senone”:%133],“posteriors”。“:[134],“我们”:[135],“比较”:[136],“提议”:[138159],“与”:[141],“常规”:[142170],“JD-GMM”:[143171],“on”:[145],“声音”:[147],“转换”:[148],“挑战”:[149],“2016”:[150],“数据库”。“:[152],”实验“:[154],”结果“:[155],”显示“:[156],”我们的“:[158],”特征“:[161],”获得“:[164],”相似“:[165],”性能“:[166],”比较“:[167],”案例“:[174],”数据。“:[182]},”cited_by_api_url“:”https://api.openalex.org/works?filter=cites:W2608377413“,”counts_by_year“:[{年:2023,”cited_by_count“:2},{年“:2022,”cited_by_count”:1},“年”:2021,”citecd_by_count“:2%n,{”年“:2020,”citesd_by_count“:4}],”updated_date“:”2024-06-16T19:58:59.093195“,”created_dated“:”2017-05-05“}”