{“id”:“https://openalex.org/W4389814425“,”doi“:”https://doi.org/10.48550/arxiv.2312.08553“,”title“:”USM-Lite:“Universal Speech Models语音识别的量化和稀疏感知微调”,“display_name”:“USM-Lite:Universal语音模型语音识别的定量和稀疏感知细化”,“publication_year”:2023,“publiation_date”:“2023-01-01”,“ids”:{“openalex”:“https://openalex.org/W4389814425“,”doi“:”https://doi.org/10.48550/arxiv.2312.08553“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2312.08553“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”is_core“:fase,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“other-oa”,“licence_id”:“https://openalex.org/licenses/other-oa网站“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},”type“:”preprint“,”type_crossref“:“posted-content”,”indexed_in“:[”arxiv“,”datacite“],”open_access“:{”is_oa“:true,”oa_status“:”green“,”oa_url“:”https://arxiv.org/abs/312.08853“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5058886181“,”display_name“:”邵金鼎“,”兽人“:”https://orcid.org/00000-0002-2108-3111“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”丁,邵津“,”raw关联字符串“:[],“隶属关系”:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5105940239“,”display_name“:”Qiu David“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”David,Qiu“,“raw_affiliation_strings”:[]“affiliations”:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5092046744“,”display_name“:”David Rim“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Rim,David“,”raw _affiliation_strings“:],”affiliations“:[/]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5101319167“,”display_name“:”Yanzhang He“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”He,Yanzhong“,“raw_affiliation_strings”:[]“afliations”:[]},{“author_position”:“middle”,“author”:{“id”:“”https://openalex.org/A5070398306“,”display_name“:”Oleg Rybakov\u200e“,”orcid“:”https://orcid.org/0000-0003-4805-3083“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”Rybakov,Oleg“,”raw_affiliation_strings“:[],“从属关系”:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5100374360“,”display_name“:”Bo Li“,”orcid“:”https://orcid.org/0000-0001-6709-0942“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”李,波“,”raw_affiliation_strings“:[],“附属关系”:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5032640894“,”display_name“:”Rohit Prabhavalkar“,”orcid“:”https://orcid.org/0000-0001-5331-6058“},”机构“:[],”国家“:[],”is_correresponsing“:false,”raw_author_name“:”Prabhavalkar,Rohit“,”raw_affiation_strings“:[],”附属“:[]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5101432591“,”display_name“:”Weiran Wang“,”orcid“:”https://orcid.org/0009-0000-0843-707X“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”Wang,Weiran“,”raw_affiliation_strings“:[],“affiliations”:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5070513394“,”display_name“:”Tara N.Sainath“,”orcid“:”https://orcid.org/0000-0002-4126-6556“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”Sainath,Tara N.“,”raw_affiliation_strings“:[],“从属关系”:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5033596864“,”display_name“:”Shivani Agrawal“,”orcid“:null},”institutions“:[],”countries“:[],”is_correresponsing“:false,”raw_author_name“:”Agrawal,Shivani“,”raw_affiation_strings“:[],”affiliations“:[]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5043621779“,”display_name“:”仲林汉“,”兽人“:”https://orcid.org/0000-0001-8795-7953“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”汉族,中林“,”raw _ afiliation_strings“:[],“affiliations”:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5100402391“,”display_name“:”李健“,”orcid“:”https://orcid.org/0000-0001-5335-9832“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”李,健“,”raw _ afiliation_strings“:[],“从属关系”:[]},{“author_position”:“last”,“author”:{“id”:“”https://openalex.org/A5070172290“,”display_name“:”Amir Yazdanbakhsh“,”orcid“:”https://orcid.org/0000-0001-8199-7671“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”Yazdanbakhsh,Amir“,”raw_affiliation_strings“:[],“隶属关系”:[]}],“机构评估”:[]apc_payd“:null,”fwci“:null,”has_fulltext“:false,”cited_by_count“:0,”citation_normalized_percentile“:{”value“:0.0,”is_in_top_1_percent“:false},”cited_by_percentile_year“:{“min”:0,“max”:71},“biblio”:{“volume”:null,“issue”:null,“first_page”:nully,“last_page”:null},‘is_retracted’:false _主题“:{”id“:”https://openalex.org/T10201“,”display_name“:”语音识别技术“,”score“:0.9998,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10201“,”display_name“:”语音识别技术“,”score“:0.9998,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10860“,”display_name“:”语音增强技术“,”score“:0.9988,”subfield“:{”id“:”https://openalex.org/subfields/1711“,”display_name“:”信号处理“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T11309“,”display_name“:”音频信号分类与分析“,”score“:0.9957,”subfield“:{”id“:”https://openalex.org/subfields/1711“,”display_name“:”信号处理“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/aoustic-modeling“,”display_name“:”声学建模“,”score“:0.572365},{”id“:”https://openalex.org/keywords/end-to-end-speech-recognition(https://openalex.org/关键词/端到端语音识别)“,”display_name“:”端到端语音识别“,”score“:0.566285},{”id“:”https://openalex.org/keywords/automatic-speech-re认知“,”display_name“:”自动语音识别“,”score“:0.560496},{”id“:”https://openalex.org/keywords/audio-visual-speech-recognition(https://openalex.org/keywords/audio-visual-speech-recognition)“,”display_name“:”视听语音识别“,”score“:0.556175},{”id“:”https://openalex.org/keywords/speech-enhancement网站“,”display_name“:”语音增强“,”score“:0.532722},{”id“:”https://openalex.org/keywords/word-error-rate网站“,”display_name“:”字错误率“,”score“:0.42404187}],”concepts“:[{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.7394237},{”id“:”https://openalex.org/C28855332,“wikidata”:https://www.wikidata.org/wiki/Q198099“,”display_name“:”量化(信号处理)“,”level“:2,”score“:0.7057565},{”id“:”https://openalex.org/C28490314,“wikidata”:https://www.wikidata.org/wiki/Q189436“,”display_name“:”语音识别“,”level“:1,”score“:0.508887},{”id“:”https://openalex.org/C40969351,“wikidata”:https://www.wikidata.org/wiki/Q3516228“,”display_name“:”字错误率“,”level“:2,”score“:0.42404187},{”id“:”https://openalex.org/C11413529,“wikidata”:https://www.wikidata.org/wiki/Q8366“,”display_name“:”Algorithm“,”level“:1,”score“:0.4123367}],”mesh“:[],”locations_count“:2,”location“:[{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2312.08553“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”is_core“:fase,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“other-oa”,“licence_id”:“https://openalex.org/licenses/other-oa网站“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},{”is_oa“:false,”landing_page_url“:”https://api.datacite.org/dois/10.48550/arxiv.2312.08553“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4393179698“,”display_name“:”DataCite API“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”is_core“:false,”host_organization“:”https://openalex.org/I4210145204“,”“host_organization_name”:“DataCite”,“host_organization_lineage”:[“https://openalex.org/I4210145204“],”host_organization_lineage_names“:[”DataCite“],“type”:“metadata”},“license”:null,“licence_id”:null,“version”:null}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“https://arxiv.org/abs/2312.08553“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”is_core“:fase,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“other-oa”,“licence_id”:“https://openalex.org/licenses/other-oa网站“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},”sustainable_development_goals“:[{”score“:0.64,”id“:”https://metadata.un.org/sdg/16“,”display_name“:”和平、正义和强大的机构“}],”grants“:[],”datasets“:[],”versions“:[】,”referenced_works_count“:0,”referrenced_works“:],”related_work斯“:[”https://openalex.org/W2547793174","https://openalex.org/W2544241817","https://openalex.org/W2309273277","https://openalex.org/W2132885390","https://openalex.org/W2132658536","https://openalex.org/W2070212102","https://openalex.org/W2061937230","https://openalex.org/W1769849273","https://openalex.org/W1574295218","https://openalex.org/W113247760“],”abstract_inverted_index“:{”端到端“:[0],”自动“:[1],”语音“:[2,18],”识别“:[3],”(ASR)“:[4],”模型“:[5,19],”have“:[6157],”seen“:[7],”革命性“:[8],“质量”:[9],“收益”:[10],”with“:[11,66,95],”the“:[12,3177,81117135160163180185],”recent“:[13],”开发”:[14],“of”:[15113119159165],“大规模”:[16102],“通用“:[17],”(USM)。“:[20],”“然而,”“:[21127],”部署“:[22],”这些“:[23],”大规模“:[24],”USM“:[25],”是“:[26,41],”极端“:[27],“昂贵”:[28],”到期“:[29],”到“:[30,46101113156],”巨大“:[32],”内存“:[33],”使用“:[34],”和“:[35,70,87124144182187],”计算“:[36],”成本。“:[37],”因此,“:[38],”模型“:[39,78,82155],”压缩“:[40130],”an“:[42],”重要“:[43],”研究“:[44],”主题“:[45],”适合“:[47],”基于USM“:[48],”ASR“:[49],”根据“:[50138],“预算”:[51],“in”:[52],“真实世界”:[53],“场景。“:[54],”In“:[55],”this“:[56],”study“:[57],”we“:58],”propose“:[59],”a“:[60,67,96101128],”USM“:[61,99],”微调“:[62],”approach“:/63],”for“:[64194],”ASR“:[65],”low bit“:[68],”量化“:[69123143],”N:M“:[11],”结构化“:[72],”spars城市:[73],“意识”:[74],“范式”:[75],“on”:[76100179184],“权重”,:[79],“减少”:[80],“复杂性“:[83],”来自“:[84],”参数“:[85,98],”精度“:[86],”矩阵“:[88],”拓扑“:[89],”透视图。“:[90],“我们”:[91174],“执行”:[92],“广泛”:[93],“实验”:[94],“20亿”:[97],“语音”:[103],“搜索”:[104],“数据集”:[105],“评估”:[107],“我方”:[108149],“建议”:[109150],“方法”。“:[110],“A”:[111],“系列”:[112],“消融”:[114],“研究”:[115],“验证”:[116],“有效性”:[118],“向上”:[120],“int4”:[122],“2:4”:%125],“稀疏性”。“:[126146],”single“:[129],”technology“:[131],”fails“:[132],”recover“:[134],”performance“:[136],”well“:[137],”extreme“:[139],”setup“:[140],”including“:[141],”int2“:[142],”1:4“:[145],”By“:%147],”contrast“:[148],”method“:[151],”can“:[152],”compress“:[153],”9.4%“:[158],”大小,“:[161],”at“:[162],”cost“:[164],”only“:[166],”7.3%“:[167],”relative“:[168],”单词“:[169],”错误“:[170],”速率“:[171],”(WER)“:[172],”回归。“:[173],”也“:[175],”提供“:[176],”深入“:[177],”分析“:[178],”结果“:[181],”讨论“:[183],”限制“:[186],”潜在“:[188],”解决方案“:[189],”其中“:[190],”将“:[191],”成为“:[192],”有价值“:[193],”未来“:[195],”研究。“:[196]},”cited_by_api_url“:”https://api.openalex.org/works?filter=cites:W4389814425“,”counts_by_year“:[],”updated_date“:”2024-09-20T01:29:35.620436“,”created_date:“2023-12-16”}“