{“id”:“https://openalex.org/W3096104971“,”doi“:”https://doi.org/10.21437/interseech.2020-2840“,”title“:”Scaling Up Online Speech Recognition Using ConvNets“,”display_name“:”使用ConvNet放大联机语音识别“,”publication_year“:2020,”publiation_date“:”2020-10-25“,”ids“:{”openalex“:”https://openalex.org/W3096104971“,”doi“:”https://doi.org/10.21437/interseech.2020-2840“,”mag“:”3096104971“},”language“:”en“,”primary_location“:{”is_oa“:false,”landing_page_url“:”https://doi.org/10.21437/interseech.2020-2840“,”pdf_url“:null,”source“:nul,”license“:null',”licence_id“:null,”version“:nuller,”is_accepted“:false,”is_published“:false},”type“:”article“,”type_crossref“:“proceedings-article”,”indexed_in“:[”crossref“],”open_access“:{”is_oa“:true,”oa_status“:”green“,”“oa_url”:“”https://arxiv.org/pdf/2001.09727“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5028944337网址“,”display_name“:”Vineel Pratap“,”orcid“:”https://orcid.org/00000-0003-3333-910X“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”Vineel Pratap“,”raw_affiliation_strings“:[],“affiliations”:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5012045783“,”display_name“:”Qiantong Xu“,”orcid“:”https://orcid.org/0000-0002-3998-4209“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”Qiantong Xu“,”raw_affiliation_strings“:[],“从属关系”:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5027275703“,”display_name“:”Jacob Kahn“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Jacob-Kahnhttps://openalex.org/A5087617906“,”display_name“:”Gilad Avidov“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Gilad-Avidovhttps://openalex.org/A5061907595“,”display_name“:”T.Likhomanenko“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Tatiana Likhoman nko“,”raw _affiliation_strings“:【】,”affiliations“:〔〕},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5087325198“,”display_name“:”Awni Hannun“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Awni-Hannunhttps://openalex.org/A5025751434“,”display_name“:”Vitaliy Liptchinsky“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Vitali Liptchinky“,“raw_affiliation_strings”:[]、“affiliations”:[]},{“author_position”:“middle”,“author”:{“id”:“”https://openalex.org/A5041907084“,”display_name“:”Gabriel Synnaeve“,”orcid“:”https://orcid.org/0000-0003-1715-3356“},”机构“:[],”国家“:[],”is_correresponsing“:false,”raw_author_name“:”Gabriel Synnaeve“,”raw_affiation_strings“:[],”附属“:[]},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A5053915453“,”display_name“:”Ronan Collobert“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“;”Ronam Collobert”,“raw_affiliation_strings”:[]、“affiliations”:[]}]、“countries_distiction_count”:0,“institutions_distitionc_count“:0,”corresponding_author_ids“:[】,”coresponding_institution_ids“:null,”apc_payd“:null,”fwci“:2.173,”has_fulltext“:false,”cited_by_count“:21,”cited_by_percentile_year“:{”min“:94,”max“:95},”biblio“:{volume”:null、“issue”:null、“first_page”:null}、“last_page”:null},“is_retracted”:false、“is_paratext”:false,“primary_topic”:{“id”:“https://openalex.org/T10201“,”display_name“:”语音识别技术“,”score“:0.9992,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10201“,”display_name“:”语音识别技术“,”score“:0.9992,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10860“,”display_name“:”语音增强技术“,”score“:0.9982,”subfield“:{”id“:”https://openalex.org/subfields/1711“,”display_name“:”信号处理“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T11309“,”display_name“:”音频信号分类与分析“,”score“:0.998,”subfield“:{”id“:”https://openalex.org/subfields/1711“,”display_name“:”信号处理“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/end-to-end-speech-recognition(https://openalex.org/关键词/端到端语音识别)“,”display_name“:”端到端语音识别“,”score“:0.609178},{”id“:”https://openalex.org/keywords/audi-visual-speech-re认知“,”display_name“:”视听语音识别“,”score“:0.592489},{”id“:”https://openalex.org/keywords/automatic-speech-re认知“,”display_name“:”自动语音识别“,”score“:0.573357},{”id“:”https://openalex.org/keywords/environmental-sound-recognization网址“,”display_name“:”环境声音识别“,”score“:0.554978},{”id“:”https://openalex.org/keywords/speech-enhancement网站“,”display_name“:”语音增强“,”score“:0.537214}],”concepts“:[{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.7531237},{”id“:”https://openalex.org/C28490314,“wikidata”:https://www.wikidata.org/wiki/Q189436“,”display_name“:”语音识别“,”level“:1,”score“:0.65075624},{”id“:”https://openalex.org/C99844830,“wikidata”:https://www.wikidata.org/wiki/Q102441924“,”display_name“:”Scaling“,”level“:2,”score“:0.60152406},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.43700963},{”id“:”https://openalex.org/C91682802,“wikidata”:https://www.wikidata.org/wiki/Q620538“,”display_name“:”多维缩放“,”level“:2,”score“:0.43420964},{”id“:”https://openalex.org/C204321447,“wikidata”:https://www.wikidata.org/wiki/Q30642“,”display_name“:”自然语言处理“,”level“:1,”score“:0.36871862},{”id“:”https://openalex.org/C153180895,“wikidata”:https://www.wikidata.org/wiki/Q7148389“,”display_name“:”模式识别(心理学)“,”level“:2,”score“:0.3452219},{”id“:”https://openalex.org/C119857082,“wikidata”:https://www.wikidata.org/wiki/Q2539“,”display_name“:”机器学习“,”level“:1,”score“:0.19170499},{”id“:”https://openalex.org/C33923547,“wikidata”:https://www.wikidata.org/wiki/Q395“,”display_name“:”数学“,”等级“:0,”分数“:0.06826252},{”id“:”https://openalex.org/C2524010,“wikidata”:https://www.wikidata.org/wiki/Q8087“,”display_name“:”Geometry“,”level“:1,”score“:0.0}],”mesh“:[],”locations_count“:2,”location“:[{”is_oa“:false,”landing_page_url“:”https://doi.org/10.21437/interseech.2020-2840“,”pdf_url“:null,”source“:null,”license“:nully,”licence_id“:null,”version“:nuller,”is_accepted“:false,”is_published“:false},{”is_oa“:true,”landing_page_url”:“https://arxiv.org/abs/2001.09727,“pdf_url”:https://arxiv.org/pdf/2001.09727,“源”:{“id”:https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”is_core“:fase,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“https://arxiv.org/abs/2001.09727,“pdf_url”:https://arxiv.org/pdf/2001.09727,“源”:{“id”:https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”is_core“:fase,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false},”sustainable_development_goals“:[{”score“:0.47,”id“:”https://metadata.un.org/sdg/4“,”display_name“:”素质教育“}],”grants“:[],”datasets“:【】,”versions“:【],”referenced_works_count“:0,”referrenced_works“:[],”related_work斯“:[”https://openalex.org/W4378770497","https://openalex.org/W4245539973","https://openalex.org/W4238212629","https://openalex.org/W4200285273","https://openalex.org/W305894733","https://openalex.org/W2374778813","https://openalex.org/W2314854132","https://openalex.org/W2049584446","https://openalex.org/W2012281976","https://openalex.org/W2003051771“],”ngrams_url“:”https://api.openalex.org/works/W3096104971/ngrams“,”abstract_inverted_index“:{”We“:[0,19],”design“:[1,86],”an“:[2],”online“:[3],”端到端“:[4],”语音“:[5],”识别“:[6],”system“:[7,40],”based“:[8101],”on“:[9102],”Time-Depth“:[10],”Separable“:[11],”(TDS)“:[12],”卷积“:[13],”and“:[14,32,59,93],“连接”:[15],“暂时”:[16],“分类”:[17],“(CTC)。”:[18],“改进”:[20],““:[21,29,45,68,71,82103],”核心“:[22],”TDS“:[23],”体系结构“:[24],”in“:[25],”order“:[26],”to“:[27,67],”limit“:[28],”future“:[30],”context“:[31],”因此“:[33],”reduce“:[3],”latency“:[35,58],”while“:[36,54],”维护“:[37],”准确性。“:[38],“The”:[39],“has”:[41],“almost”:[42],“three”:[43],“times”:44],“吞吐量”:[46],“of”:[47,70,84],“a”:[48,60],“well”:[49],“tunes”:[50100],“hybrid”:[51],“ASR”:[52],“baseline”:[53],“word”:[62],“error”:[63],“rate”。“:[64],”也是“:[65],”重要“:[66],”效率“:[69],”识别器“:[72],”是“:[73],”我们的“:[74,85],”高度“:[75],”优化“:[76],”波束“:[77],”搜索“:[78],”解码器。“:[79],”To“:[80],”show“:[81],”impact“:[83],”choices“,:[87],”we“:88],”analyze“:[89],”吞吐量“:[90],”延迟“:[91],”准确性“:[92],”discussion“:[94],”how“:95],”these“:[96],”metrics“:[97],”can“:[98],”be“:[99],”user“:[104],”requirements。“:[105]},”cited_by_api_url“:”https://api.openalex.org/works?filter=cites:W3096104971“,”counts_by_year“:[{“年”:2024,”cited_by_count“:1},{“年份”:2023,”ciped_by_cunt“:3},”{“年度”:2022,“cited_by_count”:2},“年份”:2021,”cited_by_count