{“id”:“https://openalex.org/W4223984749“,”doi“:”https://doi.org/10.48550/arxiv.2204.05738“,”title“:”Text-Driven Separation of Arbitrary Sounds“,”display_name“:”文本驱动的任意发音分离“,”publication_year“:2022,”publitation_date“:”2022-01-01“,”ids“:{”openalex“:”https://openalex.org/W4223984749“,”doi“:”https://doi.org/10.48550/arxiv.2204.05738“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2204.05738“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”is_core“:fase,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“other-oa”,“licence_id”:“https://openalex.org/licenses/other-oa网站“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},”type“:”preprint“,”type_crossref“:“posted-content”,”indexed_in“:[”arxiv“,”datacite“],”open_access“:{”is_oa“:true,”oa_status“:”green“,”oa_url“:”https://arxiv.org/abs/2204.05738“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5034910585“,”display_name“:”Kevin Kilgour“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Kilgor,Kevin“,“raw_affiliation_strings”:[]“,”affiliations“:]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5002559095“,”display_name“:”Beat Gfeller“,”orcid“:”https://orcid.org/0000-0002-1321-9015“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”Gfeller,Beat“,”raw_affiliation_strings“:[],“从属关系”:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5054290005“,”display_name“:”青青黄“,”兽人“:”https://orcid.org/0000-0002-0635-7479“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”Huang,Qingqing“,”raw_affiliation_strings“:[],“affiliations”:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5006451413“,”display_name“:”Aren Jansen“,”orcid“:”https://orcid.org/0009-0005-0800-8677“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:Jansen,Aren”,“raw_affiliation_strings”:[]、“从属关系”:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5053447215“,”display_name“:”Scott Wisdom“,”orcid“:”https://orcid.org/0000-0001-6671-1428“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”Wisdom,Scott“,”raw _ afiliation_strings“:[],“affiliations”:[]},{“author_position”:“last”,“author”:{“id”:“https://openalex.org/A5033341878“,”display_name“:”Marco Tagliasacchi“,”orcid“:”https://orcid.org/0000-0002-7682-6795“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”Tagliasacchi,Marco“,”raw _ afiliation_strings“:[],“隶属关系”:[]}],“countries _ distinct_count”:0,“institutions _ disting_count“:0,”corresponding_author_ids“:[】,”correcponding_institution_ids,“has_fulltext”:假,“cited_by_count“:0,”cited_by_percentile_year“:{”min“:0”,“max”:66},“biblio”:{“volume”:null,“issue”:nul,“first_page”:null,“last_page”:null},”is_retracted“:false,”is_paratext“:false,”primary_topic“:”{“id”:“https://openalex.org/T10860“,”display_name“:”语音增强技术“,”score“:0.9999,”subfield“:{”id“:”https://openalex.org/subfields/1711“,”display_name“:”信号处理“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10860“,”display_name“:”语音增强技术“,”score“:0.9999,”subfield“:{”id“:”https://openalex.org/subfields/1711“,”display_name“:”信号处理“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T11309“,”display_name“:”音频信号分类与分析“,”score“:0.9994,”subfield“:{”id“:”https://openalex.org/subfields/1711“,”display_name“:”信号处理“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10201“,”display_name“:”语音识别技术“,”score“:0.997,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”Physical Sciences“}}],”keywords“:[{”id“:”https://openalex.org/keywords/source-separtition“,”display_name“:”源分离“,”score“:0.623289},{”id“:”https://openalex.org/keywords/audio-event-detection(https://openalex.org/关键词/音频事件检测)“,”display_name“:”音频事件检测“,”score“:0.594388},{”id“:”https://openalex.org/keywords/environmental-sound-recognization网址“,”display_name“:”环境声音识别“,”score“:0.584056},{”id“:”https://openalex.org/keywords/aoustic-modeling“,”display_name“:”声学建模“,”score“:0.572636},{”id“:”https://openalex.org/keywords/audio-visual-speech-recognition(https://openalex.org/keywords/audio-visual-speech-recognition)“,”display_name“:”视听语音识别“,”score“:0.563331}],”concepts“:[{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.7558602},{”id“:”https://openalex.org/C41608201,“wikidata”:https://www.wikidata.org/wiki/Q980509“,”display_name“:”Embedding“,”level“:2,”score“:0.7440517},{”id“:”https://openalex.org/C2776359362,“wikidata”:https://www.wikidata.org/wiki/Q2145286“,”display_name“:”Representation(politics)“,”level“:3,”score“:0.7142545},{”id“:”https://openalex.org/C2780226545,“wikidata”:https://www.wikidata.org/wiki/Q6888030“,”display_name“:”Modality(human\u2013 computer interaction)“,”level“:2,”score“:0.58989793},{”id“:”https://openalex.org/C28490314,“wikidata”:https://www.wikidata.org/wiki/Q189436“,”display_name“:”语音识别“,”level“:1,”score“:0.5848476},{”id“:”https://openalex.org/C2776864781,“wikidata”:https://www.wikidata.org/wiki/Q52617913“,”display_name“:”源分离“,”level“:2,”score“:0.5449381},{”id“:”https://openalex.org/C71139939,“wikidata”:https://www.wikidata.org/wiki/Q910194“,”display_name“:”Modal“,”level“:2,”score“:0.48841757},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.372289},{”id“:”https://openalex.org/C204321447,“wikidata”:https://www.wikidata.org/wiki/Q30642“,”display_name“:”自然语言处理“,”level“:1,”score“:0.33870852},{”id“:”https://openalex.org/C185592680,“wikidata”:https://www.wikidata.org/wiki/Q2329“,”display_name“:”Chemistry“,”level“:0,”score“:0.0},{”id“:”https://openalex.org/C94625758,“wikidata”:https://www.wikidata.org/wiki/Q7163“,”display_name“:”Politics“,”level“:2,”score“:0.0},{”id“:”https://openalex.org/C17744445,“wikidata”:https://www.wikidata.org/wiki/Q36442“,”display_name“:”政治学“,”level“:0,”score“:0.0},{”id“:”https://openalex.org/C188027245,“wikidata”:https://www.wikidata.org/wiki/Q750446“,”display_name“:”聚合物化学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C199539241,“wikidata”:https://www.wikidata.org/wiki/Q7748“,”display_name“:”Law“,”level“:1,”score“:0.0}],”mesh“:[],”locations_count“:3,”location“:[{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2204.05738“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”is_core“:fase,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“other-oa”,“licence_id”:“https://openalex.org/licenses/other-oa网站“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},{”is_oa“:true,”landing_page_url“:”http://arxiv.org/abs/2204.05738“,”pdf_url“:”http://arxiv.org/pdf/2204.05738,“源”:{“id”:https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”is_core“:fase,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”Cornell University“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false},{“is_oa”:false,“landing_page_url”:“https://api.datacite.org/dois/10.48550/arxiv.2204.05738“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4393179698“,”display_name“:”DataCite API“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”is_core“:false,”host_organization“:”https://openalex.org/I4210145204“,”“host_organization_name”:“DataCite”,“host_organization_lineage”:[“https://openalex.org/I4210145204“],”host_organization_lineage_names“:[”DataCite“],“type”:“metadata”},“license”:null,“licence_id”:null,“version”:null}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“https://arxiv.org/abs/2204.05738“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is.in_doaj“:false,”is_core“:fase,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“other-oa”,“licence_id”:“https://openalex.org/licenses/other-oa网站“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},”sustainable_development_goals“:[],”grants“:[],”datasets“:],”versions“:[https://openalex.org/W73545470","https://openalex.org/W627697492","https://openalex.org/W2530972254","https://openalex.org/W2385859805","https://openalex.org/W2374430585","https://openalex.org/W2374013449","https://openalex.org/W2364381299","https://openalex.org/W2345479200","https://openalex.org/W2183306018网址","https://openalex.org/W2081900870“],”ngrams_url“:”https://api.openalex.org/works/W4223984749/ngrams网站“,”“abstract_inverted_index”:{“We”:[0132],“propose”:[1],“a”:[2,6,11,17,21,59,67,80],“method”:[3],“of”:[4,2511217151],“separing”:[5],“desired”:[7],“sound”:[8],“源”:[9,69],“from”:[10,83],“single channel”:[12],“mixture”:[13],“based”:[14,78],“on”:[15,79100123]130],“任意”:[16],“文本”:[18,52],“描述”:[19,53],“或”:[20],“简短”:[22],“audio”:[23,48,70],“sample”:[24],“the”:[26,55,84,92,96149],“target”:[27],“source.”:[28],“This”:[29],“is”:[30,41137],“reactived”:[31],“by”:[32,89],“combining”:[33],“two”:[34118],“distinct”:[35],“model.”:[36],“the”:[37,62],“first”:[38],“model”:[39,64],“发音词”:[40,90],“训练过的”:[42],“to”:[43,54,95],“联合”:[44],“嵌入”:[45],“两者”:[46],“an”:[47,73110],“clip”:[49,71],“and”:[50,75125142],“its”:[51],“same”:[56],“embedding”:[57],“in”:[58],“shared”:[60,85],“representation.”:[61],“second”:[C3],“SoundFilter”,“:[65],”takes“:[66],“mixed”:[68],“as”:[72],“input”:[74],“separtices”:[76],“it”:[77],“conditioning”:[81,97],“vector”:[82],“text-audio”:[86],“representation”:[87],“defined”:[88],“制造”:[91],“模型”:[93],“不可知论”:[94],“模态”:[98],“评估”:[99],“多重”:[101],“数据集”:[102],“我们”:[103],“显示”:[104134],“那”:[105135143],“我方”:[106144],“方法”:[107147],“可以”:[108],“实现”:[109],“SI-SDR”:[111],“9.1”:[113],“dB”:[1114127],“for”:[115],“mixture”:[116],“arbitral”:[119],“sounds”:[120],“when”:[12128],“条件”:[122129],“文本”:[124],“10.1”:[126],“音频”:[131],“同时”:[133],“声音词”:[136],“有效”:[138],“在”:[139],“学习”:[140],“共同嵌入”:[141],“多模态”:[145],“训练”:[146],“提高”:[148],“性能”:[150],“SoundFilter.”:[152]},“cited_by_api_url”:“https://api.openalex.org/works?filter=cites:W4223984749“,”counts_by_year“:[],”updated_date“:”2024-07-02T22:10:55.980817“,”created_date:“2022-04-19”}“