{“id”:“https://openalex.org/W4386908184“,”doi“:”https://doi.org/10.48550/arxiv.2309.10668“,”title“:”语言建模是压缩“,”display_name“:”语言建模是压缩“,”publication_year“:2023,”publication_date“:”2023-01-01“,”ids“:{”openalex“:”https://openalex.org/W4386908184“,”doi“:”https://doi.org/10.48550/arxiv.2309.10668“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2309.10668“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“cc-by”,“licence_id”:“https://openalex.org/licenses/cc-by“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},”type“:”preprint“,”type_crossref“:“posted-content”,”indexed_in“:[”arxiv“,”datacite“],”open_access“:{”is_oa“:true,”oa_status“:”green“,”oa_url“:”https://arxiv.org/abs/2309.10668“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5059962909“,”display_name“:”Gr\u00e9goire Del\u00e 9tang“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Del\u00 e9tang,Gr\u00 e 9goires“,”raw _affiliation_strings“:【】},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5077124139“,”display_name“:”Anian Ruoss“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Ruoss,Anian“,”raw _affiliation_strings“:]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5059582849“,”display_name“:”Paul-Ambroise Duquenne“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false“,”raw_author_name“:”Duquene,Paul-Amberoise“,”raw_affiliation_strings“:]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5020795308“,”display_name“:”Elliot Catt“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Catt,Elliot“,”raw _affiliation_string“:[]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5013602545“,”display_name“:”Tim Genewein“,”orcid“:null},”institutions“:[],”countries“:[],”is_correresponsing“:false,”raw_author_name“:”Genewein,Tim“,”raw_affiation_strings“:[]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5088656569“,”display_name“:”Christopher Mattern“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Mattern,Christophers“,”raw _affiliation_strings“:]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5026686188“,”display_name“:”Jordi Grau-Moya“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Grau-Moa,Jordi“,”raw _affiliation_strings“:[/]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5017305728“,”display_name“:”Li Kevin Wenliang“,”orcid“:null}“,”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Wenlian,Li Keven“,“raw_affiliation_strings”:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5005322233“,”display_name“:”Matthew Aitchison“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“,”Aitchison,Matthew“,”raw _affiliation_string“:[]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5081226725“,”display_name“:”Laurent Orseau“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“,”oraw_affiliation_string“:[]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5073944062“,”display_name“:”Marcus Hutter“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Hutter,Marcus“,”raw _affiliation_string“:[]},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A506070909021“,”display_name“:”Joel Veness“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Veness,Joel“,”raw _affiliation_string“:[]}],”countries _distict_count“:0,”instistictions_distiction_count“:零,”corresponding_author_ids“:[】,”correcponding_institution_ids:null,“has_fulltext”:false,“cited_by_count“:4,”cited_by_percentile_year“:{“min”:94,“max”:96},“biblio”:{”volume“:null,“issue”:null、“first_page”:null,“last_page”:null},”is_retracted“:false,”is_paratext“:false,”primary_topic“:{”id“:”https://openalex.org/T10181“,”display_name“:”统计机器翻译与自然语言处理“,”score“:0.9965,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”Artificial Intelligence“},”field“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10181“,”display_name“:”统计机器翻译与自然语言处理“,”score“:0.9965,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10028“,”display_name“:”自然语言处理“,”score“:0.9948,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10201“,”display_name“:”语音识别技术“,”score“:0.9781,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/language-modeling“,”display_name“:”语言建模“,”score“:0.598589},{”id“:”https://openalex.org/keywords/topic-modeling网站“,”display_name“:”Topic Modeling“,”score“:0.561565},{”id“:”https://openalex.org/keywords/统计语言建模“,”display_name“:”统计语言建模“,”score“:0.548174},{”id“:”https://openalex.org/keywords/word-representation网站“,”display_name“:”单词表示“,”score“:0.524552},{”id“:”https://openalex.org/keywords/aoustic-modeling“,”display_name“:”声学建模“,”score“:0.523843}],”concepts“:[{”id“:”https://openalex.org/C81081738,“wikidata”:https://www.wikidata.org/wiki/Q55542“,”display_name“:”无损压缩“,”level“:3,”score“:0.8020729},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.7609828},{”id“:”https://openalex.org/C165021410,“wikidata”:https://www.wikidata.org/wiki/Q55564“,”display_name“:”Lossy compression“,”level“:2,”score“:0.6327643},{”id“:”https://openalex.org/C137293760,“wikidata”:https://www.wikidata.org/wiki/Q3621696“,”display_name“:”语言模型“,”level“:2,”score“:0.6162696},{”id“:”https://openalex.org/C131097465,“wikidata”:https://www.wikidata.org/wiki/Q178898“,”display_name“:”气体压缩机“,”level“:2,”score“:0.57322073},{”id“:”https://openalex.org/C180016635,“wikidata”:https://www.wikidata.org/wiki/Q2712821网址“,”display_name“:”压缩(物理)“,”level“:2,”score“:0.52188617},{”id“:”https://openalex.org/C2779343474,“wikidata”:https://www.wikidata.org/wiki/Q3109175“,”display_name“:”Context(考古学)“,”level“:2,”score“:0.49215835},{”id“:”https://openalex.org/C78548338,“wikidata”:https://www.wikidata.org/wiki/Q2493“,”display_name“:”数据压缩“,”level“:2,”score“:0.44330952},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.41613057},{”id“:”https://openalex.org/C204321447,“wikidata”:https://www.wikidata.org/wiki/Q30642“,”display_name“:”自然语言处理“,”level“:1,”score“:0.41087863},{”id“:”https://openalex.org/C119857082,“wikidata”:https://www.wikidata.org/wiki/Q2539“,”display_name“:”机器学习“,”level“:1,”score“:0.3992056},{”id“:”https://openalex.org/C28490314,“wikidata”:https://www.wikidata.org/wiki/Q189436“,”display_name“:”语音识别“,”level“:1,”score“:0.3451943},{”id“:”https://openalex.org/C127413603,“wikidata”:https://www.wikidata.org/wiki/Q11023“,”display_name“:”Engineering“,”level“:0,”score“:0.11381531},{”id“:”https://openalex.org/C78519656,“wikidata”:https://www.wikidata.org/wiki/Q101333“,”display_name“:”机械工程“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C151730666,“wikidata”:https://www.wikidata.org/wiki/Q7205“,”display_name“:”古生物学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C192562407,“wikidata”:https://www.wikidata.org/wiki/Q228736“,”display_name“:”材料科学“,”level“:0,”score“:0.0},{”id“:”https://openalex.org/C159985019,“wikidata”:https://www.wikidata.org/wiki/Q181790“,”display_name“:”复合材料“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C86803240,“wikidata”:https://www.wikidata.org/wiki/Q420“,”display_name“:”Biology“,”level“:0,”score“:0.0}],”mesh“:[],”locations_count“:2,”location“:[{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2309.10668“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“cc-by”,“licence_id”:“https://openalex.org/licenses/cc-by(https://openalex.org/licenses/cc-by)“,”版本“:”提交版本“,”is_accepted“:false,”is_published“:false},{”is_oa“:false,”landing_page_url“:”https://api.datacite.org/dois/10.48550/arxiv.2309.10668“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4393179698“,”display_name“:”DataCite API“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I4210145204“,”“host_organization_name”:“DataCite”,“host_organization_lineage”:[“https://openalex.org/I4210145204“],”host_organization_lineage_names“:[”DataCite“],“type”:“metadata”},“license”:null,“licence_id”:null,“version”:null}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“https://arxiv.org/abs/2309.10668“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“cc-by”,“licence_id”:“https://openalex.org/licenses/cc-by“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},”sustainable_development_goals“:[{”display_name“:”素质教育“,”score“:0.82,”id“:”https://metadata.un.org/sdg/4“}],”grants“:[],”datasets“:[],”versions“:[】,”referenced_works_count“:0,”referrenced_works“:],”related_work斯“:[”https://openalex.org/W755971114","https://openalex.org/W4313046148","https://openalex.org/W4247601675","https://openalex.org/W3180760233","https://openalex.org/W3035703949","https://openalex.org/W2547124190","https://openalex.org/W2385628723","https://openalex.org/W2118338613","https://openalex.org/W1982468865","https://openalex.org/W1970394887“],”ngrams_url“:”https://api.openalex.org/works/W4386908184/ngrams网站“,”“abstract_inverted_index”:{“It”:[0],“has”:[1,25],“long”:[2],“been”:[3],“established”:[4],“that”:[5,78,87137],“predictive”:[6,43],“models”:[7,40,81],“can”:[8],“be”:[9,49],“transformed”:[10],“into”:[11,94],“lossless”:%12],“compressors”:[13126],“and”:[14,31,67,67,86,98115],“vice”:[15],“reverse.”:[16],“顺便提一下”:[17],“in”:[18],“recent”:[19],“年,“:[20],”the“:[21,59,63,69,88138],”machine“:[22],”learning“:[23],”community“:[24],”focused“:[26],”on“:[27108],”training“:[28],”increased“:[29],”large“:[30,38,73,79],”powered“:[32,83],”self-pervised“:[3],”(language)“:[34],”models。“:[35,75],”自“:[36],”这些“:[37],”语言“:[39,80],”展览“:[41],”令人印象深刻“:[42],”能力“:[44],”他们“:[45],”是“:[46,82],”位置良好“:[47],”到“:[48113118143149],”强大“:[50],”压缩机。“:[51],“In”:[52],“this”:[53],“work”,:[54],“we”:55135],“advoriter”:[56],“for”:[57],“viewing”:[58],“predication”:[60],“problem”:[61],“through”:[62],“lens”:[64],“of”:[65,72120],“compression”:[66,70,89],“evaluation”:[68],“capabilities”:[71],“(foundation)”:[74],“we”:[76],“显示”:[77136],“通用”:[84],“预测值”:[85],“视点”:[90],“提供“:[91],“novel”:[92],“insights”:[93],“scaling”:[95],“laws”,“:[96],“tokenization”,“:[97],“in-context”:[99],“learning”。“:[100],”For“:[101],”example,“:[102],”Chinchilla“:/103],”70B“,”:[104],“while”:[105],“trained”:[106],“primary”:[107],“text,”:/109],“compresses”:[110],“ImageNet”:%11],“patches”:[112],“43.4%”:[114],“LibriSpeech”:[116],“samples”:[117],“16.4%”:[119],“their”:[121],“原始”:[122],“大小”:[123],“跳动”:[124],“特定域”:[125],“类似”:[127]巴布亚新几内亚“:[128],”(58.5%)“:[129],”或“:[130],”FLAC“:[131],“(30.3%),”:[132],“。“:[133],”最后,“:[134],”预测压缩“:[139],”等价“:[140],”允许“:[141],”我们“:[142],”使用“:[144],”任意“:[145],”压缩机“:[146],”(如“:[147],”gzip)“:[148],”构建“:[150],”a“:[151],”条件“:[152],”生成“:[153],”模型。“:[154]},”cited_by_api_url“:”https://api.openalex.org/works?filter=cites:W4386908184“,”counts_by_year“:[{”年“:2024,”引用_by_count“:4}],”更新日期“:”2024-05-10T01:56:24.968311“,”创建日期“:“2023-09-21”}