{“id”:“https://openalex.org/W4379539789“,”doi“:”https://doi.org/10.48550/arxiv.2306.02697“,”title“:”Efficient GPT Model Pre-training using Tensor Train Matrix Representation“,”display_name“:”高效GPT模型预训练使用Tensor训练矩阵表示“,”publication_year“:2023,”publitation_date“:”2023-01-01“,”ids“:{”openalex“:”https://openalex.org/W4379539789“,”doi“:”https://doi.org/10.48550/arxiv.2306.02697“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2306.02697“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“cc-by”,“licence_id”:“https://openalex.org/licenses/cc-by“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},”type“:”preprint“,”type_crossref“:“posted-content”,”indexed_in“:[”arxiv“,”datacite“],”open_access“:{”is_oa“:true,”oa_status“:”green“,”oa_url“:”https://arxiv.org/abs/2306.02697“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5003655345“,”display_name“:”Viktoria Chekalina“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Chekalina,Viktoriia“,”raw _affiliation_strings“:]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5009627524“,”display_name“:”G.E.Novikov“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Novikof,Georgii“,”raw _affiliation_strings“:]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5034056852“,”display_name“:”Julia Gusak“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Gusak,Julia“,”raw _affiliation_strings“:]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5004111307“,”display_name“:”Ivan Oseledets“,”orcid“:”https://orcid.org/0000-0003-2071-2163“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”Oseledets,Ivan“,”raw_affiliation_strings“:[]},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A5026157285“,”display_name“:”Alexander Panchenko“,”orcid“:”https://orcid.org/0000-0001-6097-6118“},”机构“:[],”国家“:[',”is_corresponding“:false,”raw_author_name“:”Panchenko,Alexander“,”raw关联字符串“:[]}],”countries_distict_count“:0,”institutions_disticent_count“:0',”corresponding_author_ids“:[[],”correcponding_institution_ids 0,“cited_by_percentile_year“:{“min”:0,“max”:78},“biblio”:{卷:null,“问题”:nullhttps://openalex.org/T10028“,”display_name“:”自然语言处理“,”score“:0.9874,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10028“,”display_name“:”自然语言处理“,”score“:0.9874,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T13650“,”“display_name”:“使用Python进行科学计算和数据分析”,“score”:0.9715,“subfield”:{“id”:“https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T13702“,”“display_name”:“医疗保健中的深度学习应用程序”,“score”:0.9326,“subfield”:{“id”:“https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/topic-modeling网站“,”display_name“:”主题建模“,”score“:0.550723},{”id“:”https://openalex.org/keywords/prefective-modeling“,”display_name“:”预测建模“,”score“:0.515563},{”id“:”https://openalex.org/关键字/机器翻译“,”display_name“:”机器翻译“,”score“:0.512645},{”id“:”https://openalex.org/keywords/统计建模“,”display_name“:”统计建模“,”score“:0.511378},{”id“:”https://openalex.org/keywords/preained-models“,”display_name“:”预训练模型“,”score“:0.504882}],”concepts“:[{”id“:”https://openalex.org/C100279451,“wikidata”:https://www.wikidata.org/wiki/Q372193“,”display_name“:”困惑“,”level“:3,”score“:0.8937222},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.72984856},{”id“:”https://openalex.org/C66322947,“wikidata”:https://www.wikidata.org/wiki/Q11658“,”display_name“:”Transformer“,”level“:3,”score“:0.70293987},{”id“:”https://openalex.org/C170858558,“wikidata”:https://www.wikidata.org/wiki/Q1394144“,”display_name“:”自动摘要“,”level“:2,”score“:0.64248943},{”id“:”https://openalex.org/C137293760,“wikidata”:https://www.wikidata.org/wiki/Q3621696“,”display_name“:”语言模型“,”level“:2,”score“:0.5912186},{”id“:”https://openalex.org/C2776359362,“wikidata”:https://www.wikidata.org/wiki/Q2145286“,”display_name“:”Representation(politics)“,”level“:3,”score“:0.45509338},{”id“:”https://openalex.org/C155281189,“wikidata”:https://www.wikidata.org/wiki/Q3518150“,”display_name“:”张量(内在定义)“,”level“:2,”score“:0.4220891},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.39491516},{”id“:”https://openalex.org/C11413529,“wikidata”:https://www.wikidata.org/wiki/Q8366“,”display_name“:”Algorithm“,”level“:1,”score“:0.36285388},{”id“:”https://openalex.org/C33923547,“wikidata”:https://www.wikidata.org/wiki/Q395“,”display_name“:”Mathematics“,”level“:0,”score“:0.12342444},{”id“:”https://openalex.org/C127413603,“wikidata”:https://www.wikidata.org/wiki/Q11023“,”display_name“:”Engineering“,”level“:0,”score“:0.10689637},{”id“:”https://openalex.org/C165801399,“wikidata”:https://www.wikidata.org/wiki/Q25428“,”display_name“:”Voltage“,”level“:2,”score“:0.08127469},{”id“:”https://openalex.org/C94625758,“wikidata”:https://www.wikidata.org/wiki/Q7163“,”display_name“:”政治“,”级别“:2,”分数“:0.0},{”id“:”https://openalex.org/C202444582,“wikidata”:https://www.wikidata.org/wiki/Q837863“,”display_name“:”纯数学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C199539241,“wikidata”:https://www.wikidata.org/wiki/Q7748“,”display_name“:”Law“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C17744445,“wikidata”:https://www.wikidata.org/wiki/Q36442“,”display_name“:”政治学“,”level“:0,”score“:0.0},{”id“:”https://openalex.org/C119599485,“wikidata”:https://www.wikidata.org/wiki/Q43035“,”display_name“:”电气工程“,”level“:1,”score“:0.0}],”mesh“:[],”locations_count“:3,”location“:[{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2306.02697“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“cc-by”,“licence_id”:“https://openalex.org/licenses/cc-by“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},{”is_oa“:true,”landing_page_url“:”http://arxiv.org/abs/2306.02697,“pdf_url”:http://arxiv.org/pdf/2306.02697,“源”:{“id”:https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”Cornell University“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false},{“is_oa”:false,“landing_page_url”:“https://api.datacite.org/dois/10.448550/arxiv.2306.02697“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4393179698“,”display_name“:”DataCite API“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I4210145204“,”“host_organization_name”:“DataCite”,“host_organization_lineage”:[“https://openalex.org/I4210145204“],”host_organization_lineage_names“:[”DataCite“],“type”:“metadata”},“license”:null,“licence_id”:null,“version”:null}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“https://arxiv.org/abs/2306.02697“,”pdf_url“:空,”源“:{”id“:”https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:“cc-by”,“licence_id”:“https://openalex.org/licenses/cc-by“,”version“:”submittedVersion“,”is_accepted“:false,”is_published“:false},”sustainable_development_goals“:[{”display_name“:”素质教育“,”score“:0.7,”id“:”https://metadata.un.org/sdg/4“}],”grants“:[],”datasets“:[],”versions“:[】,”referenced_works_count“:0,”referrenced_works“:],”related_work斯“:[”https://openalex.org/W4322096525","https://openalex.org/W4287826556","https://openalex.org/W4281893144","https://openalex.org/W3049463507","https://openalex.org/W3013624417","https://openalex.org/W2787311093","https://openalex.org/W2551914602","https://openalex.org/W2252095989","https://openalex.org/W2169518243","https://openalex.org/W2105076537“],”ngrams_url“:”https://api.openalex.org/works/W4379539789/ngrams网站“,”“abstract_inverted_index”:{“Large-scale”:[0],“transformer”:[1],“models”:[2,13],“have”:[3],“show”:[4],“notificate”:[5],“performance”:[6],“in”:[7,21,37],“language”:[8,98],“modeling”:[9],“tasks.”:[10],“Wheer”:[11],“such”:[12],“feature”:[14],45,71],“参数”,:[17,84],“前导”:[18],“到”:[19,81,89107119],“困难”:[20],“他们的”:[22],“部署”:[23],“和”:[24,59,68100],“禁止”:[25],“培训”:[26],“成本”:[27],“来自”:[28],“从无到有。“:[29],”To“:[30],”reduce“:[31],”the“:[32,35,38,43,49,63,69,86,90,94103108],”number“:[33],”parameters“:[36],”GPT-2“:[39110],”architecture“:[40],”we“:[C1,56],”replace“:[42],”Matrix“:[44],”fully-connected“:[46],”layers“:[C7115],”with“:48],”responsiver“:[50],”Tensor“:[51],“训练”:[52],“矩阵~(TTM)”:[53],“结构。“:[54],”最后,“:[55],”自定义“:[57],”向前“:[58],”向后“:[60],”操作“:[61],”通过“:[62],”基于TTM“:[64],”层“:[65],”用于“:[66],”简单性“:[67],”稳定性“:[70],”进一步“:[72],”培训。“:[73],“%”:[74],“The”:[75112],“resulting”:[76],“GPT-2-based”:[77],“model”:[78104],“stores”:[79],“up”:[80],“40%”:[82],“lesser”:[83],“showing”:[85],“fuzzity”:[87],“comparable”:[88],“original”:[91109],“model”。“:[92111],“开”:[93],“下游”:[95],“任务”:[96],“包括”:[97],“理解”:[99],“文本”:[101],“摘要”:[102],“执行”:[105],“类似”:[106],“建议”:[113],“张量”:[114],“可以”:[116],“是”:[117],“使用”:[118],“有效”:[120],“预培训”:[121],“其他”:[122],“变压器”“:[123],”模型。“:[124]},”cited_by_api_url“:”https://api.openalex.org/works?filter=cites:W4379539789“,”counts_by_year“:[],”updated_date“:”2024-05-28T08:25:25.096594“,”created_date:“2023-06-07”}“