{“id”:“https://openalex.org/W4392120419“,”doi“:”https://doi.org/10.48550/arxiv.2402.14073“,”title“:”Improving Language Understanding from Screenshots“,”display_name“:”Improving Language Understanting from screenshot“,”publication_year“:2024,”publiation_date“:”2024-02-21“,”ids“:{”openalex“:”https://openalex.org/W4392120419“,”doi“:”https://doi.org/10.48550/arxiv.2402.14073“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2402.14073,“pdf_url”:https://arxiv.org/pdf/2402.14073,“源”:{“id”:https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”Cornell University“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false},”type“:”preprint“,”type_crossref“:“posted-content”,“indexed_in”:[”arxiv“],‘open_access’:{”is_oa“:true,”“oa_status”:“green”,“oa_url”:“https://arxiv.org/pdf/2402.14073“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”first“,”author“:{”id“:”https://openalex.org/A5033296587“,”display_name“:”天宇高“,”兽人“:”https://orcid.org/0009-0008-0357-7709“},”机构“:[],”国家“:[],”is_correresponsing“:false,”raw_author_name“:”Gao,Tianyu“,”raw_affiation_strings“:[]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5004072156“,”display_name“:”王子瑞“,”兽人“:”https://orcid.org/0000-0003-2547-4619“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”Wang,Zirui“,”raw关联字符串“:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5076577141“,”display_name“:”Adithia Bhaskar“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Bhaskard,Adithia“,”raw _affiliation_string“:[]},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A5051064208“,”display_name“:”陈丹琪“,”orcid“:”https://orcid.org/0000-0002-6226-6838“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”陈丹奇“,”raw关联字符串“:[]}],”countries_distict_count“:0,”机构区分计数“:0,“cited_by_percentile_year“:{“min”:0,“max”:92},“biblio”:{卷:null,“问题”:nullhttps://openalex.org/T12031“,”display_name“:”口语系统对话行为建模“,”score“:0.6402,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T12031“,”display_name“:”口语系统的对话行为建模“,”score“:0.6402,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T13083“,”“display_name”:“从文本数据中自动提取关键字”,“score”:0.5923,“subfield”:{“id”:“https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T12720“,”“display_name”:“了解社交电视观看和交互”,“score”:0.574,“subfield”:{“id”:“https://openalex.org/subfields/3312“,”display_name“:”社会学与政治学“},”field“:{”id“:”https://openalex.org/fields/33“,”display_name“:”社会科学“},”域“:{”id“:”https://openalex.org/domains/2“,”display_name“:”社会科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/semantic-processing“,”display_name“:”语义处理“,”score“:0.544937},{”id“:”https://openalex.org/keywords/user-simulation网站“,”display_name“:”用户模拟“,”score“:0.524697},{”id“:”https://openalex.org/keywords/multimedia-synchronization网站“,”display_name“:”多媒体同步“,”score“:0.516891},{”id“:”https://openalex.org/keywords/natural-language-generate网站“,”display_name“:”自然语言生成“,”score“:0.511083},{”id“:”https://openalex.org/keywords/语言知识“,”display_name“:”语言知识“,”score“:0.504309}],”concepts“:[{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.59662116},{”id“:”https://openalex.org/C2522767166,“wikidata”:https://www.wikidata.org/wiki/Q2374463“,”display_name“:”数据科学“,”level“:1,”score“:0.37442675},{”id“:”https://openalex.org/C204321447,“wikidata”:https://www.wikidata.org/wiki/Q30642“,”display_name“:”自然语言处理“,”level“:1,”score“:0.36096957},{”id“:”https://openalex.org/C199360897,“wikidata”:https://www.wikidata.org/wiki/Q9143“,”display_name“:”编程语言“,”level“:1,”score“:0.35480195}],”mesh“:[],”locations_count“:1.”locations“:[{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2402.14073,“pdf_url”:https://arxiv.org/pdf/2402.14073,“源”:{“id”:https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“https://arxiv.org/abs/2402.14073,“pdf_url”:https://arxiv.org/pdf/2402.14073,“源”:{“id”:https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false},”sustainable_development_goals“:[],“grants”:[]https://openalex.org/W4391913857","https://openalex.org/W2748952813","https://openalex.org/W2530322880","https://openalex.org/W2478288626","https://openalex.org/W2390279801","https://openalex.org/W2382290278","https://openalex.org/W2376932109","https://openalex.org/W2358668433","https://openalex.org/W2350741829","https://openalex.org/W2001405890“],”ngrams_url“:”https://api.openalex.org/works/W4392120419/ngrams网站“,”“abstract_inverted_index”:{“An”:[0],“emerging”:[1],“family”:[2],“of”:[3,8,81,99141],“language”:[4,40,54],“models”:[5,37,52168],“(LMs),”:[6],“capable”:[7],“processing”:[9],“both”:[10,96],“text”:[11,79102],“and”:[12,30,73,94101114164192],“images”:[13],“within”“:[14103],”a“:[15,63,86],”单个“:[16],”可视“:[17131],”视图“:[18],”有:[19],“the”:[20,67,78175],“promise”:[21],“to”:[22,3515059196],“unlock”:[23],“complex”:[24],“tasks”:[25144],“such”:[26],“as”:[27,38117119],“chart”:[28],“understanding”:[29,55],“UI”:[31],“navigation”。“:[32],”我们“:[33,84105],”参考“:[34],”这些“:[36],”屏幕截图“:[39,46,82162176190],”型号。“:[41],”尽管“:[42],”他们的“:[43194],”上诉“:[44],”现有“:[45],”LMs“:[47163191],”实质上“:[48],”滞后“:[49],”落后“:[50],”纯文本“:[51],”on“:[53,76111138187],”任务。“:[56],“To”:[57],“close”:[58],“this”:[59],“gap”:[60],“we”:【61,74156179】,“accept”:【62】,“simplified”:【64】,“setting”:〔65】,“where”:66】,“model”:【68】,“inputs”:【69】,“are”:70】,“plaint-text-rendered”:[71],“screenshots”,“:【72】,“focus”:75】,“improving”:【77122】,“能力”:[80],“LMs。“:[83],”提议“:[85],”新颖“:[87],”补丁和文本“:[88],”预测“:[89],”(PTP)“:[90],”目标“:[91],”哪个“:[92],”掩码“:[93],”恢复“:[95],”图像“:[97],”补丁“:[98],”屏幕截图“:[100],”屏幕截图“。“:[104],”也“:[106],”行为“:[107],”广泛“:[108],”消融“:[109],”研究“:[110],”掩蔽“:[112],”速率“:[113],”贴片“:[115],”大小“:[116],”良好“:[118],”设计“:[120],”用于“:[121],”训练“:[123],”稳定性。“:[124],“我们的”:[125],“预训练”:[126],“模型”,:[127],“while”:[128],“单独”:[129],“接受”:[130],“输入”:[132],“实现”:[133],“可比”:[134],“性能”:[135],“with”:%136],“BERT”:[137],“6”:[139],“out”:[140],“8”:[142],“GLUE”:/143],“(within”:[145],“2%)“:[146],”提高“:[148],”上升“:[149],”8%“:[151],”超过“:[152],”优先“:[153],”工作“:[154],“此外,”:[155],“扩展”:[157],“PTP”:[158],“训练”:[160],“自回归”:[161],“演示”:[165],“其”:[166],“有效性--我们的”:[167],“可以”:[169183],“显著”:[170],“减少”:[171],“困惑”:[172],“通过”:[173],“利用”:[174],“上下文”:[177],“一起”:[178],“希望”:[180],“我们的”:[181],“发现”:[182],“启发”:[184],“未来”:[185],“研究”:[186],“开发”:[188],“强大”:[189],“扩展”:[193],“范围”:[195],“更广泛”:[197],“应用程序”:[198]},“引用_by_api_url”:“https://api.openalex.org/works?filter=cites:W4392120419“,”counts_by_year“:[],”updated_date“:”2024-05-17T20:57:58.108713“,”created_date:“2024-02-24”}“