{“id”:“https://openalex.org/W4396832027“,”doi“:”https://doi.org/10.1145/3613905.3650798“,”title“:”自动直方图:“利用语言模型进行文本数据集探索”,“display_name”:“自动直方表:利用语言模型探索文本数据集”,“publication_year”:2024,“publiation_date”:“2024-05-11”,“ids”:{“openalex”:“https://openalex.org/W4396832027“,”doi“:”https://doi.org/10.1145/3613905.3650798“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://doi.org/10.1145/3613905.3650798,“pdf_url”:https://dl.acm.org/doi/pdf/10.1145/3613905.3650798“,”source“:null,”license“:null,”licence_id“:nul,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},”type“:”article“,”type_crossref“:“proceedings-article”,”indexed_in“:[”crossref“],”open_access“:{”is_oa“:true,”oa_status“:”青铜色“,”oa_url“:”https://dl.acm.org/doi/pdf/10.1145/3613905.3650798“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5019880413“,”display_name“:”Emily Reif“,”orcid“:”https://orcid.org/0000-0003-3572-6234},“机构”:[{“id”:https://openalex.org/I1291425158“,”display_name“:”谷歌(美国)“,”错误“:”https://ror.org/00njsd438“,”country_code“:”US“,”type“:“company”,”lineage“:[”https://openalex.org/I1291425158","https://openalex.org/I4210128969“]}],”countries“:[”US“],”is_corresponding“:false,”raw_author_name“:”Emily Reif“,”raw _affiliation_strings“:【”谷歌研究,美国“]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5043246682“,”display_name“:”Crystal Qian“,”orcid“:”https://orcid.org/0000-0001-7716-7245},“机构”:[{“id”:https://openalex.org/I1291425158“,”display_name“:”谷歌(美国)“,”错误“:”https://ror.org/00njsd438“,”country_code“:”US“,”type“:“company”,”lineage“:[”https://openalex.org/I1291425158","https://openalex.org/I4210128969“]}],”countries“:[”US“],”is_corresponding“:false,”raw_author_name“:”Crystal Qian“,”raw_affiation_strings“:[”Google Research,United States“]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5081809692“,”display_name“:”James Wexler“,”orcid“:”https://orcid.org/0009-0006-8105-6998},“机构”:[{“id”:https://openalex.org/I1291425158“,”display_name“:”谷歌(美国)“,”错误“:”https://ror.org/00njsd438“,”country_code“:”US“,”type“:“company”,”lineage“:[”https://openalex.org/I1291425158","https://openalex.org/I4210128969“]}],”国家“:[”美国“],”is_corresponding“:false,”raw_author_name“:”James Wexler“,”raw关联字符串“:[“谷歌研究,美国”]},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A5042350842“,”display_name“:”Minsuk Kahng“,”orcid“:”https://orcid.org/0000-0002-0291-6026},“机构”:[{“id”:https://openalex.org/I1291425158“,”display_name“:”谷歌(美国)“,”错误“:”https://ror.org/00njsd438“,”country_code“:”US“,”type“:“company”,”lineage“:[”https://openalex.org/I1291425158","https://openalex.org/I4210128969“]}],”countries“:[”US“],”is_corresponding“:false,”raw_author_name“:”Minsuk Kahng“,”raw _affiliation_strings“:【”People+AI Research(PAIR),Google,United States“】}],“countries_distict_count”:1,“institutions_disticenc_count”:“1,”corresponding_author_ids“:[],”correcponding_institution_ids“:false,”cited_by_count“:0,”cited_by_percentile_year“:{”min“:0”,“max”:91},“biblio”:{“volume”:null,“issue”:nul,“first_page”:null,“last_page”:null},”is_retracted“:false,”is_paratext“:false,”primary_topic“:”{“id”:“https://openalex.org/T10028“,”display_name“:”自然语言处理“,”score“:0.9993,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10028“,”display_name“:”自然语言处理“,”score“:0.9993,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10181“,”display_name“:”统计机器翻译与自然语言处理“,”score“:0.994,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T11710“,”display_name“:”生物医学本体论和文本挖掘“,”score“:0.9888,”subfield“:{”id“:”https://openalex.org/subfields/1312“,”display_name“:”Molecular Biology“},”field“:{”id“:”https://openalex.org/fields/13“,”“display_name”:“生物化学、遗传学和分子生物学”},“域”:{“id”:“https://openalex.org/domains/1“,”display_name“:”生命科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/language-modeling“,”display_name“:”语言建模“,”score“:0.532614},{”id“:”https://openalex.org/keywords/topic建模“,”display_name“:”主题建模“,”score“:0.529227},{”id“:”https://openalex.org/keywords/named-entity-recognition网站“,”display_name“:”命名实体识别“,”score“:0.512167},{”id“:”https://openalex.org/keywords/text-mining“,”display_name“:”文本挖掘“,”score“:0.505649},{”id“:”https://openalex.org/keywords/natural-language-processing“,”display_name“:”自然语言处理“,”score“:0.504857}],”concepts“:[{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.82366514},{”id“:”https://openalex.org/C2780554381,“wikidata”:https://www.wikidata.org/wiki/Q2063340“,”display_name“:”Sensemaking“,”level“:2,”score“:0.74452335},{”id“:”https://openalex.org/C9652623,“wikidata”:https://www.wikidata.org/wiki/Q190109“,”display_name“:”Field(mathematics)“,”level“:2,”score“:0.6071963},{”id“:”https://openalex.org/C36464697,“wikidata”:https://www.wikidata.org/wiki/Q41553“,”display_name“:”可视化“,”级别“:2,”分数“:0.58126503},{”id“:”https://openalex.org/C36503486,“wikidata”:https://www.wikidata.org/wiki/Q11235244“,”display_name“:”域(数学分析)“,”level“:2,”score“:0.57345074},{”id“:”https://openalex.org/C23123220,“wikidata”:https://www.wikidata.org/wiki/Q816826“,”display_name“:”信息检索“,”level“:1,”score“:0.5285006},{”id“:”https://openalex.org/C2522767166,“wikidata”:https://www.wikidata.org/wiki/Q2374463“,”display_name“:”数据科学“,”level“:1,”score“:0.52583325},{”id“:”https://openalex.org/C124101348,“wikidata”:https://www.wikidata.org/wiki/Q172491网址“,”display_name“:”数据挖掘“,”level“:1,”score“:0.27438802},{”id“:”https://openalex.org/C107457646,“wikidata”:https://www.wikidata.org/wiki/Q207434“,”display_name“:”Human\u2013计算机交互“,”level“:1,”score“:0.17956272},{”id“:”https://openalex.org/C134306372,“wikidata”:https://www.wikidata.org/wiki/Q7754“,”display_name“:”数学分析“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C33923547,“wikidata”:https://www.wikidata.org/wiki/Q395“,”display_name“:”数学“,”等级“:0,”分数“:0.0},{”id“:”https://openalex.org/C202444582,“wikidata”:https://www.wikidata.org/wiki/Q837863“,”display_name“:”纯粹数学“,”level“:1,”score“:0.0}],”mesh“:[],”locations_count“:1.”locations“:[{”is_oa“:true,”landing_page_url“:”https://doi.org/10.1145/3613905.3650798,“pdf_url”:https://dl.acm.org/doi/pdf/10.1145/3613905.3650798“,”source“:null,”license“:null,”licence_id“:nul,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true}],”best_oa_location“:{”is_oa“:true,”landing_page_url“:”https://doi.org/10.1145/3613905.3650798,“pdf_url”:https://dl.acm.org/doi/pdf/10.1145/3613905.3650798“,”source“:null,”license“:null,”license_id“:null,”version“:”publishedVersion“,”is_accepted“:true,”is_published“:true},”sustainable_development_goals“:[{”id“:”https://metadata.un.org/sdg/4“,”display_name“:”素质教育“,”score“:0.79}],”grants“:[],”datasets“:【】,”versions“:【],”referenced_works_count“:13,”referrenced_works“:[”https://openalex.org/W1544268587","https://openalex.org/W1880262756","https://openalex.org/W2087382273","https://openalex.org/W2465309725","https://openalex.org/W2576683119","https://openalex.org/W2997591727","https://openalex.org/W3118813946","https://openalex.org/W3212368439","https://openalex.org/W3213241618","https://openalex.org/W4237375617","https://openalex.org/W4283155630","https://openalex.org/W4378908626","https://openalex.org/W4389519061“],”related_works“:[”https://openalex.org/W3045759591","https://openalex.org/W3002559787","https://openalex.org/W2795557596","https://openalex.org/W2596767525","https://openalex.org/W2331546953","https://openalex.org/W2100609754","https://openalex.org/W2050640900","https://openalex.org/W2049050102","https://openalex.org/W2023412717","https://openalex.org/W1886987011“],”ngrams_url“:”https://api.openalex.org/works/W4396832027/ngrams“,”“abstract_inverted_index”:{“Making”:[0],“sense”:[1],“of”:[2,25109142157],“unstructured”:[3],“text”:[4],“dataset”:[5],“is”:[6,73],“perenually”:[7],“harouble”:[8,76],“yet”:[9],“increased”:[10],“related”:%11,36,92],“with”:[12115],“Large”:[13],“Language”:[14],”模型。“:[15],“数据”:[16],“从业者”:[17,64],“经常”:[18,65],“依赖”:[19],“关于“:[20],”数据集“:[21105],”摘要“:[22],”特别是“:[23],”分布“:[24],”各种“:[26],”派生“:[27],”特征。“:[28],”一些“:[29],”特征“:[30,94],”像“:[31],”毒性“:[32],”或“:[33,54,77],”主题“:[34],”是“:[35,44],”到“:[37101125128133153],”许多“:[38,41],”数据集“:[39],”但是“:[40],”有趣“:[42],”特性“:[43],”域“:[45],”特定:“:[46],”工具“:[47],“和”:[48,56,75,97137149],“流派”:[49],“代表”:[50,58,69106],“a“:[51,59,84112139],“音乐”:[52],“数据集”:[53,71],“疾病”:[55],“症状”:[57],“医学”:[60],“数据库”。“:[61],”相应地,“:[62],”数据“:[63117],”运行“:[66],”自定义“:[67],”分析“:[68],”每个“:[70],”其中“:[72],”繁琐“:[74],”使用“:[78130144],”无监督“:[79],”方法。“:[80],”We“:[81],”present“:[82],”AutoHistograms“:[83129],”visualization“:[85],”tool“:[86132148],”levering“:[87],”LLM。“:[88],“AutoHistograms”:[89],“automatically”:[90],“identifies”:[91],“entity-based”:[93],“visualizes”:[95],“them”,“:[96],“allows”:[98],“the”:[99104131154],“user”:[100113150],“interactively”:[102],“query”:[103],“new”:%107],“categories”:[108],“entries”。“:[110],”In“:[111],”研究“:[114151],”(n=10)“:[116],”从业者“:[118],”我们“:[119],”观察“:[120],”that“:[121],”参与者“:[122],”were“:[123],”able“:[124],”quickly“:[126],”boarboard“:[127],”identified“:[134],”actionable“:%135],”insights“:[136],”conceptualization“:[138],”broad“:[140],“范围”:[141],“适用”:[143],“案例”。“:[145],”Together“,”:[146],”this“:[147],”contribute“:[152],”growing“:[155],”field“:[156],”LLM-assisted“:[158],”sensemaking“:[159],”tools“。“:[160]},”cited_by_api_url“:”https://api.openalex.org/works?filter=引用:W4396832027“,”counts_by_year“:[],”updated_date“:”2024-06-04T16:51:18.385898“,”created_date:“2024-05-12”}“