{“id”:“https://openalex.org/W4394868117“,”doi“:”https://doi.org/10.48550/arxiv.2404.09705“,”title“:“通过视觉语言模型增强机器人解释能力:通过解释视觉输入改善人机交互的初步研究”,“display_name”:“通过视觉语言模型增强机器人解释能力:通过解释视觉输入改善人机交互的初步研究,“publication_year”:2024,“publiation_date”:“2024-04-15”,“ids”:{“openalex”:“https://openalex.org/W4394868117“,”doi“:”https://doi.org/10.48550/arxiv.2404.09705“},”language“:”en“,”primary_location“:{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2404.09705,“pdf_url”:https://arxiv.org/pdf/2404.09705,“源”:{“id”:https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”Cornell University“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false},”type“:”preprint“,”type_crossref“:“posted-content”,“indexed_in”:[”arxiv“],‘open_access’:{”is_oa“:true,”“oa_status”:“green”,“oa_url”:“https://arxiv.org/pdf/2404.09705“,”any_repository_has_fulltext“:true},”authorships“:[{”author_position“:”第一“,”作者“:{”id“:”https://openalex.org/A5057930985“,”display_name“:”David Sobr\u00edn-Hidalgo“,”orcid“:”https://orcid.org/0009-0005-7673-5921“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”Sobr\u00edn-Hidalgo,David“,”raw _ afiliation_strings“:[],“从属关系”:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5070413874“,”display_name“:”Miguel\u00c1。Gonz\u00e1lez-Santamarta“,”兽人“:”https://orcid.org/0000-0002-7658-8600“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”Gonz\u00e1lez-Satamarta,Miguel\u00c1ngel“,”raw_affiliation_strings“:[],“affiliations”:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5031255947“,”display_name“:”\u00c1ngel Manuel Guerrero\u2010Higueras“,”orcid“:”https://orcid.org/0000-0001-8277-0700“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”Guerrero-Higueras,\u00c1ngel Manuel“,”raw_affiliation_strings“:[],“从属关系”:[]},{“author_position”:“middle”,“author”:{“id”:“https://openalex.org/A5056235549“,”display_name“:”Francisco J.Rodr\u00edguez-Lera“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Rodr\u 00edgue_Lera,Francisco.Javier“,”raw _affiliation_strings“:],”affiliations“:【】},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A5070790812“,”display_name“:”Vicente Matell\u00e1n Olivera“,”orcid“:”https://orcid.org/0000-0001-7844-9658“},”机构“:[],”国家“:[[],”is_corresponding“:false,”raw_author_name“:”Matell\u00e1n-Olivera,Vicente“,”raw _ affiliation_strings“:[]],”从属关系“:[[]}],”countries _ distinct_count“:0,”机构区分计数“:0 has_fulltext“:false,”cited_by_count“:0,”cited_by_percentile_year“:{”min“:0”,“max”:91},“biblio”:{“volume”:null,“issue”:nul,“first_page”:null,“last_page”:null},”is_retracted“:false,”is_paratext“:false,”primary_topic“:”{“id”:“https://openalex.org/T11714“,”“display_name”:“图像和视频中的可视问答”,“score”:0.9991,“subfield”:{“id”:“https://openalex.org/subfields/1707“,”display_name“:”计算机视觉和模式识别“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T11714“,”“display_name”:“图像和视频中的可视问答”,“score”:0.9991,“subfield”:{“id”:“https://openalex.org/subfields/1707“,”display_name“:”计算机视觉和模式识别“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T11307“,”display_name“:”转移学习和领域适应的进展“,”score“:0.9731,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”Artificial Intelligence“},”field“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10028“,”display_name“:”自然语言处理“,”score“:0.97,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”Artificial Intelligence“},”field“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/language-understanding(https://openalex.org/keywords/language-understanding)“,”display_name“:”语言理解“,”score“:0.58092},{”id“:”https://openalex.org/keywords/visual-question-answering“,”display_name“:”可视问答“,”score“:0.559663},{”id“:”https://openalex.org/keywords/visual-recognition(https://openalex.org/keywords/visual-recognition)“,”display_name“:”视觉识别“,”score“:0.535037},{”id“:”https://openalex.org/keywords/representation-learning网站“,”display_name“:”表征学习“,”score“:0.520036},{”id“:”https://openalex.org/keywords/semantic-reasoning网站“,”display_name“:”语义推理“,”score“:0.518411}],”concepts“:[{”id“:”https://openalex.org/C90509273,“wikidata”:https://www.wikidata.org/wiki/Q11012“,”display_name“:”Robot“,”level“:2,”score“:0.70019114},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.69268197},{”id“:”https://openalex.org/C2776650193,“wikidata”:https://www.wikidata.org/wiki/Q264661“,”display_name“:”障碍“,”level“:2,”score“:0.6750803},{”id“:”https://openalex.org/C2779343474,“wikidata”:https://www.wikidata.org/wiki/Q3109175“,”display_name“:”Context(考古学)“,”level“:2,”score“:0.5885929},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.5869377},{”id“:”https://openalex.org/C107457646,“wikidata”:https://www.wikidata.org/wiki/Q207434“,”display_name“:”Human\u2013计算机交互“,”level“:1,”score“:0.5806333},{”id“:”https://openalex.org/C527412718,“wikidata”:https://www.wikidata.org/wiki/Q855395“,”display_name“:”解释(哲学)“,”级别“:2,”分数“:0.53959644},{”id“:”https://openalex.org/C2780451532,“wikidata”:https://www.wikidata.org/wiki/Q759676“,”display_name“:”Task(project management)“,”level“:2,”score“:0.5323342},{”id“:”https://openalex.org/C195324797,“wikidata”:https://www.wikidata.org/wiki/Q33742“,”display_name“:”自然语言“,”level“:2,”score“:0.47656918},{”id“:”https://openalex.org/C6683253,“wikidata”:https://www.wikidata.org/wiki/Q7075535“,”display_name“:”避障“,”level“:4,”score“:0.46863958},{”id“:”https://openalex.org/C145460709,“wikidata”:https://www.wikidata.org/wiki/Q859951“,”display_name“:”Human\u2013robot interaction“,”level“:3,”score“:0.44698313},{”id“:”https://openalex.org/C2983448237,“wikidata”:https://www.wikidata.org/wiki/Q1078276“,”display_name“:”语言理解“,”level“:2,”score“:0.4131971},{”id“:”https://openalex.org/C31972630,“wikidata”:https://www.wikidata.org/wiki/Q844240“,”display_name“:”计算机视觉“,”level“:1,”score“:0.37235457},{”id“:”https://openalex.org/C204321447,“wikidata”:https://www.wikidata.org/wiki/Q30642“,”display_name“:”自然语言处理“,”level“:1,”score“:0.35475063},{”id“:”https://openalex.org/C19966478,“wikidata”:https://www.wikidata.org/wiki/Q4810574“,”display_name“:”Mobile robot“,”level“:3,”score“:0.30307958},{”id“:”https://openalex.org/C127413603,“wikidata”:https://www.wikidata.org/wiki/Q11023“,”display_name“:”Engineering“,”level“:0,”score“:0.16091976},{”id“:”https://openalex.org/C151730666,“wikidata”:https://www.wikidata.org/wiki/Q7205“,”display_name“:”古生物学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C201995342,“wikidata”:https://www.wikidata.org/wiki/Q682496“,”display_name“:”系统工程“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C17744445,“wikidata”:https://www.wikidata.org/wiki/Q36442“,”display_name“:”政治学“,”level“:0,”score“:0.0},{”id“:”https://openalex.org/C199539241,“wikidata”:https://www.wikidata.org/wiki/Q7748“,”display_name“:”Law“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C86803240,“wikidata”:https://www.wikidata.org/wiki/Q420“,”display_name“:”生物学“,”等级“:0,”分数“:0.0},{”id“:”https://openalex.org/C199360897,“wikidata”:https://www.wikidata.org/wiki/Q9143“,”display_name“:”Programming language“,”level“:1,”score“:0.0}],”mesh“:[],”locations_count“:1,”locations“:[{”is_oa“:true,”landing_page_url“:”https://arxiv.org/abs/2404.09705,“pdf_url”:https://arxiv.org/pdf/2404.09705,“源”:{“id”:https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false}],“best_oa_location”:{“is_oa”:true,“landing_page_url”:“https://arxiv.org/abs/2404.09705,“pdf_url”:https://arxiv.org/pdf/2404.09705,“源”:{“id”:https://openalex.org/S4306400194“,”display_name“:”arXiv(康奈尔大学)“,”issn_l“:null,”issn“:null,”is_oa“:true,”is_ in_doaj“:false,”host_organization“:”https://openalex.org/I205783295“,”“host_organization_name”:“康奈尔大学”,“host_organization_lineage”:[“https://openalex.org/I205783295“],”host_organization_lineage_names“:[”康奈尔大学“],“type”:“repository”},“license”:null,“licence_id”:null,“version”:“submittedVersion”,“is_accepted”:false,“is_published”:false},”sustainable_development_goals“:[{”score“:0.53,”id“:”https://metadata.un.org/sdg/4“,”display_name“:”素质教育“}],”grants“:[],”datasets“:【】,”versions“:【],”referenced_works_count“:0,”referrenced_works“:[],”related_work斯“:[”https://openalex.org/W4391249562","https://openalex.org/W4253519380","https://openalex.org/W3043170174","https://openalex.org/W2930076404","https://openalex.org/W2782776446","https://openalex.org/W2596413128","https://openalex.org/W2357323510","https://openalex.org/W2356867392","https://openalex.org/W2155948905","https://openalex.org/W2071957557“],”ngrams_url“:”https://api.openalex.org/works/W4394868117/ngrams网站“,”“abstract_inverted_index”:{“This”:[0,68],“paper”:[1],“presents”:[2],“an”:[3],“improved”:[4],“system”:[5,27,56,90],“based”:【6],“on”:[7,91],“our”:【8,47117】],“for”:[15,71],“autonomous”:[16],“robot”:[17,98],“actions”:[18],“during”:[19],“人类机器人“:[20],“交互”:[21],“(HRI)。“:[22],”先前,“:[23],”我们“:[24,45],”开发“:[25],”a“:[26,92102],”that“:[28,74112],”used“:[29],”大型“:[30],”语言“:[31],”模型“:[32,52],”(LLM)“:[33],”解释“:[35],”日志“:[36,60,80],”和“:[37,81124],”生产“:[38],”自然“:[39],“语言”:[40],“解释。“:[41],”In“:[42],”this“:[43,88108],”study“:[44],”expand“:[46],”approach“:48],”by“:[49120],”incorporating“:[50],”Vision-Language“:[51],”(VLM)“:[53],”enable“:[54],”the“:[55,62,78,82,97126129],”analyze“:[58],”textal“:[59],”with“:/61],”added“:[63],”context“:[64],”of“:[65128],”visual“:[66114],”输入。“:[67],”方法“:[69],”允许“:[70],”生成“:[72],”组合“:[75],”数据“:[76],”来自“:[77107],”机器人“:[79],”图像“:[83],”它“:[84],”捕获。“:[85],”我们“:[86],”测试“:[87],”增强“:[89],”基本“:[93],”导航“:[94],”任务“:[95],”其中“:[96],”需要“:[99],”避免“:[101],”人类“:[103],”障碍。提供“:[104],“The”:[105],“findings”:[106],“prepartial”:[109],“study”:[110],“indicate”:[111],“adding”:[113],“interpretation”:[115],“improved”:[116],“system's”:[118],“excifically”:[121],“identifying”:[122],“barriers”:[123],“increating”:%125],“accuracy”:[127]。“:[131]},”cited_by_api_url“:”https://api.openalex.org/works?filter=cites:W4394868117“,”counts_by_year“:[],”updated_date“:”2024-06-19T17:16:44.661630“,”created_date:“2024-04-17”}“