{“状态”:“确定”,“消息类型”:“工作”,“信息版本”:“1.0.0”,“邮件”:{“索引”:{“日期-部件”:[[2024,9,5]],“日期-时间”:“2024-09-05T13:53:40Z”,“时间戳”:1725544420740},“引用-计数”:53,“发布者”:“爱思唯尔BV”,“许可证”:[{“开始”:{-“日期-零件”:[[2021,6,1]],0:00Z“,”时间戳“:1622505600000},”内容-版本“:“tdm”,“delay-in-days”:0,“URL”:“https:\/\/www.elsevier.com//tdm\/userlicense\/1.0\/”},{“start”:{“date-parts”:[[2021,6,1]],“date-time”:“2021-06-01T00:00:00Z”,“timestamp”:1622505600000},“content-version”:“stm-asf”,“delay-in-days”:“0”,“URL“https:\\/doi.org\/1015223\/policy-017“},{“start”:{“date-parts”:[[2021,6,1]],“date-time”:“2021-06-01T00:00:00Z”,“timestamp”:1622505600000},“content-version”:“stm-asf”,“delay-in-days”:0,“URL”:“https:\/\/doi.org\/10.15223\/policy-037”},{“start”:{“date-parts”:[[2021,6,1]],“date-time”:“2021-06-01T00:00:00Z”,“timetamp”:622505600000},”content-versiion“:”stm-asf“,“delay-in-daies”:0、“URL”:“https:”\/\/doi.org\/10.15223\/policy-012“},{“start”:{“date-parts”:[[2021,6,1]],“date-time”:“2021-06-01T00:00:00Z”,“timestamp”:1622505600000},“content-version”:“stm-asf”,“delay-in-days”:0,“URL”:“https:\/\/doi.org\/10.15223\/policy-029”},{“start”:{“date-parts”:[[2021,6,1]],“datetime”:“2011-06-01T_00:00:0Z”,f“,”delay-in-days“:0,”URL“:”https:\/\/doi.org\/10.15223\/policy-004“}],“内容域”:{“域”:[“elsevier.com”,“sciencedirect.com”],“交叉标记限制”:true},“短容器标题”:[“模式识别字母”],“已发布的印刷品”:{“日期部分”:[[2021,6]]},“DOI”:“10.1016\/j.pare.2021.02.009”,“类型”:“期刊文章”,“创建的”:{“日期部分”:[[2021,2,16],“日期时间”:“2021-02-16T04:57Z”,“时间戳”:1613451437000},“page”:“70-76”,“update-policy”:”http://\/dx.doi.org\/10.1016\/elsevier_cm_policy“,”source“:”Crossref“,“is-referenced-by-count”:9,“special_numbering”:“C”,“title”:[“利用辅助图像描述进行密集视频字幕”],“prefix”:“10.1016”,”volume“:“146”,“author”:[{“给定”:“Emre”,“family”:“Boran”,”sequence“:”第一“,“affiliation”:[]},{“given”:“Aykut”,“family”:“Erdem”,“sequence”:“additional”,“afiliation”:[]},“sequence”:“additional”,“affiliation”:[]},{“given”:“Lucia”,“family”:“Specia”,“sequence”:“additional”,“affiliation”:[]}],“member”:“78”,“reference”:[{“issue”:“6”,“key”:“10.1016\/j.patrec.2021.009_bib0001”,“doi-asserted-by”:52“,”作者“:”Aafaq“,“year”:“2019”,“journal-title”:“ACM Compute.Surv.(CSUR)”},{“key”:“10.1016\/j.patrec.2021.009_bib0002”,“doi-asserted-by”:“crossref”,“first page”:”72347“,“doi”:“101109\/ACCES.2020.29878770”,“article-title“:”基于krawtchouk-tchebichef矩的快速时间视频分割“,”volume“:”8“,”author“:”Abdulhussain“,“年份”:“2020年”,“新闻标题”:“IEEE Access”},{“key”:“10.1016\/j.patrec.2021.02.009_bib0003”,“series-title”:“2019年国际神经网络联合会议(IJCNN)”,“首页”:“1”,“文章-标题”:“图像和视频处理快速特征提取算法”,“作者”:“Abdulhussain”,“年份”:“199”}:“CVPR”,“首页”:“6077”,“文章标题”:“图像字幕和视觉问答自下而上的关注”,“作者”:“Anderson”,“年份”:“2018”},{“密钥”:“10.1016\/j.parec.20102.0009_bib0005”,“系列标题”:“CVPR”,“首页”:“961”,“文章标题”:“ActivityNet:人类活动理解的大型视频基准”,“author”:“Caba”,“year”:“2015”},{“key”:“10.1016\/j.patrec.2021.02.009_bib0006”,“series-title”:“2017 IEEE计算机视觉与模式识别会议(CVPR)”,“首页”:“4724”,“article-title”:”Quo-vadis,动作识别?新模型和动力学数据集“,”author“:”Carreira“,”year“:”2017“}:“10.1016\/j.patrec.2021.02.009_bib0007”,“series-title”:“ICCV”,“首页”:“2970”,“article-title”:“通过条件GAN实现多样性和自然图像描述”,“author”:“Dai”,“year”:“2017”},{“key”::“Deng”,“year”:“2009”},{“key”:“10.1016\/j.patrec.2021.002.009_bib0009”,“series-title”:“统计机器翻译研讨会”,“首页”:“376”,“article-title”:”Meteor universal:任何目标语言的特定语言翻译评估“,“author”:“Denkowski”,“年份”:“2014”}、{“key”:”10.1016\/j.patarec.201.009_bib0010“,”series-ttle“:“EMNLP”,“首页”:“968”,“article-title”:“讲述社交媒体视频故事的数据集”,“author”:“Gella”,“year”:“2018”},{“key”:“10.1016\/j.patrec.2021.009_bib0011”,“series-title”:《NeurIPS》,“first-page”:“2672”,“article-title”:“Generative敌对网络”,“author”:“Goodfellor”,“year”:《2014》}:“10.1016\/j.patrec.2021.02.009_bib0012”,“series-title”:“ICCV”,“first page”:“2712”,“article-title”:”Youtube2text:使用语义层次和零快照识别识别和描述任意活动“,”author“:”Guadarrama“,”year“:”2013“},{”key“:”10.1016//j.patre.201.009_bib001“,”series-ttle“:”CVPR“,“first-page”:“6546”,“article-title”:“时空3D CNN能否追溯2DCNN和imagenet的历史?”,“author”:“Hara”,“year”:“2018”},{“key”:“10.1016\/j.patrec.2021.009_bib0014”,“series-title”:《CVPR》,“first page”:《770》,“artice-title》:“图像识别的深度剩余学习”,“author”:“He”,“年份”:“2016”}:“10.1016\/j.patrec.2021.02.009_bib0015”,“doi-asserted-by”:“crossref”,“first page”:“1735”,”doi“:”10.1162\/neco.1997.9.8.1735“,”article-title“:”长短期记忆“,”volume“:”9“,”author“:”Hochreiter“,”year“1997”,“journal-title”:“Neural Comput.”},{“key”:”10.1016\/j.paterec.2021.009_bip0016“,“连续时间”:“British Machine Vision Conference(BMVC)”,“article-title”:“更好地使用视听线索:使用双模变压器进行密集视频字幕”,“author”:“Iashin”,“year”:“2020”},{“key”:“10.1016\/j.patrec.2021.009_bib0017”,“series-title”:《CVPR Workshops》,“first page”:”:“958”,“article-title”:“Multi-modal密集视频字幕“,”author:“Iashin”,“year”:“2020”},{“key”:“10.1016\/j.patrec.2021.02.009_bib0018”,“series-title”:“ACL”,“article-title”:”深度无序组合与文本分类的句法方法相竞争“,“author”:“Iyyer”,“year:”2015“},}“key:”10.1016\/j.patarec.201.009_bib001 9“,”series-ttle“:”ICLR“,”article-title“Adam:a method for randomic optimization”,“auth”:“Kingma”,“year”:“2015”},{“key”:“10.1016\/j.patrec.2021.02.009_bib0020”,“series-title”:“ICCV”,“article-title”:”视频中的密集适应事件“,”author“:”Krishna“,”year“:”2017文本知识”,“作者”:“Krishnamoorthy”,“year”:“2013”},{“key”:“10.1016\/j.patrec.2021.02.009_bib0022”,“series-title”:“ICML”,”first page“:”957“,”article-title“:”From word embeddings to document distances“,”author“:”Kusner“,”year“:”2015:“Mart:用于连贯视频段落标题的记忆增强递归变换器”,“author”:“Lei”,“year”:“2020”},{“key”:“10.1016\/j.patrec.2021.02.009_bib0024”,“series-title”:“CVPR”,“first page”:”7492“,“article-title”:”联合定位和描述稠密视频标题事件“,”author“:”Li“,”year“:”2018“},”{“key”:“10.1016\/j.patrec.2021.02.009_bib0025”,“series-title”:“ICCV”,“首页”:“3362”,“article-title”:“视觉段落生成的递归主题转换GAN”,“作者”:“梁”,“年份”:“2017”},{“key”:”10.1016\/j.patarec.2021.009_bip0026“,”series-title“:”CVPR“,”首页“:”6790“,”article-title“:“参加并互动:视频理解的高阶对象互动”,“作者”:“Ma”,“年份”:“2018”},{“key”:“10.1016\/j.patrec.2021.0029_bib0027”,“series-title”:“CVPR”,《首页》:“6588”,“文章标题”:“流线型密集视频字幕”,“author”:“Mun”,“year”:“2019”}es-title“:”CVPR“,“first page”:“1029”,“article-title”:“视频表示的递阶递归神经编码器及其字幕应用”,“author”:“Pan”,“year”:“2016”},{“key”:”10.1016\/j.patrec.2021.009_bib0029“,“series-title”:”CVPR“,“first-page”:“4594”,“article-title”:“联合建模嵌入和翻译以桥接视频和语言”,“author”:“Pan”,“year”:“2016”},{“key”:“10.1016\/j.patrec.2021.02.009_bib0030”,“series-title”:“CVPR”,”first page“:”6504“,”article-title“:”转移语义属性的视频字幕“,”author“:”Pan“,”year“:”2017“},”{“key”:”10.1016\/j.patarec.2021.002.009_bbb0031“,”series-ttle“:“ACL”,”首页“:”311“,文章标题“:“BLEU:自动评估机器翻译的方法”,“author”:“Papineni”,“year”:“2002”},{“key”:“10.1016\/j.patrec.2021.009_bib0032”,“series-title”:“CVPR”,“first page”:”6591“,”article-title“:”多段视频描述的对抗推理“,”author“:”Park“,”year“:”2019,“series-title”:“2018 IEEE口语技术研讨会(SLT)”,“首页”:“418”,“article-title”:“深度上下文:端到端上下文语音识别”,“作者”:“Pundak”,“年份”:“2018”},{“键”:“10.1016\/j.patrec.2021.009_bib0034”,“series-title“:”ICCV“,“首页面”:“433”,“article-titel”:“将视频内容转换为自然语言描述”,“作者”:“Rohrbach”,“年份”:“2013”},{“密钥”:“10.1016\/j.patrec.2021.02.009_bib0035”,“doi-asserted-by”:“crossref”,“首页”:“102754”,“doi”:“101016\/jvcir.2020.102754”,“author”:“Sasithradevi”,“year”:“2020”,“journal-title”:“J.Vis.Commun.Image Represents.”},{“key”:“10.1016\/J.patrec.2021.002.009_bib0036”,“series-title”:”ACL“,”first page“:”2556“,”article-title“:”概念性字幕:一个用于自动图像字幕的清理的、超名的图像alt-text数据集“,”author“:”Sharma“,”year“:”2018“},”{“key”:“10.1016\/j.patrec.2021.02.009_bib0037”,“series-title”:“ACM-MM”,“首页”:“1073”,“文章-标题”:“视频字幕生成的帧级和分段级特征和候选库评估”,“作者”:“Shetty”,“年份”:“2016”},{“key”:“10.116\/j-patrec.201.02.009_bib0088”,“系列-标题”:“ICCV”,“第一页”:”:“4135”,“论文-标题”:“说同一种语言:通过对抗性训练将机器字幕与人字幕匹配”,“作者”:“Shetty”,“年份”:“2017”},{“key”:“10.1016\/j.parec.20102.0009_bib0039”,“系列标题”:“ACL”,“首页”:“6382”,“文章标题”:“讲述教学视频中的密集过程字幕”,“作者”:“史”,“年份”:“2019”},{“key”:“10.1016\/j.patrec.2021.02.009_bib0040”,“series-title”:“NeurIPS”,“首页”:“5998”,“article-title”:“注意就是你需要的”,“author”:“Vaswani”,“年份”:“2017”},{“key”:”10.1016\/j.patarec.201.009_bib0031“,”series-title“:”CVPR“,”首页“:”4566“,”article-title“CIDEr:基于共识的图像描述评估“,”作者“:”韦丹丹“,”年份“:“2015”},{“key”:“10.1016\/j.patrec.2021.02.009_bib0042”,“series-title”:“ICCV”,“首页”:“4534”,“文章-标题”:“序列-视频-文本”,“作者”:“Venugopalan”,《年份》:“2015年”}:“展示、奖励和讲述:通过对抗性训练从照片流中自动生成叙事段落”,“作者”:“王”,“年份”:“2018”},{“关键”:“10.1016\/j.patrec.2021.002.009_bib0044”,“系列标题”:“CVPR”,“首页”:“7190”,“文章标题”:”双向关注融合,为密集视频字幕设置上下文门控“,”,“作家”:“王”,“年”:“2018”},{“key”:“10.1016\/j.patrec.2021.02.009_bib0045”,“series-title”:“ECCV”,“首页”:“20”,“文章标题”:“时态段网络:走向深度行动识别的良好实践”,“作者”:“王”,“年份”:“2016”}“”:“通过分层强化学习进行视频字幕”,“author”:“Wang”,“year”:“2018”},{“key”:“10.1016\/j.patrec.2021.02.009_bib0047”,“series-title”:“ECCV”,“first page”:”468“,“article-title”:”Move forward and tell:a progressive generator of Video descriptions“,”author“:”Xiong“,”year“:”2018“},”{“密钥”:“101016\/j.patre.2021.009_bib 0048”,“series-title”:“WACV”,“first page”:“396”,“article-title”:”连续视频流中的联合事件检测和描述“,“author”:“Xu”,“year”:“2019”},{“key”:”10.1016\/j.patrec.2021.009_bib0049“,”series-tile“:”CVPR“,“first-page”:“4507”,“article-title”:“利用时间结构描述视频”,“au作者”:“Yao”,“年份”:“2015”}、{“key”:“10.1016\/j.patrec.2021.02.009_bib0050”,“series-title”:“CVPR”,“首页”:“4584”,“article-title”:“使用层次递归神经网络的视频段落标题”,“author”:“Yu”,“year”:“2016”},{“key”::“基于背景的视频字幕的时空注意模型”,“作者”:“Zanfir”,“年份”:“2016”},{“key”:“10.1016\/j.patrec.2021.002.009_bib0052”,“series-title”:“AAAI”,”article-title“:“从网络教学视频中自动学习程序”,“author”:“周”,“年”:“2018”}、{“key”::“CVPR”,“first page”:“8739”,“article-title”:“带屏蔽变压器的端到端密集视频字幕”,“author”:“Zhou”,“year”:“2018”}],“container-title“:[”Pattern Recognition Letters“],“original-tittle”:[],“language”:“en”,“link”:[{“URL”:“https:\/\/api.elsevier.com/content\/article\/PII:S0167865521000647?httpAccept=text\/xml”,“content-type”:“text\/xml”,“content-version”:“vor”,“预期应用程序”:“文本挖掘”},{“URL”:“https:\/\/api.elsevier.com/content\/article\/PII:S01678865521000647?httpAccept=text\/plain”,“内容类型”:“text\/plain”,“内容版本”:“vor”,“预期应用程序”:“文本挖掘”}],“存放”:{“日期部分”:[[2023,1,9]],“日期时间”:“2023-01-09T17:02:00Z”,“timestamp”:1673283720000},“score”:1,“resource”:{“primary”:{“URL”:“https:\/\/linkinghub.elsevier.com/retrieve\/pii\/S0167865521000647”}},”subtitle“:[],”shorttitle“:[],”issued“:{”date-parts“:[2021,6]},‘references-count’:53,”alternative-id“:[”S01678655021000647“],”URL“:”http://\/dx.doi.org \/10.1016 \/j.patrec.2021.02.009“,”关系“:{},”ISSN“:[“0167-8655”],“issn-type”:[{“value”:“0167-9655”,“type”:“print”}],“subject”:[],“published”:{“date-parts”:[[2021,6]]},“assertion”:[{“value”:“Elsevier”,“name”:“publisher”,“label”:“此文章由”}维护,{“value”:”利用辅助图像描述进行密集视频字幕“,”name“:”articletite“,”label“:”article Title“},{”value“:“Pattern Recognition Letters”,“name”:“journalttle”,“label”:“Journal Title”},{“value”:“https:\/\/doi.org\/101016\/j.patrec.2021.02.009”,“name”:“articlelink”,”label“:”CrossRef doi link to publisher maintained version“},”{“value”:“article”,“名称”:“content_type”,“标签”:“content-type”}、{“value”:”\u00a9 2021发布者Elsevier B.V.“,”name“:“copyright”,“label”:“版权”}]}}