{“状态”:“确定”,“消息类型”:“工作”,“信息版本”:“1.0.0”,“邮件”:{“索引”:{“日期部分”:[[2024,6,25]],“日期时间”:“2024-06-25T05:13:36Z”,“时间戳”:1719292416736},“参考计数”:104,“发布者”:“IEEE”,“许可证”:[{“开始”:}“日期部分“:[2023,6,1]],”日期时间“:”2023-06-01T00:00:00 Z“,”timestamp“:1685577600000},”content-version“:“stm-asf”,“delay-in-days”:0,“URL”:“https:\\/doi.org\/10.15223\/policy-029”},{“start”:{“date-parts”:[[2023,6,1]],“date-time”:“2023-06-01T00:00:00Z”,“timestamp”:1685577600000},“content-version”:“stm-asf”、“delay-in-days“:0,”URL“https://doi.org\/10.152 23\/plicy-0323”7“}],”内容域“:{”域“:[],”交叉标记限制“:false},“short-container-title”:[],“published-print”:{“date-parts”:[[2023,6]]},“DOI”:“10.1109\/cvpr52729.2023.01399”,“type”:“proceedings-article”,“created”:{“date-parts”:[[2023,8,22]],“date-time”:“2023-08-2T17:30:52Z”,“timestamp”:1692725452000},”source“Crossref”,“is-referenced-by-count”:27,“title”:[“DropMAE:Masked Autoencoders with Spatial-Atention Dropout for Tracking Tasks”],“prefix”:“10.1109”,“author”:[{“given”:“Qianqiang”,“family”:“Wu”,“sequence”:“first”,“affiliation”:[}“name”:“香港城市大学,计算机科学系”}]},{“Givent”:“Tianyu”:“国际数字经济学院”}]},{“given”:“紫泉”,“family”:“Liu”,“sequence”:“additional”,“affiliation”:[{“name”:“香港城市大学计算机科学系”}]{,}“giving”:“Baoyuan”,“家庭”:“Wu”,”sequence“:”additional“,”affiliance“:[{”name“:“深圳香港中文大学数据科学学院”}]},{“given”:“Ying”,“family”:“Shan”,“sequence”:“additional”,“affiliation”:[{“name”:“Tencent AI Lab”}]},{“fivent”:“Antoni B.”,“家人”:“Chan”,“序列”:“附加”,“从属关系”:[[{”name“:“香港城市大学计算机科学系”}]],“member”:“263”,“reference”:[}”key“ref1”,“doi-asserted-by”:”publisher“,“doi”:“10.1109\/ICCV48922.2021.00175”},{“key”:“ref2”,“文章标题”:“Beit:Bert图像转换器的预训练”,“作者”:“Bao”,“年份”:“2021”,“期刊标题”:“arXiv”},{“key”:“ref3”,“doi断言者”:“出版商”,“doi”:“10.1007\/978-3-319-48881-3_56”},{“key”:“ref4”,“首页”:“6182”,“文章标题”:“Lean-ring判别模型预测跟踪”,“volume-title”:“ICCV”,“author”:“Bhat”,“year”:“2019”},{“key”:“ref7”,“article-title”:“非透视视觉特征学习的参数化实例分类”,“volume-title”:“NeurIPS”,“author”:“Cao”,“year”:“2020”},{“key”:“ref8”,“article-title“:”关于kinetics-600的简短注释“,”author“:”Carreira“,”year“:”2018“,”journal-title,“author”:“Carreira”,“year”:“2019”,“journal-title”:“arXiv”},{“key”:“ref10”,“article-title(文章标题):“Back-bone is all your needs:A simplified architecture for visual object tracking”,“volume-title“:”ECCV“,”author“:”Chen“,”year“:”2022:“ICML”,“author”:“Chen”,“year”:“2020”},{“key”:“ref12”,“doi-asserted-by”:“publisher”,”doi“:”10.1109\/ICCV48922.2021.00950“},”{“key”:”ref13“,”doi-assert-by“:”publisher“,”doi:“10.1109\/CVPR46437.2021.00803”}8-3-031-19815-1_37“},{“键”:“参考15”,“首页”:“11781”,“文章标题”:“重新思考具有改进内存覆盖率的时空网络,以实现高效的视频对象分割”,“volume-title”:“NeurIPS”,“author”:“Cheng”,“year”:“2021”},{“key”:“ref16”,“doi-asserted-by”:“publisher”,“doi”:“10.1109\/CVPR.2018.00774”}18英寸,“doi-asserted-by”:“publisher”,“doi”:“10.1109\/CVPR42600.2020.00633”},{“key”:“ref19”,“doi-asserted-by”:”publisher“,”doi“:”10.1109\/CVPR.2017.733“},“key“:”ref20“,”doi-assert-by“:”publister“,”doi“:I“:”10.1007\/978-3-319-46454-1_29“},{”key“:”ref22“,”article-title“:“语言模型是少数学习者”,“volume-title”:“NAACL”,“author”:“Devlin”,“year”:“2019”},{“key”:“ref23”,“doi-asserted-by”:“publisher”,”doi“:”10.1007\/978-3030-01261-8_28“},}”key“:”ref24“,”article-title“:”一个图像值16\u00d716个单词:图像识别的变形金刚”,“volume-tittle”:”ICLR“,”author“:”Dosovitski y“,”年“:“2021”},{“key”:“ref25”,“first-page”:“766”,“article-title”:“卷积神经网络的非监督鉴别特征学习”,“volume-title“:”NeurIPS“,”author“:”Dosovitskiy“,”year“:”2014“},”{“密钥”:“ref26”,“doi-asserted-by”:“publisher”,“doi”:“10.1109\/CVPR46437.2021.00585”}by“:”publisher“,”doi“:“10.1007\/s11263-020-01387-y”},{“key”:“ref28”,“doi-asserted-by”:“publisher”,“doi”:“10.1109\/CVPR.2019.00552”}ofer“,”year“:”2022“,”journal-title“:”arXiv“},{“key”:“ref31”,“doi-asserted-by”:“publisher”,“doi”:“10.1109\/ICCV.2017.129”}key“:”ref34“,”doi-asserted-by“:“publisher”,“DOI”:“10.1109\/ICCV.2017.196”},{“key”:“ref35”,“DOI-asserted-by”:“publicher”,“DOI”:”10.1109\/CVPR42600.2020.00975“},}“key”:”ref36“,”DOI-assert-by“:”publisher“,TPAMI.2014.2345390“},{“key”:“ref38”,“DOI-asserted-by”:“publisher”,“DOI”:“10.1007\/978-3-030-01237-3_4”},{“key”:“ref39”,“doi-asserted-by”:“publisher”,“doi”:“10.1109\/TPAMI.2019.2957464”},{“key”:“ref40”,“article-title”:“The dynamics human action video dataset”,“author”:“Kay”,“year”:“2017”,“journal-title“:”arXiv“}”,{”key“:”ref41“,”doi-assert-by“:”publisher“,“doi:”“10.1109\/CVPR.2019.00441”},{“键”:“参考42”,“doi-asserted-by”:“publisher”,“doi”:“10.1109\/CVPR.2018.00935”},{“key”:“ref43”,“doo-asserted-by”:”publisher“,”doi“:”10.1609\/aaaai.v33i01.33016706“},”{“key”:”ref44“,”article-title“:”一个信息跟踪基准“,”author“:”Li“,“year”:“2021”,“journal-title”:“arXiv”}“,{”key“:”ref45“,”doi-asserted-by“:”publisher“,”doi“:“10.1007\/978-3-031-20077-9_17”},{“key”:“ref46”,“doi断言者”:“publisher”,“doi”:“10.1145\/324058.3240709”},{“key”:“ref47”,“doi断言者”:“publisher”,“doi”:“10.1109\/TITS.2021.3103601”},{“key”:“ref48”,“文章标题”:“Swintrack:变压器跟踪的简单而有力的基线”,“作者”:“Lin”,“年份”:“2021”,“期刊标题”:“ar Xiv“},{“key”:“ref49”,“doi-asserted-by”:“publisher”,“doi”:“10.1007\/978-3-319-10602-1_48”},{“key”:”ref50“,”doi-assert-by“:”publisher“,”doi“:”10.1109\/CVPR52688.2022.00142“},”key“:”ref51“,”doi-asserted-by“doi-asserted-by“:”publisher“,”doi“:”10.1109\/CVPR42600.2020.00716“},{”key“:“ref53”,“doi-asserted-by”:“publisher”,“doi”:“10.1109\/CVPR.2017.515”},{“key”:“ref54”,“article-title”:“没有时间信息的Gool.ideo对象分段”,“volume-title“:”TPAMI“,“author”:“Maninis”,“year”:“2018”}、{“key”:”ref55“doi-sserted-by“:”publisher“,”doi“:”10.1109\/ICCV48922.2021.01319“},}”key“:”ref56“,”doi-asserted-by“:”publisher“,“DOI”:“10.1109\/TPAMI.20192901464”},{“key”:“ref57”,“DOI断言者”:“publisher”,“DOI”:“10.1007\/978-3-030-01246-5_19”},{“key”:“ref58”,“DOI断言者”:“publisher”,“DOI”:“10.1109\/CVPR.2016.465”},{“key”:“ref59”,“DOI断言者”:“publisher”,“DOI”:“10.1007\/978-3-319-46466-4_5”},{“key”:“ref60”,“DOI断言者”:“publisher”,“DOI”:“10.1109\/ICCV.2019.00932”},{“key”:“ref61”,“doi-asserted-by”:“publisher”,“doi”:“10.1007\/978-3-031-20047-2_33”},{“key”:“ref64”,“article-title”:“2017年戴维斯对视频对象分割的挑战”,“作者”:“Pont-Tuset”,“年份”:“2017”,“新闻标题”:“arXiv”},{“key”:“ref65”,“article-title”:“从自然语言监督中学习可转换的视觉模型”,“volume-title“:“ICML”,“author”:“Radford”,“year”:“2021”},“author”:“Ridnik”,“year”:“2021”,“journal-title”:“arXiv”},{“key”:“ref67”,“doi-asserted-by”:“publisher”,”doi“:”10.1109 \/CVPR42600.2020.00743“},”{“key”:”ref68“,”doi-assert-by“:”publisher“,”doi:“10.1007 \/s11263-015-0816-y”}“,{”key“:”ref69“,”article-title“:”无监督视频学习使用lstms表示“,”volume-title“:”ICML“,”author“:“Srivastava”,“year”:“2015”},{“key”:“ref70”,“doi-asserted-by”:“publisher”,”doi“:“10.1109\/CVPR.2016.158”}tle“:“训练通过注意力提取数据效率高的图像变换器”,“volume-title”:“ICML”,“author”:“Touvron”,《年份》:“2021”},{“key”:“ref73”,“doi-asserted-by”:“publisher”,”doi“:”10.1109\/ICCV48922.2021.00114“},”{“key”:”ref74“,”doi-assert-by“:”publisher“,”doi:“10.1109\/CVPR42600.2020.00661”}“,{”key“:”ref75“,”article le-title“:“使用场景动态生成视频”,“volume-title”:“NeurIPS”,“author”:“Vondrick”,“year”:“2016”},{“key”:“ref76”,“doi-asserted-by”:“publisher”,“doi”:“10.1109\/CVPR46437.2021.00162”}“:”publisher“,”doi“:”10.1109\/CVPR.2018.00511“},{”key“:“ref79”,“doi-asserted-by”:“publisher”,“doi”:“10.1109\/CVPR46437.2021.01355”},{“key”:“ref80”,“doi-assertd-by”:“publisher”,“DI:”10.1109\/ICCV.2019.00408“},}“key:”ref81“,”article-title“:”不同的跟踪任务需要不同的外观模型吗?“,”volume-title”:“NeurIPS”,“author”:“Wang”,“year”:“2021”}、{“key”:“ref82”,“doi-asserted-by”:“publisher”,“DOI”:“10.1109\/ICME51207.2021.9428441”},{“key”:“ref83”,“DOI-asserted-by”:“publicher”,“DOI”:”10.1109\/CVPR46437.2021.00301“},}“key:”ref84“,”DOI-assert-by“:”publisher“,”DOI“:”10.1007\/978-3-030-20873-8_8“}、{“key”:”ref85“,”DOI-asserted-by“”:”publicher“,”DI:“10.1109”109\/TPAMI.2014.2388226“},{“key”:“ref86”,“DOI-asserted-by”:“publisher”,“DOI”:“10.1109\/CVPR.2018.00393”},{“key”:“ref87”,“DOI-asserted-by”:“publisher”,“DOI:”10.1109\/CVPR52688.2022.00855“},“key“:”ref88“,”DOI-assert-by“:”publisher“,”DOI“:”10.1109\/CVPR46437.2021.01641“}、{“key”:”ref89“,”首页“:”9653“,”article-title“:”Sim-mim:简单框架用于蒙版图像建模”,“volume-title”:“CVPR”,“author”:“Xie”,“年份”:“2022”},{“key”:“ref90”,“article-title”:“Youtube-vos:一个大规模视频对象分割基准”,“author”:“Xu”,“year”:“2018”,“journal-title“:”arXiv“},}”key“:”ref91“,”doi-asserted-by“:”publisher“,”doi“:”10.1007\/978-3-031-19803-8_43“}10.1109\/ICCV48922.2021.01028“},{“键”:“参考93”,“doi-asserted-by”:“publisher”,“doi”:“10.1007\/978-3-030-01240-3_10”},{“key”:“ref94”,“doi-asserted-by”:”publisher“,”doi“:”10.1109\/CVPR42600.2020.00675,“文章标题”:“将对象与用于视频对象分割的变压器相关联”,“卷时间”:“NeurIPS”,“作者”:“Yang”,“年份”:“2021”},{“key”:“ref97”,“doi-asserted-by”:“publisher”,“doi”:“10.1007\/978-3-031-20047-2_20”}2“},{”键“:“ref99”,“doi-asserted-by”:“publisher”,“doi”:“10.1109\/ICCV.2019.00411”},{“key”:“ref100”,“article-title”:“图像着色”,“volume-title“:”ECCV“,”author“:”Zhang“,”year“:”2016“},“key“:”ref101“,”doi-assert-by“:”publisher“,“doi-asserted-by”:“publisher”,“doi”:“10.1109\/ICCV48922.2021.01309”},{“key”:“ref103”,“article-title”:“用于实时视觉跟踪的更深入和更广泛的暹罗网络”,“volume-title“:”CVPR“,”author“:”Zhang“,”year“:”2017“},{“key”:”ref104“,”doi-asserted-by“:”publisher“,“doi”:“10.1007\/978-3030-5858589-1_46”}],“event”:{“name”:“2023 IEEE\/CVF Computer Vision and Pattern Recognition(CVPR)Conference”,“location”:“加拿大不列颠哥伦比亚省温哥华”,“start”:{“date-parts”:[[2023,6,17]]},“end”:{“date-parts”:[[2023,6,24]]}},”container-title“:[”2023 IEEE\/CVF Computer Vision and Pattern Recognition(CVPR)会议“],“original-title”:[],“link”:[{“URL”:“http://\xplorestaging.IEEE.org\/ielx7\/102030337\/10203050\/10203159.pdf?arnumber=10203159“,”内容类型“:“unspecified”,“content-version”:“vor”,“intended-application”:“similarity-checking”}],“deposed”:{“date-parts”:[[2024,3,1]],“date-time”:“2024-03-01T17:14:33Z”,“timestamp”:1709313273000},“score”:1,“resource”:{primary“:{”URL“https:\/\/ieeexplore.iee.org\/document\/10203159\/”}},标题“:[],”发布“:{“日期部分”:[[2023,6]]},“references-count”:104,“URL”:“http://\/dx.doi.org\/10.109\/cvpr52729.2023.01399”,“relation”:{},“subject”:[],“published”:{“date-parts”:[2023,6]]}}}