Papers
- Back
Holocurtains: Programming Light Curtains via Binary Holography-
[pdf]
[supp]
[bibtex]@InProceedings{Chan_2022_CVPR, author = {Chan, Dorian and Narasimhan, Srinivasa G. and O'Toole, Matthew}, title = {Holocurtains: Programming Light Curtains via Binary Holography}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17886-17895} }
Learning Adaptive Warping for Real-World Rolling Shutter Correction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cao_2022_CVPR, author = {Cao, Mingdeng and Zhong, Zhihang and Wang, Jiahao and Zheng, Yinqiang and Yang, Yujiu}, title = {Learning Adaptive Warping for Real-World Rolling Shutter Correction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17785-17793} }
Bongard-HOI: Benchmarking Few-Shot Visual Reasoning for Human-Object Interactions-
[pdf]
[supp]
[bibtex]@InProceedings{Jiang_2022_CVPR, author = {Jiang, Huaizu and Ma, Xiaojian and Nie, Weili and Yu, Zhiding and Zhu, Yuke and Anandkumar, Anima}, title = {Bongard-HOI: Benchmarking Few-Shot Visual Reasoning for Human-Object Interactions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19056-19065} }
ZeroCap: Zero-Shot Image-to-Text Generation for Visual-Semantic Arithmetic-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tewel_2022_CVPR, author = {Tewel, Yoad and Shalev, Yoav and Schwartz, Idan and Wolf, Lior}, title = {ZeroCap: Zero-Shot Image-to-Text Generation for Visual-Semantic Arithmetic}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17918-17928} }
End-to-End Generative Pretraining for Multimodal Video Captioning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Seo_2022_CVPR, author = {Seo, Paul Hongsuck and Nagrani, Arsha and Arnab, Anurag and Schmid, Cordelia}, title = {End-to-End Generative Pretraining for Multimodal Video Captioning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17959-17968} }
Stochastic Trajectory Prediction via Motion Indeterminacy Diffusion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gu_2022_CVPR, author = {Gu, Tianpei and Chen, Guangyi and Li, Junlong and Lin, Chunze and Rao, Yongming and Zhou, Jie and Lu, Jiwen}, title = {Stochastic Trajectory Prediction via Motion Indeterminacy Diffusion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17113-17122} }
Cross-Modal Clinical Graph Transformer for Ophthalmic Report Generation-
[pdf]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Mingjie and Cai, Wenjia and Verspoor, Karin and Pan, Shirui and Liang, Xiaodan and Chang, Xiaojun}, title = {Cross-Modal Clinical Graph Transformer for Ophthalmic Report Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20656-20665} }
Human-Object Interaction Detection via Disentangled Transformer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhou_2022_CVPR, author = {Zhou, Desen and Liu, Zhichao and Wang, Jian and Wang, Leshan and Hu, Tao and Ding, Errui and Wang, Jingdong}, title = {Human-Object Interaction Detection via Disentangled Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19568-19577} }
CVF-SID: Cyclic Multi-Variate Function for Self-Supervised Image Denoising by Disentangling Noise From Image-
[pdf]
[supp]
[bibtex]@InProceedings{Neshatavar_2022_CVPR, author = {Neshatavar, Reyhaneh and Yavartanoo, Mohsen and Son, Sanghyun and Lee, Kyoung Mu}, title = {CVF-SID: Cyclic Multi-Variate Function for Self-Supervised Image Denoising by Disentangling Noise From Image}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17583-17591} }
FaceFormer: Speech-Driven 3D Facial Animation With Transformers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fan_2022_CVPR, author = {Fan, Yingruo and Lin, Zhaojiang and Saito, Jun and Wang, Wenping and Komura, Taku}, title = {FaceFormer: Speech-Driven 3D Facial Animation With Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18770-18780} }
Exploring Patch-Wise Semantic Relation for Contrastive Learning in Image-to-Image Translation Tasks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jung_2022_CVPR, author = {Jung, Chanyong and Kwon, Gihyun and Ye, Jong Chul}, title = {Exploring Patch-Wise Semantic Relation for Contrastive Learning in Image-to-Image Translation Tasks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18260-18269} }
Towards General Purpose Vision Systems: An End-to-End Task-Agnostic Vision-Language Architecture-
[pdf]
[supp]
[bibtex]@InProceedings{Gupta_2022_CVPR, author = {Gupta, Tanmay and Kamath, Amita and Kembhavi, Aniruddha and Hoiem, Derek}, title = {Towards General Purpose Vision Systems: An End-to-End Task-Agnostic Vision-Language Architecture}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16399-16409} }
LiT: Zero-Shot Transfer With Locked-Image Text Tuning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhai_2022_CVPR, author = {Zhai, Xiaohua and Wang, Xiao and Mustafa, Basil and Steiner, Andreas and Keysers, Daniel and Kolesnikov, Alexander and Beyer, Lucas}, title = {LiT: Zero-Shot Transfer With Locked-Image Text Tuning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18123-18133} }
GeoNeRF: Generalizing NeRF With Geometry Priors-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Johari_2022_CVPR, author = {Johari, Mohammad Mahdi and Lepoittevin, Yann and Fleuret, Fran\c{c}ois}, title = {GeoNeRF: Generalizing NeRF With Geometry Priors}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18365-18375} }
PhoCaL: A Multi-Modal Dataset for Category-Level Object Pose Estimation With Photometrically Challenging Objects-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2022_CVPR, author = {Wang, Pengyuan and Jung, HyunJun and Li, Yitong and Shen, Siyuan and Srikanth, Rahul Parthasarathy and Garattoni, Lorenzo and Meier, Sven and Navab, Nassir and Busam, Benjamin}, title = {PhoCaL: A Multi-Modal Dataset for Category-Level Object Pose Estimation With Photometrically Challenging Objects}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21222-21231} }
Uformer: A General U-Shaped Transformer for Image Restoration-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2022_CVPR, author = {Wang, Zhendong and Cun, Xiaodong and Bao, Jianmin and Zhou, Wengang and Liu, Jianzhuang and Li, Houqiang}, title = {Uformer: A General U-Shaped Transformer for Image Restoration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17683-17693} }
Bridge-Prompt: Towards Ordinal Action Understanding in Instructional Videos-
[pdf]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Muheng and Chen, Lei and Duan, Yueqi and Hu, Zhilan and Feng, Jianjiang and Zhou, Jie and Lu, Jiwen}, title = {Bridge-Prompt: Towards Ordinal Action Understanding in Instructional Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19880-19889} }
Cerberus Transformer: Joint Semantic, Affordance and Attribute Parsing-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2022_CVPR, author = {Chen, Xiaoxue and Liu, Tianyu and Zhao, Hao and Zhou, Guyue and Zhang, Ya-Qin}, title = {Cerberus Transformer: Joint Semantic, Affordance and Attribute Parsing}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19649-19658} }
Single-Photon Structured Light-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sundar_2022_CVPR, author = {Sundar, Varun and Ma, Sizhuo and Sankaranarayanan, Aswin C. and Gupta, Mohit}, title = {Single-Photon Structured Light}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17865-17875} }
Deblurring via Stochastic Refinement-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Whang_2022_CVPR, author = {Whang, Jay and Delbracio, Mauricio and Talebi, Hossein and Saharia, Chitwan and Dimakis, Alexandros G. and Milanfar, Peyman}, title = {Deblurring via Stochastic Refinement}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16293-16303} }
3DJCG: A Unified Framework for Joint Dense Captioning and Visual Grounding on 3D Point Clouds-
[pdf]
[bibtex]@InProceedings{Cai_2022_CVPR, author = {Cai, Daigang and Zhao, Lichen and Zhang, Jing and Sheng, Lu and Xu, Dong}, title = {3DJCG: A Unified Framework for Joint Dense Captioning and Visual Grounding on 3D Point Clouds}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16464-16473} }
Abandoning the Bayer-Filter To See in the Dark-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dong_2022_CVPR, author = {Dong, Xingbo and Xu, Wanyan and Miao, Zhihui and Ma, Lan and Zhang, Chao and Yang, Jiewen and Jin, Zhe and Teoh, Andrew Beng Jin and Shen, Jiajun}, title = {Abandoning the Bayer-Filter To See in the Dark}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17431-17440} }
Exploiting Temporal Relations on Radar Perception for Autonomous Driving-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Peizhao and Wang, Pu and Berntorp, Karl and Liu, Hongfu}, title = {Exploiting Temporal Relations on Radar Perception for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17071-17080} }
Forward Compatible Training for Large-Scale Embedding Retrieval Systems-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ramanujan_2022_CVPR, author = {Ramanujan, Vivek and Vasu, Pavan Kumar Anasosalu and Farhadi, Ali and Tuzel, Oncel and Pouransari, Hadi}, title = {Forward Compatible Training for Large-Scale Embedding Retrieval Systems}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19386-19395} }
Everything at Once - Multi-Modal Fusion Transformer for Video Retrieval-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shvetsova_2022_CVPR, author = {Shvetsova, Nina and Chen, Brian and Rouditchenko, Andrew and Thomas, Samuel and Kingsbury, Brian and Feris, Rogerio S. and Harwath, David and Glass, James and Kuehne, Hilde}, title = {Everything at Once - Multi-Modal Fusion Transformer for Video Retrieval}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20020-20029} }
Neural Template: Topology-Aware Reconstruction and Disentangled Generation of 3D Meshes-
[pdf]
[supp]
[bibtex]@InProceedings{Hui_2022_CVPR, author = {Hui, Ka-Hei and Li, Ruihui and Hu, Jingyu and Fu, Chi-Wing}, title = {Neural Template: Topology-Aware Reconstruction and Disentangled Generation of 3D Meshes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18572-18582} }
AdaFace: Quality Adaptive Margin for Face Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2022_CVPR, author = {Kim, Minchul and Jain, Anil K. and Liu, Xiaoming}, title = {AdaFace: Quality Adaptive Margin for Face Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18750-18759} }
Learning Soft Estimator of Keypoint Scale and Orientation With Probabilistic Covariant Loss-
[pdf]
[supp]
[bibtex]@InProceedings{Yan_2022_CVPR, author = {Yan, Pei and Tan, Yihua and Xiong, Shengzhou and Tai, Yuan and Li, Yansheng}, title = {Learning Soft Estimator of Keypoint Scale and Orientation With Probabilistic Covariant Loss}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19406-19415} }
Opening Up Open World Tracking-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2022_CVPR, author = {Liu, Yang and Zulfikar, Idil Esen and Luiten, Jonathon and Dave, Achal and Ramanan, Deva and Leibe, Bastian and O\v{s}ep, Aljo\v{s}a and Leal-Taix\'e, Laura}, title = {Opening Up Open World Tracking}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19045-19055} }
OSSO: Obtaining Skeletal Shape From Outside-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Keller_2022_CVPR, author = {Keller, Marilyn and Zuffi, Silvia and Black, Michael J. and Pujades, Sergi}, title = {OSSO: Obtaining Skeletal Shape From Outside}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20492-20501} }
Bayesian Invariant Risk Minimization-
[pdf]
[supp]
[bibtex]@InProceedings{Lin_2022_CVPR, author = {Lin, Yong and Dong, Hanze and Wang, Hao and Zhang, Tong}, title = {Bayesian Invariant Risk Minimization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16021-16030} }
Alleviating Semantics Distortion in Unsupervised Low-Level Image-to-Image Translation via Structure Consistency Constraint-
[pdf]
[supp]
[bibtex]@InProceedings{Guo_2022_CVPR, author = {Guo, Jiaxian and Li, Jiachen and Fu, Huan and Gong, Mingming and Zhang, Kun and Tao, Dacheng}, title = {Alleviating Semantics Distortion in Unsupervised Low-Level Image-to-Image Translation via Structure Consistency Constraint}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18249-18259} }
Uni-Perceiver: Pre-Training Unified Architecture for Generic Perception for Zero-Shot and Few-Shot Tasks-
[pdf]
[supp]
[bibtex]@InProceedings{Zhu_2022_CVPR, author = {Zhu, Xizhou and Zhu, Jinguo and Li, Hao and Wu, Xiaoshi and Li, Hongsheng and Wang, Xiaohua and Dai, Jifeng}, title = {Uni-Perceiver: Pre-Training Unified Architecture for Generic Perception for Zero-Shot and Few-Shot Tasks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16804-16815} }
The Auto Arborist Dataset: A Large-Scale Benchmark for Multiview Urban Forest Monitoring Under Domain Shift-
[pdf]
[supp]
[bibtex]@InProceedings{Beery_2022_CVPR, author = {Beery, Sara and Wu, Guanhang and Edwards, Trevor and Pavetic, Filip and Majewski, Bo and Mukherjee, Shreyasee and Chan, Stanley and Morgan, John and Rathod, Vivek and Huang, Jonathan}, title = {The Auto Arborist Dataset: A Large-Scale Benchmark for Multiview Urban Forest Monitoring Under Domain Shift}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21294-21307} }
Real-Time, Accurate, and Consistent Video Semantic Segmentation via Unsupervised Adaptation and Cross-Unit Deployment on Mobile Device-
[pdf]
[supp]
[bibtex]@InProceedings{Park_2022_CVPR, author = {Park, Hyojin and Yessenbayev, Alan and Singhal, Tushar and Adhikari, Navin Kumar and Zhang, Yizhe and Borse, Shubhankar Mangesh and Cai, Hong and Pandey, Nilesh Prasad and Yin, Fei and Mayer, Frank and Calidas, Balaji and Porikli, Fatih}, title = {Real-Time, Accurate, and Consistent Video Semantic Segmentation via Unsupervised Adaptation and Cross-Unit Deployment on Mobile Device}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21431-21438} }
A Style-Aware Discriminator for Controllable Image Translation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2022_CVPR, author = {Kim, Kunhee and Park, Sanghun and Jeon, Eunyeong and Kim, Taehun and Kim, Daijin}, title = {A Style-Aware Discriminator for Controllable Image Translation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18239-18248} }
Incremental Cross-View Mutual Distillation for Self-Supervised Medical CT Synthesis-
[pdf]
[arXiv]
[bibtex]@InProceedings{Fang_2022_CVPR, author = {Fang, Chaowei and Wang, Liang and Zhang, Dingwen and Xu, Jun and Yuan, Yixuan and Han, Junwei}, title = {Incremental Cross-View Mutual Distillation for Self-Supervised Medical CT Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20677-20686} }
Moving Window Regression: A Novel Approach to Ordinal Regression-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shin_2022_CVPR, author = {Shin, Nyeong-Ho and Lee, Seon-Ho and Kim, Chang-Su}, title = {Moving Window Regression: A Novel Approach to Ordinal Regression}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18760-18769} }
ACPL: Anti-Curriculum Pseudo-Labelling for Semi-Supervised Medical Image Classification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2022_CVPR, author = {Liu, Fengbei and Tian, Yu and Chen, Yuanhong and Liu, Yuyuan and Belagiannis, Vasileios and Carneiro, Gustavo}, title = {ACPL: Anti-Curriculum Pseudo-Labelling for Semi-Supervised Medical Image Classification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20697-20706} }
Learning to Deblur Using Light Field Generated and Real Defocus Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ruan_2022_CVPR, author = {Ruan, Lingyan and Chen, Bin and Li, Jizhou and Lam, Miuling}, title = {Learning to Deblur Using Light Field Generated and Real Defocus Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16304-16313} }
PhotoScene: Photorealistic Material and Lighting Transfer for Indoor Scenes-
[pdf]
[supp]
[bibtex]@InProceedings{Yeh_2022_CVPR, author = {Yeh, Yu-Ying and Li, Zhengqin and Hold-Geoffroy, Yannick and Zhu, Rui and Xu, Zexiang and Ha\v{s}an, Milo\v{s} and Sunkavalli, Kalyan and Chandraker, Manmohan}, title = {PhotoScene: Photorealistic Material and Lighting Transfer for Indoor Scenes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18562-18571} }
Versatile Multi-Modal Pre-Training for Human-Centric Perception-
[pdf]
[arXiv]
[bibtex]@InProceedings{Hong_2022_CVPR, author = {Hong, Fangzhou and Pan, Liang and Cai, Zhongang and Liu, Ziwei}, title = {Versatile Multi-Modal Pre-Training for Human-Centric Perception}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16156-16166} }
Contrastive Regression for Domain Adaptation on Gaze Estimation-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2022_CVPR, author = {Wang, Yaoming and Jiang, Yangzhou and Li, Jin and Ni, Bingbing and Dai, Wenrui and Li, Chenglin and Xiong, Hongkai and Li, Teng}, title = {Contrastive Regression for Domain Adaptation on Gaze Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19376-19385} }
Multi-View Consistent Generative Adversarial Networks for 3D-Aware Image Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2022_CVPR, author = {Zhang, Xuanmeng and Zheng, Zhedong and Gao, Daiheng and Zhang, Bang and Pan, Pan and Yang, Yi}, title = {Multi-View Consistent Generative Adversarial Networks for 3D-Aware Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18450-18459} }
Memory-Augmented Non-Local Attention for Video Super-Resolution-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yu_2022_CVPR, author = {Yu, Jiyang and Liu, Jingen and Bo, Liefeng and Mei, Tao}, title = {Memory-Augmented Non-Local Attention for Video Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17834-17843} }
Classification-Then-Grounding: Reformulating Video Scene Graphs As Temporal Bipartite Graphs-
[pdf]
[supp]
[bibtex]@InProceedings{Gao_2022_CVPR, author = {Gao, Kaifeng and Chen, Long and Niu, Yulei and Shao, Jian and Xiao, Jun}, title = {Classification-Then-Grounding: Reformulating Video Scene Graphs As Temporal Bipartite Graphs}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19497-19506} }
Transformer-Empowered Multi-Scale Contextual Matching and Aggregation for Multi-Contrast MRI Super-Resolution-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Guangyuan and Lv, Jun and Tian, Yapeng and Dou, Qi and Wang, Chengyan and Xu, Chenliang and Qin, Jing}, title = {Transformer-Empowered Multi-Scale Contextual Matching and Aggregation for Multi-Contrast MRI Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20636-20645} }
GateHUB: Gated History Unit With Background Suppression for Online Action Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2022_CVPR, author = {Chen, Junwen and Mittal, Gaurav and Yu, Ye and Kong, Yu and Chen, Mei}, title = {GateHUB: Gated History Unit With Background Suppression for Online Action Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19925-19934} }
Bridging Video-Text Retrieval With Multiple Choice Questions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ge_2022_CVPR, author = {Ge, Yuying and Ge, Yixiao and Liu, Xihui and Li, Dian and Shan, Ying and Qie, Xiaohu and Luo, Ping}, title = {Bridging Video-Text Retrieval With Multiple Choice Questions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16167-16176} }
DF-GAN: A Simple and Effective Baseline for Text-to-Image Synthesis-
[pdf]
[bibtex]@InProceedings{Tao_2022_CVPR, author = {Tao, Ming and Tang, Hao and Wu, Fei and Jing, Xiao-Yuan and Bao, Bing-Kun and Xu, Changsheng}, title = {DF-GAN: A Simple and Effective Baseline for Text-to-Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16515-16525} }
CoNeRF: Controllable Neural Radiance Fields-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kania_2022_CVPR, author = {Kania, Kacper and Yi, Kwang Moo and Kowalski, Marek and Trzci\'nski, Tomasz and Tagliasacchi, Andrea}, title = {CoNeRF: Controllable Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18623-18632} }
Noise2NoiseFlow: Realistic Camera Noise Modeling Without Clean Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Maleky_2022_CVPR, author = {Maleky, Ali and Kousha, Shayan and Brown, Michael S. and Brubaker, Marcus A.}, title = {Noise2NoiseFlow: Realistic Camera Noise Modeling Without Clean Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17632-17641} }
ZeroWaste Dataset: Towards Deformable Object Segmentation in Cluttered Scenes-
[pdf]
[arXiv]
[bibtex]@InProceedings{Bashkirova_2022_CVPR, author = {Bashkirova, Dina and Abdelfattah, Mohamed and Zhu, Ziliang and Akl, James and Alladkani, Fadi and Hu, Ping and Ablavsky, Vitaly and Calli, Berk and Bargal, Sarah Adel and Saenko, Kate}, title = {ZeroWaste Dataset: Towards Deformable Object Segmentation in Cluttered Scenes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21147-21157} }
UNIST: Unpaired Neural Implicit Shape Translation Network-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2022_CVPR, author = {Chen, Qimin and Merz, Johannes and Sanghi, Aditya and Shayani, Hooman and Mahdavi-Amiri, Ali and Zhang, Hao}, title = {UNIST: Unpaired Neural Implicit Shape Translation Network}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18614-18622} }
Local-Adaptive Face Recognition via Graph-Based Meta-Clustering and Regularized Adaptation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2022_CVPR, author = {Zhu, Wenbin and Wang, Chien-Yi and Tseng, Kuan-Lun and Lai, Shang-Hong and Wang, Baoyuan}, title = {Local-Adaptive Face Recognition via Graph-Based Meta-Clustering and Regularized Adaptation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20301-20310} }
The DEVIL Is in the Details: A Diagnostic Evaluation Benchmark for Video Inpainting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Szeto_2022_CVPR, author = {Szeto, Ryan and Corso, Jason J.}, title = {The DEVIL Is in the Details: A Diagnostic Evaluation Benchmark for Video Inpainting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21054-21063} }
Generating Useful Accident-Prone Driving Scenarios via a Learned Traffic Prior-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Rempe_2022_CVPR, author = {Rempe, Davis and Philion, Jonah and Guibas, Leonidas J. and Fidler, Sanja and Litany, Or}, title = {Generating Useful Accident-Prone Driving Scenarios via a Learned Traffic Prior}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17305-17315} }
Efficient Geometry-Aware 3D Generative Adversarial Networks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chan_2022_CVPR, author = {Chan, Eric R. and Lin, Connor Z. and Chan, Matthew A. and Nagano, Koki and Pan, Boxiao and De Mello, Shalini and Gallo, Orazio and Guibas, Leonidas J. and Tremblay, Jonathan and Khamis, Sameh and Karras, Tero and Wetzstein, Gordon}, title = {Efficient Geometry-Aware 3D Generative Adversarial Networks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16123-16133} }
Dancing Under the Stars: Video Denoising in Starlight-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Monakhova_2022_CVPR, author = {Monakhova, Kristina and Richter, Stephan R. and Waller, Laura and Koltun, Vladlen}, title = {Dancing Under the Stars: Video Denoising in Starlight}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16241-16251} }
SPAct: Self-Supervised Privacy Preservation for Action Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dave_2022_CVPR, author = {Dave, Ishan Rajendrakumar and Chen, Chen and Shah, Mubarak}, title = {SPAct: Self-Supervised Privacy Preservation for Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20164-20173} }
De-Rendering 3D Objects in the Wild-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wimbauer_2022_CVPR, author = {Wimbauer, Felix and Wu, Shangzhe and Rupprecht, Christian}, title = {De-Rendering 3D Objects in the Wild}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18490-18499} }
Representing 3D Shapes With Probabilistic Directed Distance Fields-
[pdf]
[supp]
[bibtex]@InProceedings{Aumentado-Armstrong_2022_CVPR, author = {Aumentado-Armstrong, Tristan and Tsogkas, Stavros and Dickinson, Sven and Jepson, Allan D.}, title = {Representing 3D Shapes With Probabilistic Directed Distance Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19343-19354} }
Learning ABCs: Approximate Bijective Correspondence for Isolating Factors of Variation With Weak Supervision-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Murphy_2022_CVPR, author = {Murphy, Kieran A. and Jampani, Varun and Ramalingam, Srikumar and Makadia, Ameesh}, title = {Learning ABCs: Approximate Bijective Correspondence for Isolating Factors of Variation With Weak Supervision}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16010-16020} }
ABO: Dataset and Benchmarks for Real-World 3D Object Understanding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Collins_2022_CVPR, author = {Collins, Jasmine and Goel, Shubham and Deng, Kenan and Luthra, Achleshwar and Xu, Leon and Gundogdu, Erhan and Zhang, Xi and Vicente, Tomas F. Yago and Dideriksen, Thomas and Arora, Himanshu and Guillaumin, Matthieu and Malik, Jitendra}, title = {ABO: Dataset and Benchmarks for Real-World 3D Object Understanding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21126-21136} }
MS-TCT: Multi-Scale Temporal ConvTransformer for Action Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Dai_2022_CVPR, author = {Dai, Rui and Das, Srijan and Kahatapitiya, Kumara and Ryoo, Michael S. and Br\'emond, Fran\c{c}ois}, title = {MS-TCT: Multi-Scale Temporal ConvTransformer for Action Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20041-20051} }
Make It Move: Controllable Image-to-Video Generation With Text Descriptions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hu_2022_CVPR, author = {Hu, Yaosi and Luo, Chong and Chen, Zhenzhong}, title = {Make It Move: Controllable Image-to-Video Generation With Text Descriptions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18219-18228} }
Neural Points: Point Cloud Representation With Neural Fields for Arbitrary Upsampling-
[pdf]
[arXiv]
[bibtex]@InProceedings{Feng_2022_CVPR, author = {Feng, Wanquan and Li, Jin and Cai, Hongrui and Luo, Xiaonan and Zhang, Juyong}, title = {Neural Points: Point Cloud Representation With Neural Fields for Arbitrary Upsampling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18633-18642} }
FIFO: Learning Fog-Invariant Features for Foggy Scene Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2022_CVPR, author = {Lee, Sohyun and Son, Taeyoung and Kwak, Suha}, title = {FIFO: Learning Fog-Invariant Features for Foggy Scene Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18911-18921} }
Unsupervised Visual Representation Learning by Online Constrained K-Means-
[pdf]
[supp]
[bibtex]@InProceedings{Qian_2022_CVPR, author = {Qian, Qi and Xu, Yuanhong and Hu, Juhua and Li, Hao and Jin, Rong}, title = {Unsupervised Visual Representation Learning by Online Constrained K-Means}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16640-16649} }
Neural Point Light Fields-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ost_2022_CVPR, author = {Ost, Julian and Laradji, Issam and Newell, Alejandro and Bahat, Yuval and Heide, Felix}, title = {Neural Point Light Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18419-18429} }
Vehicle Trajectory Prediction Works, but Not Everywhere-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bahari_2022_CVPR, author = {Bahari, Mohammadhossein and Saadatnejad, Saeed and Rahimi, Ahmad and Shaverdikondori, Mohammad and Shahidzadeh, Amir Hossein and Moosavi-Dezfooli, Seyed-Mohsen and Alahi, Alexandre}, title = {Vehicle Trajectory Prediction Works, but Not Everywhere}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17123-17133} }
Instance-Wise Occlusion and Depth Orders in Natural Scenes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2022_CVPR, author = {Lee, Hyunmin and Park, Jaesik}, title = {Instance-Wise Occlusion and Depth Orders in Natural Scenes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21210-21221} }
Contour-Hugging Heatmaps for Landmark Detection-
[pdf]
[supp]
[bibtex]@InProceedings{McCouat_2022_CVPR, author = {McCouat, James and Voiculescu, Irina}, title = {Contour-Hugging Heatmaps for Landmark Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20597-20605} }
DisARM: Displacement Aware Relation Module for 3D Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Duan_2022_CVPR, author = {Duan, Yao and Zhu, Chenyang and Lan, Yuqing and Yi, Renjiao and Liu, Xinwang and Xu, Kai}, title = {DisARM: Displacement Aware Relation Module for 3D Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16980-16989} }
NeRF-Editing: Geometry Editing of Neural Radiance Fields-
[pdf]
[supp]
[bibtex]@InProceedings{Yuan_2022_CVPR, author = {Yuan, Yu-Jie and Sun, Yang-Tian and Lai, Yu-Kun and Ma, Yuewen and Jia, Rongfei and Gao, Lin}, title = {NeRF-Editing: Geometry Editing of Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18353-18364} }
Optimal Correction Cost for Object Detection Evaluation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Otani_2022_CVPR, author = {Otani, Mayu and Togashi, Riku and Nakashima, Yuta and Rahtu, Esa and Heikkil\"a, Janne and Satoh, Shin'ichi}, title = {Optimal Correction Cost for Object Detection Evaluation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21107-21115} }
Artistic Style Discovery With Independent Components-
[pdf]
[bibtex]@InProceedings{Xie_2022_CVPR, author = {Xie, Xin and Li, Yi and Huang, Huaibo and Fu, Haiyan and Wang, Wanwan and Guo, Yanqing}, title = {Artistic Style Discovery With Independent Components}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19870-19879} }
HyperStyle: StyleGAN Inversion With HyperNetworks for Real Image Editing-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Alaluf_2022_CVPR, author = {Alaluf, Yuval and Tov, Omer and Mokady, Ron and Gal, Rinon and Bermano, Amit}, title = {HyperStyle: StyleGAN Inversion With HyperNetworks for Real Image Editing}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18511-18521} }
LTP: Lane-Based Trajectory Prediction for Autonomous Driving-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2022_CVPR, author = {Wang, Jingke and Ye, Tengju and Gu, Ziqing and Chen, Junbo}, title = {LTP: Lane-Based Trajectory Prediction for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17134-17142} }
AP-BSN: Self-Supervised Denoising for Real-World Images via Asymmetric PD and Blind-Spot Network-
[pdf]
[supp]
[bibtex]@InProceedings{Lee_2022_CVPR, author = {Lee, Wooseok and Son, Sanghyun and Lee, Kyoung Mu}, title = {AP-BSN: Self-Supervised Denoising for Real-World Images via Asymmetric PD and Blind-Spot Network}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17725-17734} }
Not All Points Are Equal: Learning Highly Efficient Point-Based Detectors for 3D LiDAR Point Clouds-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2022_CVPR, author = {Zhang, Yifan and Hu, Qingyong and Xu, Guoquan and Ma, Yanxin and Wan, Jianwei and Guo, Yulan}, title = {Not All Points Are Equal: Learning Highly Efficient Point-Based Detectors for 3D LiDAR Point Clouds}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18953-18962} }
RigNeRF: Fully Controllable Neural 3D Portraits-
[pdf]
[bibtex]@InProceedings{Athar_2022_CVPR, author = {Athar, ShahRukh and Xu, Zexiang and Sunkavalli, Kalyan and Shechtman, Eli and Shu, Zhixin}, title = {RigNeRF: Fully Controllable Neural 3D Portraits}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20364-20373} }
CLIP-Forge: Towards Zero-Shot Text-To-Shape Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Sanghi_2022_CVPR, author = {Sanghi, Aditya and Chu, Hang and Lambourne, Joseph G. and Wang, Ye and Cheng, Chin-Yi and Fumero, Marco and Malekshan, Kamal Rahimi}, title = {CLIP-Forge: Towards Zero-Shot Text-To-Shape Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18603-18613} }
Instance-Dependent Label-Noise Learning With Manifold-Regularized Transition Matrix Estimation-
[pdf]
[bibtex]@InProceedings{Cheng_2022_CVPR, author = {Cheng, De and Liu, Tongliang and Ning, Yixiong and Wang, Nannan and Han, Bo and Niu, Gang and Gao, Xinbo and Sugiyama, Masashi}, title = {Instance-Dependent Label-Noise Learning With Manifold-Regularized Transition Matrix Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16630-16639} }
Rethinking the Augmentation Module in Contrastive Learning: Learning Hierarchical Augmentation Invariance With Expanded Views-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhang_2022_CVPR, author = {Zhang, Junbo and Ma, Kaisheng}, title = {Rethinking the Augmentation Module in Contrastive Learning: Learning Hierarchical Augmentation Invariance With Expanded Views}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16650-16659} }
Equivariant Point Cloud Analysis via Learning Orientations for Message Passing-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Luo_2022_CVPR, author = {Luo, Shitong and Li, Jiahan and Guan, Jiaqi and Su, Yufeng and Cheng, Chaoran and Peng, Jian and Ma, Jianzhu}, title = {Equivariant Point Cloud Analysis via Learning Orientations for Message Passing}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18932-18941} }
Node Representation Learning in Graph via Node-to-Neighbourhood Mutual Information Maximization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dong_2022_CVPR, author = {Dong, Wei and Wu, Junsheng and Luo, Yi and Ge, Zongyuan and Wang, Peng}, title = {Node Representation Learning in Graph via Node-to-Neighbourhood Mutual Information Maximization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16620-16629} }
Point Cloud Pre-Training With Natural 3D Structures-
[pdf]
[supp]
[bibtex]@InProceedings{Yamada_2022_CVPR, author = {Yamada, Ryosuke and Kataoka, Hirokatsu and Chiba, Naoya and Domae, Yukiyasu and Ogata, Tetsuya}, title = {Point Cloud Pre-Training With Natural 3D Structures}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21283-21293} }
StyleT2I: Toward Compositional and High-Fidelity Text-to-Image Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Zhiheng and Min, Martin Renqiang and Li, Kai and Xu, Chenliang}, title = {StyleT2I: Toward Compositional and High-Fidelity Text-to-Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18197-18207} }
V-Doc: Visual Questions Answers With Documents-
[pdf]
[bibtex]@InProceedings{Ding_2022_CVPR, author = {Ding, Yihao and Huang, Zhe and Wang, Runlin and Zhang, YanHang and Chen, Xianru and Ma, Yuzhong and Chung, Hyunsuk and Han, Soyeon Caren}, title = {V-Doc: Visual Questions Answers With Documents}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21492-21498} }
Uncertainty-Guided Probabilistic Transformer for Complex Action Recognition-
[pdf]
[bibtex]@InProceedings{Guo_2022_CVPR, author = {Guo, Hongji and Wang, Hanjing and Ji, Qiang}, title = {Uncertainty-Guided Probabilistic Transformer for Complex Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20052-20061} }
V2C: Visual Voice Cloning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2022_CVPR, author = {Chen, Qi and Tan, Mingkui and Qi, Yuankai and Zhou, Jiaqiu and Li, Yuanqing and Wu, Qi}, title = {V2C: Visual Voice Cloning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21242-21251} }
EvUnroll: Neuromorphic Events Based Rolling Shutter Image Correction-
[pdf]
[supp]
[bibtex]@InProceedings{Zhou_2022_CVPR, author = {Zhou, Xinyu and Duan, Peiqi and Ma, Yi and Shi, Boxin}, title = {EvUnroll: Neuromorphic Events Based Rolling Shutter Image Correction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17775-17784} }
Gait Recognition in the Wild With Dense 3D Representations and a Benchmark-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zheng_2022_CVPR, author = {Zheng, Jinkai and Liu, Xinchen and Liu, Wu and He, Lingxiao and Yan, Chenggang and Mei, Tao}, title = {Gait Recognition in the Wild With Dense 3D Representations and a Benchmark}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20228-20237} }
Temporal Context Matters: Enhancing Single Image Prediction With Disease Progression Representations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Konwer_2022_CVPR, author = {Konwer, Aishik and Xu, Xuan and Bae, Joseph and Chen, Chao and Prasanna, Prateek}, title = {Temporal Context Matters: Enhancing Single Image Prediction With Disease Progression Representations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18824-18835} }
Learning From All Vehicles-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2022_CVPR, author = {Chen, Dian and Kr\"ahenb\"uhl, Philipp}, title = {Learning From All Vehicles}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17222-17231} }
Towards Driving-Oriented Metric for Lane Detection Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sato_2022_CVPR, author = {Sato, Takami and Chen, Qi Alfred}, title = {Towards Driving-Oriented Metric for Lane Detection Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17153-17162} }
XYDeblur: Divide and Conquer for Single Image Deblurring-
[pdf]
[supp]
[bibtex]@InProceedings{Ji_2022_CVPR, author = {Ji, Seo-Won and Lee, Jeongmin and Kim, Seung-Wook and Hong, Jun-Pyo and Baek, Seung-Jin and Jung, Seung-Won and Ko, Sung-Jea}, title = {XYDeblur: Divide and Conquer for Single Image Deblurring}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17421-17430} }
STCrowd: A Multimodal Dataset for Pedestrian Perception in Crowded Scenes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cong_2022_CVPR, author = {Cong, Peishan and Zhu, Xinge and Qiao, Feng and Ren, Yiming and Peng, Xidong and Hou, Yuenan and Xu, Lan and Yang, Ruigang and Manocha, Dinesh and Ma, Yuexin}, title = {STCrowd: A Multimodal Dataset for Pedestrian Perception in Crowded Scenes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19608-19617} }
Deep Decomposition for Stochastic Normal-Abnormal Transport-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2022_CVPR, author = {Liu, Peirong and Lee, Yueh and Aylward, Stephen and Niethammer, Marc}, title = {Deep Decomposition for Stochastic Normal-Abnormal Transport}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18791-18801} }
Multimodal Material Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Liang_2022_CVPR, author = {Liang, Yupeng and Wakaki, Ryosuke and Nobuhara, Shohei and Nishino, Ko}, title = {Multimodal Material Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19800-19808} }
DynamicEarthNet: Daily Multi-Spectral Satellite Dataset for Semantic Change Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Toker_2022_CVPR, author = {Toker, Aysim and Kondmann, Lukas and Weber, Mark and Eisenberger, Marvin and Camero, Andr\'es and Hu, Jingliang and Hoderlein, Ariadna Pregel and \c{S}enaras, \c{C}a\u{g}lar and Davis, Timothy and Cremers, Daniel and Marchisio, Giovanni and Zhu, Xiao Xiang and Leal-Taix\'e, Laura}, title = {DynamicEarthNet: Daily Multi-Spectral Satellite Dataset for Semantic Change Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21158-21167} }
Quantization-Aware Deep Optics for Diffractive Snapshot Hyperspectral Imaging-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Lingen and Wang, Lizhi and Song, Weitao and Zhang, Lei and Xiong, Zhiwei and Huang, Hua}, title = {Quantization-Aware Deep Optics for Diffractive Snapshot Hyperspectral Imaging}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19780-19789} }
Improving Video Model Transfer With Dynamic Representation Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Yi and Vasconcelos, Nuno}, title = {Improving Video Model Transfer With Dynamic Representation Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19280-19291} }
PIE-Net: Photometric Invariant Edge Guided Network for Intrinsic Image Decomposition-
[pdf]
[supp]
[bibtex]@InProceedings{Das_2022_CVPR, author = {Das, Partha and Karaoglu, Sezer and Gevers, Theo}, title = {PIE-Net: Photometric Invariant Edge Guided Network for Intrinsic Image Decomposition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19790-19799} }
QS-Attn: Query-Selected Attention for Contrastive Learning in I2I Translation-
[pdf]
[supp]
[bibtex]@InProceedings{Hu_2022_CVPR, author = {Hu, Xueqi and Zhou, Xinyue and Huang, Qiusheng and Shi, Zhengyi and Sun, Li and Li, Qingli}, title = {QS-Attn: Query-Selected Attention for Contrastive Learning in I2I Translation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18291-18300} }
Adaptive Gating for Single-Photon 3D Imaging-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Po_2022_CVPR, author = {Po, Ryan and Pediredla, Adithya and Gkioulekas, Ioannis}, title = {Adaptive Gating for Single-Photon 3D Imaging}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16354-16363} }
H4D: Human 4D Modeling by Learning Neural Compositional Representation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jiang_2022_CVPR, author = {Jiang, Boyan and Zhang, Yinda and Wei, Xingkui and Xue, Xiangyang and Fu, Yanwei}, title = {H4D: Human 4D Modeling by Learning Neural Compositional Representation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19355-19365} }
Cannot See the Forest for the Trees: Aggregating Multiple Viewpoints To Better Classify Objects in Videos-
[pdf]
[supp]
[bibtex]@InProceedings{Hwang_2022_CVPR, author = {Hwang, Sukjun and Heo, Miran and Oh, Seoung Wug and Kim, Seon Joo}, title = {Cannot See the Forest for the Trees: Aggregating Multiple Viewpoints To Better Classify Objects in Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17052-17061} }
Learning Canonical F-Correlation Projection for Compact Multiview Representation-
[pdf]
[supp]
[bibtex]@InProceedings{Yuan_2022_CVPR, author = {Yuan, Yun-Hao and Li, Jin and Li, Yun and Qiang, Jipeng and Zhu, Yi and Shen, Xiaobo and Gou, Jianping}, title = {Learning Canonical F-Correlation Projection for Compact Multiview Representation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19260-19269} }
DIFNet: Boosting Visual Information Flow for Image Captioning-
[pdf]
[bibtex]@InProceedings{Wu_2022_CVPR, author = {Wu, Mingrui and Zhang, Xuying and Sun, Xiaoshuai and Zhou, Yiyi and Chen, Chao and Gu, Jiaxin and Sun, Xing and Ji, Rongrong}, title = {DIFNet: Boosting Visual Information Flow for Image Captioning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18020-18029} }
Tree Energy Loss: Towards Sparsely Annotated Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liang_2022_CVPR, author = {Liang, Zhiyuan and Wang, Tiancai and Zhang, Xiangyu and Sun, Jian and Shen, Jianbing}, title = {Tree Energy Loss: Towards Sparsely Annotated Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16907-16916} }
Grounding Answers for Visual Questions Asked by Visually Impaired People-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2022_CVPR, author = {Chen, Chongyan and Anjum, Samreen and Gurari, Danna}, title = {Grounding Answers for Visual Questions Asked by Visually Impaired People}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19098-19107} }
Automatic Color Image Stitching Using Quaternion Rank-1 Alignment-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Jiaxue and Zhou, Yicong}, title = {Automatic Color Image Stitching Using Quaternion Rank-1 Alignment}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19720-19729} }
VisualGPT: Data-Efficient Adaptation of Pretrained Language Models for Image Captioning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2022_CVPR, author = {Chen, Jun and Guo, Han and Yi, Kai and Li, Boyang and Elhoseiny, Mohamed}, title = {VisualGPT: Data-Efficient Adaptation of Pretrained Language Models for Image Captioning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18030-18040} }
All-Photon Polarimetric Time-of-Flight Imaging-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Baek_2022_CVPR, author = {Baek, Seung-Hwan and Heide, Felix}, title = {All-Photon Polarimetric Time-of-Flight Imaging}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17876-17885} }
Towards Implicit Text-Guided 3D Shape Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2022_CVPR, author = {Liu, Zhengzhe and Wang, Yi and Qi, Xiaojuan and Fu, Chi-Wing}, title = {Towards Implicit Text-Guided 3D Shape Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17896-17906} }
A Versatile Multi-View Framework for LiDAR-Based 3D Object Detection With Guidance From Panoptic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fazlali_2022_CVPR, author = {Fazlali, Hamidreza and Xu, Yixuan and Ren, Yuan and Liu, Bingbing}, title = {A Versatile Multi-View Framework for LiDAR-Based 3D Object Detection With Guidance From Panoptic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17192-17201} }
RFNet: Unsupervised Network for Mutually Reinforcing Multi-Modal Image Registration and Fusion-
[pdf]
[supp]
[bibtex]@InProceedings{Xu_2022_CVPR, author = {Xu, Han and Ma, Jiayi and Yuan, Jiteng and Le, Zhuliang and Liu, Wei}, title = {RFNet: Unsupervised Network for Mutually Reinforcing Multi-Modal Image Registration and Fusion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19679-19688} }
CellTypeGraph: A New Geometric Computer Vision Benchmark-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cerrone_2022_CVPR, author = {Cerrone, Lorenzo and Vijayan, Athul and Mody, Tejasvinee and Schneitz, Kay and Hamprecht, Fred A.}, title = {CellTypeGraph: A New Geometric Computer Vision Benchmark}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20897-20907} }
Clustering Plotted Data by Image Segmentation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Naous_2022_CVPR, author = {Naous, Tarek and Sarkar, Srinjay and Abid, Abubakar and Zou, James}, title = {Clustering Plotted Data by Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21499-21504} }
Animal Kingdom: A Large and Diverse Dataset for Animal Behavior Understanding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ng_2022_CVPR, author = {Ng, Xun Long and Ong, Kian Eng and Zheng, Qichen and Ni, Yun and Yeo, Si Yong and Liu, Jun}, title = {Animal Kingdom: A Large and Diverse Dataset for Animal Behavior Understanding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19023-19034} }
EI-CLIP: Entity-Aware Interventional Contrastive Learning for E-Commerce Cross-Modal Retrieval-
[pdf]
[supp]
[bibtex]@InProceedings{Ma_2022_CVPR, author = {Ma, Haoyu and Zhao, Handong and Lin, Zhe and Kale, Ajinkya and Wang, Zhangyang and Yu, Tong and Gu, Jiuxiang and Choudhary, Sunav and Xie, Xiaohui}, title = {EI-CLIP: Entity-Aware Interventional Contrastive Learning for E-Commerce Cross-Modal Retrieval}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18051-18061} }
Multi-Dimensional, Nuanced and Subjective - Measuring the Perception of Facial Expressions-
[pdf]
[supp]
[bibtex]@InProceedings{Bryant_2022_CVPR, author = {Bryant, De'Aira and Deng, Siqi and Sephus, Nashlie and Xia, Wei and Perona, Pietro}, title = {Multi-Dimensional, Nuanced and Subjective - Measuring the Perception of Facial Expressions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20932-20941} }
PyMiceTracking: An Open-Source Toolbox for Real-Time Behavioral Neuroscience Experiments-
[pdf]
[bibtex]@InProceedings{Menezes_2022_CVPR, author = {Menezes, Richardson and de Miranda, Aron and Maia, Helton}, title = {PyMiceTracking: An Open-Source Toolbox for Real-Time Behavioral Neuroscience Experiments}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21459-21465} }
Fine-Grained Temporal Contrastive Learning for Weakly-Supervised Temporal Action Localization-
[pdf]
[arXiv]
[bibtex]@InProceedings{Gao_2022_CVPR, author = {Gao, Junyu and Chen, Mengyuan and Xu, Changsheng}, title = {Fine-Grained Temporal Contrastive Learning for Weakly-Supervised Temporal Action Localization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19999-20009} }
UTC: A Unified Transformer With Inter-Task Contrastive Learning for Visual Dialog-
[pdf]
[arXiv]
[bibtex]@InProceedings{Chen_2022_CVPR, author = {Chen, Cheng and Tan, Zhenshan and Cheng, Qingrong and Jiang, Xin and Liu, Qun and Zhu, Yudong and Gu, Xiaodong}, title = {UTC: A Unified Transformer With Inter-Task Contrastive Learning for Visual Dialog}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18103-18112} }
Mimicking the Oracle: An Initial Phase Decorrelation Approach for Class Incremental Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shi_2022_CVPR, author = {Shi, Yujun and Zhou, Kuangqi and Liang, Jian and Jiang, Zihang and Feng, Jiashi and Torr, Philip H.S. and Bai, Song and Tan, Vincent Y. F.}, title = {Mimicking the Oracle: An Initial Phase Decorrelation Approach for Class Incremental Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16722-16731} }
RIDDLE: Lidar Data Compression With Range Image Deep Delta Encoding-
[pdf]
[supp]
[bibtex]@InProceedings{Zhou_2022_CVPR, author = {Zhou, Xuanyu and Qi, Charles R. and Zhou, Yin and Anguelov, Dragomir}, title = {RIDDLE: Lidar Data Compression With Range Image Deep Delta Encoding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17212-17221} }
RelTransformer: A Transformer-Based Long-Tail Visual Relationship Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2022_CVPR, author = {Chen, Jun and Agarwal, Aniket and Abdelkarim, Sherif and Zhu, Deyao and Elhoseiny, Mohamed}, title = {RelTransformer: A Transformer-Based Long-Tail Visual Relationship Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19507-19517} }
RigidFlow: Self-Supervised Scene Flow Learning on Point Clouds by Local Rigidity Prior-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Ruibo and Zhang, Chi and Lin, Guosheng and Wang, Zhe and Shen, Chunhua}, title = {RigidFlow: Self-Supervised Scene Flow Learning on Point Clouds by Local Rigidity Prior}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16959-16968} }
Personalized Image Aesthetics Assessment With Rich Attributes-
[pdf]
[arXiv]
[bibtex]@InProceedings{Yang_2022_CVPR, author = {Yang, Yuzhe and Xu, Liwu and Li, Leida and Qie, Nan and Li, Yaqian and Zhang, Peng and Guo, Yandong}, title = {Personalized Image Aesthetics Assessment With Rich Attributes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19861-19869} }
HDNet: High-Resolution Dual-Domain Learning for Spectral Compressive Imaging-
[pdf]
[arXiv]
[bibtex]@InProceedings{Hu_2022_CVPR, author = {Hu, Xiaowan and Cai, Yuanhao and Lin, Jing and Wang, Haoqian and Yuan, Xin and Zhang, Yulun and Timofte, Radu and Van Gool, Luc}, title = {HDNet: High-Resolution Dual-Domain Learning for Spectral Compressive Imaging}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17542-17551} }
Amodal Panoptic Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Mohan_2022_CVPR, author = {Mohan, Rohit and Valada, Abhinav}, title = {Amodal Panoptic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21023-21032} }
Gravitationally Lensed Black Hole Emission Tomography-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Levis_2022_CVPR, author = {Levis, Aviad and Srinivasan, Pratul P. and Chael, Andrew A. and Ng, Ren and Bouman, Katherine L.}, title = {Gravitationally Lensed Black Hole Emission Tomography}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19841-19850} }
3D-Aware Image Synthesis via Learning Structural and Textural Representations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2022_CVPR, author = {Xu, Yinghao and Peng, Sida and Yang, Ceyuan and Shen, Yujun and Zhou, Bolei}, title = {3D-Aware Image Synthesis via Learning Structural and Textural Representations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18430-18439} }
Text-to-Image Synthesis Based on Object-Guided Joint-Decoding Transformer-
[pdf]
[supp]
[bibtex]@InProceedings{Wu_2022_CVPR, author = {Wu, Fuxiang and Liu, Liu and Hao, Fusheng and He, Fengxiang and Cheng, Jun}, title = {Text-to-Image Synthesis Based on Object-Guided Joint-Decoding Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18113-18122} }
Unsupervised Vision-and-Language Pre-Training via Retrieval-Based Multi-Granular Alignment-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhou_2022_CVPR, author = {Zhou, Mingyang and Yu, Licheng and Singh, Amanpreet and Wang, Mengjiao and Yu, Zhou and Zhang, Ning}, title = {Unsupervised Vision-and-Language Pre-Training via Retrieval-Based Multi-Granular Alignment}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16485-16494} }
PONI: Potential Functions for ObjectGoal Navigation With Interaction-Free Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Ramakrishnan_2022_CVPR, author = {Ramakrishnan, Santhosh Kumar and Chaplot, Devendra Singh and Al-Halah, Ziad and Malik, Jitendra and Grauman, Kristen}, title = {PONI: Potential Functions for ObjectGoal Navigation With Interaction-Free Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18890-18900} }
Exploring Structure-Aware Transformer Over Interaction Proposals for Human-Object Interaction Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2022_CVPR, author = {Zhang, Yong and Pan, Yingwei and Yao, Ting and Huang, Rui and Mei, Tao and Chen, Chang-Wen}, title = {Exploring Structure-Aware Transformer Over Interaction Proposals for Human-Object Interaction Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19548-19557} }
Glass: Geometric Latent Augmentation for Shape Spaces-
[pdf]
[arXiv]
[bibtex]@InProceedings{Muralikrishnan_2022_CVPR, author = {Muralikrishnan, Sanjeev and Chaudhuri, Siddhartha and Aigerman, Noam and Kim, Vladimir G. and Fisher, Matthew and Mitra, Niloy J.}, title = {Glass: Geometric Latent Augmentation for Shape Spaces}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18552-18561} }
Evading the Simplicity Bias: Training a Diverse Set of Models Discovers Solutions With Superior OOD Generalization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Teney_2022_CVPR, author = {Teney, Damien and Abbasnejad, Ehsan and Lucey, Simon and van den Hengel, Anton}, title = {Evading the Simplicity Bias: Training a Diverse Set of Models Discovers Solutions With Superior OOD Generalization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16761-16772} }
Assembly101: A Large-Scale Multi-View Video Dataset for Understanding Procedural Activities-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sener_2022_CVPR, author = {Sener, Fadime and Chatterjee, Dibyadip and Shelepov, Daniel and He, Kun and Singhania, Dipika and Wang, Robert and Yao, Angela}, title = {Assembly101: A Large-Scale Multi-View Video Dataset for Understanding Procedural Activities}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21096-21106} }
DPICT: Deep Progressive Image Compression Using Trit-Planes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2022_CVPR, author = {Lee, Jae-Han and Jeon, Seungmin and Choi, Kwang Pyo and Park, Youngo and Kim, Chang-Su}, title = {DPICT: Deep Progressive Image Compression Using Trit-Planes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16113-16122} }
Text to Image Generation With Semantic-Spatial Aware GAN-
[pdf]
[arXiv]
[bibtex]@InProceedings{Liao_2022_CVPR, author = {Liao, Wentong and Hu, Kai and Yang, Michael Ying and Rosenhahn, Bodo}, title = {Text to Image Generation With Semantic-Spatial Aware GAN}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18187-18196} }
PixMix: Dreamlike Pictures Comprehensively Improve Safety Measures-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hendrycks_2022_CVPR, author = {Hendrycks, Dan and Zou, Andy and Mazeika, Mantas and Tang, Leonard and Li, Bo and Song, Dawn and Steinhardt, Jacob}, title = {PixMix: Dreamlike Pictures Comprehensively Improve Safety Measures}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16783-16792} }
Generalizable Cross-Modality Medical Image Segmentation via Style Augmentation and Dual Normalization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhou_2022_CVPR, author = {Zhou, Ziqi and Qi, Lei and Yang, Xin and Ni, Dong and Shi, Yinghuan}, title = {Generalizable Cross-Modality Medical Image Segmentation via Style Augmentation and Dual Normalization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20856-20865} }
TimeReplayer: Unlocking the Potential of Event Cameras for Video Interpolation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{He_2022_CVPR, author = {He, Weihua and You, Kaichao and Qiao, Zhendong and Jia, Xu and Zhang, Ziyang and Wang, Wenhui and Lu, Huchuan and Wang, Yaoyuan and Liao, Jianxing}, title = {TimeReplayer: Unlocking the Potential of Event Cameras for Video Interpolation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17804-17813} }
Interactive Segmentation and Visualization for Tiny Objects in Multi-Megapixel Images-
[pdf]
[arXiv]
[bibtex]@InProceedings{Xu_2022_CVPR, author = {Xu, Chengyuan and Dong, Boning and Stier, Noah and McCully, Curtis and Howell, D. Andrew and Sen, Pradeep and H\"ollerer, Tobias}, title = {Interactive Segmentation and Visualization for Tiny Objects in Multi-Megapixel Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21447-21452} }
Scaling Vision Transformers to Gigapixel Images via Hierarchical Self-Supervised Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2022_CVPR, author = {Chen, Richard J. and Chen, Chengkuan and Li, Yicong and Chen, Tiffany Y. and Trister, Andrew D. and Krishnan, Rahul G. and Mahmood, Faisal}, title = {Scaling Vision Transformers to Gigapixel Images via Hierarchical Self-Supervised Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16144-16155} }
Neural Reflectance for Shape Recovery With Shadow Handling-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Junxuan and Li, Hongdong}, title = {Neural Reflectance for Shape Recovery With Shadow Handling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16221-16230} }
Surface Representation for Point Clouds-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ran_2022_CVPR, author = {Ran, Haoxi and Liu, Jun and Wang, Chengjie}, title = {Surface Representation for Point Clouds}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18942-18952} }
DeepLIIF: An Online Platform for Quantification of Clinical Pathology Slides-
[pdf]
[arXiv]
[bibtex]@InProceedings{Ghahremani_2022_CVPR, author = {Ghahremani, Parmida and Marino, Joseph and Dodds, Ricardo and Nadeem, Saad}, title = {DeepLIIF: An Online Platform for Quantification of Clinical Pathology Slides}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21399-21405} }
Joint Video Summarization and Moment Localization by Cross-Task Sample Transfer-
[pdf]
[supp]
[bibtex]@InProceedings{Jiang_2022_CVPR, author = {Jiang, Hao and Mu, Yadong}, title = {Joint Video Summarization and Moment Localization by Cross-Task Sample Transfer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16388-16398} }
Optical Flow Estimation for Spiking Camera-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hu_2022_CVPR, author = {Hu, Liwen and Zhao, Rui and Ding, Ziluo and Ma, Lei and Shi, Boxin and Xiong, Ruiqin and Huang, Tiejun}, title = {Optical Flow Estimation for Spiking Camera}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17844-17853} }
InstaFormer: Instance-Aware Image-to-Image Translation With Transformer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2022_CVPR, author = {Kim, Soohyun and Baek, Jongbeom and Park, Jihye and Kim, Gyeongnyeon and Kim, Seungryong}, title = {InstaFormer: Instance-Aware Image-to-Image Translation With Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18321-18331} }
3D-VField: Adversarial Augmentation of Point Clouds for Domain Generalization in 3D Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Lehner_2022_CVPR, author = {Lehner, Alexander and Gasperini, Stefano and Marcos-Ramiro, Alvaro and Schmidt, Michael and Mahani, Mohammad-Ali Nikouei and Navab, Nassir and Busam, Benjamin and Tombari, Federico}, title = {3D-VField: Adversarial Augmentation of Point Clouds for Domain Generalization in 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17295-17304} }
AutoMine: An Unmanned Mine Dataset-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Yuchen and Li, Zixuan and Teng, Siyu and Zhang, Yu and Zhou, Yuhang and Zhu, Yuchang and Cao, Dongpu and Tian, Bin and Ai, Yunfeng and Xuanyuan, Zhe and Chen, Long}, title = {AutoMine: An Unmanned Mine Dataset}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21308-21317} }
Neural Data-Dependent Transform for Learned Image Compression-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2022_CVPR, author = {Wang, Dezhao and Yang, Wenhan and Hu, Yueyu and Liu, Jiaying}, title = {Neural Data-Dependent Transform for Learned Image Compression}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17379-17388} }
Evaluation-Oriented Knowledge Distillation for Deep Face Recognition-
[pdf]
[bibtex]@InProceedings{Huang_2022_CVPR, author = {Huang, Yuge and Wu, Jiaxiang and Xu, Xingkun and Ding, Shouhong}, title = {Evaluation-Oriented Knowledge Distillation for Deep Face Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18740-18749} }
Improving Subgraph Recognition With Variational Graph Information Bottleneck-
[pdf]
[arXiv]
[bibtex]@InProceedings{Yu_2022_CVPR, author = {Yu, Junchi and Cao, Jie and He, Ran}, title = {Improving Subgraph Recognition With Variational Graph Information Bottleneck}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19396-19405} }
Synthetic Generation of Face Videos With Plethysmograph Physiology-
[pdf]
[bibtex]@InProceedings{Wang_2022_CVPR, author = {Wang, Zhen and Ba, Yunhao and Chari, Pradyumna and Bozkurt, Oyku Deniz and Brown, Gianna and Patwa, Parth and Vaddi, Niranjan and Jalilian, Laleh and Kadambi, Achuta}, title = {Synthetic Generation of Face Videos With Plethysmograph Physiology}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20587-20596} }
TransRAC: Encoding Multi-Scale Temporal Correlation With Transformers for Repetitive Action Counting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hu_2022_CVPR, author = {Hu, Huazhang and Dong, Sixun and Zhao, Yiqun and Lian, Dongze and Li, Zhengxin and Gao, Shenghua}, title = {TransRAC: Encoding Multi-Scale Temporal Correlation With Transformers for Repetitive Action Counting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19013-19022} }
AdaInt: Learning Adaptive Intervals for 3D Lookup Tables on Real-Time Image Enhancement-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2022_CVPR, author = {Yang, Canqian and Jin, Meiguang and Jia, Xu and Xu, Yi and Chen, Ying}, title = {AdaInt: Learning Adaptive Intervals for 3D Lookup Tables on Real-Time Image Enhancement}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17522-17531} }
RegionCLIP: Region-Based Language-Image Pretraining-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhong_2022_CVPR, author = {Zhong, Yiwu and Yang, Jianwei and Zhang, Pengchuan and Li, Chunyuan and Codella, Noel and Li, Liunian Harold and Zhou, Luowei and Dai, Xiyang and Yuan, Lu and Li, Yin and Gao, Jianfeng}, title = {RegionCLIP: Region-Based Language-Image Pretraining}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16793-16803} }
Video Frame Interpolation Transformer-
[pdf]
[arXiv]
[bibtex]@InProceedings{Shi_2022_CVPR, author = {Shi, Zhihao and Xu, Xiangyu and Liu, Xiaohong and Chen, Jun and Yang, Ming-Hsuan}, title = {Video Frame Interpolation Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17482-17491} }
An Empirical Study of End-to-End Temporal Action Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2022_CVPR, author = {Liu, Xiaolong and Bai, Song and Bai, Xiang}, title = {An Empirical Study of End-to-End Temporal Action Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20010-20019} }
Brain-Supervised Image Editing-
[pdf]
[supp]
[bibtex]@InProceedings{Davis_2022_CVPR, author = {Davis, III, Keith M. and de la Torre-Ortiz, Carlos and Ruotsalo, Tuukka}, title = {Brain-Supervised Image Editing}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18480-18489} }
3D Shape Variational Autoencoder Latent Disentanglement via Mini-Batch Feature Swapping for Bodies and Faces-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Foti_2022_CVPR, author = {Foti, Simone and Koo, Bongjin and Stoyanov, Danail and Clarkson, Matthew J.}, title = {3D Shape Variational Autoencoder Latent Disentanglement via Mini-Batch Feature Swapping for Bodies and Faces}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18730-18739} }
RestoreFormer: High-Quality Blind Face Restoration From Undegraded Key-Value Pairs-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2022_CVPR, author = {Wang, Zhouxia and Zhang, Jiawei and Chen, Runjian and Wang, Wenping and Luo, Ping}, title = {RestoreFormer: High-Quality Blind Face Restoration From Undegraded Key-Value Pairs}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17512-17521} }
Mask-Guided Spectral-Wise Transformer for Efficient Hyperspectral Image Reconstruction-
[pdf]
[arXiv]
[bibtex]@InProceedings{Cai_2022_CVPR, author = {Cai, Yuanhao and Lin, Jing and Hu, Xiaowan and Wang, Haoqian and Yuan, Xin and Zhang, Yulun and Timofte, Radu and Van Gool, Luc}, title = {Mask-Guided Spectral-Wise Transformer for Efficient Hyperspectral Image Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17502-17511} }
PPDL: Predicate Probability Distribution Based Loss for Unbiased Scene Graph Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Wei and Zhang, Haiwei and Bai, Qijie and Zhao, Guoqing and Jiang, Ning and Yuan, Xiaojie}, title = {PPDL: Predicate Probability Distribution Based Loss for Unbiased Scene Graph Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19447-19456} }
Coupling Vision and Proprioception for Navigation of Legged Robots-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fu_2022_CVPR, author = {Fu, Zipeng and Kumar, Ashish and Agarwal, Ananye and Qi, Haozhi and Malik, Jitendra and Pathak, Deepak}, title = {Coupling Vision and Proprioception for Navigation of Legged Robots}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17273-17283} }
Fine-Grained Predicates Learning for Scene Graph Generation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Lyu_2022_CVPR, author = {Lyu, Xinyu and Gao, Lianli and Guo, Yuyu and Zhao, Zhou and Huang, Hao and Shen, Heng Tao and Song, Jingkuan}, title = {Fine-Grained Predicates Learning for Scene Graph Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19467-19475} }
Neural Head Avatars From Monocular RGB Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Grassal_2022_CVPR, author = {Grassal, Philip-William and Prinzler, Malte and Leistner, Titus and Rother, Carsten and Nie{\ss}ner, Matthias and Thies, Justus}, title = {Neural Head Avatars From Monocular RGB Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18653-18664} }
EMOCA: Emotion Driven Monocular Face Capture and Animation-
[pdf]
[supp]
[bibtex]@InProceedings{Danecek_2022_CVPR, author = {Dan\v{e}\v{c}ek, Radek and Black, Michael J. and Bolkart, Timo}, title = {EMOCA: Emotion Driven Monocular Face Capture and Animation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20311-20322} }
Towards Diverse and Natural Scene-Aware 3D Human Motion Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2022_CVPR, author = {Wang, Jingbo and Rong, Yu and Liu, Jingyuan and Yan, Sijie and Lin, Dahua and Dai, Bo}, title = {Towards Diverse and Natural Scene-Aware 3D Human Motion Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20460-20469} }
How Much Does Input Data Type Impact Final Face Model Accuracy?-
[pdf]
[supp]
[bibtex]@InProceedings{Luo_2022_CVPR, author = {Luo, Jiahao and Khan, Fahim Hasan and Mori, Issei and de Silva, Akila and Ruezga, Eric Sandoval and Liu, Minghao and Pang, Alex and Davis, James}, title = {How Much Does Input Data Type Impact Final Face Model Accuracy?}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18985-18994} }
HumanNeRF: Free-Viewpoint Rendering of Moving People From Monocular Video-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Weng_2022_CVPR, author = {Weng, Chung-Yi and Curless, Brian and Srinivasan, Pratul P. and Barron, Jonathan T. and Kemelmacher-Shlizerman, Ira}, title = {HumanNeRF: Free-Viewpoint Rendering of Moving People From Monocular Video}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16210-16220} }
Which Images To Label for Few-Shot Medical Landmark Detection?-
[pdf]
[arXiv]
[bibtex]@InProceedings{Quan_2022_CVPR, author = {Quan, Quan and Yao, Qingsong and Li, Jun and Zhou, S. Kevin}, title = {Which Images To Label for Few-Shot Medical Landmark Detection?}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20606-20616} }
UBoCo: Unsupervised Boundary Contrastive Learning for Generic Event Boundary Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kang_2022_CVPR, author = {Kang, Hyolim and Kim, Jinwoo and Kim, Taehyun and Kim, Seon Joo}, title = {UBoCo: Unsupervised Boundary Contrastive Learning for Generic Event Boundary Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20073-20082} }
Both Style and Fog Matter: Cumulative Domain Adaptation for Semantic Foggy Scene Understanding-
[pdf]
[arXiv]
[bibtex]@InProceedings{Ma_2022_CVPR, author = {Ma, Xianzheng and Wang, Zhixiang and Zhan, Yacheng and Zheng, Yinqiang and Wang, Zheng and Dai, Dengxin and Lin, Chia-Wen}, title = {Both Style and Fog Matter: Cumulative Domain Adaptation for Semantic Foggy Scene Understanding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18922-18931} }
Ev-TTA: Test-Time Adaptation for Event-Based Object Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2022_CVPR, author = {Kim, Junho and Hwang, Inwoo and Kim, Young Min}, title = {Ev-TTA: Test-Time Adaptation for Event-Based Object Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17745-17754} }
NODEO: A Neural Ordinary Differential Equation Based Optimization Framework for Deformable Image Registration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2022_CVPR, author = {Wu, Yifan and Jiahao, Tom Z. and Wang, Jiancong and Yushkevich, Paul A. and Hsieh, M. Ani and Gee, James C.}, title = {NODEO: A Neural Ordinary Differential Equation Based Optimization Framework for Deformable Image Registration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20804-20813} }
Pyramid Architecture for Multi-Scale Processing in Point Cloud Segmentation-
[pdf]
[bibtex]@InProceedings{Nie_2022_CVPR, author = {Nie, Dong and Lan, Rui and Wang, Ling and Ren, Xiaofeng}, title = {Pyramid Architecture for Multi-Scale Processing in Point Cloud Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17284-17294} }
Cross-Architecture Self-Supervised Video Representation Learning-
[pdf]
[arXiv]
[bibtex]@InProceedings{Guo_2022_CVPR, author = {Guo, Sheng and Xiong, Zihua and Zhong, Yujie and Wang, Limin and Guo, Xiaobo and Han, Bing and Huang, Weilin}, title = {Cross-Architecture Self-Supervised Video Representation Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19270-19279} }
High-Resolution Image Harmonization via Collaborative Dual Transformations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cong_2022_CVPR, author = {Cong, Wenyan and Tao, Xinhao and Niu, Li and Liang, Jing and Gao, Xuesong and Sun, Qihao and Zhang, Liqing}, title = {High-Resolution Image Harmonization via Collaborative Dual Transformations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18470-18479} }
MM-TTA: Multi-Modal Test-Time Adaptation for 3D Semantic Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Shin_2022_CVPR, author = {Shin, Inkyu and Tsai, Yi-Hsuan and Zhuang, Bingbing and Schulter, Samuel and Liu, Buyu and Garg, Sparsh and Kweon, In So and Yoon, Kuk-Jin}, title = {MM-TTA: Multi-Modal Test-Time Adaptation for 3D Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16928-16937} }
Towards Bidirectional Arbitrary Image Rescaling: Joint Optimization and Cycle Idempotence-
[pdf]
[arXiv]
[bibtex]@InProceedings{Pan_2022_CVPR, author = {Pan, Zhihong and Li, Baopu and He, Dongliang and Yao, Mingde and Wu, Wenhao and Lin, Tianwei and Li, Xin and Ding, Errui}, title = {Towards Bidirectional Arbitrary Image Rescaling: Joint Optimization and Cycle Idempotence}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17389-17398} }
Topology Preserving Local Road Network Estimation From Single Onboard Camera Image-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Can_2022_CVPR, author = {Can, Yigit Baran and Liniger, Alexander and Paudel, Danda Pani and Van Gool, Luc}, title = {Topology Preserving Local Road Network Estimation From Single Onboard Camera Image}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17263-17272} }
Eigenlanes: Data-Driven Lane Descriptors for Structurally Diverse Lanes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jin_2022_CVPR, author = {Jin, Dongkwon and Park, Wonhui and Jeong, Seong-Gyun and Kwon, Heeyeon and Kim, Chang-Su}, title = {Eigenlanes: Data-Driven Lane Descriptors for Structurally Diverse Lanes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17163-17171} }
SpaceEdit: Learning a Unified Editing Space for Open-Domain Image Color Editing-
[pdf]
[supp]
[bibtex]@InProceedings{Shi_2022_CVPR, author = {Shi, Jing and Xu, Ning and Zheng, Haitian and Smith, Alex and Luo, Jiebo and Xu, Chenliang}, title = {SpaceEdit: Learning a Unified Editing Space for Open-Domain Image Color Editing}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19730-19739} }
Multi-Level Feature Learning for Contrastive Multi-View Clustering-
[pdf]
[arXiv]
[bibtex]@InProceedings{Xu_2022_CVPR, author = {Xu, Jie and Tang, Huayi and Ren, Yazhou and Peng, Liang and Zhu, Xiaofeng and He, Lifang}, title = {Multi-Level Feature Learning for Contrastive Multi-View Clustering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16051-16060} }
Egocentric Prediction of Action Target in 3D-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Yiming and Cao, Ziang and Liang, Andrew and Liang, Benjamin and Chen, Luoyao and Zhao, Hang and Feng, Chen}, title = {Egocentric Prediction of Action Target in 3D}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21003-21012} }
Towards Real-World Navigation With Deep Differentiable Planners-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ishida_2022_CVPR, author = {Ishida, Shu and Henriques, Jo\~ao F.}, title = {Towards Real-World Navigation With Deep Differentiable Planners}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17327-17336} }
Video K-Net: A Simple, Strong, and Unified Baseline for Video Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Xiangtai and Zhang, Wenwei and Pang, Jiangmiao and Chen, Kai and Cheng, Guangliang and Tong, Yunhai and Loy, Chen Change}, title = {Video K-Net: A Simple, Strong, and Unified Baseline for Video Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18847-18857} }
NeRFReN: Neural Radiance Fields With Reflections-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Guo_2022_CVPR, author = {Guo, Yuan-Chen and Kang, Di and Bao, Linchao and He, Yu and Zhang, Song-Hai}, title = {NeRFReN: Neural Radiance Fields With Reflections}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18409-18418} }
SCS-Co: Self-Consistent Style Contrastive Learning for Image Harmonization-
[pdf]
[supp]
[bibtex]@InProceedings{Hang_2022_CVPR, author = {Hang, Yucheng and Xia, Bin and Yang, Wenming and Liao, Qingmin}, title = {SCS-Co: Self-Consistent Style Contrastive Learning for Image Harmonization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19710-19719} }
Neural Convolutional Surfaces-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Morreale_2022_CVPR, author = {Morreale, Luca and Aigerman, Noam and Guerrero, Paul and Kim, Vladimir G. and Mitra, Niloy J.}, title = {Neural Convolutional Surfaces}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19333-19342} }
HyperSegNAS: Bridging One-Shot Neural Architecture Search With 3D Medical Image Segmentation Using HyperNet-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Peng_2022_CVPR, author = {Peng, Cheng and Myronenko, Andriy and Hatamizadeh, Ali and Nath, Vishwesh and Siddiquee, Md Mahfuzur Rahman and He, Yufan and Xu, Daguang and Chellappa, Rama and Yang, Dong}, title = {HyperSegNAS: Bridging One-Shot Neural Architecture Search With 3D Medical Image Segmentation Using HyperNet}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20741-20751} }
A Comprehensive Study of Image Classification Model Sensitivity to Foregrounds, Backgrounds, and Visual Attributes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Moayeri_2022_CVPR, author = {Moayeri, Mazda and Pope, Phillip and Balaji, Yogesh and Feizi, Soheil}, title = {A Comprehensive Study of Image Classification Model Sensitivity to Foregrounds, Backgrounds, and Visual Attributes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19087-19097} }
ConDor: Self-Supervised Canonicalization of 3D Pose for Partial Shapes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sajnani_2022_CVPR, author = {Sajnani, Rahul and Poulenard, Adrien and Jain, Jivitesh and Dua, Radhika and Guibas, Leonidas J. and Sridhar, Srinath}, title = {ConDor: Self-Supervised Canonicalization of 3D Pose for Partial Shapes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16969-16979} }
Exploring Endogenous Shift for Cross-Domain Detection: A Large-Scale Benchmark and Perturbation Suppression Network-
[pdf]
[bibtex]@InProceedings{Tao_2022_CVPR, author = {Tao, Renshuai and Li, Hainan and Wang, Tianbo and Wei, Yanlu and Ding, Yifu and Jin, Bowei and Zhi, Hongping and Liu, Xianglong and Liu, Aishan}, title = {Exploring Endogenous Shift for Cross-Domain Detection: A Large-Scale Benchmark and Perturbation Suppression Network}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21189-21199} }
VisCUIT: Visual Auditor for Bias in CNN Image Classifier-
[pdf]
[arXiv]
[bibtex]@InProceedings{Lee_2022_CVPR, author = {Lee, Seongmin and Wang, Zijie J. and Hoffman, Judy and Chau, Duen Horng (Polo)}, title = {VisCUIT: Visual Auditor for Bias in CNN Image Classifier}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21475-21483} }
DirecFormer: A Directed Attention in Transformer Approach to Robust Action Recognition-
[pdf]
[arXiv]
[bibtex]@InProceedings{Truong_2022_CVPR, author = {Truong, Thanh-Dat and Bui, Quoc-Huy and Duong, Chi Nhan and Seo, Han-Seok and Phung, Son Lam and Li, Xin and Luu, Khoa}, title = {DirecFormer: A Directed Attention in Transformer Approach to Robust Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20030-20040} }
Robust Egocentric Photo-Realistic Facial Expression Transfer for Virtual Reality-
[pdf]
[arXiv]
[bibtex]@InProceedings{Jourabloo_2022_CVPR, author = {Jourabloo, Amin and De la Torre, Fernando and Saragih, Jason and Wei, Shih-En and Lombardi, Stephen and Wang, Te-Li and Belko, Danielle and Trimble, Autumn and Badino, Hernan}, title = {Robust Egocentric Photo-Realistic Facial Expression Transfer for Virtual Reality}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20323-20332} }
Distillation Using Oracle Queries for Transformer-Based Human-Object Interaction Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Qu_2022_CVPR, author = {Qu, Xian and Ding, Changxing and Li, Xingao and Zhong, Xubin and Tao, Dacheng}, title = {Distillation Using Oracle Queries for Transformer-Based Human-Object Interaction Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19558-19567} }
Learning Video Representations of Human Motion From Synthetic Data-
[pdf]
[supp]
[bibtex]@InProceedings{Guo_2022_CVPR, author = {Guo, Xi and Wu, Wei and Wang, Dongliang and Su, Jing and Su, Haisheng and Gan, Weihao and Huang, Jian and Yang, Qin}, title = {Learning Video Representations of Human Motion From Synthetic Data}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20197-20207} }
BoostMIS: Boosting Medical Image Semi-Supervised Learning With Adaptive Pseudo Labeling and Informative Active Annotation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhang_2022_CVPR, author = {Zhang, Wenqiao and Zhu, Lei and Hallinan, James and Zhang, Shengyu and Makmur, Andrew and Cai, Qingpeng and Ooi, Beng Chin}, title = {BoostMIS: Boosting Medical Image Semi-Supervised Learning With Adaptive Pseudo Labeling and Informative Active Annotation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20666-20676} }
HOI4D: A 4D Egocentric Dataset for Category-Level Human-Object Interaction-
[pdf]
[arXiv]
[bibtex]@InProceedings{Liu_2022_CVPR, author = {Liu, Yunze and Liu, Yun and Jiang, Che and Lyu, Kangbo and Wan, Weikang and Shen, Hao and Liang, Boqiang and Fu, Zhoujie and Wang, He and Yi, Li}, title = {HOI4D: A 4D Egocentric Dataset for Category-Level Human-Object Interaction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21013-21022} }
Collaborative Transformers for Grounded Situation Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cho_2022_CVPR, author = {Cho, Junhyeong and Yoon, Youngseok and Kwak, Suha}, title = {Collaborative Transformers for Grounded Situation Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19659-19668} }
Vox2Cortex: Fast Explicit Reconstruction of Cortical Surfaces From 3D MRI Scans With Geometric Deep Neural Networks-
[pdf]
[supp]
[bibtex]@InProceedings{Bongratz_2022_CVPR, author = {Bongratz, Fabian and Rickmann, Anne-Marie and P\"olsterl, Sebastian and Wachinger, Christian}, title = {Vox2Cortex: Fast Explicit Reconstruction of Cortical Surfaces From 3D MRI Scans With Geometric Deep Neural Networks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20773-20783} }
ScanQA: 3D Question Answering for Spatial Scene Understanding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Azuma_2022_CVPR, author = {Azuma, Daichi and Miyanishi, Taiki and Kurita, Shuhei and Kawanabe, Motoaki}, title = {ScanQA: 3D Question Answering for Spatial Scene Understanding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19129-19139} }
Class-Incremental Learning by Knowledge Distillation With Adaptive Feature Consolidation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kang_2022_CVPR, author = {Kang, Minsoo and Park, Jaeyoo and Han, Bohyung}, title = {Class-Incremental Learning by Knowledge Distillation With Adaptive Feature Consolidation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16071-16080} }
Learning Program Representations for Food Images and Cooking Recipes-
[pdf]
[arXiv]
[bibtex]@InProceedings{Papadopoulos_2022_CVPR, author = {Papadopoulos, Dim P. and Mora, Enrique and Chepurko, Nadiia and Huang, Kuan Wei and Ofli, Ferda and Torralba, Antonio}, title = {Learning Program Representations for Food Images and Cooking Recipes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16559-16569} }
Directional Self-Supervised Learning for Heavy Image Augmentations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bai_2022_CVPR, author = {Bai, Yalong and Yang, Yifan and Zhang, Wei and Mei, Tao}, title = {Directional Self-Supervised Learning for Heavy Image Augmentations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16692-16701} }
No-Reference Point Cloud Quality Assessment via Domain Adaptation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Yang_2022_CVPR, author = {Yang, Qi and Liu, Yipeng and Chen, Siheng and Xu, Yiling and Sun, Jun}, title = {No-Reference Point Cloud Quality Assessment via Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21179-21188} }
Comprehending and Ordering Semantics for Image Captioning-
[pdf]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Yehao and Pan, Yingwei and Yao, Ting and Mei, Tao}, title = {Comprehending and Ordering Semantics for Image Captioning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17990-17999} }
A Large-Scale Comprehensive Dataset and Copy-Overlap Aware Evaluation Protocol for Segment-Level Video Copy Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{He_2022_CVPR, author = {He, Sifeng and Yang, Xudong and Jiang, Chen and Liang, Gang and Zhang, Wei and Pan, Tan and Wang, Qing and Xu, Furong and Li, Chunguang and Liu, JinXiong and Xu, Hui and Huang, Kaiming and Cheng, Yuan and Qian, Feng and Zhang, Xiaobo and Yang, Lei}, title = {A Large-Scale Comprehensive Dataset and Copy-Overlap Aware Evaluation Protocol for Segment-Level Video Copy Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21086-21095} }
GaTector: A Unified Framework for Gaze Object Prediction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2022_CVPR, author = {Wang, Binglu and Hu, Tao and Li, Baoshan and Chen, Xiaojuan and Zhang, Zhijie}, title = {GaTector: A Unified Framework for Gaze Object Prediction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19588-19597} }
LaTr: Layout-Aware Transformer for Scene-Text VQA-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Biten_2022_CVPR, author = {Biten, Ali Furkan and Litman, Ron and Xie, Yusheng and Appalaraju, Srikar and Manmatha, R.}, title = {LaTr: Layout-Aware Transformer for Scene-Text VQA}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16548-16558} }
HeadNeRF: A Real-Time NeRF-Based Parametric Head Model-
[pdf]
[arXiv]
[bibtex]@InProceedings{Hong_2022_CVPR, author = {Hong, Yang and Peng, Bo and Xiao, Haiyao and Liu, Ligang and Zhang, Juyong}, title = {HeadNeRF: A Real-Time NeRF-Based Parametric Head Model}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20374-20384} }
Replacing Labeled Real-Image Datasets With Auto-Generated Contours-
[pdf]
[bibtex]@InProceedings{Kataoka_2022_CVPR, author = {Kataoka, Hirokatsu and Hayamizu, Ryo and Yamada, Ryosuke and Nakashima, Kodai and Takashima, Sora and Zhang, Xinyu and Martinez-Noriega, Edgar Josafat and Inoue, Nakamasa and Yokota, Rio}, title = {Replacing Labeled Real-Image Datasets With Auto-Generated Contours}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21232-21241} }
WebQA: Multihop and Multimodal QA-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chang_2022_CVPR, author = {Chang, Yingshan and Narang, Mridu and Suzuki, Hisami and Cao, Guihong and Gao, Jianfeng and Bisk, Yonatan}, title = {WebQA: Multihop and Multimodal QA}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16495-16504} }
Towards Language-Free Training for Text-to-Image Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhou_2022_CVPR, author = {Zhou, Yufan and Zhang, Ruiyi and Chen, Changyou and Li, Chunyuan and Tensmeyer, Chris and Yu, Tong and Gu, Jiuxiang and Xu, Jinhui and Sun, Tong}, title = {Towards Language-Free Training for Text-to-Image Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17907-17917} }
Learning Affinity From Attention: End-to-End Weakly-Supervised Semantic Segmentation With Transformers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ru_2022_CVPR, author = {Ru, Lixiang and Zhan, Yibing and Yu, Baosheng and Du, Bo}, title = {Learning Affinity From Attention: End-to-End Weakly-Supervised Semantic Segmentation With Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16846-16855} }
FERV39k: A Large-Scale Multi-Scene Dataset for Facial Expression Recognition in Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2022_CVPR, author = {Wang, Yan and Sun, Yixuan and Huang, Yiwen and Liu, Zhongying and Gao, Shuyong and Zhang, Wei and Ge, Weifeng and Zhang, Wenqiang}, title = {FERV39k: A Large-Scale Multi-Scene Dataset for Facial Expression Recognition in Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20922-20931} }
Omnivore: A Single Model for Many Visual Modalities-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Girdhar_2022_CVPR, author = {Girdhar, Rohit and Singh, Mannat and Ravi, Nikhila and van der Maaten, Laurens and Joulin, Armand and Misra, Ishan}, title = {Omnivore: A Single Model for Many Visual Modalities}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16102-16112} }
DAIR-V2X: A Large-Scale Dataset for Vehicle-Infrastructure Cooperative 3D Object Detection-
[pdf]
[bibtex]@InProceedings{Yu_2022_CVPR, author = {Yu, Haibao and Luo, Yizhen and Shu, Mao and Huo, Yiyi and Yang, Zebang and Shi, Yifeng and Guo, Zhenglong and Li, Hanyu and Hu, Xing and Yuan, Jirui and Nie, Zaiqing}, title = {DAIR-V2X: A Large-Scale Dataset for Vehicle-Infrastructure Cooperative 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21361-21370} }
Uncertainty-Aware Adaptation for Self-Supervised 3D Human Pose Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kundu_2022_CVPR, author = {Kundu, Jogendra Nath and Seth, Siddharth and YM, Pradyumna and Jampani, Varun and Chakraborty, Anirban and Babu, R. Venkatesh}, title = {Uncertainty-Aware Adaptation for Self-Supervised 3D Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20448-20459} }
Semi-Supervised Wide-Angle Portraits Correction by Multi-Scale Transformer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2022_CVPR, author = {Zhu, Fushun and Zhao, Shan and Wang, Peng and Wang, Hao and Yan, Hua and Liu, Shuaicheng}, title = {Semi-Supervised Wide-Angle Portraits Correction by Multi-Scale Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19689-19698} }
Is Mapping Necessary for Realistic PointGoal Navigation?-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Partsey_2022_CVPR, author = {Partsey, Ruslan and Wijmans, Erik and Yokoyama, Naoki and Dobosevych, Oles and Batra, Dhruv and Maksymets, Oleksandr}, title = {Is Mapping Necessary for Realistic PointGoal Navigation?}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17232-17241} }
Node-Aligned Graph Convolutional Network for Whole-Slide Image Representation and Classification-
[pdf]
[bibtex]@InProceedings{Guan_2022_CVPR, author = {Guan, Yonghang and Zhang, Jun and Tian, Kuan and Yang, Sen and Dong, Pei and Xiang, Jinxi and Yang, Wei and Huang, Junzhou and Zhang, Yuyao and Han, Xiao}, title = {Node-Aligned Graph Convolutional Network for Whole-Slide Image Representation and Classification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18813-18823} }
Object-Relation Reasoning Graph for Action Recognition-
[pdf]
[bibtex]@InProceedings{Ou_2022_CVPR, author = {Ou, Yangjun and Mi, Li and Chen, Zhenzhong}, title = {Object-Relation Reasoning Graph for Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20133-20142} }
FaceVerse: A Fine-Grained and Detail-Controllable 3D Face Morphable Model From a Hybrid Dataset-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2022_CVPR, author = {Wang, Lizhen and Chen, Zhiyuan and Yu, Tao and Ma, Chenguang and Li, Liang and Liu, Yebin}, title = {FaceVerse: A Fine-Grained and Detail-Controllable 3D Face Morphable Model From a Hybrid Dataset}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20333-20342} }
Bring Evanescent Representations to Life in Lifelong Class Incremental Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Toldo_2022_CVPR, author = {Toldo, Marco and Ozay, Mete}, title = {Bring Evanescent Representations to Life in Lifelong Class Incremental Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16732-16741} }
Look Back and Forth: Video Super-Resolution With Explicit Temporal Difference Modeling-
[pdf]
[arXiv]
[bibtex]@InProceedings{Isobe_2022_CVPR, author = {Isobe, Takashi and Jia, Xu and Tao, Xin and Li, Changlin and Li, Ruihuang and Shi, Yongjie and Mu, Jing and Lu, Huchuan and Tai, Yu-Wing}, title = {Look Back and Forth: Video Super-Resolution With Explicit Temporal Difference Modeling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17411-17420} }
A Stitch in Time Saves Nine: A Train-Time Regularizing Loss for Improved Neural Network Calibration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hebbalaguppe_2022_CVPR, author = {Hebbalaguppe, Ramya and Prakash, Jatin and Madan, Neelabh and Arora, Chetan}, title = {A Stitch in Time Saves Nine: A Train-Time Regularizing Loss for Improved Neural Network Calibration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16081-16090} }
Deep Image-Based Illumination Harmonization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bao_2022_CVPR, author = {Bao, Zhongyun and Long, Chengjiang and Fu, Gang and Liu, Daquan and Li, Yuanzhen and Wu, Jiaming and Xiao, Chunxia}, title = {Deep Image-Based Illumination Harmonization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18542-18551} }
Harmony: A Generic Unsupervised Approach for Disentangling Semantic Content From Parameterized Transformations-
[pdf]
[supp]
[bibtex]@InProceedings{Uddin_2022_CVPR, author = {Uddin, Mostofa Rafid and Howe, Gregory and Zeng, Xiangrui and Xu, Min}, title = {Harmony: A Generic Unsupervised Approach for Disentangling Semantic Content From Parameterized Transformations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20646-20655} }
Talking Face Generation With Multilingual TTS-
[pdf]
[arXiv]
[bibtex]@InProceedings{Song_2022_CVPR, author = {Song, Hyoung-Kyu and Woo, Sang Hoon and Lee, Junhyeok and Yang, Seungmin and Cho, Hyunjae and Lee, Youseong and Choi, Dongho and Kim, Kang-wook}, title = {Talking Face Generation With Multilingual TTS}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21425-21430} }
Kernelized Few-Shot Object Detection With Efficient Integral Aggregation-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2022_CVPR, author = {Zhang, Shan and Wang, Lei and Murray, Naila and Koniusz, Piotr}, title = {Kernelized Few-Shot Object Detection With Efficient Integral Aggregation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19207-19216} }
Context-Aware Video Reconstruction for Rolling Shutter Cameras-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fan_2022_CVPR, author = {Fan, Bin and Dai, Yuchao and Zhang, Zhiyuan and Liu, Qi and He, Mingyi}, title = {Context-Aware Video Reconstruction for Rolling Shutter Cameras}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17572-17582} }
Robust Contrastive Learning Against Noisy Views-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chuang_2022_CVPR, author = {Chuang, Ching-Yao and Hjelm, R Devon and Wang, Xin and Vineet, Vibhav and Joshi, Neel and Torralba, Antonio and Jegelka, Stefanie and Song, Yale}, title = {Robust Contrastive Learning Against Noisy Views}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16670-16681} }
RSTT: Real-Time Spatial Temporal Transformer for Space-Time Video Super-Resolution-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Geng_2022_CVPR, author = {Geng, Zhicheng and Liang, Luming and Ding, Tianyu and Zharkov, Ilya}, title = {RSTT: Real-Time Spatial Temporal Transformer for Space-Time Video Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17441-17451} }
Learning Memory-Augmented Unidirectional Metrics for Cross-Modality Person Re-Identification-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2022_CVPR, author = {Liu, Jialun and Sun, Yifan and Zhu, Feng and Pei, Hongbin and Yang, Yi and Li, Wenhui}, title = {Learning Memory-Augmented Unidirectional Metrics for Cross-Modality Person Re-Identification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19366-19375} }
Partial Class Activation Attention for Semantic Segmentation-
[pdf]
[bibtex]@InProceedings{Liu_2022_CVPR, author = {Liu, Sun-Ao and Xie, Hongtao and Xu, Hai and Zhang, Yongdong and Tian, Qi}, title = {Partial Class Activation Attention for Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16836-16845} }
SkinningNet: Two-Stream Graph Convolutional Neural Network for Skinning Prediction of Synthetic Characters-
[pdf]
[supp]
[bibtex]@InProceedings{Mosella-Montoro_2022_CVPR, author = {Mosella-Montoro, Albert and Ruiz-Hidalgo, Javier}, title = {SkinningNet: Two-Stream Graph Convolutional Neural Network for Skinning Prediction of Synthetic Characters}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18593-18602} }
Cross-Modal Representation Learning for Zero-Shot Action Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lin_2022_CVPR, author = {Lin, Chung-Ching and Lin, Kevin and Wang, Lijuan and Liu, Zicheng and Li, Linjie}, title = {Cross-Modal Representation Learning for Zero-Shot Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19978-19988} }
Conditional Prompt Learning for Vision-Language Models-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhou_2022_CVPR, author = {Zhou, Kaiyang and Yang, Jingkang and Loy, Chen Change and Liu, Ziwei}, title = {Conditional Prompt Learning for Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16816-16825} }
Affine Medical Image Registration With Coarse-To-Fine Vision Transformer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mok_2022_CVPR, author = {Mok, Tony C. W. and Chung, Albert C. S.}, title = {Affine Medical Image Registration With Coarse-To-Fine Vision Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20835-20844} }
SMPL-A: Modeling Person-Specific Deformable Anatomy-
[pdf]
[supp]
[bibtex]@InProceedings{Guo_2022_CVPR, author = {Guo, Hengtao and Planche, Benjamin and Zheng, Meng and Karanam, Srikrishna and Chen, Terrence and Wu, Ziyan}, title = {SMPL-A: Modeling Person-Specific Deformable Anatomy}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20814-20823} }
A Differentiable Two-Stage Alignment Scheme for Burst Image Reconstruction With Large Shift-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Guo_2022_CVPR, author = {Guo, Shi and Yang, Xi and Ma, Jianqi and Ren, Gaofeng and Zhang, Lei}, title = {A Differentiable Two-Stage Alignment Scheme for Burst Image Reconstruction With Large Shift}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17472-17481} }
Unifying Panoptic Segmentation for Autonomous Driving-
[pdf]
[supp]
[bibtex]@InProceedings{Zendel_2022_CVPR, author = {Zendel, Oliver and Sch\"orghuber, Matthias and Rainer, Bernhard and Murschitz, Markus and Beleznai, Csaba}, title = {Unifying Panoptic Segmentation for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21351-21360} }
On the Road to Online Adaptation for Semantic Image Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Volpi_2022_CVPR, author = {Volpi, Riccardo and De Jorge, Pau and Larlus, Diane and Csurka, Gabriela}, title = {On the Road to Online Adaptation for Semantic Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19184-19195} }
Masked Autoencoders Are Scalable Vision Learners-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{He_2022_CVPR, author = {He, Kaiming and Chen, Xinlei and Xie, Saining and Li, Yanghao and Doll\'ar, Piotr and Girshick, Ross}, title = {Masked Autoencoders Are Scalable Vision Learners}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16000-16009} }
Point-BERT: Pre-Training 3D Point Cloud Transformers With Masked Point Modeling-
[pdf]
[supp]
[bibtex]@InProceedings{Yu_2022_CVPR, author = {Yu, Xumin and Tang, Lulu and Rao, Yongming and Huang, Tiejun and Zhou, Jie and Lu, Jiwen}, title = {Point-BERT: Pre-Training 3D Point Cloud Transformers With Masked Point Modeling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19313-19322} }
Crowd Counting in the Frequency Domain-
[pdf]
[supp]
[bibtex]@InProceedings{Shu_2022_CVPR, author = {Shu, Weibo and Wan, Jia and Tan, Kay Chen and Kwong, Sam and Chan, Antoni B.}, title = {Crowd Counting in the Frequency Domain}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19618-19627} }
Aladdin: Joint Atlas Building and Diffeomorphic Registration Learning With Pairwise Alignment-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ding_2022_CVPR, author = {Ding, Zhipeng and Niethammer, Marc}, title = {Aladdin: Joint Atlas Building and Diffeomorphic Registration Learning With Pairwise Alignment}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20784-20793} }
Learning sRGB-to-Raw-RGB De-Rendering With Content-Aware Metadata-
[pdf]
[supp]
[bibtex]@InProceedings{Nam_2022_CVPR, author = {Nam, Seonghyeon and Punnappurath, Abhijith and Brubaker, Marcus A. and Brown, Michael S.}, title = {Learning sRGB-to-Raw-RGB De-Rendering With Content-Aware Metadata}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17704-17713} }
Point Cloud Color Constancy-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xing_2022_CVPR, author = {Xing, Xiaoyan and Qian, Yanlin and Feng, Sibo and Dong, Yuhan and Matas, Ji\v{r}{\'\i}}, title = {Point Cloud Color Constancy}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19750-19759} }
Towards an End-to-End Framework for Flow-Guided Video Inpainting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Zhen and Lu, Cheng-Ze and Qin, Jianhua and Guo, Chun-Le and Cheng, Ming-Ming}, title = {Towards an End-to-End Framework for Flow-Guided Video Inpainting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17562-17571} }
CrossLoc: Scalable Aerial Localization Assisted by Multimodal Synthetic Data-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yan_2022_CVPR, author = {Yan, Qi and Zheng, Jianhao and Reding, Simon and Li, Shanci and Doytchinov, Iordan}, title = {CrossLoc: Scalable Aerial Localization Assisted by Multimodal Synthetic Data}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17358-17368} }
On Learning Contrastive Representations for Learning With Noisy Labels-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yi_2022_CVPR, author = {Yi, Li and Liu, Sheng and She, Qi and McLeod, A. Ian and Wang, Boyu}, title = {On Learning Contrastive Representations for Learning With Noisy Labels}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16682-16691} }
Modeling Indirect Illumination for Inverse Rendering-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhang_2022_CVPR, author = {Zhang, Yuanqing and Sun, Jiaming and He, Xingyi and Fu, Huan and Jia, Rongfei and Zhou, Xiaowei}, title = {Modeling Indirect Illumination for Inverse Rendering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18643-18652} }
BACON: Band-Limited Coordinate Networks for Multiscale Scene Representation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lindell_2022_CVPR, author = {Lindell, David B. and Van Veen, Dave and Park, Jeong Joon and Wetzstein, Gordon}, title = {BACON: Band-Limited Coordinate Networks for Multiscale Scene Representation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16252-16262} }
Modeling sRGB Camera Noise With Normalizing Flows-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kousha_2022_CVPR, author = {Kousha, Shayan and Maleky, Ali and Brown, Michael S. and Brubaker, Marcus A.}, title = {Modeling sRGB Camera Noise With Normalizing Flows}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17463-17471} }
Reference-Based Video Super-Resolution Using Multi-Camera Video Triplets-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2022_CVPR, author = {Lee, Junyong and Lee, Myeonghee and Cho, Sunghyun and Lee, Seungyong}, title = {Reference-Based Video Super-Resolution Using Multi-Camera Video Triplets}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17824-17833} }
Self-Supervised Image Representation Learning With Geometric Set Consistency-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2022_CVPR, author = {Chen, Nenglun and Chu, Lei and Pan, Hao and Lu, Yan and Wang, Wenping}, title = {Self-Supervised Image Representation Learning With Geometric Set Consistency}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19292-19302} }
GEN-VLKT: Simplify Association and Enhance Interaction Understanding for HOI Detection-
[pdf]
[bibtex]@InProceedings{Liao_2022_CVPR, author = {Liao, Yue and Zhang, Aixi and Lu, Miao and Wang, Yongliang and Li, Xiaobo and Liu, Si}, title = {GEN-VLKT: Simplify Association and Enhance Interaction Understanding for HOI Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20123-20132} }
Global Matching With Overlapping Attention for Optical Flow Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhao_2022_CVPR, author = {Zhao, Shiyu and Zhao, Long and Zhang, Zhixing and Zhou, Enyu and Metaxas, Dimitris}, title = {Global Matching With Overlapping Attention for Optical Flow Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17592-17601} }
Rethinking Efficient Lane Detection via Curve Modeling-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Feng_2022_CVPR, author = {Feng, Zhengyang and Guo, Shaohua and Tan, Xin and Xu, Ke and Wang, Min and Ma, Lizhuang}, title = {Rethinking Efficient Lane Detection via Curve Modeling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17062-17070} }
Co-Advise: Cross Inductive Bias Distillation-
[pdf]
[bibtex]@InProceedings{Ren_2022_CVPR, author = {Ren, Sucheng and Gao, Zhengqi and Hua, Tianyu and Xue, Zihui and Tian, Yonglong and He, Shengfeng and Zhao, Hang}, title = {Co-Advise: Cross Inductive Bias Distillation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16773-16782} }
DTFD-MIL: Double-Tier Feature Distillation Multiple Instance Learning for Histopathology Whole Slide Image Classification-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2022_CVPR, author = {Zhang, Hongrun and Meng, Yanda and Zhao, Yitian and Qiao, Yihong and Yang, Xiaoyun and Coupland, Sarah E. and Zheng, Yalin}, title = {DTFD-MIL: Double-Tier Feature Distillation Multiple Instance Learning for Histopathology Whole Slide Image Classification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18802-18812} }
Deep Generalized Unfolding Networks for Image Restoration-
[pdf]
[arXiv]
[bibtex]@InProceedings{Mou_2022_CVPR, author = {Mou, Chong and Wang, Qian and Zhang, Jian}, title = {Deep Generalized Unfolding Networks for Image Restoration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17399-17410} }
Robust Cross-Modal Representation Learning With Progressive Self-Distillation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Andonian_2022_CVPR, author = {Andonian, Alex and Chen, Shixing and Hamid, Raffay}, title = {Robust Cross-Modal Representation Learning With Progressive Self-Distillation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16430-16441} }
Compressive Single-Photon 3D Cameras-
[pdf]
[supp]
[bibtex]@InProceedings{Gutierrez-Barragan_2022_CVPR, author = {Gutierrez-Barragan, Felipe and Ingle, Atul and Seets, Trevor and Gupta, Mohit and Velten, Andreas}, title = {Compressive Single-Photon 3D Cameras}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17854-17864} }
Rethinking Controllable Variational Autoencoders-
[pdf]
[supp]
[bibtex]@InProceedings{Shao_2022_CVPR, author = {Shao, Huajie and Yang, Yifei and Lin, Haohong and Lin, Longzhong and Chen, Yizhuo and Yang, Qinmin and Zhao, Han}, title = {Rethinking Controllable Variational Autoencoders}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19250-19259} }
Boosting Crowd Counting via Multifaceted Attention-
[pdf]
[arXiv]
[bibtex]@InProceedings{Lin_2022_CVPR, author = {Lin, Hui and Ma, Zhiheng and Ji, Rongrong and Wang, Yaowei and Hong, Xiaopeng}, title = {Boosting Crowd Counting via Multifaceted Attention}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19628-19637} }
BigDL 2.0: Seamless Scaling of AI Pipelines From Laptops to Distributed Cluster-
[pdf]
[supp]
[bibtex]@InProceedings{Dai_2022_CVPR, author = {Dai, Jason (Jinquan) and Ding, Ding and Shi, Dongjie and Huang, Shengsheng and Wang, Jiao and Qiu, Xin and Huang, Kai and Song, Guoqiong and Wang, Yang and Gong, Qiyuan and Song, Jiaming and Yu, Shan and Zheng, Le and Chen, Yina and Deng, Junwei and Song, Ge}, title = {BigDL 2.0: Seamless Scaling of AI Pipelines From Laptops to Distributed Cluster}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21439-21446} }
Acquiring a Dynamic Light Field Through a Single-Shot Coded Image-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mizuno_2022_CVPR, author = {Mizuno, Ryoya and Takahashi, Keita and Yoshida, Michitaka and Tsutake, Chihiro and Fujii, Toshiaki and Nagahara, Hajime}, title = {Acquiring a Dynamic Light Field Through a Single-Shot Coded Image}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19830-19840} }
Attentive Fine-Grained Structured Sparsity for Image Restoration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Oh_2022_CVPR, author = {Oh, Junghun and Kim, Heewon and Nah, Seungjun and Hong, Cheeun and Choi, Jonghyun and Lee, Kyoung Mu}, title = {Attentive Fine-Grained Structured Sparsity for Image Restoration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17673-17682} }
StylizedNeRF: Consistent 3D Scene Stylization As Stylized NeRF via 2D-3D Mutual Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2022_CVPR, author = {Huang, Yi-Hua and He, Yue and Yuan, Yu-Jie and Lai, Yu-Kun and Gao, Lin}, title = {StylizedNeRF: Consistent 3D Scene Stylization As Stylized NeRF via 2D-3D Mutual Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18342-18352} }
NightLab: A Dual-Level Architecture With Hardness Detection for Segmentation at Night-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Deng_2022_CVPR, author = {Deng, Xueqing and Wang, Peng and Lian, Xiaochen and Newsam, Shawn}, title = {NightLab: A Dual-Level Architecture With Hardness Detection for Segmentation at Night}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16938-16948} }
InfoGCN: Representation Learning for Human Skeleton-Based Action Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Chi_2022_CVPR, author = {Chi, Hyung-gun and Ha, Myoung Hoon and Chi, Seunggeun and Lee, Sang Wan and Huang, Qixing and Ramani, Karthik}, title = {InfoGCN: Representation Learning for Human Skeleton-Based Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20186-20196} }
Sparse to Dense Dynamic 3D Facial Expression Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Otberdout_2022_CVPR, author = {Otberdout, Naima and Ferrari, Claudio and Daoudi, Mohamed and Berretti, Stefano and Del Bimbo, Alberto}, title = {Sparse to Dense Dynamic 3D Facial Expression Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20385-20394} }
Crafting Better Contrastive Views for Siamese Representation Learning-
[pdf]
[arXiv]
[bibtex]@InProceedings{Peng_2022_CVPR, author = {Peng, Xiangyu and Wang, Kai and Zhu, Zheng and Wang, Mang and You, Yang}, title = {Crafting Better Contrastive Views for Siamese Representation Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16031-16040} }
Continual Learning for Visual Search With Backward Consistent Feature Embedding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wan_2022_CVPR, author = {Wan, Timmy S. T. and Chen, Jun-Cheng and Wu, Tzer-Yi and Chen, Chu-Song}, title = {Continual Learning for Visual Search With Backward Consistent Feature Embedding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16702-16711} }
EyePAD++: A Distillation-Based Approach for Joint Eye Authentication and Presentation Attack Detection Using Periocular Images-
[pdf]
[supp]
[bibtex]@InProceedings{Dhar_2022_CVPR, author = {Dhar, Prithviraj and Kumar, Amit and Kaplan, Kirsten and Gupta, Khushi and Ranjan, Rakesh and Chellappa, Rama}, title = {EyePAD++: A Distillation-Based Approach for Joint Eye Authentication and Presentation Attack Detection Using Periocular Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20218-20227} }
Efficient Two-Stage Detection of Human-Object Interactions With a Novel Unary-Pairwise Transformer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2022_CVPR, author = {Zhang, Frederic Z. and Campbell, Dylan and Gould, Stephen}, title = {Efficient Two-Stage Detection of Human-Object Interactions With a Novel Unary-Pairwise Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20104-20112} }
A Low-Cost & Real-Time Motion Capture System-
[pdf]
[bibtex]@InProceedings{Chatzitofis_2022_CVPR, author = {Chatzitofis, Anargyros and Albanis, Georgios and Zioulis, Nikolaos and Thermos, Spyridon}, title = {A Low-Cost \& Real-Time Motion Capture System}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21453-21458} }
Unified Contrastive Learning in Image-Text-Label Space-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2022_CVPR, author = {Yang, Jianwei and Li, Chunyuan and Zhang, Pengchuan and Xiao, Bin and Liu, Ce and Yuan, Lu and Gao, Jianfeng}, title = {Unified Contrastive Learning in Image-Text-Label Space}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19163-19173} }
Unifying Motion Deblurring and Frame Interpolation With Events-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2022_CVPR, author = {Zhang, Xiang and Yu, Lei}, title = {Unifying Motion Deblurring and Frame Interpolation With Events}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17765-17774} }
Fast Point Transformer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Park_2022_CVPR, author = {Park, Chunghyun and Jeong, Yoonwoo and Cho, Minsu and Park, Jaesik}, title = {Fast Point Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16949-16958} }
Unimodal-Concentrated Loss: Fully Adaptive Label Distribution Learning for Ordinal Regression-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Qiang and Wang, Jingjing and Yao, Zhaoliang and Li, Yachun and Yang, Pengju and Yan, Jingwei and Wang, Chunmao and Pu, Shiliang}, title = {Unimodal-Concentrated Loss: Fully Adaptive Label Distribution Learning for Ordinal Regression}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20513-20522} }
Deep Stereo Image Compression via Bi-Directional Coding-
[pdf]
[bibtex]@InProceedings{Lei_2022_CVPR, author = {Lei, Jianjun and Liu, Xiangrui and Peng, Bo and Jin, Dengchao and Li, Wanqing and Gu, Jingxiao}, title = {Deep Stereo Image Compression via Bi-Directional Coding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19669-19678} }
How Good Is Aesthetic Ability of a Fashion Model?-
[pdf]
[supp]
[bibtex]@InProceedings{Zou_2022_CVPR, author = {Zou, Xingxing and Pang, Kaicheng and Zhang, Wen and Wong, Waikeung}, title = {How Good Is Aesthetic Ability of a Fashion Model?}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21200-21209} }
Mining Multi-View Information: A Strong Self-Supervised Framework for Depth-Based 3D Hand Pose and Mesh Estimation-
[pdf]
[supp]
[bibtex]@InProceedings{Ren_2022_CVPR, author = {Ren, Pengfei and Sun, Haifeng and Hao, Jiachang and Wang, Jingyu and Qi, Qi and Liao, Jianxin}, title = {Mining Multi-View Information: A Strong Self-Supervised Framework for Depth-Based 3D Hand Pose and Mesh Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20555-20565} }
BTS: A Bi-Lingual Benchmark for Text Segmentation in the Wild-
[pdf]
[supp]
[bibtex]@InProceedings{Xu_2022_CVPR, author = {Xu, Xixi and Qi, Zhongang and Ma, Jianqi and Zhang, Honglun and Shan, Ying and Qie, Xiaohu}, title = {BTS: A Bi-Lingual Benchmark for Text Segmentation in the Wild}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19152-19162} }
Hierarchical Modular Network for Video Captioning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ye_2022_CVPR, author = {Ye, Hanhua and Li, Guorong and Qi, Yuankai and Wang, Shuhui and Huang, Qingming and Yang, Ming-Hsuan}, title = {Hierarchical Modular Network for Video Captioning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17939-17948} }
Alignment-Uniformity Aware Representation Learning for Zero-Shot Video Classification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Pu_2022_CVPR, author = {Pu, Shi and Zhao, Kaili and Zheng, Mao}, title = {Alignment-Uniformity Aware Representation Learning for Zero-Shot Video Classification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19968-19977} }
LiDARCap: Long-Range Marker-Less 3D Human Motion Capture With LiDAR Point Clouds-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Jialian and Zhang, Jingyi and Wang, Zhiyong and Shen, Siqi and Wen, Chenglu and Ma, Yuexin and Xu, Lan and Yu, Jingyi and Wang, Cheng}, title = {LiDARCap: Long-Range Marker-Less 3D Human Motion Capture With LiDAR Point Clouds}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20502-20512} }
GeoEngine: A Platform for Production-Ready Geospatial Research-
[pdf]
[bibtex]@InProceedings{Verma_2022_CVPR, author = {Verma, Sagar and Gupta, Siddharth and Shin, Hal and Panigrahi, Akash and Goswami, Shubham and Pardeshi, Shweta and Exe, Natanael and Dutta, Ujwal and Joshi, Tanka Raj and Bhojwani, Nitin}, title = {GeoEngine: A Platform for Production-Ready Geospatial Research}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21416-21424} }
GroupViT: Semantic Segmentation Emerges From Text Supervision-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2022_CVPR, author = {Xu, Jiarui and De Mello, Shalini and Liu, Sifei and Byeon, Wonmin and Breuel, Thomas and Kautz, Jan and Wang, Xiaolong}, title = {GroupViT: Semantic Segmentation Emerges From Text Supervision}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18134-18144} }
Occlusion-Aware Cost Constructor for Light Field Depth Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2022_CVPR, author = {Wang, Yingqian and Wang, Longguang and Liang, Zhengyu and Yang, Jungang and An, Wei and Guo, Yulan}, title = {Occlusion-Aware Cost Constructor for Light Field Depth Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19809-19818} }
SmartPortraits: Depth Powered Handheld Smartphone Dataset of Human Portraits for State Estimation, Reconstruction and Synthesis-
[pdf]
[arXiv]
[bibtex]@InProceedings{Kornilova_2022_CVPR, author = {Kornilova, Anastasiia and Faizullin, Marsel and Pakulev, Konstantin and Sadkov, Andrey and Kukushkin, Denis and Akhmetyanov, Azat and Akhtyamov, Timur and Taherinejad, Hekmat and Ferrer, Gonzalo}, title = {SmartPortraits: Depth Powered Handheld Smartphone Dataset of Human Portraits for State Estimation, Reconstruction and Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21318-21329} }
Stacked Hybrid-Attention and Group Collaborative Learning for Unbiased Scene Graph Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dong_2022_CVPR, author = {Dong, Xingning and Gan, Tian and Song, Xuemeng and Wu, Jianlong and Cheng, Yuan and Nie, Liqiang}, title = {Stacked Hybrid-Attention and Group Collaborative Learning for Unbiased Scene Graph Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19427-19436} }
Topology-Preserving Shape Reconstruction and Registration via Neural Diffeomorphic Flow-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sun_2022_CVPR, author = {Sun, Shanlin and Han, Kun and Kong, Deying and Tang, Hao and Yan, Xiangyi and Xie, Xiaohui}, title = {Topology-Preserving Shape Reconstruction and Registration via Neural Diffeomorphic Flow}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20845-20855} }
Learning Part Segmentation Through Unsupervised Domain Adaptation From Synthetic Vehicles-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2022_CVPR, author = {Liu, Qing and Kortylewski, Adam and Zhang, Zhishuai and Li, Zizhang and Guo, Mengqi and Liu, Qihao and Yuan, Xiaoding and Mu, Jiteng and Qiu, Weichao and Yuille, Alan}, title = {Learning Part Segmentation Through Unsupervised Domain Adaptation From Synthetic Vehicles}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19140-19151} }
Learning Object Context for Novel-View Scene Layout Generation-
[pdf]
[bibtex]@InProceedings{Qiao_2022_CVPR, author = {Qiao, Xiaotian and Hancke, Gerhard P. and Lau, Rynson W.H.}, title = {Learning Object Context for Novel-View Scene Layout Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16990-16999} }
Neural Fields As Learnable Kernels for 3D Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Williams_2022_CVPR, author = {Williams, Francis and Gojcic, Zan and Khamis, Sameh and Zorin, Denis and Bruna, Joan and Fidler, Sanja and Litany, Or}, title = {Neural Fields As Learnable Kernels for 3D Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18500-18510} }
Detector-Free Weakly Supervised Group Activity Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2022_CVPR, author = {Kim, Dongkeun and Lee, Jinsung and Cho, Minsu and Kwak, Suha}, title = {Detector-Free Weakly Supervised Group Activity Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20083-20093} }
HairCLIP: Design Your Hair by Text and Reference Image-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wei_2022_CVPR, author = {Wei, Tianyi and Chen, Dongdong and Zhou, Wenbo and Liao, Jing and Tan, Zhentao and Yuan, Lu and Zhang, Weiming and Yu, Nenghai}, title = {HairCLIP: Design Your Hair by Text and Reference Image}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18072-18081} }
OakInk: A Large-Scale Knowledge Repository for Understanding Hand-Object Interaction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2022_CVPR, author = {Yang, Lixin and Li, Kailin and Zhan, Xinyu and Wu, Fei and Xu, Anran and Liu, Liu and Lu, Cewu}, title = {OakInk: A Large-Scale Knowledge Repository for Understanding Hand-Object Interaction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20953-20962} }
SwinBERT: End-to-End Transformers With Sparse Attention for Video Captioning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lin_2022_CVPR, author = {Lin, Kevin and Li, Linjie and Lin, Chung-Ching and Ahmed, Faisal and Gan, Zhe and Liu, Zicheng and Lu, Yumao and Wang, Lijuan}, title = {SwinBERT: End-to-End Transformers With Sparse Attention for Video Captioning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17949-17958} }
Maximum Spatial Perturbation Consistency for Unpaired Image-to-Image Translation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2022_CVPR, author = {Xu, Yanwu and Xie, Shaoan and Wu, Wenhao and Zhang, Kun and Gong, Mingming and Batmanghelich, Kayhan}, title = {Maximum Spatial Perturbation Consistency for Unpaired Image-to-Image Translation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18311-18320} }
Bringing Old Films Back to Life-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wan_2022_CVPR, author = {Wan, Ziyu and Zhang, Bo and Chen, Dongdong and Liao, Jing}, title = {Bringing Old Films Back to Life}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17694-17703} }
E2(GO)MOTION: Motion Augmented Event Stream for Egocentric Action Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Plizzari_2022_CVPR, author = {Plizzari, Chiara and Planamente, Mirco and Goletto, Gabriele and Cannici, Marco and Gusso, Emanuele and Matteucci, Matteo and Caputo, Barbara}, title = {E2(GO)MOTION: Motion Augmented Event Stream for Egocentric Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19935-19947} }
An Empirical Study of Training End-to-End Vision-and-Language Transformers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dou_2022_CVPR, author = {Dou, Zi-Yi and Xu, Yichong and Gan, Zhe and Wang, Jianfeng and Wang, Shuohang and Wang, Lijuan and Zhu, Chenguang and Zhang, Pengchuan and Yuan, Lu and Peng, Nanyun and Liu, Zicheng and Zeng, Michael}, title = {An Empirical Study of Training End-to-End Vision-and-Language Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18166-18176} }
Multimodal Dynamics: Dynamical Fusion for Trustworthy Multimodal Classification-
[pdf]
[supp]
[bibtex]@InProceedings{Han_2022_CVPR, author = {Han, Zongbo and Yang, Fan and Huang, Junzhou and Zhang, Changqing and Yao, Jianhua}, title = {Multimodal Dynamics: Dynamical Fusion for Trustworthy Multimodal Classification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20707-20717} }
Unsupervised Homography Estimation With Coplanarity-Aware GAN-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hong_2022_CVPR, author = {Hong, Mingbo and Lu, Yuhang and Ye, Nianjin and Lin, Chunyu and Zhao, Qijun and Liu, Shuaicheng}, title = {Unsupervised Homography Estimation With Coplanarity-Aware GAN}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17663-17672} }
LIFT: Learning 4D LiDAR Image Fusion Transformer for 3D Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Zeng_2022_CVPR, author = {Zeng, Yihan and Zhang, Da and Wang, Chunwei and Miao, Zhenwei and Liu, Ting and Zhan, Xin and Hao, Dayang and Ma, Chao}, title = {LIFT: Learning 4D LiDAR Image Fusion Transformer for 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17172-17181} }
PatchNet: A Simple Face Anti-Spoofing Framework via Fine-Grained Patch Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2022_CVPR, author = {Wang, Chien-Yi and Lu, Yu-Ding and Yang, Shang-Ta and Lai, Shang-Hong}, title = {PatchNet: A Simple Face Anti-Spoofing Framework via Fine-Grained Patch Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20281-20290} }
Rethinking Minimal Sufficient Representation in Contrastive Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2022_CVPR, author = {Wang, Haoqing and Guo, Xun and Deng, Zhi-Hong and Lu, Yan}, title = {Rethinking Minimal Sufficient Representation in Contrastive Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16041-16050} }
Effective Conditioned and Composed Image Retrieval Combining CLIP-Based Features-
[pdf]
[bibtex]@InProceedings{Baldrati_2022_CVPR, author = {Baldrati, Alberto and Bertini, Marco and Uricchio, Tiberio and Del Bimbo, Alberto}, title = {Effective Conditioned and Composed Image Retrieval Combining CLIP-Based Features}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21466-21474} }
Practical Stereo Matching via Cascaded Recurrent Network With Adaptive Correlation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Jiankun and Wang, Peisen and Xiong, Pengfei and Cai, Tao and Yan, Ziwei and Yang, Lei and Liu, Jiangyu and Fan, Haoqiang and Liu, Shuaicheng}, title = {Practical Stereo Matching via Cascaded Recurrent Network With Adaptive Correlation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16263-16272} }
D-Grasp: Physically Plausible Dynamic Grasp Synthesis for Hand-Object Interactions-
[pdf]
[supp]
[bibtex]@InProceedings{Christen_2022_CVPR, author = {Christen, Sammy and Kocabas, Muhammed and Aksan, Emre and Hwangbo, Jemin and Song, Jie and Hilliges, Otmar}, title = {D-Grasp: Physically Plausible Dynamic Grasp Synthesis for Hand-Object Interactions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20577-20586} }
Show, Deconfound and Tell: Image Captioning With Causal Inference-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2022_CVPR, author = {Liu, Bing and Wang, Dong and Yang, Xu and Zhou, Yong and Yao, Rui and Shao, Zhiwen and Zhao, Jiaqi}, title = {Show, Deconfound and Tell: Image Captioning With Causal Inference}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18041-18050} }
ImFace: A Nonlinear 3D Morphable Face Model With Implicit Neural Representations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zheng_2022_CVPR, author = {Zheng, Mingwu and Yang, Hongyu and Huang, Di and Chen, Liming}, title = {ImFace: A Nonlinear 3D Morphable Face Model With Implicit Neural Representations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20343-20352} }
MobRecon: Mobile-Friendly Hand Mesh Reconstruction From Monocular Image-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2022_CVPR, author = {Chen, Xingyu and Liu, Yufeng and Dong, Yajiao and Zhang, Xiong and Ma, Chongyang and Xiong, Yanmin and Zhang, Yuan and Guo, Xiaoyan}, title = {MobRecon: Mobile-Friendly Hand Mesh Reconstruction From Monocular Image}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20544-20554} }
AlignMixup: Improving Representations by Interpolating Aligned Features-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Venkataramanan_2022_CVPR, author = {Venkataramanan, Shashanka and Kijak, Ewa and Amsaleg, Laurent and Avrithis, Yannis}, title = {AlignMixup: Improving Representations by Interpolating Aligned Features}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19174-19183} }
HerosNet: Hyperspectral Explicable Reconstruction and Optimal Sampling Deep Network for Snapshot Compressive Imaging-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhang_2022_CVPR, author = {Zhang, Xuanyu and Zhang, Yongbing and Xiong, Ruiqin and Sun, Qilin and Zhang, Jian}, title = {HerosNet: Hyperspectral Explicable Reconstruction and Optimal Sampling Deep Network for Snapshot Compressive Imaging}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17532-17541} }
Detecting Deepfakes With Self-Blended Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shiohara_2022_CVPR, author = {Shiohara, Kaede and Yamasaki, Toshihiko}, title = {Detecting Deepfakes With Self-Blended Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18720-18729} }
Learnable Irrelevant Modality Dropout for Multimodal Action Recognition on Modality-Specific Annotated Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Alfasly_2022_CVPR, author = {Alfasly, Saghir and Lu, Jian and Xu, Chen and Zou, Yuru}, title = {Learnable Irrelevant Modality Dropout for Multimodal Action Recognition on Modality-Specific Annotated Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20208-20217} }
Bi-Level Doubly Variational Learning for Energy-Based Latent Variable Models-
[pdf]
[supp]
[bibtex]@InProceedings{Kan_2022_CVPR, author = {Kan, Ge and L\"u, Jinhu and Wang, Tian and Zhang, Baochang and Zhu, Aichun and Huang, Lei and Guo, Guodong and Snoussi, Hichem}, title = {Bi-Level Doubly Variational Learning for Energy-Based Latent Variable Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18460-18469} }
AxIoU: An Axiomatically Justified Measure for Video Moment Retrieval-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Togashi_2022_CVPR, author = {Togashi, Riku and Otani, Mayu and Nakashima, Yuta and Rahtu, Esa and Heikkil\"a, Janne and Sakai, Tetsuya}, title = {AxIoU: An Axiomatically Justified Measure for Video Moment Retrieval}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21076-21085} }
NOC-REK: Novel Object Captioning With Retrieved Vocabulary From External Knowledge-
[pdf]
[supp]
[bibtex]@InProceedings{Vo_2022_CVPR, author = {Vo, Duc Minh and Chen, Hong and Sugimoto, Akihiro and Nakayama, Hideki}, title = {NOC-REK: Novel Object Captioning With Retrieved Vocabulary From External Knowledge}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18000-18008} }
Speech Driven Tongue Animation-
[pdf]
[supp]
[bibtex]@InProceedings{Medina_2022_CVPR, author = {Medina, Salvador and Tome, Denis and Stoll, Carsten and Tiede, Mark and Munhall, Kevin and Hauptmann, Alexander G. and Matthews, Iain}, title = {Speech Driven Tongue Animation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20406-20416} }
Hybrid Relation Guided Set Matching for Few-Shot Action Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2022_CVPR, author = {Wang, Xiang and Zhang, Shiwei and Qing, Zhiwu and Tang, Mingqian and Zuo, Zhengrong and Gao, Changxin and Jin, Rong and Sang, Nong}, title = {Hybrid Relation Guided Set Matching for Few-Shot Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19948-19957} }
SHIFT: A Synthetic Driving Dataset for Continuous Multi-Task Domain Adaptation-
[pdf]
[supp]
[bibtex]@InProceedings{Sun_2022_CVPR, author = {Sun, Tao and Segu, Mattia and Postels, Janis and Wang, Yuxuan and Van Gool, Luc and Schiele, Bernt and Tombari, Federico and Yu, Fisher}, title = {SHIFT: A Synthetic Driving Dataset for Continuous Multi-Task Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21371-21382} }
FlexIT: Towards Flexible Semantic Image Translation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Couairon_2022_CVPR, author = {Couairon, Guillaume and Grechka, Asya and Verbeek, Jakob and Schwenk, Holger and Cord, Matthieu}, title = {FlexIT: Towards Flexible Semantic Image Translation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18270-18279} }
Face2Exp: Combating Data Biases for Facial Expression Recognition-
[pdf]
[bibtex]@InProceedings{Zeng_2022_CVPR, author = {Zeng, Dan and Lin, Zhiyuan and Yan, Xiao and Liu, Yuting and Wang, Fei and Tang, Bo}, title = {Face2Exp: Combating Data Biases for Facial Expression Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20291-20300} }
PINA: Learning a Personalized Implicit Neural Avatar From a Single RGB-D Video Sequence-
[pdf]
[supp]
[bibtex]@InProceedings{Dong_2022_CVPR, author = {Dong, Zijian and Guo, Chen and Song, Jie and Chen, Xu and Geiger, Andreas and Hilliges, Otmar}, title = {PINA: Learning a Personalized Implicit Neural Avatar From a Single RGB-D Video Sequence}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20470-20480} }
Forecasting From LiDAR via Future Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Peri_2022_CVPR, author = {Peri, Neehar and Luiten, Jonathon and Li, Mengtian and O\v{s}ep, Aljo\v{s}a and Leal-Taix\'e, Laura and Ramanan, Deva}, title = {Forecasting From LiDAR via Future Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17202-17211} }
CRAFT: Cross-Attentional Flow Transformer for Robust Optical Flow-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sui_2022_CVPR, author = {Sui, Xiuchao and Li, Shaohua and Geng, Xue and Wu, Yan and Xu, Xinxing and Liu, Yong and Goh, Rick and Zhu, Hongyuan}, title = {CRAFT: Cross-Attentional Flow Transformer for Robust Optical Flow}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17602-17611} }
Privacy Preserving Partial Localization-
[pdf]
[supp]
[bibtex]@InProceedings{Geppert_2022_CVPR, author = {Geppert, Marcel and Larsson, Viktor and Sch\"onberger, Johannes L. and Pollefeys, Marc}, title = {Privacy Preserving Partial Localization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17337-17347} }
Cross-Modal Background Suppression for Audio-Visual Event Localization-
[pdf]
[bibtex]@InProceedings{Xia_2022_CVPR, author = {Xia, Yan and Zhao, Zhou}, title = {Cross-Modal Background Suppression for Audio-Visual Event Localization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19989-19998} }
Lagrange Motion Analysis and View Embeddings for Improved Gait Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Chai_2022_CVPR, author = {Chai, Tianrui and Li, Annan and Zhang, Shaoxiong and Li, Zilong and Wang, Yunhong}, title = {Lagrange Motion Analysis and View Embeddings for Improved Gait Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20249-20258} }
Neural Mesh Simplification-
[pdf]
[supp]
[bibtex]@InProceedings{Potamias_2022_CVPR, author = {Potamias, Rolandos Alexandros and Ploumpis, Stylianos and Zafeiriou, Stefanos}, title = {Neural Mesh Simplification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18583-18592} }
Deep Hyperspectral-Depth Reconstruction Using Single Color-Dot Projection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Chunyu and Monno, Yusuke and Okutomi, Masatoshi}, title = {Deep Hyperspectral-Depth Reconstruction Using Single Color-Dot Projection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19770-19779} }
M3T: Three-Dimensional Medical Image Classifier Using Multi-Plane and Multi-Slice Transformer-
[pdf]
[supp]
[bibtex]@InProceedings{Jang_2022_CVPR, author = {Jang, Jinseong and Hwang, Dosik}, title = {M3T: Three-Dimensional Medical Image Classifier Using Multi-Plane and Multi-Slice Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20718-20729} }
3MASSIV: Multilingual, Multimodal and Multi-Aspect Dataset of Social Media Short Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gupta_2022_CVPR, author = {Gupta, Vikram and Mittal, Trisha and Mathur, Puneet and Mishra, Vaibhav and Maheshwari, Mayank and Bera, Aniket and Mukherjee, Debdoot and Manocha, Dinesh}, title = {3MASSIV: Multilingual, Multimodal and Multi-Aspect Dataset of Social Media Short Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21064-21075} }
Structured Sparse R-CNN for Direct Scene Graph Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Teng_2022_CVPR, author = {Teng, Yao and Wang, Limin}, title = {Structured Sparse R-CNN for Direct Scene Graph Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19437-19446} }
Multi-Grained Spatio-Temporal Features Perceived Network for Event-Based Lip-Reading-
[pdf]
[supp]
[bibtex]@InProceedings{Tan_2022_CVPR, author = {Tan, Ganchao and Wang, Yang and Han, Han and Cao, Yang and Wu, Feng and Zha, Zheng-Jun}, title = {Multi-Grained Spatio-Temporal Features Perceived Network for Event-Based Lip-Reading}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20094-20103} }
AnyFace: Free-Style Text-To-Face Synthesis and Manipulation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Sun_2022_CVPR, author = {Sun, Jianxin and Deng, Qiyao and Li, Qi and Sun, Muyi and Ren, Min and Sun, Zhenan}, title = {AnyFace: Free-Style Text-To-Face Synthesis and Manipulation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18687-18696} }
HL-Net: Heterophily Learning Network for Scene Graph Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Lin_2022_CVPR, author = {Lin, Xin and Ding, Changxing and Zhan, Yibing and Li, Zijian and Tao, Dacheng}, title = {HL-Net: Heterophily Learning Network for Scene Graph Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19476-19485} }
MERLOT Reserve: Neural Script Knowledge Through Vision and Language and Sound-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zellers_2022_CVPR, author = {Zellers, Rowan and Lu, Jiasen and Lu, Ximing and Yu, Youngjae and Zhao, Yanpeng and Salehi, Mohammadreza and Kusupati, Aditya and Hessel, Jack and Farhadi, Ali and Choi, Yejin}, title = {MERLOT Reserve: Neural Script Knowledge Through Vision and Language and Sound}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16375-16387} }
A Conservative Approach for Unbiased Learning on Unknown Biases-
[pdf]
[supp]
[bibtex]@InProceedings{Jeon_2022_CVPR, author = {Jeon, Myeongho and Kim, Daekyung and Lee, Woochul and Kang, Myungjoo and Lee, Joonseok}, title = {A Conservative Approach for Unbiased Learning on Unknown Biases}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16752-16760} }
Large-Scale Video Panoptic Segmentation in the Wild: A Benchmark-
[pdf]
[supp]
[bibtex]@InProceedings{Miao_2022_CVPR, author = {Miao, Jiaxu and Wang, Xiaohan and Wu, Yu and Li, Wei and Zhang, Xu and Wei, Yunchao and Yang, Yi}, title = {Large-Scale Video Panoptic Segmentation in the Wild: A Benchmark}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21033-21043} }
GrainSpace: A Large-Scale Dataset for Fine-Grained and Domain-Adaptive Recognition of Cereal Grains-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fan_2022_CVPR, author = {Fan, Lei and Ding, Yiwen and Fan, Dongdong and Di, Donglin and Pagnucco, Maurice and Song, Yang}, title = {GrainSpace: A Large-Scale Dataset for Fine-Grained and Domain-Adaptive Recognition of Cereal Grains}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21116-21125} }
BokehMe: When Neural Rendering Meets Classical Rendering-
[pdf]
[supp]
[bibtex]@InProceedings{Peng_2022_CVPR, author = {Peng, Juewen and Cao, Zhiguo and Luo, Xianrui and Lu, Hao and Xian, Ke and Zhang, Jianming}, title = {BokehMe: When Neural Rendering Meets Classical Rendering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16283-16292} }
Learning Modal-Invariant and Temporal-Memory for Video-Based Visible-Infrared Person Re-Identification-
[pdf]
[supp]
[bibtex]@InProceedings{Lin_2022_CVPR, author = {Lin, Xinyu and Li, Jinxing and Ma, Zeyu and Li, Huafeng and Li, Shuang and Xu, Kaixiong and Lu, Guangming and Zhang, David}, title = {Learning Modal-Invariant and Temporal-Memory for Video-Based Visible-Infrared Person Re-Identification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20973-20982} }
BigDatasetGAN: Synthesizing ImageNet With Pixel-Wise Annotations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Daiqing and Ling, Huan and Kim, Seung Wook and Kreis, Karsten and Fidler, Sanja and Torralba, Antonio}, title = {BigDatasetGAN: Synthesizing ImageNet With Pixel-Wise Annotations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21330-21340} }
Align Representations With Base: A New Approach to Self-Supervised Learning-
[pdf]
[bibtex]@InProceedings{Zhang_2022_CVPR, author = {Zhang, Shaofeng and Qiu, Lyn and Zhu, Feng and Yan, Junchi and Zhang, Hengrui and Zhao, Rui and Li, Hongyang and Yang, Xiaokang}, title = {Align Representations With Base: A New Approach to Self-Supervised Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16600-16609} }
Exploring Denoised Cross-Video Contrast for Weakly-Supervised Temporal Action Localization-
[pdf]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Jingjing and Yang, Tianyu and Ji, Wei and Wang, Jue and Cheng, Li}, title = {Exploring Denoised Cross-Video Contrast for Weakly-Supervised Temporal Action Localization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19914-19924} }
SVIP: Sequence VerIfication for Procedures in Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Qian_2022_CVPR, author = {Qian, Yicheng and Luo, Weixin and Lian, Dongze and Tang, Xu and Zhao, Peilin and Gao, Shenghua}, title = {SVIP: Sequence VerIfication for Procedures in Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19890-19902} }
Low-Resource Adaptation for Personalized Co-Speech Gesture Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Ahuja_2022_CVPR, author = {Ahuja, Chaitanya and Lee, Dong Won and Morency, Louis-Philippe}, title = {Low-Resource Adaptation for Personalized Co-Speech Gesture Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20566-20576} }
HDR-NeRF: High Dynamic Range Neural Radiance Fields-
[pdf]
[supp]
[bibtex]@InProceedings{Huang_2022_CVPR, author = {Huang, Xin and Zhang, Qi and Feng, Ying and Li, Hongdong and Wang, Xuan and Wang, Qing}, title = {HDR-NeRF: High Dynamic Range Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18398-18408} }
Neural Emotion Director: Speech-Preserving Semantic Control of Facial Expressions in "In-the-Wild" Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Papantoniou_2022_CVPR, author = {Papantoniou, Foivos Paraperas and Filntisis, Panagiotis P. and Maragos, Petros and Roussos, Anastasios}, title = {Neural Emotion Director: Speech-Preserving Semantic Control of Facial Expressions in ''In-the-Wild'' Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18781-18790} }
Learning To Listen: Modeling Non-Deterministic Dyadic Facial Motion-
[pdf]
[arXiv]
[bibtex]@InProceedings{Ng_2022_CVPR, author = {Ng, Evonne and Joo, Hanbyul and Hu, Liwen and Li, Hao and Darrell, Trevor and Kanazawa, Angjoo and Ginosar, Shiry}, title = {Learning To Listen: Modeling Non-Deterministic Dyadic Facial Motion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20395-20405} }
3PSDF: Three-Pole Signed Distance Function for Learning Surfaces With Arbitrary Topologies-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2022_CVPR, author = {Chen, Weikai and Lin, Cheng and Li, Weiyang and Yang, Bo}, title = {3PSDF: Three-Pole Signed Distance Function for Learning Surfaces With Arbitrary Topologies}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18522-18531} }
GIRAFFE HD: A High-Resolution 3D-Aware Generative Model-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xue_2022_CVPR, author = {Xue, Yang and Li, Yuheng and Singh, Krishna Kumar and Lee, Yong Jae}, title = {GIRAFFE HD: A High-Resolution 3D-Aware Generative Model}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18440-18449} }
Knowledge-Driven Self-Supervised Representation Learning for Facial Action Unit Recognition-
[pdf]
[bibtex]@InProceedings{Chang_2022_CVPR, author = {Chang, Yanan and Wang, Shangfei}, title = {Knowledge-Driven Self-Supervised Representation Learning for Facial Action Unit Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20417-20426} }
Learning Second Order Local Anomaly for General Face Forgery Detection-
[pdf]
[bibtex]@InProceedings{Fei_2022_CVPR, author = {Fei, Jianwei and Dai, Yunshu and Yu, Peipeng and Shen, Tianrun and Xia, Zhihua and Weng, Jian}, title = {Learning Second Order Local Anomaly for General Face Forgery Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20270-20280} }
ADAS: A Direct Adaptation Strategy for Multi-Target Domain Adaptive Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2022_CVPR, author = {Lee, Seunghun and Choi, Wonhyeok and Kim, Changjae and Choi, Minwoo and Im, Sunghoon}, title = {ADAS: A Direct Adaptation Strategy for Multi-Target Domain Adaptive Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19196-19206} }
The Devil Is in the Labels: Noisy Label Correction for Robust Scene Graph Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Lin and Chen, Long and Huang, Yifeng and Zhang, Zhimeng and Zhang, Songyang and Xiao, Jun}, title = {The Devil Is in the Labels: Noisy Label Correction for Robust Scene Graph Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18869-18878} }
LAVT: Language-Aware Vision Transformer for Referring Image Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2022_CVPR, author = {Yang, Zhao and Wang, Jiaqi and Tang, Yansong and Chen, Kai and Zhao, Hengshuang and Torr, Philip H.S.}, title = {LAVT: Language-Aware Vision Transformer for Referring Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18155-18165} }
Video Demoireing With Relation-Based Temporal Consistency-
[pdf]
[arXiv]
[bibtex]@InProceedings{Dai_2022_CVPR, author = {Dai, Peng and Yu, Xin and Ma, Lan and Zhang, Baoheng and Li, Jia and Li, Wenbo and Shen, Jiajun and Qi, Xiaojuan}, title = {Video Demoireing With Relation-Based Temporal Consistency}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17622-17631} }
GraFormer: Graph-Oriented Transformer for 3D Pose Estimation-
[pdf]
[bibtex]@InProceedings{Zhao_2022_CVPR, author = {Zhao, Weixi and Wang, Weiqiang and Tian, Yunjie}, title = {GraFormer: Graph-Oriented Transformer for 3D Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20438-20447} }
DeepCurrents: Learning Implicit Representations of Shapes With Boundaries-
[pdf]
[arXiv]
[bibtex]@InProceedings{Palmer_2022_CVPR, author = {Palmer, David and Smirnov, Dmitriy and Wang, Stephanie and Chern, Albert and Solomon, Justin}, title = {DeepCurrents: Learning Implicit Representations of Shapes With Boundaries}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18665-18675} }
Zero Experience Required: Plug & Play Modular Transfer Learning for Semantic Visual Navigation-
[pdf]
[supp]
[bibtex]@InProceedings{Al-Halah_2022_CVPR, author = {Al-Halah, Ziad and Ramakrishnan, Santhosh Kumar and Grauman, Kristen}, title = {Zero Experience Required: Plug \& Play Modular Transfer Learning for Semantic Visual Navigation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17031-17041} }
The Wanderings of Odysseus in 3D Scenes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2022_CVPR, author = {Zhang, Yan and Tang, Siyu}, title = {The Wanderings of Odysseus in 3D Scenes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20481-20491} }
All-in-One Image Restoration for Unknown Corruption-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Boyun and Liu, Xiao and Hu, Peng and Wu, Zhongqin and Lv, Jiancheng and Peng, Xi}, title = {All-in-One Image Restoration for Unknown Corruption}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17452-17462} }
Optimizing Video Prediction via Video Frame Interpolation-
[pdf]
[bibtex]@InProceedings{Wu_2022_CVPR, author = {Wu, Yue and Wen, Qiang and Chen, Qifeng}, title = {Optimizing Video Prediction via Video Frame Interpolation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17814-17823} }
Episodic Memory Question Answering-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Datta_2022_CVPR, author = {Datta, Samyak and Dharur, Sameer and Cartillier, Vincent and Desai, Ruta and Khanna, Mukul and Batra, Dhruv and Parikh, Devi}, title = {Episodic Memory Question Answering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19119-19128} }
Continual Stereo Matching of Continuous Driving Scenes With Growing Architecture-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2022_CVPR, author = {Zhang, Chenghao and Tian, Kun and Fan, Bin and Meng, Gaofeng and Zhang, Zhaoxiang and Pan, Chunhong}, title = {Continual Stereo Matching of Continuous Driving Scenes With Growing Architecture}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18901-18910} }
Learning To Zoom Inside Camera Imaging Pipeline-
[pdf]
[supp]
[bibtex]@InProceedings{Tang_2022_CVPR, author = {Tang, Chengzhou and Yang, Yuqiang and Zeng, Bing and Tan, Ping and Liu, Shuaicheng}, title = {Learning To Zoom Inside Camera Imaging Pipeline}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17552-17561} }
gDNA: Towards Generative Detailed Neural Avatars-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2022_CVPR, author = {Chen, Xu and Jiang, Tianjian and Song, Jie and Yang, Jinlong and Black, Michael J. and Geiger, Andreas and Hilliges, Otmar}, title = {gDNA: Towards Generative Detailed Neural Avatars}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20427-20437} }
Degree-of-Linear-Polarization-Based Color Constancy-
[pdf]
[supp]
[bibtex]@InProceedings{Ono_2022_CVPR, author = {Ono, Taishi and Kondo, Yuhi and Sun, Legong and Kurita, Teppei and Moriuchi, Yusuke}, title = {Degree-of-Linear-Polarization-Based Color Constancy}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19740-19749} }
On the Importance of Asymmetry for Siamese Representation Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2022_CVPR, author = {Wang, Xiao and Fan, Haoqi and Tian, Yuandong and Kihara, Daisuke and Chen, Xinlei}, title = {On the Importance of Asymmetry for Siamese Representation Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16570-16579} }
Probing Representation Forgetting in Supervised and Unsupervised Continual Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Davari_2022_CVPR, author = {Davari, MohammadReza and Asadi, Nader and Mudur, Sudhir and Aljundi, Rahaf and Belilovsky, Eugene}, title = {Probing Representation Forgetting in Supervised and Unsupervised Continual Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16712-16721} }
DenseCLIP: Language-Guided Dense Prediction With Context-Aware Prompting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Rao_2022_CVPR, author = {Rao, Yongming and Zhao, Wenliang and Chen, Guangyi and Tang, Yansong and Zhu, Zheng and Huang, Guan and Zhou, Jie and Lu, Jiwen}, title = {DenseCLIP: Language-Guided Dense Prediction With Context-Aware Prompting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18082-18091} }
JRDB-Act: A Large-Scale Dataset for Spatio-Temporal Action, Social Group and Activity Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Ehsanpour_2022_CVPR, author = {Ehsanpour, Mahsa and Saleh, Fatemeh and Savarese, Silvio and Reid, Ian and Rezatofighi, Hamid}, title = {JRDB-Act: A Large-Scale Dataset for Spatio-Temporal Action, Social Group and Activity Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20983-20992} }
AR-NeRF: Unsupervised Learning of Depth and Defocus Effects From Natural Images With Aperture Rendering Neural Radiance Fields-
[pdf]
[supp]
[bibtex]@InProceedings{Kaneko_2022_CVPR, author = {Kaneko, Takuhiro}, title = {AR-NeRF: Unsupervised Learning of Depth and Defocus Effects From Natural Images With Aperture Rendering Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18387-18397} }
Decoupling and Recoupling Spatiotemporal Representation for RGB-D-Based Motion Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Zhou_2022_CVPR, author = {Zhou, Benjia and Wang, Pichao and Wan, Jun and Liang, Yanyan and Wang, Fan and Zhang, Du and Lei, Zhen and Li, Hao and Jin, Rong}, title = {Decoupling and Recoupling Spatiotemporal Representation for RGB-D-Based Motion Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20154-20163} }
Towards Robust and Adaptive Motion Forecasting: A Causal Representation Perspective-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2022_CVPR, author = {Liu, Yuejiang and Cadei, Riccardo and Schweizer, Jonas and Bahmani, Sherwin and Alahi, Alexandre}, title = {Towards Robust and Adaptive Motion Forecasting: A Causal Representation Perspective}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17081-17092} }
Escaping Data Scarcity for High-Resolution Heterogeneous Face Hallucination-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mei_2022_CVPR, author = {Mei, Yiqun and Guo, Pengfei and Patel, Vishal M.}, title = {Escaping Data Scarcity for High-Resolution Heterogeneous Face Hallucination}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18676-18686} }
Visual Acoustic Matching-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2022_CVPR, author = {Chen, Changan and Gao, Ruohan and Calamia, Paul and Grauman, Kristen}, title = {Visual Acoustic Matching}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18858-18868} }
Unified Multivariate Gaussian Mixture for Efficient Neural Image Compression-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2022_CVPR, author = {Zhu, Xiaosu and Song, Jingkuan and Gao, Lianli and Zheng, Feng and Shen, Heng Tao}, title = {Unified Multivariate Gaussian Mixture for Efficient Neural Image Compression}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17612-17621} }
3D Photo Stylization: Learning To Generate Stylized Novel Views From a Single Image-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mu_2022_CVPR, author = {Mu, Fangzhou and Wang, Jian and Wu, Yicheng and Li, Yin}, title = {3D Photo Stylization: Learning To Generate Stylized Novel Views From a Single Image}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16273-16282} }
SelfD: Self-Learning Large-Scale Driving Policies From the Web-
[pdf]
[bibtex]@InProceedings{Zhang_2022_CVPR, author = {Zhang, Jimuyang and Zhu, Ruizhao and Ohn-Bar, Eshed}, title = {SelfD: Self-Learning Large-Scale Driving Policies From the Web}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17316-17326} }
"The Pedestrian Next to the Lamppost" Adaptive Object Graphs for Better Instantaneous Mapping-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Saha_2022_CVPR, author = {Saha, Avishkar and Mendez, Oscar and Russell, Chris and Bowden, Richard}, title = {''The Pedestrian Next to the Lamppost'' Adaptive Object Graphs for Better Instantaneous Mapping}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19528-19537} }
Surpassing the Human Accuracy: Detecting Gallbladder Cancer From USG Images With Curriculum Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Basu_2022_CVPR, author = {Basu, Soumen and Gupta, Mayank and Rana, Pratyaksha and Gupta, Pankaj and Arora, Chetan}, title = {Surpassing the Human Accuracy: Detecting Gallbladder Cancer From USG Images With Curriculum Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20886-20896} }
Autofocus for Event Cameras-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lin_2022_CVPR, author = {Lin, Shijie and Zhang, Yinqiang and Yu, Lei and Zhou, Bin and Luo, Xiaowei and Pan, Jia}, title = {Autofocus for Event Cameras}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16344-16353} }
Learning Multiple Adverse Weather Removal via Two-Stage Knowledge Learning and Multi-Contrastive Regularization: Toward a Unified Model-
[pdf]
[bibtex]@InProceedings{Chen_2022_CVPR, author = {Chen, Wei-Ting and Huang, Zhi-Kai and Tsai, Cheng-Che and Yang, Hao-Hsiang and Ding, Jian-Jiun and Kuo, Sy-Yen}, title = {Learning Multiple Adverse Weather Removal via Two-Stage Knowledge Learning and Multi-Contrastive Regularization: Toward a Unified Model}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17653-17662} }
L-Verse: Bidirectional Generation Between Image and Text-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2022_CVPR, author = {Kim, Taehoon and Song, Gwangmo and Lee, Sihaeng and Kim, Sangyun and Seo, Yewon and Lee, Soonyoung and Kim, Seung Hwan and Lee, Honglak and Bae, Kyunghoon}, title = {L-Verse: Bidirectional Generation Between Image and Text}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16526-16536} }
Self-Supervised Learning of Adversarial Example: Towards Good Generalizations for Deepfake Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2022_CVPR, author = {Chen, Liang and Zhang, Yong and Song, Yibing and Liu, Lingqiao and Wang, Jue}, title = {Self-Supervised Learning of Adversarial Example: Towards Good Generalizations for Deepfake Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18710-18719} }
Ego4D: Around the World in 3,000 Hours of Egocentric Video-
[pdf]
[supp]
[bibtex]@InProceedings{Grauman_2022_CVPR, author = {Grauman, Kristen and Westbury, Andrew and Byrne, Eugene and Chavis, Zachary and Furnari, Antonino and Girdhar, Rohit and Hamburger, Jackson and Jiang, Hao and Liu, Miao and Liu, Xingyu and Martin, Miguel and Nagarajan, Tushar and Radosavovic, Ilija and Ramakrishnan, Santhosh Kumar and Ryan, Fiona and Sharma, Jayant and Wray, Michael and Xu, Mengmeng and Xu, Eric Zhongcong and Zhao, Chen and Bansal, Siddhant and Batra, Dhruv and Cartillier, Vincent and Crane, Sean and Do, Tien and Doulaty, Morrie and Erapalli, Akshay and Feichtenhofer, Christoph and Fragomeni, Adriano and Fu, Qichen and Gebreselasie, Abrham and Gonz\'alez, Cristina and Hillis, James and Huang, Xuhua and Huang, Yifei and Jia, Wenqi and Khoo, Weslie and Kol\'a\v{r}, J\'achym and Kottur, Satwik and Kumar, Anurag and Landini, Federico and Li, Chao and Li, Yanghao and Li, Zhenqiang and Mangalam, Karttikeya and Modhugu, Raghava and Munro, Jonathan and Murrell, Tullie and Nishiyasu, Takumi and Price, Will and Ruiz, Paola and Ramazanova, Merey and Sari, Leda and Somasundaram, Kiran and Southerland, Audrey and Sugano, Yusuke and Tao, Ruijie and Vo, Minh and Wang, Yuchen and Wu, Xindi and Yagi, Takuma and Zhao, Ziwei and Zhu, Yunyi and Arbel\'aez, Pablo and Crandall, David and Damen, Dima and Farinella, Giovanni Maria and Fuegen, Christian and Ghanem, Bernard and Ithapu, Vamsi Krishna and Jawahar, C. V. and Joo, Hanbyul and Kitani, Kris and Li, Haizhou and Newcombe, Richard and Oliva, Aude and Park, Hyun Soo and Rehg, James M. and Sato, Yoichi and Shi, Jianbo and Shou, Mike Zheng and Torralba, Antonio and Torresani, Lorenzo and Yan, Mingfei and Malik, Jitendra}, title = {Ego4D: Around the World in 3,000 Hours of Egocentric Video}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18995-19012} }
Self-Supervised Pre-Training of Swin Transformers for 3D Medical Image Analysis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tang_2022_CVPR, author = {Tang, Yucheng and Yang, Dong and Li, Wenqi and Roth, Holger R. and Landman, Bennett and Xu, Daguang and Nath, Vishwesh and Hatamizadeh, Ali}, title = {Self-Supervised Pre-Training of Swin Transformers for 3D Medical Image Analysis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20730-20740} }
Camera-Conditioned Stable Feature Generation for Isolated Camera Supervised Person Re-IDentification-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wu_2022_CVPR, author = {Wu, Chao and Ge, Wenhang and Wu, Ancong and Chang, Xiaobin}, title = {Camera-Conditioned Stable Feature Generation for Isolated Camera Supervised Person Re-IDentification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20238-20248} }
Weakly Supervised Semantic Segmentation Using Out-of-Distribution Data-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2022_CVPR, author = {Lee, Jungbeom and Oh, Seong Joon and Yun, Sangdoo and Choe, Junsuk and Kim, Eunji and Yoon, Sungroh}, title = {Weakly Supervised Semantic Segmentation Using Out-of-Distribution Data}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16897-16906} }
Point-Level Region Contrast for Object Detection Pre-Training-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bai_2022_CVPR, author = {Bai, Yutong and Chen, Xinlei and Kirillov, Alexander and Yuille, Alan and Berg, Alexander C.}, title = {Point-Level Region Contrast for Object Detection Pre-Training}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16061-16070} }
Spatial-Temporal Parallel Transformer for Arm-Hand Dynamic Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2022_CVPR, author = {Liu, Shuying and Wu, Wenbin and Wu, Jiaxian and Lin, Yue}, title = {Spatial-Temporal Parallel Transformer for Arm-Hand Dynamic Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20523-20532} }
Failure Modes of Domain Generalization Algorithms-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Galstyan_2022_CVPR, author = {Galstyan, Tigran and Harutyunyan, Hrayr and Khachatrian, Hrant and Steeg, Greg Ver and Galstyan, Aram}, title = {Failure Modes of Domain Generalization Algorithms}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19077-19086} }
Class Similarity Weighted Knowledge Distillation for Continual Semantic Segmentation-
[pdf]
[bibtex]@InProceedings{Phan_2022_CVPR, author = {Phan, Minh Hieu and Ta, The-Anh and Phung, Son Lam and Tran-Thanh, Long and Bouzerdoum, Abdesselam}, title = {Class Similarity Weighted Knowledge Distillation for Continual Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16866-16875} }
DAD-3DHeads: A Large-Scale Dense, Accurate and Diverse Dataset for 3D Head Alignment From a Single Image-
[pdf]
[supp]
[bibtex]@InProceedings{Martyniuk_2022_CVPR, author = {Martyniuk, Tetiana and Kupyn, Orest and Kurlyak, Yana and Krashenyi, Igor and Matas, Ji\v{r}{\'\i} and Sharmanska, Viktoriia}, title = {DAD-3DHeads: A Large-Scale Dense, Accurate and Diverse Dataset for 3D Head Alignment From a Single Image}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20942-20952} }
vCLIMB: A Novel Video Class Incremental Learning Benchmark-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Villa_2022_CVPR, author = {Villa, Andr\'es and Alhamoud, Kumail and Escorcia, Victor and Caba, Fabian and Alc\'azar, Juan Le\'on and Ghanem, Bernard}, title = {vCLIMB: A Novel Video Class Incremental Learning Benchmark}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19035-19044} }
Bending Reality: Distortion-Aware Transformers for Adapting to Panoramic Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2022_CVPR, author = {Zhang, Jiaming and Yang, Kailun and Ma, Chaoxiang and Rei{\ss}, Simon and Peng, Kunyu and Stiefelhagen, Rainer}, title = {Bending Reality: Distortion-Aware Transformers for Adapting to Panoramic Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16917-16927} }
INS-Conv: Incremental Sparse Convolution for Online 3D Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2022_CVPR, author = {Liu, Leyao and Zheng, Tian and Lin, Yun-Jou and Ni, Kai and Fang, Lu}, title = {INS-Conv: Incremental Sparse Convolution for Online 3D Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18975-18984} }
Visual Vibration Tomography: Estimating Interior Material Properties From Monocular Video-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Feng_2022_CVPR, author = {Feng, Berthy T. and Ogren, Alexander C. and Daraio, Chiara and Bouman, Katherine L.}, title = {Visual Vibration Tomography: Estimating Interior Material Properties From Monocular Video}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16231-16240} }
Rope3D: The Roadside Perception Dataset for Autonomous Driving and Monocular 3D Object Detection Task-
[pdf]
[supp]
[bibtex]@InProceedings{Ye_2022_CVPR, author = {Ye, Xiaoqing and Shu, Mao and Li, Hanyu and Shi, Yifeng and Li, Yingying and Wang, Guangjie and Tan, Xiao and Ding, Errui}, title = {Rope3D: The Roadside Perception Dataset for Autonomous Driving and Monocular 3D Object Detection Task}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21341-21350} }
Noisy Boundaries: Lemon or Lemonade for Semi-Supervised Instance Segmentation?-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2022_CVPR, author = {Wang, Zhenyu and Li, Yali and Wang, Shengjin}, title = {Noisy Boundaries: Lemon or Lemonade for Semi-Supervised Instance Segmentation?}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16826-16835} }
Boosting View Synthesis With Residual Transfer-
[pdf]
[bibtex]@InProceedings{Rong_2022_CVPR, author = {Rong, Xuejian and Huang, Jia-Bin and Saraf, Ayush and Kim, Changil and Kopf, Johannes}, title = {Boosting View Synthesis With Residual Transfer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19760-19769} }
Think Global, Act Local: Dual-Scale Graph Transformer for Vision-and-Language Navigation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2022_CVPR, author = {Chen, Shizhe and Guhur, Pierre-Louis and Tapaswi, Makarand and Schmid, Cordelia and Laptev, Ivan}, title = {Think Global, Act Local: Dual-Scale Graph Transformer for Vision-and-Language Navigation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16537-16547} }
Towards Layer-Wise Image Vectorization-
[pdf]
[supp]
[bibtex]@InProceedings{Ma_2022_CVPR, author = {Ma, Xu and Zhou, Yuqian and Xu, Xingqian and Sun, Bin and Filev, Valerii and Orlov, Nikita and Fu, Yun and Shi, Humphrey}, title = {Towards Layer-Wise Image Vectorization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16314-16323} }
Scenic: A JAX Library for Computer Vision Research and Beyond-
[pdf]
[arXiv]
[bibtex]@InProceedings{Dehghani_2022_CVPR, author = {Dehghani, Mostafa and Gritsenko, Alexey and Arnab, Anurag and Minderer, Matthias and Tay, Yi}, title = {Scenic: A JAX Library for Computer Vision Research and Beyond}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21393-21398} }
CNN Filter DB: An Empirical Investigation of Trained Convolutional Filters-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gavrikov_2022_CVPR, author = {Gavrikov, Paul and Keuper, Janis}, title = {CNN Filter DB: An Empirical Investigation of Trained Convolutional Filters}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19066-19076} }
ScePT: Scene-Consistent, Policy-Based Trajectory Predictions for Planning-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2022_CVPR, author = {Chen, Yuxiao and Ivanovic, Boris and Pavone, Marco}, title = {ScePT: Scene-Consistent, Policy-Based Trajectory Predictions for Planning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17103-17112} }
Deep Saliency Prior for Reducing Visual Distraction-
[pdf]
[arXiv]
[bibtex]@InProceedings{Aberman_2022_CVPR, author = {Aberman, Kfir and He, Junfeng and Gandelsman, Yossi and Mosseri, Inbar and Jacobs, David E. and Kohlhoff, Kai and Pritch, Yael and Rubinstein, Michael}, title = {Deep Saliency Prior for Reducing Visual Distraction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19851-19860} }
Efficient Large-Scale Localization by Global Instance Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Xue_2022_CVPR, author = {Xue, Fei and Budvytis, Ignas and Reino, Daniel Olmeda and Cipolla, Roberto}, title = {Efficient Large-Scale Localization by Global Instance Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17348-17357} }
Spatial Commonsense Graph for Object Localisation in Partial Scenes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Giuliari_2022_CVPR, author = {Giuliari, Francesco and Skenderi, Geri and Cristani, Marco and Wang, Yiming and Del Bue, Alessio}, title = {Spatial Commonsense Graph for Object Localisation in Partial Scenes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19518-19527} }
Physically-Guided Disentangled Implicit Rendering for 3D Face Modeling-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2022_CVPR, author = {Zhang, Zhenyu and Ge, Yanhao and Tai, Ying and Cao, Weijian and Chen, Renwang and Liu, Kunlin and Tang, Hao and Huang, Xiaoming and Wang, Chengjie and Xie, Zhifeng and Huang, Dongjin}, title = {Physically-Guided Disentangled Implicit Rendering for 3D Face Modeling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20353-20363} }
M5Product: Self-Harmonized Contrastive Learning for E-Commercial Multi-Modal Pretraining-
[pdf]
[supp]
[bibtex]@InProceedings{Dong_2022_CVPR, author = {Dong, Xiao and Zhan, Xunlin and Wu, Yangxin and Wei, Yunchao and Kampffmeyer, Michael C. and Wei, Xiaoyong and Lu, Minlong and Wang, Yaowei and Liang, Xiaodan}, title = {M5Product: Self-Harmonized Contrastive Learning for E-Commercial Multi-Modal Pretraining}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21252-21262} }
On Guiding Visual Attention With Language Specification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Petryk_2022_CVPR, author = {Petryk, Suzanne and Dunlap, Lisa and Nasseri, Keyan and Gonzalez, Joseph and Darrell, Trevor and Rohrbach, Anna}, title = {On Guiding Visual Attention With Language Specification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18092-18102} }
ReSTR: Convolution-Free Referring Image Segmentation Using Transformers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2022_CVPR, author = {Kim, Namyup and Kim, Dongwon and Lan, Cuiling and Zeng, Wenjun and Kwak, Suha}, title = {ReSTR: Convolution-Free Referring Image Segmentation Using Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18145-18154} }
Use All the Labels: A Hierarchical Multi-Label Contrastive Learning Framework-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2022_CVPR, author = {Zhang, Shu and Xu, Ran and Xiong, Caiming and Ramaiah, Chetan}, title = {Use All the Labels: A Hierarchical Multi-Label Contrastive Learning Framework}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16660-16669} }
SGTR: End-to-End Scene Graph Generation With Transformer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Rongjie and Zhang, Songyang and He, Xuming}, title = {SGTR: End-to-End Scene Graph Generation With Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19486-19496} }
Set-Supervised Action Learning in Procedural Task Videos via Pairwise Order Consistency-
[pdf]
[supp]
[bibtex]@InProceedings{Lu_2022_CVPR, author = {Lu, Zijia and Elhamifar, Ehsan}, title = {Set-Supervised Action Learning in Procedural Task Videos via Pairwise Order Consistency}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19903-19913} }
DeepFusion: Lidar-Camera Deep Fusion for Multi-Modal 3D Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Yingwei and Yu, Adams Wei and Meng, Tianjian and Caine, Ben and Ngiam, Jiquan and Peng, Daiyi and Shen, Junyang and Lu, Yifeng and Zhou, Denny and Le, Quoc V. and Yuille, Alan and Tan, Mingxing}, title = {DeepFusion: Lidar-Camera Deep Fusion for Multi-Modal 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17182-17191} }
DeepFace-EMD: Re-Ranking Using Patch-Wise Earth Mover's Distance Improves Out-of-Distribution Face Identification-
[pdf]
[supp]
[bibtex]@InProceedings{Phan_2022_CVPR, author = {Phan, Hai and Nguyen, Anh}, title = {DeepFace-EMD: Re-Ranking Using Patch-Wise Earth Mover's Distance Improves Out-of-Distribution Face Identification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20259-20269} }
General Facial Representation Learning in a Visual-Linguistic Manner-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zheng_2022_CVPR, author = {Zheng, Yinglin and Yang, Hao and Zhang, Ting and Bao, Jianmin and Chen, Dongdong and Huang, Yangyu and Yuan, Lu and Chen, Dong and Zeng, Ming and Wen, Fang}, title = {General Facial Representation Learning in a Visual-Linguistic Manner}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18697-18709} }
Improving Segmentation of the Inferior Alveolar Nerve Through Deep Label Propagation-
[pdf]
[bibtex]@InProceedings{Cipriano_2022_CVPR, author = {Cipriano, Marco and Allegretti, Stefano and Bolelli, Federico and Pollastri, Federico and Grana, Costantino}, title = {Improving Segmentation of the Inferior Alveolar Nerve Through Deep Label Propagation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21137-21146} }
Dual-Shutter Optical Vibration Sensing-
[pdf]
[supp]
[bibtex]@InProceedings{Sheinin_2022_CVPR, author = {Sheinin, Mark and Chan, Dorian and O'Toole, Matthew and Narasimhan, Srinivasa G.}, title = {Dual-Shutter Optical Vibration Sensing}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16324-16333} }
Interactiveness Field in Human-Object Interactions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2022_CVPR, author = {Liu, Xinpeng and Li, Yong-Lu and Wu, Xiaoqian and Tai, Yu-Wing and Lu, Cewu and Tang, Chi-Keung}, title = {Interactiveness Field in Human-Object Interactions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20113-20122} }
Self-Supervised Dense Consistency Regularization for Image-to-Image Translation-
[pdf]
[supp]
[bibtex]@InProceedings{Ko_2022_CVPR, author = {Ko, Minsu and Cha, Eunju and Suh, Sungjoo and Lee, Huijin and Han, Jae-Joon and Shin, Jinwoo and Han, Bohyung}, title = {Self-Supervised Dense Consistency Regularization for Image-to-Image Translation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18301-18310} }
The Devil Is in the Details: Window-Based Attention for Image Compression-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zou_2022_CVPR, author = {Zou, Renjie and Song, Chunfeng and Zhang, Zhaoxiang}, title = {The Devil Is in the Details: Window-Based Attention for Image Compression}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17492-17501} }
Category-Aware Transformer Network for Better Human-Object Interaction Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dong_2022_CVPR, author = {Dong, Leizhen and Li, Zhimin and Xu, Kunlun and Zhang, Zhijun and Yan, Luxin and Zhong, Sheng and Zou, Xu}, title = {Category-Aware Transformer Network for Better Human-Object Interaction Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19538-19547} }
LARGE: Latent-Based Regression Through GAN Semantics-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nitzan_2022_CVPR, author = {Nitzan, Yotam and Gal, Rinon and Brenner, Ofir and Cohen-Or, Daniel}, title = {LARGE: Latent-Based Regression Through GAN Semantics}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19239-19249} }
Are Multimodal Transformers Robust to Missing Modality?-
[pdf]
[arXiv]
[bibtex]@InProceedings{Ma_2022_CVPR, author = {Ma, Mengmeng and Ren, Jian and Zhao, Long and Testuggine, Davide and Peng, Xi}, title = {Are Multimodal Transformers Robust to Missing Modality?}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18177-18186} }
Fisher Information Guidance for Learned Time-of-Flight Imaging-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Jiaqu and Yue, Tao and Zhao, Sijie and Hu, Xuemei}, title = {Fisher Information Guidance for Learned Time-of-Flight Imaging}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16334-16343} }
VRDFormer: End-to-End Video Visual Relation Detection With Transformers-
[pdf]
[supp]
[bibtex]@InProceedings{Zheng_2022_CVPR, author = {Zheng, Sipeng and Chen, Shizhe and Jin, Qin}, title = {VRDFormer: End-to-End Video Visual Relation Detection With Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18836-18846} }
CLIPstyler: Image Style Transfer With a Single Text Condition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kwon_2022_CVPR, author = {Kwon, Gihyun and Ye, Jong Chul}, title = {CLIPstyler: Image Style Transfer With a Single Text Condition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18062-18071} }
Ray Priors Through Reprojection: Improving Neural Radiance Fields for Novel View Extrapolation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhang_2022_CVPR, author = {Zhang, Jian and Zhang, Yuanqing and Fu, Huan and Zhou, Xiaowei and Cai, Bowen and Huang, Jinchi and Jia, Rongfei and Zhao, Binqiang and Tang, Xing}, title = {Ray Priors Through Reprojection: Improving Neural Radiance Fields for Novel View Extrapolation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18376-18386} }
Spatio-Temporal Relation Modeling for Few-Shot Action Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Thatipelli_2022_CVPR, author = {Thatipelli, Anirudh and Narayan, Sanath and Khan, Salman and Anwer, Rao Muhammad and Khan, Fahad Shahbaz and Ghanem, Bernard}, title = {Spatio-Temporal Relation Modeling for Few-Shot Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19958-19967} }
Pop-Out Motion: 3D-Aware Image Deformation via Learning the Shape Laplacian-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2022_CVPR, author = {Lee, Jihyun and Sung, Minhyuk and Kim, Hyunjin and Kim, Tae-Kyun}, title = {Pop-Out Motion: 3D-Aware Image Deformation via Learning the Shape Laplacian}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18532-18541} }
Towards Noiseless Object Contours for Weakly Supervised Semantic Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Jing and Fan, Junsong and Zhang, Zhaoxiang}, title = {Towards Noiseless Object Contours for Weakly Supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16856-16865} }
Unsupervised Image-to-Image Translation With Generative Prior-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2022_CVPR, author = {Yang, Shuai and Jiang, Liming and Liu, Ziwei and Loy, Chen Change}, title = {Unsupervised Image-to-Image Translation With Generative Prior}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18332-18341} }
Multi-Marginal Contrastive Learning for Multi-Label Subcellular Protein Localization-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2022_CVPR, author = {Liu, Ziyi and Wang, Zengmao and Du, Bo}, title = {Multi-Marginal Contrastive Learning for Multi-Label Subcellular Protein Localization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20626-20635} }
Predict, Prevent, and Evaluate: Disentangled Text-Driven Image Manipulation Empowered by Pre-Trained Vision-Language Model-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2022_CVPR, author = {Xu, Zipeng and Lin, Tianwei and Tang, Hao and Li, Fu and He, Dongliang and Sebe, Nicu and Timofte, Radu and Van Gool, Luc and Ding, Errui}, title = {Predict, Prevent, and Evaluate: Disentangled Text-Driven Image Manipulation Empowered by Pre-Trained Vision-Language Model}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18229-18238} }
RU-Net: Regularized Unrolling Network for Scene Graph Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Lin_2022_CVPR, author = {Lin, Xin and Ding, Changxing and Zhang, Jing and Zhan, Yibing and Tao, Dacheng}, title = {RU-Net: Regularized Unrolling Network for Scene Graph Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19457-19466} }
Integrating Language Guidance Into Vision-Based Deep Metric Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Roth_2022_CVPR, author = {Roth, Karsten and Vinyals, Oriol and Akata, Zeynep}, title = {Integrating Language Guidance Into Vision-Based Deep Metric Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16177-16189} }
PartGlot: Learning Shape Part Segmentation From Language Reference Games-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Koo_2022_CVPR, author = {Koo, Juil and Huang, Ian and Achlioptas, Panos and Guibas, Leonidas J. and Sung, Minhyuk}, title = {PartGlot: Learning Shape Part Segmentation From Language Reference Games}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16505-16514} }
DIVeR: Real-Time and Accurate Neural Radiance Fields With Deterministic Integration for Volume Rendering-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2022_CVPR, author = {Wu, Liwen and Lee, Jae Yong and Bhattad, Anand and Wang, Yu-Xiong and Forsyth, David}, title = {DIVeR: Real-Time and Accurate Neural Radiance Fields With Deterministic Integration for Volume Rendering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16200-16209} }
ContIG: Self-Supervised Multimodal Contrastive Learning for Medical Imaging With Genetics-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Taleb_2022_CVPR, author = {Taleb, Aiham and Kirchler, Matthias and Monti, Remo and Lippert, Christoph}, title = {ContIG: Self-Supervised Multimodal Contrastive Learning for Medical Imaging With Genetics}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20908-20921} }
Disentangling Visual and Written Concepts in CLIP-
[pdf]
[bibtex]@InProceedings{Materzynska_2022_CVPR, author = {Materzy\'nska, Joanna and Torralba, Antonio and Bau, David}, title = {Disentangling Visual and Written Concepts in CLIP}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16410-16419} }
Bilateral Video Magnification Filter-
[pdf]
[supp]
[bibtex]@InProceedings{Takeda_2022_CVPR, author = {Takeda, Shoichiro and Niwa, Kenta and Isogawa, Mariko and Shimizu, Shinya and Okami, Kazuki and Aono, Yushi}, title = {Bilateral Video Magnification Filter}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17369-17378} }
AdaFocus V2: End-to-End Training of Spatial Dynamic Networks for Video Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2022_CVPR, author = {Wang, Yulin and Yue, Yang and Lin, Yuanze and Jiang, Haojun and Lai, Zihang and Kulikov, Victor and Orlov, Nikita and Shi, Humphrey and Huang, Gao}, title = {AdaFocus V2: End-to-End Training of Spatial Dynamic Networks for Video Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20062-20072} }
Neural Mean Discrepancy for Efficient Out-of-Distribution Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dong_2022_CVPR, author = {Dong, Xin and Guo, Junfeng and Li, Ang and Ting, Wei-Te and Liu, Cong and Kung, H.T.}, title = {Neural Mean Discrepancy for Efficient Out-of-Distribution Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19217-19227} }
Time Lens++: Event-Based Frame Interpolation With Parametric Non-Linear Flow and Multi-Scale Fusion-
[pdf]
[supp]
[bibtex]@InProceedings{Tulyakov_2022_CVPR, author = {Tulyakov, Stepan and Bochicchio, Alfredo and Gehrig, Daniel and Georgoulis, Stamatios and Li, Yuanyou and Scaramuzza, Davide}, title = {Time Lens++: Event-Based Frame Interpolation With Parametric Non-Linear Flow and Multi-Scale Fusion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17755-17764} }
It Is Okay To Not Be Okay: Overcoming Emotional Bias in Affective Image Captioning by Contrastive Data Collection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mohamed_2022_CVPR, author = {Mohamed, Youssef and Khan, Faizan Farooq and Haydarov, Kilichbek and Elhoseiny, Mohamed}, title = {It Is Okay To Not Be Okay: Overcoming Emotional Bias in Affective Image Captioning by Contrastive Data Collection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21263-21272} }
Neural Global Shutter: Learn To Restore Video From a Rolling Shutter Camera With Global Reset Feature-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wang_2022_CVPR, author = {Wang, Zhixiang and Ji, Xiang and Huang, Jia-Bin and Satoh, Shin'ichi and Zhou, Xiao and Zheng, Yinqiang}, title = {Neural Global Shutter: Learn To Restore Video From a Rolling Shutter Camera With Global Reset Feature}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17794-17803} }
DiRA: Discriminative, Restorative, and Adversarial Learning for Self-Supervised Medical Image Analysis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Haghighi_2022_CVPR, author = {Haghighi, Fatemeh and Taher, Mohammad Reza Hosseinzadeh and Gotway, Michael B. and Liang, Jianming}, title = {DiRA: Discriminative, Restorative, and Adversarial Learning for Self-Supervised Medical Image Analysis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20824-20834} }
Open Challenges in Deep Stereo: The Booster Dataset-
[pdf]
[supp]
[bibtex]@InProceedings{Ramirez_2022_CVPR, author = {Ramirez, Pierluigi Zama and Tosi, Fabio and Poggi, Matteo and Salti, Samuele and Mattoccia, Stefano and Di Stefano, Luigi}, title = {Open Challenges in Deep Stereo: The Booster Dataset}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21168-21178} }
Self-Supervised Bulk Motion Artifact Removal in Optical Coherence Tomography Angiography-
[pdf]
[arXiv]
[bibtex]@InProceedings{Ren_2022_CVPR, author = {Ren, Jiaxiang and Park, Kicheon and Pan, Yingtian and Ling, Haibin}, title = {Self-Supervised Bulk Motion Artifact Removal in Optical Coherence Tomography Angiography}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20617-20625} }
PoseTrack21: A Dataset for Person Search, Multi-Object Tracking and Multi-Person Pose Tracking-
[pdf]
[supp]
[bibtex]@InProceedings{Doring_2022_CVPR, author = {D\"oring, Andreas and Chen, Di and Zhang, Shanshan and Schiele, Bernt and Gall, J\"urgen}, title = {PoseTrack21: A Dataset for Person Search, Multi-Object Tracking and Multi-Person Pose Tracking}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20963-20972} }
Ithaca365: Dataset and Driving Perception Under Repeated and Challenging Weather Conditions-
[pdf]
[supp]
[bibtex]@InProceedings{Diaz-Ruiz_2022_CVPR, author = {Diaz-Ruiz, Carlos A. and Xia, Youya and You, Yurong and Nino, Jose and Chen, Junan and Monica, Josephine and Chen, Xiangyu and Luo, Katie and Wang, Yan and Emond, Marc and Chao, Wei-Lun and Hariharan, Bharath and Weinberger, Kilian Q. and Campbell, Mark}, title = {Ithaca365: Dataset and Driving Perception Under Repeated and Challenging Weather Conditions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21383-21392} }
YouMVOS: An Actor-Centric Multi-Shot Video Object Segmentation Dataset-
[pdf]
[bibtex]@InProceedings{Wei_2022_CVPR, author = {Wei, Donglai and Kharbanda, Siddhant and Arora, Sarthak and Roy, Roshan and Jain, Nishant and Palrecha, Akash and Shah, Tanav and Mathur, Shray and Mathur, Ritik and Kemkar, Abhijay and Chakravarthy, Anirudh and Lin, Zudi and Jang, Won-Dong and Tang, Yansong and Bai, Song and Tompkin, James and Torr, Philip H.S. and Pfister, Hanspeter}, title = {YouMVOS: An Actor-Centric Multi-Shot Video Object Segmentation Dataset}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21044-21053} }
Rethinking Spatial Invariance of Convolutional Networks for Object Counting-
[pdf]
[bibtex]@InProceedings{Cheng_2022_CVPR, author = {Cheng, Zhi-Qi and Dai, Qi and Li, Hong and Song, Jingkuan and Wu, Xiao and Hauptmann, Alexander G.}, title = {Rethinking Spatial Invariance of Convolutional Networks for Object Counting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19638-19648} }
Geometric Anchor Correspondence Mining With Uncertainty Modeling for Universal Domain Adaptation-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2022_CVPR, author = {Chen, Liang and Lou, Yihang and He, Jianzhong and Bai, Tao and Deng, Minghua}, title = {Geometric Anchor Correspondence Mining With Uncertainty Modeling for Universal Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16134-16143} }
Coopernaut: End-to-End Driving With Cooperative Perception for Networked Vehicles-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cui_2022_CVPR, author = {Cui, Jiaxun and Qiu, Hang and Chen, Dian and Stone, Peter and Zhu, Yuke}, title = {Coopernaut: End-to-End Driving With Cooperative Perception for Networked Vehicles}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17252-17262} }
Few-Shot Keypoint Detection With Uncertainty Learning for Unseen Species-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lu_2022_CVPR, author = {Lu, Changsheng and Koniusz, Piotr}, title = {Few-Shot Keypoint Detection With Uncertainty Learning for Unseen Species}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19416-19426} }
3D-SPS: Single-Stage 3D Visual Grounding via Referred Point Progressive Selection-
[pdf]
[bibtex]@InProceedings{Luo_2022_CVPR, author = {Luo, Junyu and Fu, Jiahui and Kong, Xianghao and Gao, Chen and Ren, Haibing and Shen, Hao and Xia, Huaxia and Liu, Si}, title = {3D-SPS: Single-Stage 3D Visual Grounding via Referred Point Progressive Selection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16454-16463} }
Learning Multiple Dense Prediction Tasks From Partially Annotated Data-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Wei-Hong and Liu, Xialei and Bilen, Hakan}, title = {Learning Multiple Dense Prediction Tasks From Partially Annotated Data}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18879-18889} }
Towards Low-Cost and Efficient Malaria Detection-
[pdf]
[arXiv]
[bibtex]@InProceedings{Sultani_2022_CVPR, author = {Sultani, Waqas and Nawaz, Wajahat and Javed, Syed and Danish, Muhammad Sohail and Saadia, Asma and Ali, Mohsen}, title = {Towards Low-Cost and Efficient Malaria Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20687-20696} }
Learning Neural Light Fields With Ray-Space Embedding-
[pdf]
[supp]
[bibtex]@InProceedings{Attal_2022_CVPR, author = {Attal, Benjamin and Huang, Jia-Bin and Zollh\"ofer, Michael and Kopf, Johannes and Kim, Changil}, title = {Learning Neural Light Fields With Ray-Space Embedding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19819-19829} }
Clean Implicit 3D Structure From Noisy 2D STEM Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kniesel_2022_CVPR, author = {Kniesel, Hannah and Ropinski, Timo and Bergner, Tim and Devan, Kavitha Shaga and Read, Clarissa and Walther, Paul and Ritschel, Tobias and Hermosilla, Pedro}, title = {Clean Implicit 3D Structure From Noisy 2D STEM Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20762-20772} }
UKPGAN: A General Self-Supervised Keypoint Detector-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{You_2022_CVPR, author = {You, Yang and Liu, Wenhai and Ze, Yanjie and Li, Yong-Lu and Wang, Weiming and Lu, Cewu}, title = {UKPGAN: A General Self-Supervised Keypoint Detector}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17042-17051} }
Learning Optimal K-Space Acquisition and Reconstruction Using Physics-Informed Neural Networks-
[pdf]
[supp]
[bibtex]@InProceedings{Peng_2022_CVPR, author = {Peng, Wei and Feng, Li and Zhao, Guoying and Liu, Fang}, title = {Learning Optimal K-Space Acquisition and Reconstruction Using Physics-Informed Neural Networks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20794-20803} }
Raw High-Definition Radar for Multi-Task Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Rebut_2022_CVPR, author = {Rebut, Julien and Ouaknine, Arthur and Malik, Waqas and P\'erez, Patrick}, title = {Raw High-Definition Radar for Multi-Task Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17021-17030} }
Exploring Set Similarity for Dense Self-Supervised Representation Learning-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wang_2022_CVPR, author = {Wang, Zhaoqing and Li, Qiang and Zhang, Guoxin and Wan, Pengfei and Zheng, Wen and Wang, Nannan and Gong, Mingming and Liu, Tongliang}, title = {Exploring Set Similarity for Dense Self-Supervised Representation Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16590-16599} }
ONCE-3DLanes: Building Monocular 3D Lane Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Yan_2022_CVPR, author = {Yan, Fan and Nie, Ming and Cai, Xinyue and Han, Jianhua and Xu, Hang and Yang, Zhen and Ye, Chaoqiang and Fu, Yanwei and Mi, Michael Bi and Zhang, Li}, title = {ONCE-3DLanes: Building Monocular 3D Lane Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17143-17152} }
Weakly but Deeply Supervised Occlusion-Reasoned Parametric Road Layouts-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2022_CVPR, author = {Liu, Buyu and Zhuang, Bingbing and Chandraker, Manmohan}, title = {Weakly but Deeply Supervised Occlusion-Reasoned Parametric Road Layouts}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17000-17009} }
Modulated Contrast for Versatile Image Synthesis-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhan_2022_CVPR, author = {Zhan, Fangneng and Zhang, Jiahui and Yu, Yingchen and Wu, Rongliang and Lu, Shijian}, title = {Modulated Contrast for Versatile Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18280-18290} }
Identifying Ambiguous Similarity Conditions via Semantic Matching-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ye_2022_CVPR, author = {Ye, Han-Jia and Shi, Yi and Zhan, De-Chuan}, title = {Identifying Ambiguous Similarity Conditions via Semantic Matching}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16610-16619} }
MSTR: Multi-Scale Transformer for End-to-End Human-Object Interaction Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2022_CVPR, author = {Kim, Bumsoo and Mun, Jonghwan and On, Kyoung-Woon and Shin, Minchul and Lee, Junhyun and Kim, Eun-Sol}, title = {MSTR: Multi-Scale Transformer for End-to-End Human-Object Interaction Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19578-19587} }
DetectorDetective: Investigating the Effects of Adversarial Examples on Object Detectors-
[pdf]
[bibtex]@InProceedings{Vellaichamy_2022_CVPR, author = {Vellaichamy, Sivapriya and Hull, Matthew and Wang, Zijie J. and Das, Nilaksh and Peng, ShengYun and Park, Haekyu and Chau, Duen Horng (Polo)}, title = {DetectorDetective: Investigating the Effects of Adversarial Examples on Object Detectors}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21484-21491} }
EMScore: Evaluating Video Captioning via Coarse-Grained and Fine-Grained Embedding Matching-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shi_2022_CVPR, author = {Shi, Yaya and Yang, Xu and Xu, Haiyang and Yuan, Chunfeng and Li, Bing and Hu, Weiming and Zha, Zheng-Jun}, title = {EMScore: Evaluating Video Captioning via Coarse-Grained and Fine-Grained Embedding Matching}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17929-17938} }
SNR-Aware Low-Light Image Enhancement-
[pdf]
[bibtex]@InProceedings{Xu_2022_CVPR, author = {Xu, Xiaogang and Wang, Ruixing and Fu, Chi-Wing and Jia, Jiaya}, title = {SNR-Aware Low-Light Image Enhancement}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17714-17724} }
3D Common Corruptions and Data Augmentation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Kar_2022_CVPR, author = {Kar, O\u{g}uzhan Fatih and Yeo, Teresa and Atanov, Andrei and Zamir, Amir}, title = {3D Common Corruptions and Data Augmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18963-18974} }
Injecting Semantic Concepts Into End-to-End Image Captioning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fang_2022_CVPR, author = {Fang, Zhiyuan and Wang, Jianfeng and Hu, Xiaowei and Liang, Lin and Gan, Zhe and Wang, Lijuan and Yang, Yezhou and Liu, Zicheng}, title = {Injecting Semantic Concepts Into End-to-End Image Captioning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18009-18019} }
L2G: A Simple Local-to-Global Knowledge Transfer Framework for Weakly Supervised Semantic Segmentation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Jiang_2022_CVPR, author = {Jiang, Peng-Tao and Yang, Yuqi and Hou, Qibin and Wei, Yunchao}, title = {L2G: A Simple Local-to-Global Knowledge Transfer Framework for Weakly Supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16886-16896} }
VL-InterpreT: An Interactive Visualization Tool for Interpreting Vision-Language Transformers-
[pdf]
[bibtex]@InProceedings{Aflalo_2022_CVPR, author = {Aflalo, Estelle and Du, Meng and Tseng, Shao-Yen and Liu, Yongfei and Wu, Chenfei and Duan, Nan and Lal, Vasudev}, title = {VL-InterpreT: An Interactive Visualization Tool for Interpreting Vision-Language Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21406-21415} }
LiDAR Snowfall Simulation for Robust 3D Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hahner_2022_CVPR, author = {Hahner, Martin and Sakaridis, Christos and Bijelic, Mario and Heide, Felix and Yu, Fisher and Dai, Dengxin and Van Gool, Luc}, title = {LiDAR Snowfall Simulation for Robust 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16364-16374} }
Structural and Statistical Texture Knowledge Distillation for Semantic Segmentation-
[pdf]
[bibtex]@InProceedings{Ji_2022_CVPR, author = {Ji, Deyi and Wang, Haoran and Tao, Mingyuan and Huang, Jianqiang and Hua, Xian-Sheng and Lu, Hongtao}, title = {Structural and Statistical Texture Knowledge Distillation for Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16876-16885} }
Blended Diffusion for Text-Driven Editing of Natural Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Avrahami_2022_CVPR, author = {Avrahami, Omri and Lischinski, Dani and Fried, Ohad}, title = {Blended Diffusion for Text-Driven Editing of Natural Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18208-18218} }
BE-STI: Spatial-Temporal Integrated Network for Class-Agnostic Motion Prediction With Bidirectional Enhancement-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2022_CVPR, author = {Wang, Yunlong and Pan, Hongyu and Zhu, Jun and Wu, Yu-Huan and Zhan, Xin and Jiang, Kun and Yang, Diange}, title = {BE-STI: Spatial-Temporal Integrated Network for Class-Agnostic Motion Prediction With Bidirectional Enhancement}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17093-17102} }
A Structured Dictionary Perspective on Implicit Neural Representations-
[pdf]
[supp]
[bibtex]@InProceedings{Yuce_2022_CVPR, author = {Y\"uce, Gizem and Ortiz-Jim\'enez, Guillermo and Besbinar, Beril and Frossard, Pascal}, title = {A Structured Dictionary Perspective on Implicit Neural Representations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19228-19238} }
Learning To Answer Questions in Dynamic Audio-Visual Scenarios-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Guangyao and Wei, Yake and Tian, Yapeng and Xu, Chenliang and Wen, Ji-Rong and Hu, Di}, title = {Learning To Answer Questions in Dynamic Audio-Visual Scenarios}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19108-19118} }
Synthetic Aperture Imaging With Events and Frames-
[pdf]
[supp]
[bibtex]@InProceedings{Liao_2022_CVPR, author = {Liao, Wei and Zhang, Xiang and Yu, Lei and Lin, Shijie and Yang, Wen and Qiao, Ning}, title = {Synthetic Aperture Imaging With Events and Frames}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17735-17744} }
CLIP-Event: Connecting Text and Images With Event Structures-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Manling and Xu, Ruochen and Wang, Shuohang and Zhou, Luowei and Lin, Xudong and Zhu, Chenguang and Zeng, Michael and Ji, Heng and Chang, Shih-Fu}, title = {CLIP-Event: Connecting Text and Images With Event Structures}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16420-16429} }
Scaling Up Vision-Language Pre-Training for Image Captioning-
[pdf]
[arXiv]
[bibtex]@InProceedings{Hu_2022_CVPR, author = {Hu, Xiaowei and Gan, Zhe and Wang, Jianfeng and Yang, Zhengyuan and Liu, Zicheng and Lu, Yumao and Wang, Lijuan}, title = {Scaling Up Vision-Language Pre-Training for Image Captioning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17980-17989} }
Unsupervised Action Segmentation by Joint Representation Learning and Online Clustering-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kumar_2022_CVPR, author = {Kumar, Sateesh and Haresh, Sanjay and Ahmed, Awais and Konin, Andrey and Zia, M. Zeeshan and Tran, Quoc-Huy}, title = {Unsupervised Action Segmentation by Joint Representation Learning and Online Clustering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20174-20185} }
LISA: Learning Implicit Shape and Appearance of Hands-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Corona_2022_CVPR, author = {Corona, Enric and Hodan, Tomas and Vo, Minh and Moreno-Noguer, Francesc and Sweeney, Chris and Newcombe, Richard and Ma, Lingni}, title = {LISA: Learning Implicit Shape and Appearance of Hands}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20533-20543} }
DiGS: Divergence Guided Shape Implicit Neural Representation for Unoriented Point Clouds-
[pdf]
[supp]
[bibtex]@InProceedings{Ben-Shabat_2022_CVPR, author = {Ben-Shabat, Yizhak and Koneputugodage, Chamin Hewa and Gould, Stephen}, title = {DiGS: Divergence Guided Shape Implicit Neural Representation for Unoriented Point Clouds}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19323-19332} }
Semi-Supervised Learning of Semantic Correspondence With Pseudo-Labels-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2022_CVPR, author = {Kim, Jiwon and Ryoo, Kwangrok and Seo, Junyoung and Lee, Gyuseong and Kim, Daehwan and Cho, Hansang and Kim, Seungryong}, title = {Semi-Supervised Learning of Semantic Correspondence With Pseudo-Labels}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19699-19709} }
HLRTF: Hierarchical Low-Rank Tensor Factorization for Inverse Problems in Multi-Dimensional Imaging-
[pdf]
[supp]
[bibtex]@InProceedings{Luo_2022_CVPR, author = {Luo, Yisi and Zhao, Xi-Le and Meng, Deyu and Jiang, Tai-Xiang}, title = {HLRTF: Hierarchical Low-Rank Tensor Factorization for Inverse Problems in Multi-Dimensional Imaging}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19303-19312} }
FIBA: Frequency-Injection Based Backdoor Attack in Medical Image Analysis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Feng_2022_CVPR, author = {Feng, Yu and Ma, Benteng and Zhang, Jing and Zhao, Shanshan and Xia, Yong and Tao, Dacheng}, title = {FIBA: Frequency-Injection Based Backdoor Attack in Medical Image Analysis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20876-20885} }
Deep Constrained Least Squares for Blind Image Super-Resolution-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Luo_2022_CVPR, author = {Luo, Ziwei and Huang, Haibin and Yu, Lei and Li, Youwei and Fan, Haoqiang and Liu, Shuaicheng}, title = {Deep Constrained Least Squares for Blind Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17642-17652} }
Beyond a Pre-Trained Object Detector: Cross-Modal Textual and Visual Context for Image Captioning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kuo_2022_CVPR, author = {Kuo, Chia-Wen and Kira, Zsolt}, title = {Beyond a Pre-Trained Object Detector: Cross-Modal Textual and Visual Context for Image Captioning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17969-17979} }
Symmetry-Aware Neural Architecture for Embodied Visual Exploration-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2022_CVPR, author = {Liu, Shuang and Okatani, Takayuki}, title = {Symmetry-Aware Neural Architecture for Embodied Visual Exploration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17242-17251} }
From Representation to Reasoning: Towards Both Evidence and Commonsense Reasoning for Video Question-Answering-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2022_CVPR, author = {Li, Jiangtong and Niu, Li and Zhang, Liqing}, title = {From Representation to Reasoning: Towards Both Evidence and Commonsense Reasoning for Video Question-Answering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21273-21282} }
DanceTrack: Multi-Object Tracking in Uniform Appearance and Diverse Motion-
[pdf]
[arXiv]
[bibtex]@InProceedings{Sun_2022_CVPR, author = {Sun, Peize and Cao, Jinkun and Jiang, Yi and Yuan, Zehuan and Bai, Song and Kitani, Kris and Luo, Ping}, title = {DanceTrack: Multi-Object Tracking in Uniform Appearance and Diverse Motion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20993-21002} }
Unsupervised Learning of Debiased Representations With Pseudo-Attributes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Seo_2022_CVPR, author = {Seo, Seonguk and Lee, Joon-Young and Han, Bohyung}, title = {Unsupervised Learning of Debiased Representations With Pseudo-Attributes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16742-16751} }
TubeDETR: Spatio-Temporal Video Grounding With Transformers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2022_CVPR, author = {Yang, Antoine and Miech, Antoine and Sivic, Josef and Laptev, Ivan and Schmid, Cordelia}, title = {TubeDETR: Spatio-Temporal Video Grounding With Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16442-16453} }
SLIC: Self-Supervised Learning With Iterative Clustering for Human Action Videos-
[pdf]
[supp]
[bibtex]@InProceedings{Khorasgani_2022_CVPR, author = {Khorasgani, Salar Hosseini and Chen, Yuxuan and Shkurti, Florian}, title = {SLIC: Self-Supervised Learning With Iterative Clustering for Human Action Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16091-16101} }
UBnormal: New Benchmark for Supervised Open-Set Video Anomaly Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Acsintoae_2022_CVPR, author = {Acsintoae, Andra and Florescu, Andrei and Georgescu, Mariana-Iuliana and Mare, Tudor and Sumedrea, Paul and Ionescu, Radu Tudor and Khan, Fahad Shahbaz and Shah, Mubarak}, title = {UBnormal: New Benchmark for Supervised Open-Set Video Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20143-20153} }
Beyond Cross-View Image Retrieval: Highly Accurate Vehicle Localization Using Satellite Image-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shi_2022_CVPR, author = {Shi, Yujiao and Li, Hongdong}, title = {Beyond Cross-View Image Retrieval: Highly Accurate Vehicle Localization Using Satellite Image}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17010-17020} }
Closing the Generalization Gap of Cross-Silo Federated Medical Image Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2022_CVPR, author = {Xu, An and Li, Wenqi and Guo, Pengfei and Yang, Dong and Roth, Holger R. and Hatamizadeh, Ali and Zhao, Can and Xu, Daguang and Huang, Heng and Xu, Ziyue}, title = {Closing the Generalization Gap of Cross-Silo Federated Medical Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20866-20875} }
Leverage Your Local and Global Representations: A New Self-Supervised Learning Strategy-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2022_CVPR, author = {Zhang, Tong and Qiu, Congpei and Ke, Wei and S\"usstrunk, Sabine and Salzmann, Mathieu}, title = {Leverage Your Local and Global Representations: A New Self-Supervised Learning Strategy}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16580-16589} }
NeRF in the Dark: High Dynamic Range View Synthesis From Noisy Raw Images-
[pdf]
[supp]
[bibtex]@InProceedings{Mildenhall_2022_CVPR, author = {Mildenhall, Ben and Hedman, Peter and Martin-Brualla, Ricardo and Srinivasan, Pratul P. and Barron, Jonathan T.}, title = {NeRF in the Dark: High Dynamic Range View Synthesis From Noisy Raw Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16190-16199} }
DArch: Dental Arch Prior-Assisted 3D Tooth Instance Segmentation With Weak Annotations-
[pdf]
[bibtex]@InProceedings{Qiu_2022_CVPR, author = {Qiu, Liangdong and Ye, Chongjie and Chen, Pei and Liu, Yunbi and Han, Xiaoguang and Cui, Shuguang}, title = {DArch: Dental Arch Prior-Assisted 3D Tooth Instance Segmentation With Weak Annotations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20752-20761} }
Globetrotter: Connecting Languages by Connecting Images-
[pdf]
[supp]
[bibtex]@InProceedings{Suris_2022_CVPR, author = {Sur{\'\i}s, D{\'\i}dac and Epstein, Dave and Vondrick, Carl}, title = {Globetrotter: Connecting Languages by Connecting Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16474-16484} }
Back