CVPR 2022 Open Access Repository

Papers

Back
Holocurtains: Programming Light Curtains via Binary Holography: Dorian Chan,

Srinivasa G. Narasimhan,

Matthew O'Toole; [pdf] [supp]
[bibtex]
@InProceedings{Chan_2022_CVPR, author = {Chan, Dorian and Narasimhan, Srinivasa G. and O'Toole, Matthew}, title = {Holocurtains: Programming Light Curtains via Binary Holography}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17886-17895} }
Learning Adaptive Warping for Real-World Rolling Shutter Correction: Mingdeng Cao,

Zhihang Zhong,

Jiahao Wang,

Yinqiang Zheng,

Yujiu Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cao_2022_CVPR, author = {Cao, Mingdeng and Zhong, Zhihang and Wang, Jiahao and Zheng, Yinqiang and Yang, Yujiu}, title = {Learning Adaptive Warping for Real-World Rolling Shutter Correction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17785-17793} }
Bongard-HOI: Benchmarking Few-Shot Visual Reasoning for Human-Object Interactions: Huaizu Jiang,

Xiaojian Ma,

Weili Nie,

Zhiding Yu,

Yuke Zhu,

Anima Anandkumar; [pdf] [supp]
[bibtex]
@InProceedings{Jiang_2022_CVPR, author = {Jiang, Huaizu and Ma, Xiaojian and Nie, Weili and Yu, Zhiding and Zhu, Yuke and Anandkumar, Anima}, title = {Bongard-HOI: Benchmarking Few-Shot Visual Reasoning for Human-Object Interactions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19056-19065} }
ZeroCap: Zero-Shot Image-to-Text Generation for Visual-Semantic Arithmetic: Yoad Tewel,

Yoav Shalev,

Idan Schwartz,

Lior Wolf; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tewel_2022_CVPR, author = {Tewel, Yoad and Shalev, Yoav and Schwartz, Idan and Wolf, Lior}, title = {ZeroCap: Zero-Shot Image-to-Text Generation for Visual-Semantic Arithmetic}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17918-17928} }
End-to-End Generative Pretraining for Multimodal Video Captioning: Paul Hongsuck Seo,

Arsha Nagrani,

Anurag Arnab,

Cordelia Schmid; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Seo_2022_CVPR, author = {Seo, Paul Hongsuck and Nagrani, Arsha and Arnab, Anurag and Schmid, Cordelia}, title = {End-to-End Generative Pretraining for Multimodal Video Captioning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17959-17968} }
Stochastic Trajectory Prediction via Motion Indeterminacy Diffusion: Tianpei Gu,

Guangyi Chen,

Junlong Li,

Chunze Lin,

Yongming Rao,

Jie Zhou,

Jiwen Lu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gu_2022_CVPR, author = {Gu, Tianpei and Chen, Guangyi and Li, Junlong and Lin, Chunze and Rao, Yongming and Zhou, Jie and Lu, Jiwen}, title = {Stochastic Trajectory Prediction via Motion Indeterminacy Diffusion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17113-17122} }
Cross-Modal Clinical Graph Transformer for Ophthalmic Report Generation: Mingjie Li,

Wenjia Cai,

Karin Verspoor,

Shirui Pan,

Xiaodan Liang,

Xiaojun Chang; [pdf]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Mingjie and Cai, Wenjia and Verspoor, Karin and Pan, Shirui and Liang, Xiaodan and Chang, Xiaojun}, title = {Cross-Modal Clinical Graph Transformer for Ophthalmic Report Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20656-20665} }
Human-Object Interaction Detection via Disentangled Transformer: Desen Zhou,

Zhichao Liu,

Jian Wang,

Leshan Wang,

Tao Hu,

Errui Ding,

Jingdong Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhou_2022_CVPR, author = {Zhou, Desen and Liu, Zhichao and Wang, Jian and Wang, Leshan and Hu, Tao and Ding, Errui and Wang, Jingdong}, title = {Human-Object Interaction Detection via Disentangled Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19568-19577} }
CVF-SID: Cyclic Multi-Variate Function for Self-Supervised Image Denoising by Disentangling Noise From Image: Reyhaneh Neshatavar,

Mohsen Yavartanoo,

Sanghyun Son,

Kyoung Mu Lee; [pdf] [supp]
[bibtex]
@InProceedings{Neshatavar_2022_CVPR, author = {Neshatavar, Reyhaneh and Yavartanoo, Mohsen and Son, Sanghyun and Lee, Kyoung Mu}, title = {CVF-SID: Cyclic Multi-Variate Function for Self-Supervised Image Denoising by Disentangling Noise From Image}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17583-17591} }
FaceFormer: Speech-Driven 3D Facial Animation With Transformers: Yingruo Fan,

Zhaojiang Lin,

Jun Saito,

Wenping Wang,

Taku Komura; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Fan_2022_CVPR, author = {Fan, Yingruo and Lin, Zhaojiang and Saito, Jun and Wang, Wenping and Komura, Taku}, title = {FaceFormer: Speech-Driven 3D Facial Animation With Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18770-18780} }
Exploring Patch-Wise Semantic Relation for Contrastive Learning in Image-to-Image Translation Tasks: Chanyong Jung,

Gihyun Kwon,

Jong Chul Ye; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jung_2022_CVPR, author = {Jung, Chanyong and Kwon, Gihyun and Ye, Jong Chul}, title = {Exploring Patch-Wise Semantic Relation for Contrastive Learning in Image-to-Image Translation Tasks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18260-18269} }
Towards General Purpose Vision Systems: An End-to-End Task-Agnostic Vision-Language Architecture: Tanmay Gupta,

Amita Kamath,

Aniruddha Kembhavi,

Derek Hoiem; [pdf] [supp]
[bibtex]
@InProceedings{Gupta_2022_CVPR, author = {Gupta, Tanmay and Kamath, Amita and Kembhavi, Aniruddha and Hoiem, Derek}, title = {Towards General Purpose Vision Systems: An End-to-End Task-Agnostic Vision-Language Architecture}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16399-16409} }
LiT: Zero-Shot Transfer With Locked-Image Text Tuning: Xiaohua Zhai,

Xiao Wang,

Basil Mustafa,

Andreas Steiner,

Daniel Keysers,

Alexander Kolesnikov,

Lucas Beyer; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhai_2022_CVPR, author = {Zhai, Xiaohua and Wang, Xiao and Mustafa, Basil and Steiner, Andreas and Keysers, Daniel and Kolesnikov, Alexander and Beyer, Lucas}, title = {LiT: Zero-Shot Transfer With Locked-Image Text Tuning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18123-18133} }
GeoNeRF: Generalizing NeRF With Geometry Priors: Mohammad Mahdi Johari,

Yann Lepoittevin,

François Fleuret; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Johari_2022_CVPR, author = {Johari, Mohammad Mahdi and Lepoittevin, Yann and Fleuret, Fran\c{c}ois}, title = {GeoNeRF: Generalizing NeRF With Geometry Priors}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18365-18375} }
PhoCaL: A Multi-Modal Dataset for Category-Level Object Pose Estimation With Photometrically Challenging Objects: Pengyuan Wang,

HyunJun Jung,

Yitong Li,

Siyuan Shen,

Rahul Parthasarathy Srikanth,

Lorenzo Garattoni,

Sven Meier,

Nassir Navab,

Benjamin Busam; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2022_CVPR, author = {Wang, Pengyuan and Jung, HyunJun and Li, Yitong and Shen, Siyuan and Srikanth, Rahul Parthasarathy and Garattoni, Lorenzo and Meier, Sven and Navab, Nassir and Busam, Benjamin}, title = {PhoCaL: A Multi-Modal Dataset for Category-Level Object Pose Estimation With Photometrically Challenging Objects}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21222-21231} }
Uformer: A General U-Shaped Transformer for Image Restoration: Zhendong Wang,

Xiaodong Cun,

Jianmin Bao,

Wengang Zhou,

Jianzhuang Liu,

Houqiang Li; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2022_CVPR, author = {Wang, Zhendong and Cun, Xiaodong and Bao, Jianmin and Zhou, Wengang and Liu, Jianzhuang and Li, Houqiang}, title = {Uformer: A General U-Shaped Transformer for Image Restoration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17683-17693} }
Bridge-Prompt: Towards Ordinal Action Understanding in Instructional Videos: Muheng Li,

Lei Chen,

Yueqi Duan,

Zhilan Hu,

Jianjiang Feng,

Jie Zhou,

Jiwen Lu; [pdf]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Muheng and Chen, Lei and Duan, Yueqi and Hu, Zhilan and Feng, Jianjiang and Zhou, Jie and Lu, Jiwen}, title = {Bridge-Prompt: Towards Ordinal Action Understanding in Instructional Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19880-19889} }
Cerberus Transformer: Joint Semantic, Affordance and Attribute Parsing: Xiaoxue Chen,

Tianyu Liu,

Hao Zhao,

Guyue Zhou,

Ya-Qin Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2022_CVPR, author = {Chen, Xiaoxue and Liu, Tianyu and Zhao, Hao and Zhou, Guyue and Zhang, Ya-Qin}, title = {Cerberus Transformer: Joint Semantic, Affordance and Attribute Parsing}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19649-19658} }
Single-Photon Structured Light: Varun Sundar,

Sizhuo Ma,

Aswin C. Sankaranarayanan,

Mohit Gupta; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sundar_2022_CVPR, author = {Sundar, Varun and Ma, Sizhuo and Sankaranarayanan, Aswin C. and Gupta, Mohit}, title = {Single-Photon Structured Light}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17865-17875} }
Deblurring via Stochastic Refinement: Jay Whang,

Mauricio Delbracio,

Hossein Talebi,

Chitwan Saharia,

Alexandros G. Dimakis,

Peyman Milanfar; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Whang_2022_CVPR, author = {Whang, Jay and Delbracio, Mauricio and Talebi, Hossein and Saharia, Chitwan and Dimakis, Alexandros G. and Milanfar, Peyman}, title = {Deblurring via Stochastic Refinement}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16293-16303} }
3DJCG: A Unified Framework for Joint Dense Captioning and Visual Grounding on 3D Point Clouds: Daigang Cai,

Lichen Zhao,

Jing Zhang,

Lu Sheng,

Dong Xu; [pdf]
[bibtex]
@InProceedings{Cai_2022_CVPR, author = {Cai, Daigang and Zhao, Lichen and Zhang, Jing and Sheng, Lu and Xu, Dong}, title = {3DJCG: A Unified Framework for Joint Dense Captioning and Visual Grounding on 3D Point Clouds}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16464-16473} }
Abandoning the Bayer-Filter To See in the Dark: Xingbo Dong,

Wanyan Xu,

Zhihui Miao,

Lan Ma,

Chao Zhang,

Jiewen Yang,

Zhe Jin,

Andrew Beng Jin Teoh,

Jiajun Shen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dong_2022_CVPR, author = {Dong, Xingbo and Xu, Wanyan and Miao, Zhihui and Ma, Lan and Zhang, Chao and Yang, Jiewen and Jin, Zhe and Teoh, Andrew Beng Jin and Shen, Jiajun}, title = {Abandoning the Bayer-Filter To See in the Dark}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17431-17440} }
Exploiting Temporal Relations on Radar Perception for Autonomous Driving: Peizhao Li,

Pu Wang,

Karl Berntorp,

Hongfu Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Peizhao and Wang, Pu and Berntorp, Karl and Liu, Hongfu}, title = {Exploiting Temporal Relations on Radar Perception for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17071-17080} }
Forward Compatible Training for Large-Scale Embedding Retrieval Systems: Vivek Ramanujan,

Pavan Kumar Anasosalu Vasu,

Ali Farhadi,

Oncel Tuzel,

Hadi Pouransari; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ramanujan_2022_CVPR, author = {Ramanujan, Vivek and Vasu, Pavan Kumar Anasosalu and Farhadi, Ali and Tuzel, Oncel and Pouransari, Hadi}, title = {Forward Compatible Training for Large-Scale Embedding Retrieval Systems}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19386-19395} }
Everything at Once - Multi-Modal Fusion Transformer for Video Retrieval: Nina Shvetsova,

Brian Chen,

Andrew Rouditchenko,

Samuel Thomas,

Brian Kingsbury,

Rogerio S. Feris,

David Harwath,

James Glass,

Hilde Kuehne; [pdf] [supp] [arXiv ]
[bibtex]
@InProceedings{Shvetsova_2022_CVPR, author = {Shvetsova, Nina and Chen, Brian and Rouditchenko, Andrew and Thomas, Samuel and Kingsbury, Brian and Feris, Rogerio S. and Harwath, David and Glass, James and Kuehne, Hilde}, title = {Everything at Once - Multi-Modal Fusion Transformer for Video Retrieval}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20020-20029} }
Neural Template: Topology-Aware Reconstruction and Disentangled Generation of 3D Meshes: Ka-Hei Hui,

Ruihui Li,

Jingyu Hu,

Chi-Wing Fu; [pdf] [supp]
[bibtex]
@InProceedings{Hui_2022_CVPR, author = {Hui, Ka-Hei and Li, Ruihui and Hu, Jingyu and Fu, Chi-Wing}, title = {Neural Template: Topology-Aware Reconstruction and Disentangled Generation of 3D Meshes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18572-18582} }
AdaFace: Quality Adaptive Margin for Face Recognition: Minchul Kim,

Anil K. Jain,

Xiaoming Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2022_CVPR, author = {Kim, Minchul and Jain, Anil K. and Liu, Xiaoming}, title = {AdaFace: Quality Adaptive Margin for Face Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18750-18759} }
Learning Soft Estimator of Keypoint Scale and Orientation With Probabilistic Covariant Loss: Pei Yan,

Yihua Tan,

Shengzhou Xiong,

Yuan Tai,

Yansheng Li; [pdf] [supp]
[bibtex]
@InProceedings{Yan_2022_CVPR, author = {Yan, Pei and Tan, Yihua and Xiong, Shengzhou and Tai, Yuan and Li, Yansheng}, title = {Learning Soft Estimator of Keypoint Scale and Orientation With Probabilistic Covariant Loss}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19406-19415} }
Opening Up Open World Tracking: Yang Liu,

Idil Esen Zulfikar,

Jonathon Luiten,

Achal Dave,

Deva Ramanan,

Bastian Leibe,

Aljoša Ošep,

Laura Leal-Taixé; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2022_CVPR, author = {Liu, Yang and Zulfikar, Idil Esen and Luiten, Jonathon and Dave, Achal and Ramanan, Deva and Leibe, Bastian and O\v{s}ep, Aljo\v{s}a and Leal-Taix\'e, Laura}, title = {Opening Up Open World Tracking}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19045-19055} }
OSSO: Obtaining Skeletal Shape From Outside: Marilyn Keller,

Silvia Zuffi,

Michael J. Black,

Sergi Pujades; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Keller_2022_CVPR, author = {Keller, Marilyn and Zuffi, Silvia and Black, Michael J. and Pujades, Sergi}, title = {OSSO: Obtaining Skeletal Shape From Outside}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20492-20501} }
Bayesian Invariant Risk Minimization: Yong Lin,

Hanze Dong,

Hao Wang,

Tong Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Lin_2022_CVPR, author = {Lin, Yong and Dong, Hanze and Wang, Hao and Zhang, Tong}, title = {Bayesian Invariant Risk Minimization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16021-16030} }
Alleviating Semantics Distortion in Unsupervised Low-Level Image-to-Image Translation via Structure Consistency Constraint: Jiaxian Guo,

Jiachen Li,

Huan Fu,

Mingming Gong,

Kun Zhang,

Dacheng Tao; [pdf] [supp]
[bibtex]
@InProceedings{Guo_2022_CVPR, author = {Guo, Jiaxian and Li, Jiachen and Fu, Huan and Gong, Mingming and Zhang, Kun and Tao, Dacheng}, title = {Alleviating Semantics Distortion in Unsupervised Low-Level Image-to-Image Translation via Structure Consistency Constraint}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18249-18259} }
Uni-Perceiver: Pre-Training Unified Architecture for Generic Perception for Zero-Shot and Few-Shot Tasks: Xizhou Zhu,

Jinguo Zhu,

Hao Li,

Xiaoshi Wu,

Hongsheng Li,

Xiaohua Wang,

Jifeng Dai; [pdf] [supp]
[bibtex]
@InProceedings{Zhu_2022_CVPR, author = {Zhu, Xizhou and Zhu, Jinguo and Li, Hao and Wu, Xiaoshi and Li, Hongsheng and Wang, Xiaohua and Dai, Jifeng}, title = {Uni-Perceiver: Pre-Training Unified Architecture for Generic Perception for Zero-Shot and Few-Shot Tasks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16804-16815} }
The Auto Arborist Dataset: A Large-Scale Benchmark for Multiview Urban Forest Monitoring Under Domain Shift: Sara Beery,

Guanhang Wu,

Trevor Edwards,

Filip Pavetic,

Bo Majewski,

Shreyasee Mukherjee,

Stanley Chan,

John Morgan,

Vivek Rathod,

Jonathan Huang; [pdf] [supp]
[bibtex]
@InProceedings{Beery_2022_CVPR, author = {Beery, Sara and Wu, Guanhang and Edwards, Trevor and Pavetic, Filip and Majewski, Bo and Mukherjee, Shreyasee and Chan, Stanley and Morgan, John and Rathod, Vivek and Huang, Jonathan}, title = {The Auto Arborist Dataset: A Large-Scale Benchmark for Multiview Urban Forest Monitoring Under Domain Shift}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21294-21307} }
Real-Time, Accurate, and Consistent Video Semantic Segmentation via Unsupervised Adaptation and Cross-Unit Deployment on Mobile Device: Hyojin Park,

Alan Yessenbayev,

Tushar Singhal,

Navin Kumar Adhikari,

Yizhe Zhang,

Shubhankar Mangesh Borse,

Hong Cai,

Nilesh Prasad Pandey,

Fei Yin,

Frank Mayer,

Balaji Calidas,

Fatih Porikli; [pdf] [supp]
[bibtex]
@InProceedings{Park_2022_CVPR, author = {Park, Hyojin and Yessenbayev, Alan and Singhal, Tushar and Adhikari, Navin Kumar and Zhang, Yizhe and Borse, Shubhankar Mangesh and Cai, Hong and Pandey, Nilesh Prasad and Yin, Fei and Mayer, Frank and Calidas, Balaji and Porikli, Fatih}, title = {Real-Time, Accurate, and Consistent Video Semantic Segmentation via Unsupervised Adaptation and Cross-Unit Deployment on Mobile Device}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21431-21438} }
A Style-Aware Discriminator for Controllable Image Translation: Kunhee Kim,

Sanghun Park,

Eunyeong Jeon,

Taehun Kim,

Daijin Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2022_CVPR, author = {Kim, Kunhee and Park, Sanghun and Jeon, Eunyeong and Kim, Taehun and Kim, Daijin}, title = {A Style-Aware Discriminator for Controllable Image Translation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18239-18248} }
Incremental Cross-View Mutual Distillation for Self-Supervised Medical CT Synthesis: Chaowei Fang,

Liang Wang,

Dingwen Zhang,

Jun Xu,

Yixuan Yuan,

Junwei Han; [pdf] [arXiv]
[bibtex]
@InProceedings{Fang_2022_CVPR, author = {Fang, Chaowei and Wang, Liang and Zhang, Dingwen and Xu, Jun and Yuan, Yixuan and Han, Junwei}, title = {Incremental Cross-View Mutual Distillation for Self-Supervised Medical CT Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20677-20686} }
Moving Window Regression: A Novel Approach to Ordinal Regression: Nyeong-Ho Shin,

Seon-Ho Lee,

Chang-Su Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shin_2022_CVPR, author = {Shin, Nyeong-Ho and Lee, Seon-Ho and Kim, Chang-Su}, title = {Moving Window Regression: A Novel Approach to Ordinal Regression}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18760-18769} }
ACPL: Anti-Curriculum Pseudo-Labelling for Semi-Supervised Medical Image Classification: Fengbei Liu,

Yu Tian,

Yuanhong Chen,

Yuyuan Liu,

Vasileios Belagiannis,

Gustavo Carneiro; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2022_CVPR, author = {Liu, Fengbei and Tian, Yu and Chen, Yuanhong and Liu, Yuyuan and Belagiannis, Vasileios and Carneiro, Gustavo}, title = {ACPL: Anti-Curriculum Pseudo-Labelling for Semi-Supervised Medical Image Classification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20697-20706} }
Learning to Deblur Using Light Field Generated and Real Defocus Images: Lingyan Ruan,

Bin Chen,

Jizhou Li,

Miuling Lam; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ruan_2022_CVPR, author = {Ruan, Lingyan and Chen, Bin and Li, Jizhou and Lam, Miuling}, title = {Learning to Deblur Using Light Field Generated and Real Defocus Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16304-16313} }
PhotoScene: Photorealistic Material and Lighting Transfer for Indoor Scenes: Yu-Ying Yeh,

Zhengqin Li,

Yannick Hold-Geoffroy,

Rui Zhu,

Zexiang Xu,

Miloš Hašan,

Kalyan Sunkavalli,

Manmohan Chandraker; [pdf] [supp]
[bibtex]
@InProceedings{Yeh_2022_CVPR, author = {Yeh, Yu-Ying and Li, Zhengqin and Hold-Geoffroy, Yannick and Zhu, Rui and Xu, Zexiang and Ha\v{s}an, Milo\v{s} and Sunkavalli, Kalyan and Chandraker, Manmohan}, title = {PhotoScene: Photorealistic Material and Lighting Transfer for Indoor Scenes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18562-18571} }
Versatile Multi-Modal Pre-Training for Human-Centric Perception: Fangzhou Hong,

Liang Pan,

Zhongang Cai,

Ziwei Liu; [pdf] [arXiv]
[bibtex]
@InProceedings{Hong_2022_CVPR, author = {Hong, Fangzhou and Pan, Liang and Cai, Zhongang and Liu, Ziwei}, title = {Versatile Multi-Modal Pre-Training for Human-Centric Perception}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16156-16166} }
Contrastive Regression for Domain Adaptation on Gaze Estimation: Yaoming Wang,

Yangzhou Jiang,

Jin Li,

Bingbing Ni,

Wenrui Dai,

Chenglin Li,

Hongkai Xiong,

Teng Li; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2022_CVPR, author = {Wang, Yaoming and Jiang, Yangzhou and Li, Jin and Ni, Bingbing and Dai, Wenrui and Li, Chenglin and Xiong, Hongkai and Li, Teng}, title = {Contrastive Regression for Domain Adaptation on Gaze Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19376-19385} }
Multi-View Consistent Generative Adversarial Networks for 3D-Aware Image Synthesis: Xuanmeng Zhang,

Zhedong Zheng,

Daiheng Gao,

Bang Zhang,

Pan Pan,

Yi Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2022_CVPR, author = {Zhang, Xuanmeng and Zheng, Zhedong and Gao, Daiheng and Zhang, Bang and Pan, Pan and Yang, Yi}, title = {Multi-View Consistent Generative Adversarial Networks for 3D-Aware Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18450-18459} }
Memory-Augmented Non-Local Attention for Video Super-Resolution: Jiyang Yu,

Jingen Liu,

Liefeng Bo,

Tao Mei; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yu_2022_CVPR, author = {Yu, Jiyang and Liu, Jingen and Bo, Liefeng and Mei, Tao}, title = {Memory-Augmented Non-Local Attention for Video Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17834-17843} }
Classification-Then-Grounding: Reformulating Video Scene Graphs As Temporal Bipartite Graphs: Kaifeng Gao,

Long Chen,

Yulei Niu,

Jian Shao,

Jun Xiao; [pdf] [supp]
[bibtex]
@InProceedings{Gao_2022_CVPR, author = {Gao, Kaifeng and Chen, Long and Niu, Yulei and Shao, Jian and Xiao, Jun}, title = {Classification-Then-Grounding: Reformulating Video Scene Graphs As Temporal Bipartite Graphs}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19497-19506} }
Transformer-Empowered Multi-Scale Contextual Matching and Aggregation for Multi-Contrast MRI Super-Resolution: Guangyuan Li,

Jun Lv,

Yapeng Tian,

Qi Dou,

Chengyan Wang,

Chenliang Xu,

Jing Qin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Guangyuan and Lv, Jun and Tian, Yapeng and Dou, Qi and Wang, Chengyan and Xu, Chenliang and Qin, Jing}, title = {Transformer-Empowered Multi-Scale Contextual Matching and Aggregation for Multi-Contrast MRI Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20636-20645} }
GateHUB: Gated History Unit With Background Suppression for Online Action Detection: Junwen Chen,

Gaurav Mittal,

Ye Yu,

Yu Kong,

Mei Chen; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2022_CVPR, author = {Chen, Junwen and Mittal, Gaurav and Yu, Ye and Kong, Yu and Chen, Mei}, title = {GateHUB: Gated History Unit With Background Suppression for Online Action Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19925-19934} }
Bridging Video-Text Retrieval With Multiple Choice Questions: Yuying Ge,

Yixiao Ge,

Xihui Liu,

Dian Li,

Ying Shan,

Xiaohu Qie,

Ping Luo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ge_2022_CVPR, author = {Ge, Yuying and Ge, Yixiao and Liu, Xihui and Li, Dian and Shan, Ying and Qie, Xiaohu and Luo, Ping}, title = {Bridging Video-Text Retrieval With Multiple Choice Questions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16167-16176} }
DF-GAN: A Simple and Effective Baseline for Text-to-Image Synthesis: Ming Tao,

Hao Tang,

Fei Wu,

Xiao-Yuan Jing,

Bing-Kun Bao,

Changsheng Xu; [pdf]
[bibtex]
@InProceedings{Tao_2022_CVPR, author = {Tao, Ming and Tang, Hao and Wu, Fei and Jing, Xiao-Yuan and Bao, Bing-Kun and Xu, Changsheng}, title = {DF-GAN: A Simple and Effective Baseline for Text-to-Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16515-16525} }
CoNeRF: Controllable Neural Radiance Fields: Kacper Kania,

Kwang Moo Yi,

Marek Kowalski,

Tomasz Trzciński,

Andrea Tagliasacchi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kania_2022_CVPR, author = {Kania, Kacper and Yi, Kwang Moo and Kowalski, Marek and Trzci\'nski, Tomasz and Tagliasacchi, Andrea}, title = {CoNeRF: Controllable Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18623-18632} }
Noise2NoiseFlow: Realistic Camera Noise Modeling Without Clean Images: Ali Maleky,

Shayan Kousha,

Michael S. Brown,

Marcus A. Brubaker; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Maleky_2022_CVPR, author = {Maleky, Ali and Kousha, Shayan and Brown, Michael S. and Brubaker, Marcus A.}, title = {Noise2NoiseFlow: Realistic Camera Noise Modeling Without Clean Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17632-17641} }
ZeroWaste Dataset: Towards Deformable Object Segmentation in Cluttered Scenes: Dina Bashkirova,

Mohamed Abdelfattah,

Ziliang Zhu,

James Akl,

Fadi Alladkani,

Ping Hu,

Vitaly Ablavsky,

Berk Calli,

Sarah Adel Bargal,

Kate Saenko; [pdf] [arXiv]
[bibtex]
@InProceedings{Bashkirova_2022_CVPR, author = {Bashkirova, Dina and Abdelfattah, Mohamed and Zhu, Ziliang and Akl, James and Alladkani, Fadi and Hu, Ping and Ablavsky, Vitaly and Calli, Berk and Bargal, Sarah Adel and Saenko, Kate}, title = {ZeroWaste Dataset: Towards Deformable Object Segmentation in Cluttered Scenes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21147-21157} }
UNIST: Unpaired Neural Implicit Shape Translation Network: Qimin Chen,

Johannes Merz,

Aditya Sanghi,

Hooman Shayani,

Ali Mahdavi-Amiri,

Hao Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2022_CVPR, author = {Chen, Qimin and Merz, Johannes and Sanghi, Aditya and Shayani, Hooman and Mahdavi-Amiri, Ali and Zhang, Hao}, title = {UNIST: Unpaired Neural Implicit Shape Translation Network}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18614-18622} }
Local-Adaptive Face Recognition via Graph-Based Meta-Clustering and Regularized Adaptation: Wenbin Zhu,

Chien-Yi Wang,

Kuan-Lun Tseng,

Shang-Hong Lai,

Baoyuan Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhu_2022_CVPR, author = {Zhu, Wenbin and Wang, Chien-Yi and Tseng, Kuan-Lun and Lai, Shang-Hong and Wang, Baoyuan}, title = {Local-Adaptive Face Recognition via Graph-Based Meta-Clustering and Regularized Adaptation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20301-20310} }
The DEVIL Is in the Details: A Diagnostic Evaluation Benchmark for Video Inpainting: Ryan Szeto,

Jason J. Corso; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Szeto_2022_CVPR, author = {Szeto, Ryan and Corso, Jason J.}, title = {The DEVIL Is in the Details: A Diagnostic Evaluation Benchmark for Video Inpainting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21054-21063} }
Generating Useful Accident-Prone Driving Scenarios via a Learned Traffic Prior: Davis Rempe,

Jonah Philion,

Leonidas J. Guibas,

Sanja Fidler,

Or Litany; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Rempe_2022_CVPR, author = {Rempe, Davis and Philion, Jonah and Guibas, Leonidas J. and Fidler, Sanja and Litany, Or}, title = {Generating Useful Accident-Prone Driving Scenarios via a Learned Traffic Prior}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17305-17315} }
Efficient Geometry-Aware 3D Generative Adversarial Networks: Eric R. Chan,

Connor Z. Lin,

Matthew A. Chan,

Koki Nagano,

Boxiao Pan,

Shalini De Mello,

Orazio Gallo,

Leonidas J. Guibas,

Jonathan Tremblay,

Sameh Khamis,

Tero Karras,

Gordon Wetzstein; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chan_2022_CVPR, author = {Chan, Eric R. and Lin, Connor Z. and Chan, Matthew A. and Nagano, Koki and Pan, Boxiao and De Mello, Shalini and Gallo, Orazio and Guibas, Leonidas J. and Tremblay, Jonathan and Khamis, Sameh and Karras, Tero and Wetzstein, Gordon}, title = {Efficient Geometry-Aware 3D Generative Adversarial Networks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16123-16133} }
Dancing Under the Stars: Video Denoising in Starlight: Kristina Monakhova,

Stephan R. Richter,

Laura Waller,

Vladlen Koltun; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Monakhova_2022_CVPR, author = {Monakhova, Kristina and Richter, Stephan R. and Waller, Laura and Koltun, Vladlen}, title = {Dancing Under the Stars: Video Denoising in Starlight}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16241-16251} }
SPAct: Self-Supervised Privacy Preservation for Action Recognition: Ishan Rajendrakumar Dave,

Chen Chen,

Mubarak Shah; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dave_2022_CVPR, author = {Dave, Ishan Rajendrakumar and Chen, Chen and Shah, Mubarak}, title = {SPAct: Self-Supervised Privacy Preservation for Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20164-20173} }
De-Rendering 3D Objects in the Wild: Felix Wimbauer,

Shangzhe Wu,

Christian Rupprecht; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wimbauer_2022_CVPR, author = {Wimbauer, Felix and Wu, Shangzhe and Rupprecht, Christian}, title = {De-Rendering 3D Objects in the Wild}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18490-18499} }
Representing 3D Shapes With Probabilistic Directed Distance Fields: Tristan Aumentado-Armstrong,

Stavros Tsogkas,

Sven Dickinson,

Allan D. Jepson; [pdf] [supp]
[bibtex]
@InProceedings{Aumentado-Armstrong_2022_CVPR, author = {Aumentado-Armstrong, Tristan and Tsogkas, Stavros and Dickinson, Sven and Jepson, Allan D.}, title = {Representing 3D Shapes With Probabilistic Directed Distance Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19343-19354} }
Learning ABCs: Approximate Bijective Correspondence for Isolating Factors of Variation With Weak Supervision: Kieran A. Murphy,

Varun Jampani,

Srikumar Ramalingam,

Ameesh Makadia; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Murphy_2022_CVPR, author = {Murphy, Kieran A. and Jampani, Varun and Ramalingam, Srikumar and Makadia, Ameesh}, title = {Learning ABCs: Approximate Bijective Correspondence for Isolating Factors of Variation With Weak Supervision}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16010-16020} }
ABO: Dataset and Benchmarks for Real-World 3D Object Understanding: Jasmine Collins,

Shubham Goel,

Kenan Deng,

Achleshwar Luthra,

Leon Xu,

Erhan Gundogdu,

Xi Zhang,

Tomas F. Yago Vicente,

Thomas Dideriksen,

Himanshu Arora,

Matthieu Guillaumin,

Jitendra Malik; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Collins_2022_CVPR, author = {Collins, Jasmine and Goel, Shubham and Deng, Kenan and Luthra, Achleshwar and Xu, Leon and Gundogdu, Erhan and Zhang, Xi and Vicente, Tomas F. Yago and Dideriksen, Thomas and Arora, Himanshu and Guillaumin, Matthieu and Malik, Jitendra}, title = {ABO: Dataset and Benchmarks for Real-World 3D Object Understanding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21126-21136} }
MS-TCT: Multi-Scale Temporal ConvTransformer for Action Detection: Rui Dai,

Srijan Das,

Kumara Kahatapitiya,

Michael S. Ryoo,

François Brémond; [pdf] [supp]
[bibtex]
@InProceedings{Dai_2022_CVPR, author = {Dai, Rui and Das, Srijan and Kahatapitiya, Kumara and Ryoo, Michael S. and Br\'emond, Fran\c{c}ois}, title = {MS-TCT: Multi-Scale Temporal ConvTransformer for Action Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20041-20051} }
Make It Move: Controllable Image-to-Video Generation With Text Descriptions: Yaosi Hu,

Chong Luo,

Zhenzhong Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hu_2022_CVPR, author = {Hu, Yaosi and Luo, Chong and Chen, Zhenzhong}, title = {Make It Move: Controllable Image-to-Video Generation With Text Descriptions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18219-18228} }
Neural Points: Point Cloud Representation With Neural Fields for Arbitrary Upsampling: Wanquan Feng,

Jin Li,

Hongrui Cai,

Xiaonan Luo,

Juyong Zhang; [pdf] [arXiv]
[bibtex]
@InProceedings{Feng_2022_CVPR, author = {Feng, Wanquan and Li, Jin and Cai, Hongrui and Luo, Xiaonan and Zhang, Juyong}, title = {Neural Points: Point Cloud Representation With Neural Fields for Arbitrary Upsampling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18633-18642} }
FIFO: Learning Fog-Invariant Features for Foggy Scene Segmentation: Sohyun Lee,

Taeyoung Son,

Suha Kwak; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2022_CVPR, author = {Lee, Sohyun and Son, Taeyoung and Kwak, Suha}, title = {FIFO: Learning Fog-Invariant Features for Foggy Scene Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18911-18921} }
Unsupervised Visual Representation Learning by Online Constrained K-Means: Qi Qian,

Yuanhong Xu,

Juhua Hu,

Hao Li,

Rong Jin; [pdf] [supp]
[bibtex]
@InProceedings{Qian_2022_CVPR, author = {Qian, Qi and Xu, Yuanhong and Hu, Juhua and Li, Hao and Jin, Rong}, title = {Unsupervised Visual Representation Learning by Online Constrained K-Means}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16640-16649} }
Neural Point Light Fields: Julian Ost,

Issam Laradji,

Alejandro Newell,

Yuval Bahat,

Felix Heide; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ost_2022_CVPR, author = {Ost, Julian and Laradji, Issam and Newell, Alejandro and Bahat, Yuval and Heide, Felix}, title = {Neural Point Light Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18419-18429} }
Vehicle Trajectory Prediction Works, but Not Everywhere: Mohammadhossein Bahari,

Saeed Saadatnejad,

Ahmad Rahimi,

Mohammad Shaverdikondori,

Amir Hossein Shahidzadeh,

Seyed-Mohsen Moosavi-Dezfooli,

Alexandre Alahi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bahari_2022_CVPR, author = {Bahari, Mohammadhossein and Saadatnejad, Saeed and Rahimi, Ahmad and Shaverdikondori, Mohammad and Shahidzadeh, Amir Hossein and Moosavi-Dezfooli, Seyed-Mohsen and Alahi, Alexandre}, title = {Vehicle Trajectory Prediction Works, but Not Everywhere}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17123-17133} }
Instance-Wise Occlusion and Depth Orders in Natural Scenes: Hyunmin Lee,

Jaesik Park; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2022_CVPR, author = {Lee, Hyunmin and Park, Jaesik}, title = {Instance-Wise Occlusion and Depth Orders in Natural Scenes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21210-21221} }
Contour-Hugging Heatmaps for Landmark Detection: James McCouat,

Irina Voiculescu; [pdf] [supp]
[bibtex]
@InProceedings{McCouat_2022_CVPR, author = {McCouat, James and Voiculescu, Irina}, title = {Contour-Hugging Heatmaps for Landmark Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20597-20605} }
DisARM: Displacement Aware Relation Module for 3D Detection: Yao Duan,

Chenyang Zhu,

Yuqing Lan,

Renjiao Yi,

Xinwang Liu,

Kai Xu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Duan_2022_CVPR, author = {Duan, Yao and Zhu, Chenyang and Lan, Yuqing and Yi, Renjiao and Liu, Xinwang and Xu, Kai}, title = {DisARM: Displacement Aware Relation Module for 3D Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16980-16989} }
NeRF-Editing: Geometry Editing of Neural Radiance Fields: Yu-Jie Yuan,

Yang-Tian Sun,

Yu-Kun Lai,

Yuewen Ma,

Rongfei Jia,

Lin Gao; [pdf] [supp]
[bibtex]
@InProceedings{Yuan_2022_CVPR, author = {Yuan, Yu-Jie and Sun, Yang-Tian and Lai, Yu-Kun and Ma, Yuewen and Jia, Rongfei and Gao, Lin}, title = {NeRF-Editing: Geometry Editing of Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18353-18364} }
Optimal Correction Cost for Object Detection Evaluation: Mayu Otani,

Riku Togashi,

Yuta Nakashima,

Esa Rahtu,

Janne Heikkilä,

Shin'ichi Satoh; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Otani_2022_CVPR, author = {Otani, Mayu and Togashi, Riku and Nakashima, Yuta and Rahtu, Esa and Heikkil\"a, Janne and Satoh, Shin'ichi}, title = {Optimal Correction Cost for Object Detection Evaluation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21107-21115} }
Artistic Style Discovery With Independent Components: Xin Xie,

Yi Li,

Huaibo Huang,

Haiyan Fu,

Wanwan Wang,

Yanqing Guo; [pdf]
[bibtex]
@InProceedings{Xie_2022_CVPR, author = {Xie, Xin and Li, Yi and Huang, Huaibo and Fu, Haiyan and Wang, Wanwan and Guo, Yanqing}, title = {Artistic Style Discovery With Independent Components}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19870-19879} }
HyperStyle: StyleGAN Inversion With HyperNetworks for Real Image Editing: Yuval Alaluf,

Omer Tov,

Ron Mokady,

Rinon Gal,

Amit Bermano; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Alaluf_2022_CVPR, author = {Alaluf, Yuval and Tov, Omer and Mokady, Ron and Gal, Rinon and Bermano, Amit}, title = {HyperStyle: StyleGAN Inversion With HyperNetworks for Real Image Editing}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18511-18521} }
LTP: Lane-Based Trajectory Prediction for Autonomous Driving: Jingke Wang,

Tengju Ye,

Ziqing Gu,

Junbo Chen; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2022_CVPR, author = {Wang, Jingke and Ye, Tengju and Gu, Ziqing and Chen, Junbo}, title = {LTP: Lane-Based Trajectory Prediction for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17134-17142} }
AP-BSN: Self-Supervised Denoising for Real-World Images via Asymmetric PD and Blind-Spot Network: Wooseok Lee,

Sanghyun Son,

Kyoung Mu Lee; [pdf] [supp]
[bibtex]
@InProceedings{Lee_2022_CVPR, author = {Lee, Wooseok and Son, Sanghyun and Lee, Kyoung Mu}, title = {AP-BSN: Self-Supervised Denoising for Real-World Images via Asymmetric PD and Blind-Spot Network}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17725-17734} }
Not All Points Are Equal: Learning Highly Efficient Point-Based Detectors for 3D LiDAR Point Clouds: Yifan Zhang,

Qingyong Hu,

Guoquan Xu,

Yanxin Ma,

Jianwei Wan,

Yulan Guo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2022_CVPR, author = {Zhang, Yifan and Hu, Qingyong and Xu, Guoquan and Ma, Yanxin and Wan, Jianwei and Guo, Yulan}, title = {Not All Points Are Equal: Learning Highly Efficient Point-Based Detectors for 3D LiDAR Point Clouds}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18953-18962} }
RigNeRF: Fully Controllable Neural 3D Portraits: ShahRukh Athar,

Zexiang Xu,

Kalyan Sunkavalli,

Eli Shechtman,

Zhixin Shu; [pdf]
[bibtex]
@InProceedings{Athar_2022_CVPR, author = {Athar, ShahRukh and Xu, Zexiang and Sunkavalli, Kalyan and Shechtman, Eli and Shu, Zhixin}, title = {RigNeRF: Fully Controllable Neural 3D Portraits}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20364-20373} }
CLIP-Forge: Towards Zero-Shot Text-To-Shape Generation: Aditya Sanghi,

Hang Chu,

Joseph G. Lambourne,

Ye Wang,

Chin-Yi Cheng,

Marco Fumero,

Kamal Rahimi Malekshan; [pdf] [supp]
[bibtex]
@InProceedings{Sanghi_2022_CVPR, author = {Sanghi, Aditya and Chu, Hang and Lambourne, Joseph G. and Wang, Ye and Cheng, Chin-Yi and Fumero, Marco and Malekshan, Kamal Rahimi}, title = {CLIP-Forge: Towards Zero-Shot Text-To-Shape Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18603-18613} }
Instance-Dependent Label-Noise Learning With Manifold-Regularized Transition Matrix Estimation: De Cheng,

Tongliang Liu,

Yixiong Ning,

Nannan Wang,

Bo Han,

Gang Niu,

Xinbo Gao,

Masashi Sugiyama; [pdf]
[bibtex]
@InProceedings{Cheng_2022_CVPR, author = {Cheng, De and Liu, Tongliang and Ning, Yixiong and Wang, Nannan and Han, Bo and Niu, Gang and Gao, Xinbo and Sugiyama, Masashi}, title = {Instance-Dependent Label-Noise Learning With Manifold-Regularized Transition Matrix Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16630-16639} }
Rethinking the Augmentation Module in Contrastive Learning: Learning Hierarchical Augmentation Invariance With Expanded Views: Junbo Zhang,

Kaisheng Ma; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhang_2022_CVPR, author = {Zhang, Junbo and Ma, Kaisheng}, title = {Rethinking the Augmentation Module in Contrastive Learning: Learning Hierarchical Augmentation Invariance With Expanded Views}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16650-16659} }
Equivariant Point Cloud Analysis via Learning Orientations for Message Passing: Shitong Luo,

Jiahan Li,

Jiaqi Guan,

Yufeng Su,

Chaoran Cheng,

Jian Peng,

Jianzhu Ma; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Luo_2022_CVPR, author = {Luo, Shitong and Li, Jiahan and Guan, Jiaqi and Su, Yufeng and Cheng, Chaoran and Peng, Jian and Ma, Jianzhu}, title = {Equivariant Point Cloud Analysis via Learning Orientations for Message Passing}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18932-18941} }
Node Representation Learning in Graph via Node-to-Neighbourhood Mutual Information Maximization: Wei Dong,

Junsheng Wu,

Yi Luo,

Zongyuan Ge,

Peng Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dong_2022_CVPR, author = {Dong, Wei and Wu, Junsheng and Luo, Yi and Ge, Zongyuan and Wang, Peng}, title = {Node Representation Learning in Graph via Node-to-Neighbourhood Mutual Information Maximization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16620-16629} }
Point Cloud Pre-Training With Natural 3D Structures: Ryosuke Yamada,

Hirokatsu Kataoka,

Naoya Chiba,

Yukiyasu Domae,

Tetsuya Ogata; [pdf] [supp]
[bibtex]
@InProceedings{Yamada_2022_CVPR, author = {Yamada, Ryosuke and Kataoka, Hirokatsu and Chiba, Naoya and Domae, Yukiyasu and Ogata, Tetsuya}, title = {Point Cloud Pre-Training With Natural 3D Structures}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21283-21293} }
StyleT2I: Toward Compositional and High-Fidelity Text-to-Image Synthesis: Zhiheng Li,

Martin Renqiang Min,

Kai Li,

Chenliang Xu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Zhiheng and Min, Martin Renqiang and Li, Kai and Xu, Chenliang}, title = {StyleT2I: Toward Compositional and High-Fidelity Text-to-Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18197-18207} }
V-Doc: Visual Questions Answers With Documents: Yihao Ding,

Zhe Huang,

Runlin Wang,

YanHang Zhang,

Xianru Chen,

Yuzhong Ma,

Hyunsuk Chung,

Soyeon Caren Han; [pdf]
[bibtex]
@InProceedings{Ding_2022_CVPR, author = {Ding, Yihao and Huang, Zhe and Wang, Runlin and Zhang, YanHang and Chen, Xianru and Ma, Yuzhong and Chung, Hyunsuk and Han, Soyeon Caren}, title = {V-Doc: Visual Questions Answers With Documents}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21492-21498} }
Uncertainty-Guided Probabilistic Transformer for Complex Action Recognition: Hongji Guo,

Hanjing Wang,

Qiang Ji; [pdf]
[bibtex]
@InProceedings{Guo_2022_CVPR, author = {Guo, Hongji and Wang, Hanjing and Ji, Qiang}, title = {Uncertainty-Guided Probabilistic Transformer for Complex Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20052-20061} }
V2C: Visual Voice Cloning: Qi Chen,

Mingkui Tan,

Yuankai Qi,

Jiaqiu Zhou,

Yuanqing Li,

Qi Wu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2022_CVPR, author = {Chen, Qi and Tan, Mingkui and Qi, Yuankai and Zhou, Jiaqiu and Li, Yuanqing and Wu, Qi}, title = {V2C: Visual Voice Cloning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21242-21251} }
EvUnroll: Neuromorphic Events Based Rolling Shutter Image Correction: Xinyu Zhou,

Peiqi Duan,

Yi Ma,

Boxin Shi; [pdf] [supp]
[bibtex]
@InProceedings{Zhou_2022_CVPR, author = {Zhou, Xinyu and Duan, Peiqi and Ma, Yi and Shi, Boxin}, title = {EvUnroll: Neuromorphic Events Based Rolling Shutter Image Correction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17775-17784} }
Gait Recognition in the Wild With Dense 3D Representations and a Benchmark: Jinkai Zheng,

Xinchen Liu,

Wu Liu,

Lingxiao He,

Chenggang Yan,

Tao Mei; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zheng_2022_CVPR, author = {Zheng, Jinkai and Liu, Xinchen and Liu, Wu and He, Lingxiao and Yan, Chenggang and Mei, Tao}, title = {Gait Recognition in the Wild With Dense 3D Representations and a Benchmark}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20228-20237} }
Temporal Context Matters: Enhancing Single Image Prediction With Disease Progression Representations: Aishik Konwer,

Xuan Xu,

Joseph Bae,

Chao Chen,

Prateek Prasanna; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Konwer_2022_CVPR, author = {Konwer, Aishik and Xu, Xuan and Bae, Joseph and Chen, Chao and Prasanna, Prateek}, title = {Temporal Context Matters: Enhancing Single Image Prediction With Disease Progression Representations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18824-18835} }
Learning From All Vehicles: Dian Chen,

Philipp Krähenbühl; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2022_CVPR, author = {Chen, Dian and Kr\"ahenb\"uhl, Philipp}, title = {Learning From All Vehicles}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17222-17231} }
Towards Driving-Oriented Metric for Lane Detection Models: Takami Sato,

Qi Alfred Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sato_2022_CVPR, author = {Sato, Takami and Chen, Qi Alfred}, title = {Towards Driving-Oriented Metric for Lane Detection Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17153-17162} }
XYDeblur: Divide and Conquer for Single Image Deblurring: Seo-Won Ji,

Jeongmin Lee,

Seung-Wook Kim,

Jun-Pyo Hong,

Seung-Jin Baek,

Seung-Won Jung,

Sung-Jea Ko; [pdf] [supp]
[bibtex]
@InProceedings{Ji_2022_CVPR, author = {Ji, Seo-Won and Lee, Jeongmin and Kim, Seung-Wook and Hong, Jun-Pyo and Baek, Seung-Jin and Jung, Seung-Won and Ko, Sung-Jea}, title = {XYDeblur: Divide and Conquer for Single Image Deblurring}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17421-17430} }
STCrowd: A Multimodal Dataset for Pedestrian Perception in Crowded Scenes: Peishan Cong,

Xinge Zhu,

Feng Qiao,

Yiming Ren,

Xidong Peng,

Yuenan Hou,

Lan Xu,

Ruigang Yang,

Dinesh Manocha,

Yuexin Ma; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cong_2022_CVPR, author = {Cong, Peishan and Zhu, Xinge and Qiao, Feng and Ren, Yiming and Peng, Xidong and Hou, Yuenan and Xu, Lan and Yang, Ruigang and Manocha, Dinesh and Ma, Yuexin}, title = {STCrowd: A Multimodal Dataset for Pedestrian Perception in Crowded Scenes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19608-19617} }
Deep Decomposition for Stochastic Normal-Abnormal Transport: Peirong Liu,

Yueh Lee,

Stephen Aylward,

Marc Niethammer; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2022_CVPR, author = {Liu, Peirong and Lee, Yueh and Aylward, Stephen and Niethammer, Marc}, title = {Deep Decomposition for Stochastic Normal-Abnormal Transport}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18791-18801} }
Multimodal Material Segmentation: Yupeng Liang,

Ryosuke Wakaki,

Shohei Nobuhara,

Ko Nishino; [pdf] [supp]
[bibtex]
@InProceedings{Liang_2022_CVPR, author = {Liang, Yupeng and Wakaki, Ryosuke and Nobuhara, Shohei and Nishino, Ko}, title = {Multimodal Material Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19800-19808} }
DynamicEarthNet: Daily Multi-Spectral Satellite Dataset for Semantic Change Segmentation: Aysim Toker,

Lukas Kondmann,

Mark Weber,

Marvin Eisenberger,

Andrés Camero,

Jingliang Hu,

Ariadna Pregel Hoderlein,

Çağlar Şenaras,

Timothy Davis,

Daniel Cremers,

Giovanni Marchisio,

Xiao Xiang Zhu,

Laura Leal-Taixé; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Toker_2022_CVPR, author = {Toker, Aysim and Kondmann, Lukas and Weber, Mark and Eisenberger, Marvin and Camero, Andr\'es and Hu, Jingliang and Hoderlein, Ariadna Pregel and \c{S}enaras, \c{C}a\u{g}lar and Davis, Timothy and Cremers, Daniel and Marchisio, Giovanni and Zhu, Xiao Xiang and Leal-Taix\'e, Laura}, title = {DynamicEarthNet: Daily Multi-Spectral Satellite Dataset for Semantic Change Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21158-21167} }
Quantization-Aware Deep Optics for Diffractive Snapshot Hyperspectral Imaging: Lingen Li,

Lizhi Wang,

Weitao Song,

Lei Zhang,

Zhiwei Xiong,

Hua Huang; [pdf] [supp]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Lingen and Wang, Lizhi and Song, Weitao and Zhang, Lei and Xiong, Zhiwei and Huang, Hua}, title = {Quantization-Aware Deep Optics for Diffractive Snapshot Hyperspectral Imaging}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19780-19789} }
Improving Video Model Transfer With Dynamic Representation Learning: Yi Li,

Nuno Vasconcelos; [pdf] [supp]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Yi and Vasconcelos, Nuno}, title = {Improving Video Model Transfer With Dynamic Representation Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19280-19291} }
PIE-Net: Photometric Invariant Edge Guided Network for Intrinsic Image Decomposition: Partha Das,

Sezer Karaoglu,

Theo Gevers; [pdf] [supp]
[bibtex]
@InProceedings{Das_2022_CVPR, author = {Das, Partha and Karaoglu, Sezer and Gevers, Theo}, title = {PIE-Net: Photometric Invariant Edge Guided Network for Intrinsic Image Decomposition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19790-19799} }
QS-Attn: Query-Selected Attention for Contrastive Learning in I2I Translation: Xueqi Hu,

Xinyue Zhou,

Qiusheng Huang,

Zhengyi Shi,

Li Sun,

Qingli Li; [pdf] [supp]
[bibtex]
@InProceedings{Hu_2022_CVPR, author = {Hu, Xueqi and Zhou, Xinyue and Huang, Qiusheng and Shi, Zhengyi and Sun, Li and Li, Qingli}, title = {QS-Attn: Query-Selected Attention for Contrastive Learning in I2I Translation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18291-18300} }
Adaptive Gating for Single-Photon 3D Imaging: Ryan Po,

Adithya Pediredla,

Ioannis Gkioulekas; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Po_2022_CVPR, author = {Po, Ryan and Pediredla, Adithya and Gkioulekas, Ioannis}, title = {Adaptive Gating for Single-Photon 3D Imaging}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16354-16363} }
H4D: Human 4D Modeling by Learning Neural Compositional Representation: Boyan Jiang,

Yinda Zhang,

Xingkui Wei,

Xiangyang Xue,

Yanwei Fu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jiang_2022_CVPR, author = {Jiang, Boyan and Zhang, Yinda and Wei, Xingkui and Xue, Xiangyang and Fu, Yanwei}, title = {H4D: Human 4D Modeling by Learning Neural Compositional Representation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19355-19365} }
Cannot See the Forest for the Trees: Aggregating Multiple Viewpoints To Better Classify Objects in Videos: Sukjun Hwang,

Miran Heo,

Seoung Wug Oh,

Seon Joo Kim; [pdf] [supp]
[bibtex]
@InProceedings{Hwang_2022_CVPR, author = {Hwang, Sukjun and Heo, Miran and Oh, Seoung Wug and Kim, Seon Joo}, title = {Cannot See the Forest for the Trees: Aggregating Multiple Viewpoints To Better Classify Objects in Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17052-17061} }
Learning Canonical F-Correlation Projection for Compact Multiview Representation: Yun-Hao Yuan,

Jin Li,

Yun Li,

Jipeng Qiang,

Yi Zhu,

Xiaobo Shen,

Jianping Gou; [pdf] [supp]
[bibtex]
@InProceedings{Yuan_2022_CVPR, author = {Yuan, Yun-Hao and Li, Jin and Li, Yun and Qiang, Jipeng and Zhu, Yi and Shen, Xiaobo and Gou, Jianping}, title = {Learning Canonical F-Correlation Projection for Compact Multiview Representation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19260-19269} }
DIFNet: Boosting Visual Information Flow for Image Captioning: Mingrui Wu,

Xuying Zhang,

Xiaoshuai Sun,

Yiyi Zhou,

Chao Chen,

Jiaxin Gu,

Xing Sun,

Rongrong Ji; [pdf]
[bibtex]
@InProceedings{Wu_2022_CVPR, author = {Wu, Mingrui and Zhang, Xuying and Sun, Xiaoshuai and Zhou, Yiyi and Chen, Chao and Gu, Jiaxin and Sun, Xing and Ji, Rongrong}, title = {DIFNet: Boosting Visual Information Flow for Image Captioning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18020-18029} }
Tree Energy Loss: Towards Sparsely Annotated Semantic Segmentation: Zhiyuan Liang,

Tiancai Wang,

Xiangyu Zhang,

Jian Sun,

Jianbing Shen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liang_2022_CVPR, author = {Liang, Zhiyuan and Wang, Tiancai and Zhang, Xiangyu and Sun, Jian and Shen, Jianbing}, title = {Tree Energy Loss: Towards Sparsely Annotated Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16907-16916} }
Grounding Answers for Visual Questions Asked by Visually Impaired People: Chongyan Chen,

Samreen Anjum,

Danna Gurari; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2022_CVPR, author = {Chen, Chongyan and Anjum, Samreen and Gurari, Danna}, title = {Grounding Answers for Visual Questions Asked by Visually Impaired People}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19098-19107} }
Automatic Color Image Stitching Using Quaternion Rank-1 Alignment: Jiaxue Li,

Yicong Zhou; [pdf] [supp]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Jiaxue and Zhou, Yicong}, title = {Automatic Color Image Stitching Using Quaternion Rank-1 Alignment}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19720-19729} }
VisualGPT: Data-Efficient Adaptation of Pretrained Language Models for Image Captioning: Jun Chen,

Han Guo,

Kai Yi,

Boyang Li,

Mohamed Elhoseiny; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2022_CVPR, author = {Chen, Jun and Guo, Han and Yi, Kai and Li, Boyang and Elhoseiny, Mohamed}, title = {VisualGPT: Data-Efficient Adaptation of Pretrained Language Models for Image Captioning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18030-18040} }
All-Photon Polarimetric Time-of-Flight Imaging: Seung-Hwan Baek,

Felix Heide; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Baek_2022_CVPR, author = {Baek, Seung-Hwan and Heide, Felix}, title = {All-Photon Polarimetric Time-of-Flight Imaging}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17876-17885} }
Towards Implicit Text-Guided 3D Shape Generation: Zhengzhe Liu,

Yi Wang,

Xiaojuan Qi,

Chi-Wing Fu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2022_CVPR, author = {Liu, Zhengzhe and Wang, Yi and Qi, Xiaojuan and Fu, Chi-Wing}, title = {Towards Implicit Text-Guided 3D Shape Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17896-17906} }
A Versatile Multi-View Framework for LiDAR-Based 3D Object Detection With Guidance From Panoptic Segmentation: Hamidreza Fazlali,

Yixuan Xu,

Yuan Ren,

Bingbing Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Fazlali_2022_CVPR, author = {Fazlali, Hamidreza and Xu, Yixuan and Ren, Yuan and Liu, Bingbing}, title = {A Versatile Multi-View Framework for LiDAR-Based 3D Object Detection With Guidance From Panoptic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17192-17201} }
RFNet: Unsupervised Network for Mutually Reinforcing Multi-Modal Image Registration and Fusion: Han Xu,

Jiayi Ma,

Jiteng Yuan,

Zhuliang Le,

Wei Liu; [pdf] [supp]
[bibtex]
@InProceedings{Xu_2022_CVPR, author = {Xu, Han and Ma, Jiayi and Yuan, Jiteng and Le, Zhuliang and Liu, Wei}, title = {RFNet: Unsupervised Network for Mutually Reinforcing Multi-Modal Image Registration and Fusion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19679-19688} }
CellTypeGraph: A New Geometric Computer Vision Benchmark: Lorenzo Cerrone,

Athul Vijayan,

Tejasvinee Mody,

Kay Schneitz,

Fred A. Hamprecht; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cerrone_2022_CVPR, author = {Cerrone, Lorenzo and Vijayan, Athul and Mody, Tejasvinee and Schneitz, Kay and Hamprecht, Fred A.}, title = {CellTypeGraph: A New Geometric Computer Vision Benchmark}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20897-20907} }
Clustering Plotted Data by Image Segmentation: Tarek Naous,

Srinjay Sarkar,

Abubakar Abid,

James Zou; [pdf] [arXiv]
[bibtex]
@InProceedings{Naous_2022_CVPR, author = {Naous, Tarek and Sarkar, Srinjay and Abid, Abubakar and Zou, James}, title = {Clustering Plotted Data by Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21499-21504} }
Animal Kingdom: A Large and Diverse Dataset for Animal Behavior Understanding: Xun Long Ng,

Kian Eng Ong,

Qichen Zheng,

Yun Ni,

Si Yong Yeo,

Jun Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ng_2022_CVPR, author = {Ng, Xun Long and Ong, Kian Eng and Zheng, Qichen and Ni, Yun and Yeo, Si Yong and Liu, Jun}, title = {Animal Kingdom: A Large and Diverse Dataset for Animal Behavior Understanding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19023-19034} }
EI-CLIP: Entity-Aware Interventional Contrastive Learning for E-Commerce Cross-Modal Retrieval: Haoyu Ma,

Handong Zhao,

Zhe Lin,

Ajinkya Kale,

Zhangyang Wang,

Tong Yu,

Jiuxiang Gu,

Sunav Choudhary,

Xiaohui Xie; [pdf] [supp]
[bibtex]
@InProceedings{Ma_2022_CVPR, author = {Ma, Haoyu and Zhao, Handong and Lin, Zhe and Kale, Ajinkya and Wang, Zhangyang and Yu, Tong and Gu, Jiuxiang and Choudhary, Sunav and Xie, Xiaohui}, title = {EI-CLIP: Entity-Aware Interventional Contrastive Learning for E-Commerce Cross-Modal Retrieval}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18051-18061} }
Multi-Dimensional, Nuanced and Subjective - Measuring the Perception of Facial Expressions: De'Aira Bryant,

Siqi Deng,

Nashlie Sephus,

Wei Xia,

Pietro Perona; [pdf] [supp]
[bibtex]
@InProceedings{Bryant_2022_CVPR, author = {Bryant, De'Aira and Deng, Siqi and Sephus, Nashlie and Xia, Wei and Perona, Pietro}, title = {Multi-Dimensional, Nuanced and Subjective - Measuring the Perception of Facial Expressions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20932-20941} }
PyMiceTracking: An Open-Source Toolbox for Real-Time Behavioral Neuroscience Experiments: Richardson Menezes,

Aron de Miranda,

Helton Maia; [pdf]
[bibtex]
@InProceedings{Menezes_2022_CVPR, author = {Menezes, Richardson and de Miranda, Aron and Maia, Helton}, title = {PyMiceTracking: An Open-Source Toolbox for Real-Time Behavioral Neuroscience Experiments}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21459-21465} }
Fine-Grained Temporal Contrastive Learning for Weakly-Supervised Temporal Action Localization: Junyu Gao,

Mengyuan Chen,

Changsheng Xu; [pdf] [arXiv]
[bibtex]
@InProceedings{Gao_2022_CVPR, author = {Gao, Junyu and Chen, Mengyuan and Xu, Changsheng}, title = {Fine-Grained Temporal Contrastive Learning for Weakly-Supervised Temporal Action Localization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19999-20009} }
UTC: A Unified Transformer With Inter-Task Contrastive Learning for Visual Dialog: Cheng Chen,

Zhenshan Tan,

Qingrong Cheng,

Xin Jiang,

Qun Liu,

Yudong Zhu,

Xiaodong Gu; [pdf] [arXiv]
[bibtex]
@InProceedings{Chen_2022_CVPR, author = {Chen, Cheng and Tan, Zhenshan and Cheng, Qingrong and Jiang, Xin and Liu, Qun and Zhu, Yudong and Gu, Xiaodong}, title = {UTC: A Unified Transformer With Inter-Task Contrastive Learning for Visual Dialog}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18103-18112} }
Mimicking the Oracle: An Initial Phase Decorrelation Approach for Class Incremental Learning: Yujun Shi,

Kuangqi Zhou,

Jian Liang,

Zihang Jiang,

Jiashi Feng,

Philip H.S. Torr,

Song Bai,

Vincent Y. F. Tan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shi_2022_CVPR, author = {Shi, Yujun and Zhou, Kuangqi and Liang, Jian and Jiang, Zihang and Feng, Jiashi and Torr, Philip H.S. and Bai, Song and Tan, Vincent Y. F.}, title = {Mimicking the Oracle: An Initial Phase Decorrelation Approach for Class Incremental Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16722-16731} }
RIDDLE: Lidar Data Compression With Range Image Deep Delta Encoding: Xuanyu Zhou,

Charles R. Qi,

Yin Zhou,

Dragomir Anguelov; [pdf] [supp]
[bibtex]
@InProceedings{Zhou_2022_CVPR, author = {Zhou, Xuanyu and Qi, Charles R. and Zhou, Yin and Anguelov, Dragomir}, title = {RIDDLE: Lidar Data Compression With Range Image Deep Delta Encoding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17212-17221} }
RelTransformer: A Transformer-Based Long-Tail Visual Relationship Recognition: Jun Chen,

Aniket Agarwal,

Sherif Abdelkarim,

Deyao Zhu,

Mohamed Elhoseiny; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2022_CVPR, author = {Chen, Jun and Agarwal, Aniket and Abdelkarim, Sherif and Zhu, Deyao and Elhoseiny, Mohamed}, title = {RelTransformer: A Transformer-Based Long-Tail Visual Relationship Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19507-19517} }
RigidFlow: Self-Supervised Scene Flow Learning on Point Clouds by Local Rigidity Prior: Ruibo Li,

Chi Zhang,

Guosheng Lin,

Zhe Wang,

Chunhua Shen; [pdf] [supp]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Ruibo and Zhang, Chi and Lin, Guosheng and Wang, Zhe and Shen, Chunhua}, title = {RigidFlow: Self-Supervised Scene Flow Learning on Point Clouds by Local Rigidity Prior}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16959-16968} }
Personalized Image Aesthetics Assessment With Rich Attributes: Yuzhe Yang,

Liwu Xu,

Leida Li,

Nan Qie,

Yaqian Li,

Peng Zhang,

Yandong Guo; [pdf] [arXiv]
[bibtex]
@InProceedings{Yang_2022_CVPR, author = {Yang, Yuzhe and Xu, Liwu and Li, Leida and Qie, Nan and Li, Yaqian and Zhang, Peng and Guo, Yandong}, title = {Personalized Image Aesthetics Assessment With Rich Attributes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19861-19869} }
HDNet: High-Resolution Dual-Domain Learning for Spectral Compressive Imaging: Xiaowan Hu,

Yuanhao Cai,

Jing Lin,

Haoqian Wang,

Xin Yuan,

Yulun Zhang,

Radu Timofte,

Luc Van Gool; [pdf] [arXiv]
[bibtex]
@InProceedings{Hu_2022_CVPR, author = {Hu, Xiaowan and Cai, Yuanhao and Lin, Jing and Wang, Haoqian and Yuan, Xin and Zhang, Yulun and Timofte, Radu and Van Gool, Luc}, title = {HDNet: High-Resolution Dual-Domain Learning for Spectral Compressive Imaging}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17542-17551} }
Amodal Panoptic Segmentation: Rohit Mohan,

Abhinav Valada; [pdf] [supp]
[bibtex]
@InProceedings{Mohan_2022_CVPR, author = {Mohan, Rohit and Valada, Abhinav}, title = {Amodal Panoptic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21023-21032} }
Gravitationally Lensed Black Hole Emission Tomography: Aviad Levis,

Pratul P. Srinivasan,

Andrew A. Chael,

Ren Ng,

Katherine L. Bouman; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Levis_2022_CVPR, author = {Levis, Aviad and Srinivasan, Pratul P. and Chael, Andrew A. and Ng, Ren and Bouman, Katherine L.}, title = {Gravitationally Lensed Black Hole Emission Tomography}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19841-19850} }
3D-Aware Image Synthesis via Learning Structural and Textural Representations: Yinghao Xu,

Sida Peng,

Ceyuan Yang,

Yujun Shen,

Bolei Zhou; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2022_CVPR, author = {Xu, Yinghao and Peng, Sida and Yang, Ceyuan and Shen, Yujun and Zhou, Bolei}, title = {3D-Aware Image Synthesis via Learning Structural and Textural Representations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18430-18439} }
Text-to-Image Synthesis Based on Object-Guided Joint-Decoding Transformer: Fuxiang Wu,

Liu Liu,

Fusheng Hao,

Fengxiang He,

Jun Cheng; [pdf] [supp]
[bibtex]
@InProceedings{Wu_2022_CVPR, author = {Wu, Fuxiang and Liu, Liu and Hao, Fusheng and He, Fengxiang and Cheng, Jun}, title = {Text-to-Image Synthesis Based on Object-Guided Joint-Decoding Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18113-18122} }
Unsupervised Vision-and-Language Pre-Training via Retrieval-Based Multi-Granular Alignment: Mingyang Zhou,

Licheng Yu,

Amanpreet Singh,

Mengjiao Wang,

Zhou Yu,

Ning Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhou_2022_CVPR, author = {Zhou, Mingyang and Yu, Licheng and Singh, Amanpreet and Wang, Mengjiao and Yu, Zhou and Zhang, Ning}, title = {Unsupervised Vision-and-Language Pre-Training via Retrieval-Based Multi-Granular Alignment}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16485-16494} }
PONI: Potential Functions for ObjectGoal Navigation With Interaction-Free Learning: Santhosh Kumar Ramakrishnan,

Devendra Singh Chaplot,

Ziad Al-Halah,

Jitendra Malik,

Kristen Grauman; [pdf] [supp]
[bibtex]
@InProceedings{Ramakrishnan_2022_CVPR, author = {Ramakrishnan, Santhosh Kumar and Chaplot, Devendra Singh and Al-Halah, Ziad and Malik, Jitendra and Grauman, Kristen}, title = {PONI: Potential Functions for ObjectGoal Navigation With Interaction-Free Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18890-18900} }
Exploring Structure-Aware Transformer Over Interaction Proposals for Human-Object Interaction Detection: Yong Zhang,

Yingwei Pan,

Ting Yao,

Rui Huang,

Tao Mei,

Chang-Wen Chen; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2022_CVPR, author = {Zhang, Yong and Pan, Yingwei and Yao, Ting and Huang, Rui and Mei, Tao and Chen, Chang-Wen}, title = {Exploring Structure-Aware Transformer Over Interaction Proposals for Human-Object Interaction Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19548-19557} }
Glass: Geometric Latent Augmentation for Shape Spaces: Sanjeev Muralikrishnan,

Siddhartha Chaudhuri,

Noam Aigerman,

Vladimir G. Kim,

Matthew Fisher,

Niloy J. Mitra; [pdf] [arXiv]
[bibtex]
@InProceedings{Muralikrishnan_2022_CVPR, author = {Muralikrishnan, Sanjeev and Chaudhuri, Siddhartha and Aigerman, Noam and Kim, Vladimir G. and Fisher, Matthew and Mitra, Niloy J.}, title = {Glass: Geometric Latent Augmentation for Shape Spaces}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18552-18561} }
Evading the Simplicity Bias: Training a Diverse Set of Models Discovers Solutions With Superior OOD Generalization: Damien Teney,

Ehsan Abbasnejad,

Simon Lucey,

Anton van den Hengel; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Teney_2022_CVPR, author = {Teney, Damien and Abbasnejad, Ehsan and Lucey, Simon and van den Hengel, Anton}, title = {Evading the Simplicity Bias: Training a Diverse Set of Models Discovers Solutions With Superior OOD Generalization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16761-16772} }
Assembly101: A Large-Scale Multi-View Video Dataset for Understanding Procedural Activities: Fadime Sener,

Dibyadip Chatterjee,

Daniel Shelepov,

Kun He,

Dipika Singhania,

Robert Wang,

Angela Yao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sener_2022_CVPR, author = {Sener, Fadime and Chatterjee, Dibyadip and Shelepov, Daniel and He, Kun and Singhania, Dipika and Wang, Robert and Yao, Angela}, title = {Assembly101: A Large-Scale Multi-View Video Dataset for Understanding Procedural Activities}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21096-21106} }
DPICT: Deep Progressive Image Compression Using Trit-Planes: Jae-Han Lee,

Seungmin Jeon,

Kwang Pyo Choi,

Youngo Park,

Chang-Su Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2022_CVPR, author = {Lee, Jae-Han and Jeon, Seungmin and Choi, Kwang Pyo and Park, Youngo and Kim, Chang-Su}, title = {DPICT: Deep Progressive Image Compression Using Trit-Planes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16113-16122} }
Text to Image Generation With Semantic-Spatial Aware GAN: Wentong Liao,

Kai Hu,

Michael Ying Yang,

Bodo Rosenhahn; [pdf] [arXiv]
[bibtex]
@InProceedings{Liao_2022_CVPR, author = {Liao, Wentong and Hu, Kai and Yang, Michael Ying and Rosenhahn, Bodo}, title = {Text to Image Generation With Semantic-Spatial Aware GAN}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18187-18196} }
PixMix: Dreamlike Pictures Comprehensively Improve Safety Measures: Dan Hendrycks,

Andy Zou,

Mantas Mazeika,

Leonard Tang,

Bo Li,

Dawn Song,

Jacob Steinhardt; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hendrycks_2022_CVPR, author = {Hendrycks, Dan and Zou, Andy and Mazeika, Mantas and Tang, Leonard and Li, Bo and Song, Dawn and Steinhardt, Jacob}, title = {PixMix: Dreamlike Pictures Comprehensively Improve Safety Measures}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16783-16792} }
Generalizable Cross-Modality Medical Image Segmentation via Style Augmentation and Dual Normalization: Ziqi Zhou,

Lei Qi,

Xin Yang,

Dong Ni,

Yinghuan Shi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhou_2022_CVPR, author = {Zhou, Ziqi and Qi, Lei and Yang, Xin and Ni, Dong and Shi, Yinghuan}, title = {Generalizable Cross-Modality Medical Image Segmentation via Style Augmentation and Dual Normalization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20856-20865} }
TimeReplayer: Unlocking the Potential of Event Cameras for Video Interpolation: Weihua He,

Kaichao You,

Zhendong Qiao,

Xu Jia,

Ziyang Zhang,

Wenhui Wang,

Huchuan Lu,

Yaoyuan Wang,

Jianxing Liao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{He_2022_CVPR, author = {He, Weihua and You, Kaichao and Qiao, Zhendong and Jia, Xu and Zhang, Ziyang and Wang, Wenhui and Lu, Huchuan and Wang, Yaoyuan and Liao, Jianxing}, title = {TimeReplayer: Unlocking the Potential of Event Cameras for Video Interpolation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17804-17813} }
Interactive Segmentation and Visualization for Tiny Objects in Multi-Megapixel Images: Chengyuan Xu,

Boning Dong,

Noah Stier,

Curtis McCully,

D. Andrew Howell,

Pradeep Sen,

Tobias Höllerer; [pdf] [arXiv]
[bibtex]
@InProceedings{Xu_2022_CVPR, author = {Xu, Chengyuan and Dong, Boning and Stier, Noah and McCully, Curtis and Howell, D. Andrew and Sen, Pradeep and H\"ollerer, Tobias}, title = {Interactive Segmentation and Visualization for Tiny Objects in Multi-Megapixel Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21447-21452} }
Scaling Vision Transformers to Gigapixel Images via Hierarchical Self-Supervised Learning: Richard J. Chen,

Chengkuan Chen,

Yicong Li,

Tiffany Y. Chen,

Andrew D. Trister,

Rahul G. Krishnan,

Faisal Mahmood; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2022_CVPR, author = {Chen, Richard J. and Chen, Chengkuan and Li, Yicong and Chen, Tiffany Y. and Trister, Andrew D. and Krishnan, Rahul G. and Mahmood, Faisal}, title = {Scaling Vision Transformers to Gigapixel Images via Hierarchical Self-Supervised Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16144-16155} }
Neural Reflectance for Shape Recovery With Shadow Handling: Junxuan Li,

Hongdong Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Junxuan and Li, Hongdong}, title = {Neural Reflectance for Shape Recovery With Shadow Handling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16221-16230} }
Surface Representation for Point Clouds: Haoxi Ran,

Jun Liu,

Chengjie Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ran_2022_CVPR, author = {Ran, Haoxi and Liu, Jun and Wang, Chengjie}, title = {Surface Representation for Point Clouds}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18942-18952} }
DeepLIIF: An Online Platform for Quantification of Clinical Pathology Slides: Parmida Ghahremani,

Joseph Marino,

Ricardo Dodds,

Saad Nadeem; [pdf] [arXiv]
[bibtex]
@InProceedings{Ghahremani_2022_CVPR, author = {Ghahremani, Parmida and Marino, Joseph and Dodds, Ricardo and Nadeem, Saad}, title = {DeepLIIF: An Online Platform for Quantification of Clinical Pathology Slides}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21399-21405} }
Joint Video Summarization and Moment Localization by Cross-Task Sample Transfer: Hao Jiang,

Yadong Mu; [pdf] [supp]
[bibtex]
@InProceedings{Jiang_2022_CVPR, author = {Jiang, Hao and Mu, Yadong}, title = {Joint Video Summarization and Moment Localization by Cross-Task Sample Transfer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16388-16398} }
Optical Flow Estimation for Spiking Camera: Liwen Hu,

Rui Zhao,

Ziluo Ding,

Lei Ma,

Boxin Shi,

Ruiqin Xiong,

Tiejun Huang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hu_2022_CVPR, author = {Hu, Liwen and Zhao, Rui and Ding, Ziluo and Ma, Lei and Shi, Boxin and Xiong, Ruiqin and Huang, Tiejun}, title = {Optical Flow Estimation for Spiking Camera}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17844-17853} }
InstaFormer: Instance-Aware Image-to-Image Translation With Transformer: Soohyun Kim,

Jongbeom Baek,

Jihye Park,

Gyeongnyeon Kim,

Seungryong Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2022_CVPR, author = {Kim, Soohyun and Baek, Jongbeom and Park, Jihye and Kim, Gyeongnyeon and Kim, Seungryong}, title = {InstaFormer: Instance-Aware Image-to-Image Translation With Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18321-18331} }
3D-VField: Adversarial Augmentation of Point Clouds for Domain Generalization in 3D Object Detection: Alexander Lehner,

Stefano Gasperini,

Alvaro Marcos-Ramiro,

Michael Schmidt,

Mohammad-Ali Nikouei Mahani,

Nassir Navab,

Benjamin Busam,

Federico Tombari; [pdf] [supp]
[bibtex]
@InProceedings{Lehner_2022_CVPR, author = {Lehner, Alexander and Gasperini, Stefano and Marcos-Ramiro, Alvaro and Schmidt, Michael and Mahani, Mohammad-Ali Nikouei and Navab, Nassir and Busam, Benjamin and Tombari, Federico}, title = {3D-VField: Adversarial Augmentation of Point Clouds for Domain Generalization in 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17295-17304} }
AutoMine: An Unmanned Mine Dataset: Yuchen Li,

Zixuan Li,

Siyu Teng,

Yu Zhang,

Yuhang Zhou,

Yuchang Zhu,

Dongpu Cao,

Bin Tian,

Yunfeng Ai,

Zhe Xuanyuan,

Long Chen; [pdf] [supp]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Yuchen and Li, Zixuan and Teng, Siyu and Zhang, Yu and Zhou, Yuhang and Zhu, Yuchang and Cao, Dongpu and Tian, Bin and Ai, Yunfeng and Xuanyuan, Zhe and Chen, Long}, title = {AutoMine: An Unmanned Mine Dataset}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21308-21317} }
Neural Data-Dependent Transform for Learned Image Compression: Dezhao Wang,

Wenhan Yang,

Yueyu Hu,

Jiaying Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2022_CVPR, author = {Wang, Dezhao and Yang, Wenhan and Hu, Yueyu and Liu, Jiaying}, title = {Neural Data-Dependent Transform for Learned Image Compression}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17379-17388} }
Evaluation-Oriented Knowledge Distillation for Deep Face Recognition: Yuge Huang,

Jiaxiang Wu,

Xingkun Xu,

Shouhong Ding; [pdf]
[bibtex]
@InProceedings{Huang_2022_CVPR, author = {Huang, Yuge and Wu, Jiaxiang and Xu, Xingkun and Ding, Shouhong}, title = {Evaluation-Oriented Knowledge Distillation for Deep Face Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18740-18749} }
Improving Subgraph Recognition With Variational Graph Information Bottleneck: Junchi Yu,

Jie Cao,

Ran He; [pdf] [arXiv]
[bibtex]
@InProceedings{Yu_2022_CVPR, author = {Yu, Junchi and Cao, Jie and He, Ran}, title = {Improving Subgraph Recognition With Variational Graph Information Bottleneck}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19396-19405} }
Synthetic Generation of Face Videos With Plethysmograph Physiology: Zhen Wang,

Yunhao Ba,

Pradyumna Chari,

Oyku Deniz Bozkurt,

Gianna Brown,

Parth Patwa,

Niranjan Vaddi,

Laleh Jalilian,

Achuta Kadambi; [pdf]
[bibtex]
@InProceedings{Wang_2022_CVPR, author = {Wang, Zhen and Ba, Yunhao and Chari, Pradyumna and Bozkurt, Oyku Deniz and Brown, Gianna and Patwa, Parth and Vaddi, Niranjan and Jalilian, Laleh and Kadambi, Achuta}, title = {Synthetic Generation of Face Videos With Plethysmograph Physiology}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20587-20596} }
TransRAC: Encoding Multi-Scale Temporal Correlation With Transformers for Repetitive Action Counting: Huazhang Hu,

Sixun Dong,

Yiqun Zhao,

Dongze Lian,

Zhengxin Li,

Shenghua Gao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hu_2022_CVPR, author = {Hu, Huazhang and Dong, Sixun and Zhao, Yiqun and Lian, Dongze and Li, Zhengxin and Gao, Shenghua}, title = {TransRAC: Encoding Multi-Scale Temporal Correlation With Transformers for Repetitive Action Counting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19013-19022} }
AdaInt: Learning Adaptive Intervals for 3D Lookup Tables on Real-Time Image Enhancement: Canqian Yang,

Meiguang Jin,

Xu Jia,

Yi Xu,

Ying Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2022_CVPR, author = {Yang, Canqian and Jin, Meiguang and Jia, Xu and Xu, Yi and Chen, Ying}, title = {AdaInt: Learning Adaptive Intervals for 3D Lookup Tables on Real-Time Image Enhancement}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17522-17531} }
RegionCLIP: Region-Based Language-Image Pretraining: Yiwu Zhong,

Jianwei Yang,

Pengchuan Zhang,

Chunyuan Li,

Noel Codella,

Liunian Harold Li,

Luowei Zhou,

Xiyang Dai,

Lu Yuan,

Yin Li,

Jianfeng Gao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhong_2022_CVPR, author = {Zhong, Yiwu and Yang, Jianwei and Zhang, Pengchuan and Li, Chunyuan and Codella, Noel and Li, Liunian Harold and Zhou, Luowei and Dai, Xiyang and Yuan, Lu and Li, Yin and Gao, Jianfeng}, title = {RegionCLIP: Region-Based Language-Image Pretraining}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16793-16803} }
Video Frame Interpolation Transformer: Zhihao Shi,

Xiangyu Xu,

Xiaohong Liu,

Jun Chen,

Ming-Hsuan Yang; [pdf] [arXiv]
[bibtex]
@InProceedings{Shi_2022_CVPR, author = {Shi, Zhihao and Xu, Xiangyu and Liu, Xiaohong and Chen, Jun and Yang, Ming-Hsuan}, title = {Video Frame Interpolation Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17482-17491} }
An Empirical Study of End-to-End Temporal Action Detection: Xiaolong Liu,

Song Bai,

Xiang Bai; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2022_CVPR, author = {Liu, Xiaolong and Bai, Song and Bai, Xiang}, title = {An Empirical Study of End-to-End Temporal Action Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20010-20019} }
Brain-Supervised Image Editing: Keith M. Davis III,

Carlos de la Torre-Ortiz,

Tuukka Ruotsalo; [pdf] [supp]
[bibtex]
@InProceedings{Davis_2022_CVPR, author = {Davis, III, Keith M. and de la Torre-Ortiz, Carlos and Ruotsalo, Tuukka}, title = {Brain-Supervised Image Editing}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18480-18489} }
3D Shape Variational Autoencoder Latent Disentanglement via Mini-Batch Feature Swapping for Bodies and Faces: Simone Foti,

Bongjin Koo,

Danail Stoyanov,

Matthew J. Clarkson; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Foti_2022_CVPR, author = {Foti, Simone and Koo, Bongjin and Stoyanov, Danail and Clarkson, Matthew J.}, title = {3D Shape Variational Autoencoder Latent Disentanglement via Mini-Batch Feature Swapping for Bodies and Faces}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18730-18739} }
RestoreFormer: High-Quality Blind Face Restoration From Undegraded Key-Value Pairs: Zhouxia Wang,

Jiawei Zhang,

Runjian Chen,

Wenping Wang,

Ping Luo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2022_CVPR, author = {Wang, Zhouxia and Zhang, Jiawei and Chen, Runjian and Wang, Wenping and Luo, Ping}, title = {RestoreFormer: High-Quality Blind Face Restoration From Undegraded Key-Value Pairs}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17512-17521} }
Mask-Guided Spectral-Wise Transformer for Efficient Hyperspectral Image Reconstruction: Yuanhao Cai,

Jing Lin,

Xiaowan Hu,

Haoqian Wang,

Xin Yuan,

Yulun Zhang,

Radu Timofte,

Luc Van Gool; [pdf] [arXiv]
[bibtex]
@InProceedings{Cai_2022_CVPR, author = {Cai, Yuanhao and Lin, Jing and Hu, Xiaowan and Wang, Haoqian and Yuan, Xin and Zhang, Yulun and Timofte, Radu and Van Gool, Luc}, title = {Mask-Guided Spectral-Wise Transformer for Efficient Hyperspectral Image Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17502-17511} }
PPDL: Predicate Probability Distribution Based Loss for Unbiased Scene Graph Generation: Wei Li,

Haiwei Zhang,

Qijie Bai,

Guoqing Zhao,

Ning Jiang,

Xiaojie Yuan; [pdf] [supp]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Wei and Zhang, Haiwei and Bai, Qijie and Zhao, Guoqing and Jiang, Ning and Yuan, Xiaojie}, title = {PPDL: Predicate Probability Distribution Based Loss for Unbiased Scene Graph Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19447-19456} }
Coupling Vision and Proprioception for Navigation of Legged Robots: Zipeng Fu,

Ashish Kumar,

Ananye Agarwal,

Haozhi Qi,

Jitendra Malik,

Deepak Pathak; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Fu_2022_CVPR, author = {Fu, Zipeng and Kumar, Ashish and Agarwal, Ananye and Qi, Haozhi and Malik, Jitendra and Pathak, Deepak}, title = {Coupling Vision and Proprioception for Navigation of Legged Robots}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17273-17283} }
Fine-Grained Predicates Learning for Scene Graph Generation: Xinyu Lyu,

Lianli Gao,

Yuyu Guo,

Zhou Zhao,

Hao Huang,

Heng Tao Shen,

Jingkuan Song; [pdf] [arXiv]
[bibtex]
@InProceedings{Lyu_2022_CVPR, author = {Lyu, Xinyu and Gao, Lianli and Guo, Yuyu and Zhao, Zhou and Huang, Hao and Shen, Heng Tao and Song, Jingkuan}, title = {Fine-Grained Predicates Learning for Scene Graph Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19467-19475} }
Neural Head Avatars From Monocular RGB Videos: Philip-William Grassal,

Malte Prinzler,

Titus Leistner,

Carsten Rother,

Matthias Nießner,

Justus Thies; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Grassal_2022_CVPR, author = {Grassal, Philip-William and Prinzler, Malte and Leistner, Titus and Rother, Carsten and Nie{\ss}ner, Matthias and Thies, Justus}, title = {Neural Head Avatars From Monocular RGB Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18653-18664} }
EMOCA: Emotion Driven Monocular Face Capture and Animation: Radek Daněček,

Michael J. Black,

Timo Bolkart; [pdf] [supp]
[bibtex]
@InProceedings{Danecek_2022_CVPR, author = {Dan\v{e}\v{c}ek, Radek and Black, Michael J. and Bolkart, Timo}, title = {EMOCA: Emotion Driven Monocular Face Capture and Animation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20311-20322} }
Towards Diverse and Natural Scene-Aware 3D Human Motion Synthesis: Jingbo Wang,

Yu Rong,

Jingyuan Liu,

Sijie Yan,

Dahua Lin,

Bo Dai; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2022_CVPR, author = {Wang, Jingbo and Rong, Yu and Liu, Jingyuan and Yan, Sijie and Lin, Dahua and Dai, Bo}, title = {Towards Diverse and Natural Scene-Aware 3D Human Motion Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20460-20469} }
How Much Does Input Data Type Impact Final Face Model Accuracy?: Jiahao Luo,

Fahim Hasan Khan,

Issei Mori,

Akila de Silva,

Eric Sandoval Ruezga,

Minghao Liu,

Alex Pang,

James Davis; [pdf] [supp]
[bibtex]
@InProceedings{Luo_2022_CVPR, author = {Luo, Jiahao and Khan, Fahim Hasan and Mori, Issei and de Silva, Akila and Ruezga, Eric Sandoval and Liu, Minghao and Pang, Alex and Davis, James}, title = {How Much Does Input Data Type Impact Final Face Model Accuracy?}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18985-18994} }
HumanNeRF: Free-Viewpoint Rendering of Moving People From Monocular Video: Chung-Yi Weng,

Brian Curless,

Pratul P. Srinivasan,

Jonathan T. Barron,

Ira Kemelmacher-Shlizerman; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Weng_2022_CVPR, author = {Weng, Chung-Yi and Curless, Brian and Srinivasan, Pratul P. and Barron, Jonathan T. and Kemelmacher-Shlizerman, Ira}, title = {HumanNeRF: Free-Viewpoint Rendering of Moving People From Monocular Video}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16210-16220} }
Which Images To Label for Few-Shot Medical Landmark Detection?: Quan Quan,

Qingsong Yao,

Jun Li,

S. Kevin Zhou; [pdf] [arXiv]
[bibtex]
@InProceedings{Quan_2022_CVPR, author = {Quan, Quan and Yao, Qingsong and Li, Jun and Zhou, S. Kevin}, title = {Which Images To Label for Few-Shot Medical Landmark Detection?}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20606-20616} }
UBoCo: Unsupervised Boundary Contrastive Learning for Generic Event Boundary Detection: Hyolim Kang,

Jinwoo Kim,

Taehyun Kim,

Seon Joo Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kang_2022_CVPR, author = {Kang, Hyolim and Kim, Jinwoo and Kim, Taehyun and Kim, Seon Joo}, title = {UBoCo: Unsupervised Boundary Contrastive Learning for Generic Event Boundary Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20073-20082} }
Both Style and Fog Matter: Cumulative Domain Adaptation for Semantic Foggy Scene Understanding: Xianzheng Ma,

Zhixiang Wang,

Yacheng Zhan,

Yinqiang Zheng,

Zheng Wang,

Dengxin Dai,

Chia-Wen Lin; [pdf] [arXiv]
[bibtex]
@InProceedings{Ma_2022_CVPR, author = {Ma, Xianzheng and Wang, Zhixiang and Zhan, Yacheng and Zheng, Yinqiang and Wang, Zheng and Dai, Dengxin and Lin, Chia-Wen}, title = {Both Style and Fog Matter: Cumulative Domain Adaptation for Semantic Foggy Scene Understanding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18922-18931} }
Ev-TTA: Test-Time Adaptation for Event-Based Object Recognition: Junho Kim,

Inwoo Hwang,

Young Min Kim; [pdf] [supp]
[bibtex]
@InProceedings{Kim_2022_CVPR, author = {Kim, Junho and Hwang, Inwoo and Kim, Young Min}, title = {Ev-TTA: Test-Time Adaptation for Event-Based Object Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17745-17754} }
NODEO: A Neural Ordinary Differential Equation Based Optimization Framework for Deformable Image Registration: Yifan Wu,

Tom Z. Jiahao,

Jiancong Wang,

Paul A. Yushkevich,

M. Ani Hsieh,

James C. Gee; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2022_CVPR, author = {Wu, Yifan and Jiahao, Tom Z. and Wang, Jiancong and Yushkevich, Paul A. and Hsieh, M. Ani and Gee, James C.}, title = {NODEO: A Neural Ordinary Differential Equation Based Optimization Framework for Deformable Image Registration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20804-20813} }
Pyramid Architecture for Multi-Scale Processing in Point Cloud Segmentation: Dong Nie,

Rui Lan,

Ling Wang,

Xiaofeng Ren; [pdf]
[bibtex]
@InProceedings{Nie_2022_CVPR, author = {Nie, Dong and Lan, Rui and Wang, Ling and Ren, Xiaofeng}, title = {Pyramid Architecture for Multi-Scale Processing in Point Cloud Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17284-17294} }
Cross-Architecture Self-Supervised Video Representation Learning: Sheng Guo,

Zihua Xiong,

Yujie Zhong,

Limin Wang,

Xiaobo Guo,

Bing Han,

Weilin Huang; [pdf] [arXiv]
[bibtex]
@InProceedings{Guo_2022_CVPR, author = {Guo, Sheng and Xiong, Zihua and Zhong, Yujie and Wang, Limin and Guo, Xiaobo and Han, Bing and Huang, Weilin}, title = {Cross-Architecture Self-Supervised Video Representation Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19270-19279} }
High-Resolution Image Harmonization via Collaborative Dual Transformations: Wenyan Cong,

Xinhao Tao,

Li Niu,

Jing Liang,

Xuesong Gao,

Qihao Sun,

Liqing Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cong_2022_CVPR, author = {Cong, Wenyan and Tao, Xinhao and Niu, Li and Liang, Jing and Gao, Xuesong and Sun, Qihao and Zhang, Liqing}, title = {High-Resolution Image Harmonization via Collaborative Dual Transformations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18470-18479} }
MM-TTA: Multi-Modal Test-Time Adaptation for 3D Semantic Segmentation: Inkyu Shin,

Yi-Hsuan Tsai,

Bingbing Zhuang,

Samuel Schulter,

Buyu Liu,

Sparsh Garg,

In So Kweon,

Kuk-Jin Yoon; [pdf] [supp]
[bibtex]
@InProceedings{Shin_2022_CVPR, author = {Shin, Inkyu and Tsai, Yi-Hsuan and Zhuang, Bingbing and Schulter, Samuel and Liu, Buyu and Garg, Sparsh and Kweon, In So and Yoon, Kuk-Jin}, title = {MM-TTA: Multi-Modal Test-Time Adaptation for 3D Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16928-16937} }
Towards Bidirectional Arbitrary Image Rescaling: Joint Optimization and Cycle Idempotence: Zhihong Pan,

Baopu Li,

Dongliang He,

Mingde Yao,

Wenhao Wu,

Tianwei Lin,

Xin Li,

Errui Ding; [pdf] [arXiv]
[bibtex]
@InProceedings{Pan_2022_CVPR, author = {Pan, Zhihong and Li, Baopu and He, Dongliang and Yao, Mingde and Wu, Wenhao and Lin, Tianwei and Li, Xin and Ding, Errui}, title = {Towards Bidirectional Arbitrary Image Rescaling: Joint Optimization and Cycle Idempotence}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17389-17398} }
Topology Preserving Local Road Network Estimation From Single Onboard Camera Image: Yigit Baran Can,

Alexander Liniger,

Danda Pani Paudel,

Luc Van Gool; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Can_2022_CVPR, author = {Can, Yigit Baran and Liniger, Alexander and Paudel, Danda Pani and Van Gool, Luc}, title = {Topology Preserving Local Road Network Estimation From Single Onboard Camera Image}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17263-17272} }
Eigenlanes: Data-Driven Lane Descriptors for Structurally Diverse Lanes: Dongkwon Jin,

Wonhui Park,

Seong-Gyun Jeong,

Heeyeon Kwon,

Chang-Su Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jin_2022_CVPR, author = {Jin, Dongkwon and Park, Wonhui and Jeong, Seong-Gyun and Kwon, Heeyeon and Kim, Chang-Su}, title = {Eigenlanes: Data-Driven Lane Descriptors for Structurally Diverse Lanes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17163-17171} }
SpaceEdit: Learning a Unified Editing Space for Open-Domain Image Color Editing: Jing Shi,

Ning Xu,

Haitian Zheng,

Alex Smith,

Jiebo Luo,

Chenliang Xu; [pdf] [supp]
[bibtex]
@InProceedings{Shi_2022_CVPR, author = {Shi, Jing and Xu, Ning and Zheng, Haitian and Smith, Alex and Luo, Jiebo and Xu, Chenliang}, title = {SpaceEdit: Learning a Unified Editing Space for Open-Domain Image Color Editing}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19730-19739} }
Multi-Level Feature Learning for Contrastive Multi-View Clustering: Jie Xu,

Huayi Tang,

Yazhou Ren,

Liang Peng,

Xiaofeng Zhu,

Lifang He; [pdf] [arXiv]
[bibtex]
@InProceedings{Xu_2022_CVPR, author = {Xu, Jie and Tang, Huayi and Ren, Yazhou and Peng, Liang and Zhu, Xiaofeng and He, Lifang}, title = {Multi-Level Feature Learning for Contrastive Multi-View Clustering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16051-16060} }
Egocentric Prediction of Action Target in 3D: Yiming Li,

Ziang Cao,

Andrew Liang,

Benjamin Liang,

Luoyao Chen,

Hang Zhao,

Chen Feng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Yiming and Cao, Ziang and Liang, Andrew and Liang, Benjamin and Chen, Luoyao and Zhao, Hang and Feng, Chen}, title = {Egocentric Prediction of Action Target in 3D}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21003-21012} }
Towards Real-World Navigation With Deep Differentiable Planners: Shu Ishida,

João F. Henriques; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ishida_2022_CVPR, author = {Ishida, Shu and Henriques, Jo\~ao F.}, title = {Towards Real-World Navigation With Deep Differentiable Planners}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17327-17336} }
Video K-Net: A Simple, Strong, and Unified Baseline for Video Segmentation: Xiangtai Li,

Wenwei Zhang,

Jiangmiao Pang,

Kai Chen,

Guangliang Cheng,

Yunhai Tong,

Chen Change Loy; [pdf] [supp]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Xiangtai and Zhang, Wenwei and Pang, Jiangmiao and Chen, Kai and Cheng, Guangliang and Tong, Yunhai and Loy, Chen Change}, title = {Video K-Net: A Simple, Strong, and Unified Baseline for Video Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18847-18857} }
NeRFReN: Neural Radiance Fields With Reflections: Yuan-Chen Guo,

Di Kang,

Linchao Bao,

Yu He,

Song-Hai Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Guo_2022_CVPR, author = {Guo, Yuan-Chen and Kang, Di and Bao, Linchao and He, Yu and Zhang, Song-Hai}, title = {NeRFReN: Neural Radiance Fields With Reflections}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18409-18418} }
SCS-Co: Self-Consistent Style Contrastive Learning for Image Harmonization: Yucheng Hang,

Bin Xia,

Wenming Yang,

Qingmin Liao; [pdf] [supp]
[bibtex]
@InProceedings{Hang_2022_CVPR, author = {Hang, Yucheng and Xia, Bin and Yang, Wenming and Liao, Qingmin}, title = {SCS-Co: Self-Consistent Style Contrastive Learning for Image Harmonization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19710-19719} }
Neural Convolutional Surfaces: Luca Morreale,

Noam Aigerman,

Paul Guerrero,

Vladimir G. Kim,

Niloy J. Mitra; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Morreale_2022_CVPR, author = {Morreale, Luca and Aigerman, Noam and Guerrero, Paul and Kim, Vladimir G. and Mitra, Niloy J.}, title = {Neural Convolutional Surfaces}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19333-19342} }
HyperSegNAS: Bridging One-Shot Neural Architecture Search With 3D Medical Image Segmentation Using HyperNet: Cheng Peng,

Andriy Myronenko,

Ali Hatamizadeh,

Vishwesh Nath,

Md Mahfuzur Rahman Siddiquee,

Yufan He,

Daguang Xu,

Rama Chellappa,

Dong Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Peng_2022_CVPR, author = {Peng, Cheng and Myronenko, Andriy and Hatamizadeh, Ali and Nath, Vishwesh and Siddiquee, Md Mahfuzur Rahman and He, Yufan and Xu, Daguang and Chellappa, Rama and Yang, Dong}, title = {HyperSegNAS: Bridging One-Shot Neural Architecture Search With 3D Medical Image Segmentation Using HyperNet}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20741-20751} }
A Comprehensive Study of Image Classification Model Sensitivity to Foregrounds, Backgrounds, and Visual Attributes: Mazda Moayeri,

Phillip Pope,

Yogesh Balaji,

Soheil Feizi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Moayeri_2022_CVPR, author = {Moayeri, Mazda and Pope, Phillip and Balaji, Yogesh and Feizi, Soheil}, title = {A Comprehensive Study of Image Classification Model Sensitivity to Foregrounds, Backgrounds, and Visual Attributes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19087-19097} }
ConDor: Self-Supervised Canonicalization of 3D Pose for Partial Shapes: Rahul Sajnani,

Adrien Poulenard,

Jivitesh Jain,

Radhika Dua,

Leonidas J. Guibas,

Srinath Sridhar; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sajnani_2022_CVPR, author = {Sajnani, Rahul and Poulenard, Adrien and Jain, Jivitesh and Dua, Radhika and Guibas, Leonidas J. and Sridhar, Srinath}, title = {ConDor: Self-Supervised Canonicalization of 3D Pose for Partial Shapes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16969-16979} }
Exploring Endogenous Shift for Cross-Domain Detection: A Large-Scale Benchmark and Perturbation Suppression Network: Renshuai Tao,

Hainan Li,

Tianbo Wang,

Yanlu Wei,

Yifu Ding,

Bowei Jin,

Hongping Zhi,

Xianglong Liu,

Aishan Liu; [pdf]
[bibtex]
@InProceedings{Tao_2022_CVPR, author = {Tao, Renshuai and Li, Hainan and Wang, Tianbo and Wei, Yanlu and Ding, Yifu and Jin, Bowei and Zhi, Hongping and Liu, Xianglong and Liu, Aishan}, title = {Exploring Endogenous Shift for Cross-Domain Detection: A Large-Scale Benchmark and Perturbation Suppression Network}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21189-21199} }
VisCUIT: Visual Auditor for Bias in CNN Image Classifier: Seongmin Lee,

Zijie J. Wang,

Judy Hoffman,

Duen Horng (Polo) Chau; [pdf] [arXiv]
[bibtex]
@InProceedings{Lee_2022_CVPR, author = {Lee, Seongmin and Wang, Zijie J. and Hoffman, Judy and Chau, Duen Horng (Polo)}, title = {VisCUIT: Visual Auditor for Bias in CNN Image Classifier}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21475-21483} }
DirecFormer: A Directed Attention in Transformer Approach to Robust Action Recognition: Thanh-Dat Truong,

Quoc-Huy Bui,

Chi Nhan Duong,

Han-Seok Seo,

Son Lam Phung,

Xin Li,

Khoa Luu; [pdf] [arXiv]
[bibtex]
@InProceedings{Truong_2022_CVPR, author = {Truong, Thanh-Dat and Bui, Quoc-Huy and Duong, Chi Nhan and Seo, Han-Seok and Phung, Son Lam and Li, Xin and Luu, Khoa}, title = {DirecFormer: A Directed Attention in Transformer Approach to Robust Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20030-20040} }
Robust Egocentric Photo-Realistic Facial Expression Transfer for Virtual Reality: Amin Jourabloo,

Fernando De la Torre,

Jason Saragih,

Shih-En Wei,

Stephen Lombardi,

Te-Li Wang,

Danielle Belko,

Autumn Trimble,

Hernan Badino; [pdf] [arXiv]
[bibtex]
@InProceedings{Jourabloo_2022_CVPR, author = {Jourabloo, Amin and De la Torre, Fernando and Saragih, Jason and Wei, Shih-En and Lombardi, Stephen and Wang, Te-Li and Belko, Danielle and Trimble, Autumn and Badino, Hernan}, title = {Robust Egocentric Photo-Realistic Facial Expression Transfer for Virtual Reality}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20323-20332} }
Distillation Using Oracle Queries for Transformer-Based Human-Object Interaction Detection: Xian Qu,

Changxing Ding,

Xingao Li,

Xubin Zhong,

Dacheng Tao; [pdf] [supp]
[bibtex]
@InProceedings{Qu_2022_CVPR, author = {Qu, Xian and Ding, Changxing and Li, Xingao and Zhong, Xubin and Tao, Dacheng}, title = {Distillation Using Oracle Queries for Transformer-Based Human-Object Interaction Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19558-19567} }
Learning Video Representations of Human Motion From Synthetic Data: Xi Guo,

Wei Wu,

Dongliang Wang,

Jing Su,

Haisheng Su,

Weihao Gan,

Jian Huang,

Qin Yang; [pdf] [supp]
[bibtex]
@InProceedings{Guo_2022_CVPR, author = {Guo, Xi and Wu, Wei and Wang, Dongliang and Su, Jing and Su, Haisheng and Gan, Weihao and Huang, Jian and Yang, Qin}, title = {Learning Video Representations of Human Motion From Synthetic Data}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20197-20207} }
BoostMIS: Boosting Medical Image Semi-Supervised Learning With Adaptive Pseudo Labeling and Informative Active Annotation: Wenqiao Zhang,

Lei Zhu,

James Hallinan,

Shengyu Zhang,

Andrew Makmur,

Qingpeng Cai,

Beng Chin Ooi; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhang_2022_CVPR, author = {Zhang, Wenqiao and Zhu, Lei and Hallinan, James and Zhang, Shengyu and Makmur, Andrew and Cai, Qingpeng and Ooi, Beng Chin}, title = {BoostMIS: Boosting Medical Image Semi-Supervised Learning With Adaptive Pseudo Labeling and Informative Active Annotation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20666-20676} }
HOI4D: A 4D Egocentric Dataset for Category-Level Human-Object Interaction: Yunze Liu,

Yun Liu,

Che Jiang,

Kangbo Lyu,

Weikang Wan,

Hao Shen,

Boqiang Liang,

Zhoujie Fu,

He Wang,

Li Yi; [pdf] [arXiv]
[bibtex]
@InProceedings{Liu_2022_CVPR, author = {Liu, Yunze and Liu, Yun and Jiang, Che and Lyu, Kangbo and Wan, Weikang and Shen, Hao and Liang, Boqiang and Fu, Zhoujie and Wang, He and Yi, Li}, title = {HOI4D: A 4D Egocentric Dataset for Category-Level Human-Object Interaction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21013-21022} }
Collaborative Transformers for Grounded Situation Recognition: Junhyeong Cho,

Youngseok Yoon,

Suha Kwak; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cho_2022_CVPR, author = {Cho, Junhyeong and Yoon, Youngseok and Kwak, Suha}, title = {Collaborative Transformers for Grounded Situation Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19659-19668} }
Vox2Cortex: Fast Explicit Reconstruction of Cortical Surfaces From 3D MRI Scans With Geometric Deep Neural Networks: Fabian Bongratz,

Anne-Marie Rickmann,

Sebastian Pölsterl,

Christian Wachinger; [pdf] [supp]
[bibtex]
@InProceedings{Bongratz_2022_CVPR, author = {Bongratz, Fabian and Rickmann, Anne-Marie and P\"olsterl, Sebastian and Wachinger, Christian}, title = {Vox2Cortex: Fast Explicit Reconstruction of Cortical Surfaces From 3D MRI Scans With Geometric Deep Neural Networks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20773-20783} }
ScanQA: 3D Question Answering for Spatial Scene Understanding: Daichi Azuma,

Taiki Miyanishi,

Shuhei Kurita,

Motoaki Kawanabe; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Azuma_2022_CVPR, author = {Azuma, Daichi and Miyanishi, Taiki and Kurita, Shuhei and Kawanabe, Motoaki}, title = {ScanQA: 3D Question Answering for Spatial Scene Understanding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19129-19139} }
Class-Incremental Learning by Knowledge Distillation With Adaptive Feature Consolidation: Minsoo Kang,

Jaeyoo Park,

Bohyung Han; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kang_2022_CVPR, author = {Kang, Minsoo and Park, Jaeyoo and Han, Bohyung}, title = {Class-Incremental Learning by Knowledge Distillation With Adaptive Feature Consolidation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16071-16080} }
Learning Program Representations for Food Images and Cooking Recipes: Dim P. Papadopoulos,

Enrique Mora,

Nadiia Chepurko,

Kuan Wei Huang,

Ferda Ofli,

Antonio Torralba; [pdf] [arXiv]
[bibtex]
@InProceedings{Papadopoulos_2022_CVPR, author = {Papadopoulos, Dim P. and Mora, Enrique and Chepurko, Nadiia and Huang, Kuan Wei and Ofli, Ferda and Torralba, Antonio}, title = {Learning Program Representations for Food Images and Cooking Recipes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16559-16569} }
Directional Self-Supervised Learning for Heavy Image Augmentations: Yalong Bai,

Yifan Yang,

Wei Zhang,

Tao Mei; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bai_2022_CVPR, author = {Bai, Yalong and Yang, Yifan and Zhang, Wei and Mei, Tao}, title = {Directional Self-Supervised Learning for Heavy Image Augmentations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16692-16701} }
No-Reference Point Cloud Quality Assessment via Domain Adaptation: Qi Yang,

Yipeng Liu,

Siheng Chen,

Yiling Xu,

Jun Sun; [pdf] [arXiv]
[bibtex]
@InProceedings{Yang_2022_CVPR, author = {Yang, Qi and Liu, Yipeng and Chen, Siheng and Xu, Yiling and Sun, Jun}, title = {No-Reference Point Cloud Quality Assessment via Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21179-21188} }
Comprehending and Ordering Semantics for Image Captioning: Yehao Li,

Yingwei Pan,

Ting Yao,

Tao Mei; [pdf]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Yehao and Pan, Yingwei and Yao, Ting and Mei, Tao}, title = {Comprehending and Ordering Semantics for Image Captioning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17990-17999} }
A Large-Scale Comprehensive Dataset and Copy-Overlap Aware Evaluation Protocol for Segment-Level Video Copy Detection: Sifeng He,

Xudong Yang,

Chen Jiang,

Gang Liang,

Wei Zhang,

Tan Pan,

Qing Wang,

Furong Xu,

Chunguang Li,

JinXiong Liu,

Hui Xu,

Kaiming Huang,

Yuan Cheng,

Feng Qian,

Xiaobo Zhang,

Lei Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{He_2022_CVPR, author = {He, Sifeng and Yang, Xudong and Jiang, Chen and Liang, Gang and Zhang, Wei and Pan, Tan and Wang, Qing and Xu, Furong and Li, Chunguang and Liu, JinXiong and Xu, Hui and Huang, Kaiming and Cheng, Yuan and Qian, Feng and Zhang, Xiaobo and Yang, Lei}, title = {A Large-Scale Comprehensive Dataset and Copy-Overlap Aware Evaluation Protocol for Segment-Level Video Copy Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21086-21095} }
GaTector: A Unified Framework for Gaze Object Prediction: Binglu Wang,

Tao Hu,

Baoshan Li,

Xiaojuan Chen,

Zhijie Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2022_CVPR, author = {Wang, Binglu and Hu, Tao and Li, Baoshan and Chen, Xiaojuan and Zhang, Zhijie}, title = {GaTector: A Unified Framework for Gaze Object Prediction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19588-19597} }
LaTr: Layout-Aware Transformer for Scene-Text VQA: Ali Furkan Biten,

Ron Litman,

Yusheng Xie,

Srikar Appalaraju,

R. Manmatha; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Biten_2022_CVPR, author = {Biten, Ali Furkan and Litman, Ron and Xie, Yusheng and Appalaraju, Srikar and Manmatha, R.}, title = {LaTr: Layout-Aware Transformer for Scene-Text VQA}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16548-16558} }
HeadNeRF: A Real-Time NeRF-Based Parametric Head Model: Yang Hong,

Bo Peng,

Haiyao Xiao,

Ligang Liu,

Juyong Zhang; [pdf] [arXiv]
[bibtex]
@InProceedings{Hong_2022_CVPR, author = {Hong, Yang and Peng, Bo and Xiao, Haiyao and Liu, Ligang and Zhang, Juyong}, title = {HeadNeRF: A Real-Time NeRF-Based Parametric Head Model}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20374-20384} }
Replacing Labeled Real-Image Datasets With Auto-Generated Contours: Hirokatsu Kataoka,

Ryo Hayamizu,

Ryosuke Yamada,

Kodai Nakashima,

Sora Takashima,

Xinyu Zhang,

Edgar Josafat Martinez-Noriega,

Nakamasa Inoue,

Rio Yokota; [pdf]
[bibtex]
@InProceedings{Kataoka_2022_CVPR, author = {Kataoka, Hirokatsu and Hayamizu, Ryo and Yamada, Ryosuke and Nakashima, Kodai and Takashima, Sora and Zhang, Xinyu and Martinez-Noriega, Edgar Josafat and Inoue, Nakamasa and Yokota, Rio}, title = {Replacing Labeled Real-Image Datasets With Auto-Generated Contours}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21232-21241} }
WebQA: Multihop and Multimodal QA: Yingshan Chang,

Mridu Narang,

Hisami Suzuki,

Guihong Cao,

Jianfeng Gao,

Yonatan Bisk; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chang_2022_CVPR, author = {Chang, Yingshan and Narang, Mridu and Suzuki, Hisami and Cao, Guihong and Gao, Jianfeng and Bisk, Yonatan}, title = {WebQA: Multihop and Multimodal QA}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16495-16504} }
Towards Language-Free Training for Text-to-Image Generation: Yufan Zhou,

Ruiyi Zhang,

Changyou Chen,

Chunyuan Li,

Chris Tensmeyer,

Tong Yu,

Jiuxiang Gu,

Jinhui Xu,

Tong Sun; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhou_2022_CVPR, author = {Zhou, Yufan and Zhang, Ruiyi and Chen, Changyou and Li, Chunyuan and Tensmeyer, Chris and Yu, Tong and Gu, Jiuxiang and Xu, Jinhui and Sun, Tong}, title = {Towards Language-Free Training for Text-to-Image Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17907-17917} }
Learning Affinity From Attention: End-to-End Weakly-Supervised Semantic Segmentation With Transformers: Lixiang Ru,

Yibing Zhan,

Baosheng Yu,

Bo Du; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ru_2022_CVPR, author = {Ru, Lixiang and Zhan, Yibing and Yu, Baosheng and Du, Bo}, title = {Learning Affinity From Attention: End-to-End Weakly-Supervised Semantic Segmentation With Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16846-16855} }
FERV39k: A Large-Scale Multi-Scene Dataset for Facial Expression Recognition in Videos: Yan Wang,

Yixuan Sun,

Yiwen Huang,

Zhongying Liu,

Shuyong Gao,

Wei Zhang,

Weifeng Ge,

Wenqiang Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2022_CVPR, author = {Wang, Yan and Sun, Yixuan and Huang, Yiwen and Liu, Zhongying and Gao, Shuyong and Zhang, Wei and Ge, Weifeng and Zhang, Wenqiang}, title = {FERV39k: A Large-Scale Multi-Scene Dataset for Facial Expression Recognition in Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20922-20931} }
Omnivore: A Single Model for Many Visual Modalities: Rohit Girdhar,

Mannat Singh,

Nikhila Ravi,

Laurens van der Maaten,

Armand Joulin,

Ishan Misra; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Girdhar_2022_CVPR, author = {Girdhar, Rohit and Singh, Mannat and Ravi, Nikhila and van der Maaten, Laurens and Joulin, Armand and Misra, Ishan}, title = {Omnivore: A Single Model for Many Visual Modalities}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16102-16112} }
DAIR-V2X: A Large-Scale Dataset for Vehicle-Infrastructure Cooperative 3D Object Detection: Haibao Yu,

Yizhen Luo,

Mao Shu,

Yiyi Huo,

Zebang Yang,

Yifeng Shi,

Zhenglong Guo,

Hanyu Li,

Xing Hu,

Jirui Yuan,

Zaiqing Nie; [pdf]
[bibtex]
@InProceedings{Yu_2022_CVPR, author = {Yu, Haibao and Luo, Yizhen and Shu, Mao and Huo, Yiyi and Yang, Zebang and Shi, Yifeng and Guo, Zhenglong and Li, Hanyu and Hu, Xing and Yuan, Jirui and Nie, Zaiqing}, title = {DAIR-V2X: A Large-Scale Dataset for Vehicle-Infrastructure Cooperative 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21361-21370} }
Uncertainty-Aware Adaptation for Self-Supervised 3D Human Pose Estimation: Jogendra Nath Kundu,

Siddharth Seth,

Pradyumna YM,

Varun Jampani,

Anirban Chakraborty,

R. Venkatesh Babu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kundu_2022_CVPR, author = {Kundu, Jogendra Nath and Seth, Siddharth and YM, Pradyumna and Jampani, Varun and Chakraborty, Anirban and Babu, R. Venkatesh}, title = {Uncertainty-Aware Adaptation for Self-Supervised 3D Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20448-20459} }
Semi-Supervised Wide-Angle Portraits Correction by Multi-Scale Transformer: Fushun Zhu,

Shan Zhao,

Peng Wang,

Hao Wang,

Hua Yan,

Shuaicheng Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhu_2022_CVPR, author = {Zhu, Fushun and Zhao, Shan and Wang, Peng and Wang, Hao and Yan, Hua and Liu, Shuaicheng}, title = {Semi-Supervised Wide-Angle Portraits Correction by Multi-Scale Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19689-19698} }
Is Mapping Necessary for Realistic PointGoal Navigation?: Ruslan Partsey,

Erik Wijmans,

Naoki Yokoyama,

Oles Dobosevych,

Dhruv Batra,

Oleksandr Maksymets; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Partsey_2022_CVPR, author = {Partsey, Ruslan and Wijmans, Erik and Yokoyama, Naoki and Dobosevych, Oles and Batra, Dhruv and Maksymets, Oleksandr}, title = {Is Mapping Necessary for Realistic PointGoal Navigation?}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17232-17241} }
Node-Aligned Graph Convolutional Network for Whole-Slide Image Representation and Classification: Yonghang Guan,

Jun Zhang,

Kuan Tian,

Sen Yang,

Pei Dong,

Jinxi Xiang,

Wei Yang,

Junzhou Huang,

Yuyao Zhang,

Xiao Han; [pdf]
[bibtex]
@InProceedings{Guan_2022_CVPR, author = {Guan, Yonghang and Zhang, Jun and Tian, Kuan and Yang, Sen and Dong, Pei and Xiang, Jinxi and Yang, Wei and Huang, Junzhou and Zhang, Yuyao and Han, Xiao}, title = {Node-Aligned Graph Convolutional Network for Whole-Slide Image Representation and Classification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18813-18823} }
Object-Relation Reasoning Graph for Action Recognition: Yangjun Ou,

Li Mi,

Zhenzhong Chen; [pdf]
[bibtex]
@InProceedings{Ou_2022_CVPR, author = {Ou, Yangjun and Mi, Li and Chen, Zhenzhong}, title = {Object-Relation Reasoning Graph for Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20133-20142} }
FaceVerse: A Fine-Grained and Detail-Controllable 3D Face Morphable Model From a Hybrid Dataset: Lizhen Wang,

Zhiyuan Chen,

Tao Yu,

Chenguang Ma,

Liang Li,

Yebin Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2022_CVPR, author = {Wang, Lizhen and Chen, Zhiyuan and Yu, Tao and Ma, Chenguang and Li, Liang and Liu, Yebin}, title = {FaceVerse: A Fine-Grained and Detail-Controllable 3D Face Morphable Model From a Hybrid Dataset}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20333-20342} }
Bring Evanescent Representations to Life in Lifelong Class Incremental Learning: Marco Toldo,

Mete Ozay; [pdf] [supp]
[bibtex]
@InProceedings{Toldo_2022_CVPR, author = {Toldo, Marco and Ozay, Mete}, title = {Bring Evanescent Representations to Life in Lifelong Class Incremental Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16732-16741} }
Look Back and Forth: Video Super-Resolution With Explicit Temporal Difference Modeling: Takashi Isobe,

Xu Jia,

Xin Tao,

Changlin Li,

Ruihuang Li,

Yongjie Shi,

Jing Mu,

Huchuan Lu,

Yu-Wing Tai; [pdf] [arXiv]
[bibtex]
@InProceedings{Isobe_2022_CVPR, author = {Isobe, Takashi and Jia, Xu and Tao, Xin and Li, Changlin and Li, Ruihuang and Shi, Yongjie and Mu, Jing and Lu, Huchuan and Tai, Yu-Wing}, title = {Look Back and Forth: Video Super-Resolution With Explicit Temporal Difference Modeling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17411-17420} }
A Stitch in Time Saves Nine: A Train-Time Regularizing Loss for Improved Neural Network Calibration: Ramya Hebbalaguppe,

Jatin Prakash,

Neelabh Madan,

Chetan Arora; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hebbalaguppe_2022_CVPR, author = {Hebbalaguppe, Ramya and Prakash, Jatin and Madan, Neelabh and Arora, Chetan}, title = {A Stitch in Time Saves Nine: A Train-Time Regularizing Loss for Improved Neural Network Calibration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16081-16090} }
Deep Image-Based Illumination Harmonization: Zhongyun Bao,

Chengjiang Long,

Gang Fu,

Daquan Liu,

Yuanzhen Li,

Jiaming Wu,

Chunxia Xiao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bao_2022_CVPR, author = {Bao, Zhongyun and Long, Chengjiang and Fu, Gang and Liu, Daquan and Li, Yuanzhen and Wu, Jiaming and Xiao, Chunxia}, title = {Deep Image-Based Illumination Harmonization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18542-18551} }
Harmony: A Generic Unsupervised Approach for Disentangling Semantic Content From Parameterized Transformations: Mostofa Rafid Uddin,

Gregory Howe,

Xiangrui Zeng,

Min Xu; [pdf] [supp]
[bibtex]
@InProceedings{Uddin_2022_CVPR, author = {Uddin, Mostofa Rafid and Howe, Gregory and Zeng, Xiangrui and Xu, Min}, title = {Harmony: A Generic Unsupervised Approach for Disentangling Semantic Content From Parameterized Transformations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20646-20655} }
Talking Face Generation With Multilingual TTS: Hyoung-Kyu Song,

Sang Hoon Woo,

Junhyeok Lee,

Seungmin Yang,

Hyunjae Cho,

Youseong Lee,

Dongho Choi,

Kang-wook Kim; [pdf] [arXiv]
[bibtex]
@InProceedings{Song_2022_CVPR, author = {Song, Hyoung-Kyu and Woo, Sang Hoon and Lee, Junhyeok and Yang, Seungmin and Cho, Hyunjae and Lee, Youseong and Choi, Dongho and Kim, Kang-wook}, title = {Talking Face Generation With Multilingual TTS}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21425-21430} }
Kernelized Few-Shot Object Detection With Efficient Integral Aggregation: Shan Zhang,

Lei Wang,

Naila Murray,

Piotr Koniusz; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2022_CVPR, author = {Zhang, Shan and Wang, Lei and Murray, Naila and Koniusz, Piotr}, title = {Kernelized Few-Shot Object Detection With Efficient Integral Aggregation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19207-19216} }
Context-Aware Video Reconstruction for Rolling Shutter Cameras: Bin Fan,

Yuchao Dai,

Zhiyuan Zhang,

Qi Liu,

Mingyi He; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Fan_2022_CVPR, author = {Fan, Bin and Dai, Yuchao and Zhang, Zhiyuan and Liu, Qi and He, Mingyi}, title = {Context-Aware Video Reconstruction for Rolling Shutter Cameras}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17572-17582} }
Robust Contrastive Learning Against Noisy Views: Ching-Yao Chuang,

R Devon Hjelm,

Xin Wang,

Vibhav Vineet,

Neel Joshi,

Antonio Torralba,

Stefanie Jegelka,

Yale Song; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chuang_2022_CVPR, author = {Chuang, Ching-Yao and Hjelm, R Devon and Wang, Xin and Vineet, Vibhav and Joshi, Neel and Torralba, Antonio and Jegelka, Stefanie and Song, Yale}, title = {Robust Contrastive Learning Against Noisy Views}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16670-16681} }
RSTT: Real-Time Spatial Temporal Transformer for Space-Time Video Super-Resolution: Zhicheng Geng,

Luming Liang,

Tianyu Ding,

Ilya Zharkov; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Geng_2022_CVPR, author = {Geng, Zhicheng and Liang, Luming and Ding, Tianyu and Zharkov, Ilya}, title = {RSTT: Real-Time Spatial Temporal Transformer for Space-Time Video Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17441-17451} }
Learning Memory-Augmented Unidirectional Metrics for Cross-Modality Person Re-Identification: Jialun Liu,

Yifan Sun,

Feng Zhu,

Hongbin Pei,

Yi Yang,

Wenhui Li; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2022_CVPR, author = {Liu, Jialun and Sun, Yifan and Zhu, Feng and Pei, Hongbin and Yang, Yi and Li, Wenhui}, title = {Learning Memory-Augmented Unidirectional Metrics for Cross-Modality Person Re-Identification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19366-19375} }
Partial Class Activation Attention for Semantic Segmentation: Sun-Ao Liu,

Hongtao Xie,

Hai Xu,

Yongdong Zhang,

Qi Tian; [pdf]
[bibtex]
@InProceedings{Liu_2022_CVPR, author = {Liu, Sun-Ao and Xie, Hongtao and Xu, Hai and Zhang, Yongdong and Tian, Qi}, title = {Partial Class Activation Attention for Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16836-16845} }
SkinningNet: Two-Stream Graph Convolutional Neural Network for Skinning Prediction of Synthetic Characters: Albert Mosella-Montoro,

Javier Ruiz-Hidalgo; [pdf] [supp]
[bibtex]
@InProceedings{Mosella-Montoro_2022_CVPR, author = {Mosella-Montoro, Albert and Ruiz-Hidalgo, Javier}, title = {SkinningNet: Two-Stream Graph Convolutional Neural Network for Skinning Prediction of Synthetic Characters}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18593-18602} }
Cross-Modal Representation Learning for Zero-Shot Action Recognition: Chung-Ching Lin,

Kevin Lin,

Lijuan Wang,

Zicheng Liu,

Linjie Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lin_2022_CVPR, author = {Lin, Chung-Ching and Lin, Kevin and Wang, Lijuan and Liu, Zicheng and Li, Linjie}, title = {Cross-Modal Representation Learning for Zero-Shot Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19978-19988} }
Conditional Prompt Learning for Vision-Language Models: Kaiyang Zhou,

Jingkang Yang,

Chen Change Loy,

Ziwei Liu; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhou_2022_CVPR, author = {Zhou, Kaiyang and Yang, Jingkang and Loy, Chen Change and Liu, Ziwei}, title = {Conditional Prompt Learning for Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16816-16825} }
Affine Medical Image Registration With Coarse-To-Fine Vision Transformer: Tony C. W. Mok,

Albert C. S. Chung; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mok_2022_CVPR, author = {Mok, Tony C. W. and Chung, Albert C. S.}, title = {Affine Medical Image Registration With Coarse-To-Fine Vision Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20835-20844} }
SMPL-A: Modeling Person-Specific Deformable Anatomy: Hengtao Guo,

Benjamin Planche,

Meng Zheng,

Srikrishna Karanam,

Terrence Chen,

Ziyan Wu; [pdf] [supp]
[bibtex]
@InProceedings{Guo_2022_CVPR, author = {Guo, Hengtao and Planche, Benjamin and Zheng, Meng and Karanam, Srikrishna and Chen, Terrence and Wu, Ziyan}, title = {SMPL-A: Modeling Person-Specific Deformable Anatomy}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20814-20823} }
A Differentiable Two-Stage Alignment Scheme for Burst Image Reconstruction With Large Shift: Shi Guo,

Xi Yang,

Jianqi Ma,

Gaofeng Ren,

Lei Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Guo_2022_CVPR, author = {Guo, Shi and Yang, Xi and Ma, Jianqi and Ren, Gaofeng and Zhang, Lei}, title = {A Differentiable Two-Stage Alignment Scheme for Burst Image Reconstruction With Large Shift}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17472-17481} }
Unifying Panoptic Segmentation for Autonomous Driving: Oliver Zendel,

Matthias Schörghuber,

Bernhard Rainer,

Markus Murschitz,

Csaba Beleznai; [pdf] [supp]
[bibtex]
@InProceedings{Zendel_2022_CVPR, author = {Zendel, Oliver and Sch\"orghuber, Matthias and Rainer, Bernhard and Murschitz, Markus and Beleznai, Csaba}, title = {Unifying Panoptic Segmentation for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21351-21360} }
On the Road to Online Adaptation for Semantic Image Segmentation: Riccardo Volpi,

Pau De Jorge,

Diane Larlus,

Gabriela Csurka; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Volpi_2022_CVPR, author = {Volpi, Riccardo and De Jorge, Pau and Larlus, Diane and Csurka, Gabriela}, title = {On the Road to Online Adaptation for Semantic Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19184-19195} }
Masked Autoencoders Are Scalable Vision Learners: Kaiming He,

Xinlei Chen,

Saining Xie,

Yanghao Li,

Piotr Dollár,

Ross Girshick; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{He_2022_CVPR, author = {He, Kaiming and Chen, Xinlei and Xie, Saining and Li, Yanghao and Doll\'ar, Piotr and Girshick, Ross}, title = {Masked Autoencoders Are Scalable Vision Learners}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16000-16009} }
Point-BERT: Pre-Training 3D Point Cloud Transformers With Masked Point Modeling: Xumin Yu,

Lulu Tang,

Yongming Rao,

Tiejun Huang,

Jie Zhou,

Jiwen Lu; [pdf] [supp]
[bibtex]
@InProceedings{Yu_2022_CVPR, author = {Yu, Xumin and Tang, Lulu and Rao, Yongming and Huang, Tiejun and Zhou, Jie and Lu, Jiwen}, title = {Point-BERT: Pre-Training 3D Point Cloud Transformers With Masked Point Modeling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19313-19322} }
Crowd Counting in the Frequency Domain: Weibo Shu,

Jia Wan,

Kay Chen Tan,

Sam Kwong,

Antoni B. Chan; [pdf] [supp]
[bibtex]
@InProceedings{Shu_2022_CVPR, author = {Shu, Weibo and Wan, Jia and Tan, Kay Chen and Kwong, Sam and Chan, Antoni B.}, title = {Crowd Counting in the Frequency Domain}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19618-19627} }
Aladdin: Joint Atlas Building and Diffeomorphic Registration Learning With Pairwise Alignment: Zhipeng Ding,

Marc Niethammer; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ding_2022_CVPR, author = {Ding, Zhipeng and Niethammer, Marc}, title = {Aladdin: Joint Atlas Building and Diffeomorphic Registration Learning With Pairwise Alignment}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20784-20793} }
Learning sRGB-to-Raw-RGB De-Rendering With Content-Aware Metadata: Seonghyeon Nam,

Abhijith Punnappurath,

Marcus A. Brubaker,

Michael S. Brown; [pdf] [supp]
[bibtex]
@InProceedings{Nam_2022_CVPR, author = {Nam, Seonghyeon and Punnappurath, Abhijith and Brubaker, Marcus A. and Brown, Michael S.}, title = {Learning sRGB-to-Raw-RGB De-Rendering With Content-Aware Metadata}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17704-17713} }
Point Cloud Color Constancy: Xiaoyan Xing,

Yanlin Qian,

Sibo Feng,

Yuhan Dong,

Jiří Matas; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xing_2022_CVPR, author = {Xing, Xiaoyan and Qian, Yanlin and Feng, Sibo and Dong, Yuhan and Matas, Ji\v{r}{\'\i}}, title = {Point Cloud Color Constancy}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19750-19759} }
Towards an End-to-End Framework for Flow-Guided Video Inpainting: Zhen Li,

Cheng-Ze Lu,

Jianhua Qin,

Chun-Le Guo,

Ming-Ming Cheng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Zhen and Lu, Cheng-Ze and Qin, Jianhua and Guo, Chun-Le and Cheng, Ming-Ming}, title = {Towards an End-to-End Framework for Flow-Guided Video Inpainting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17562-17571} }
CrossLoc: Scalable Aerial Localization Assisted by Multimodal Synthetic Data: Qi Yan,

Jianhao Zheng,

Simon Reding,

Shanci Li,

Iordan Doytchinov; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yan_2022_CVPR, author = {Yan, Qi and Zheng, Jianhao and Reding, Simon and Li, Shanci and Doytchinov, Iordan}, title = {CrossLoc: Scalable Aerial Localization Assisted by Multimodal Synthetic Data}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17358-17368} }
On Learning Contrastive Representations for Learning With Noisy Labels: Li Yi,

Sheng Liu,

Qi She,

A. Ian McLeod,

Boyu Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yi_2022_CVPR, author = {Yi, Li and Liu, Sheng and She, Qi and McLeod, A. Ian and Wang, Boyu}, title = {On Learning Contrastive Representations for Learning With Noisy Labels}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16682-16691} }
Modeling Indirect Illumination for Inverse Rendering: Yuanqing Zhang,

Jiaming Sun,

Xingyi He,

Huan Fu,

Rongfei Jia,

Xiaowei Zhou; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhang_2022_CVPR, author = {Zhang, Yuanqing and Sun, Jiaming and He, Xingyi and Fu, Huan and Jia, Rongfei and Zhou, Xiaowei}, title = {Modeling Indirect Illumination for Inverse Rendering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18643-18652} }
BACON: Band-Limited Coordinate Networks for Multiscale Scene Representation: David B. Lindell,

Dave Van Veen,

Jeong Joon Park,

Gordon Wetzstein; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lindell_2022_CVPR, author = {Lindell, David B. and Van Veen, Dave and Park, Jeong Joon and Wetzstein, Gordon}, title = {BACON: Band-Limited Coordinate Networks for Multiscale Scene Representation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16252-16262} }
Modeling sRGB Camera Noise With Normalizing Flows: Shayan Kousha,

Ali Maleky,

Michael S. Brown,

Marcus A. Brubaker; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kousha_2022_CVPR, author = {Kousha, Shayan and Maleky, Ali and Brown, Michael S. and Brubaker, Marcus A.}, title = {Modeling sRGB Camera Noise With Normalizing Flows}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17463-17471} }
Reference-Based Video Super-Resolution Using Multi-Camera Video Triplets: Junyong Lee,

Myeonghee Lee,

Sunghyun Cho,

Seungyong Lee; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2022_CVPR, author = {Lee, Junyong and Lee, Myeonghee and Cho, Sunghyun and Lee, Seungyong}, title = {Reference-Based Video Super-Resolution Using Multi-Camera Video Triplets}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17824-17833} }
Self-Supervised Image Representation Learning With Geometric Set Consistency: Nenglun Chen,

Lei Chu,

Hao Pan,

Yan Lu,

Wenping Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2022_CVPR, author = {Chen, Nenglun and Chu, Lei and Pan, Hao and Lu, Yan and Wang, Wenping}, title = {Self-Supervised Image Representation Learning With Geometric Set Consistency}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19292-19302} }
GEN-VLKT: Simplify Association and Enhance Interaction Understanding for HOI Detection: Yue Liao,

Aixi Zhang,

Miao Lu,

Yongliang Wang,

Xiaobo Li,

Si Liu; [pdf]
[bibtex]
@InProceedings{Liao_2022_CVPR, author = {Liao, Yue and Zhang, Aixi and Lu, Miao and Wang, Yongliang and Li, Xiaobo and Liu, Si}, title = {GEN-VLKT: Simplify Association and Enhance Interaction Understanding for HOI Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20123-20132} }
Global Matching With Overlapping Attention for Optical Flow Estimation: Shiyu Zhao,

Long Zhao,

Zhixing Zhang,

Enyu Zhou,

Dimitris Metaxas; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhao_2022_CVPR, author = {Zhao, Shiyu and Zhao, Long and Zhang, Zhixing and Zhou, Enyu and Metaxas, Dimitris}, title = {Global Matching With Overlapping Attention for Optical Flow Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17592-17601} }
Rethinking Efficient Lane Detection via Curve Modeling: Zhengyang Feng,

Shaohua Guo,

Xin Tan,

Ke Xu,

Min Wang,

Lizhuang Ma; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Feng_2022_CVPR, author = {Feng, Zhengyang and Guo, Shaohua and Tan, Xin and Xu, Ke and Wang, Min and Ma, Lizhuang}, title = {Rethinking Efficient Lane Detection via Curve Modeling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17062-17070} }
Co-Advise: Cross Inductive Bias Distillation: Sucheng Ren,

Zhengqi Gao,

Tianyu Hua,

Zihui Xue,

Yonglong Tian,

Shengfeng He,

Hang Zhao; [pdf]
[bibtex]
@InProceedings{Ren_2022_CVPR, author = {Ren, Sucheng and Gao, Zhengqi and Hua, Tianyu and Xue, Zihui and Tian, Yonglong and He, Shengfeng and Zhao, Hang}, title = {Co-Advise: Cross Inductive Bias Distillation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16773-16782} }
DTFD-MIL: Double-Tier Feature Distillation Multiple Instance Learning for Histopathology Whole Slide Image Classification: Hongrun Zhang,

Yanda Meng,

Yitian Zhao,

Yihong Qiao,

Xiaoyun Yang,

Sarah E. Coupland,

Yalin Zheng; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2022_CVPR, author = {Zhang, Hongrun and Meng, Yanda and Zhao, Yitian and Qiao, Yihong and Yang, Xiaoyun and Coupland, Sarah E. and Zheng, Yalin}, title = {DTFD-MIL: Double-Tier Feature Distillation Multiple Instance Learning for Histopathology Whole Slide Image Classification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18802-18812} }
Deep Generalized Unfolding Networks for Image Restoration: Chong Mou,

Qian Wang,

Jian Zhang; [pdf] [arXiv]
[bibtex]
@InProceedings{Mou_2022_CVPR, author = {Mou, Chong and Wang, Qian and Zhang, Jian}, title = {Deep Generalized Unfolding Networks for Image Restoration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17399-17410} }
Robust Cross-Modal Representation Learning With Progressive Self-Distillation: Alex Andonian,

Shixing Chen,

Raffay Hamid; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Andonian_2022_CVPR, author = {Andonian, Alex and Chen, Shixing and Hamid, Raffay}, title = {Robust Cross-Modal Representation Learning With Progressive Self-Distillation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16430-16441} }
Compressive Single-Photon 3D Cameras: Felipe Gutierrez-Barragan,

Atul Ingle,

Trevor Seets,

Mohit Gupta,

Andreas Velten; [pdf] [supp]
[bibtex]
@InProceedings{Gutierrez-Barragan_2022_CVPR, author = {Gutierrez-Barragan, Felipe and Ingle, Atul and Seets, Trevor and Gupta, Mohit and Velten, Andreas}, title = {Compressive Single-Photon 3D Cameras}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17854-17864} }
Rethinking Controllable Variational Autoencoders: Huajie Shao,

Yifei Yang,

Haohong Lin,

Longzhong Lin,

Yizhuo Chen,

Qinmin Yang,

Han Zhao; [pdf] [supp]
[bibtex]
@InProceedings{Shao_2022_CVPR, author = {Shao, Huajie and Yang, Yifei and Lin, Haohong and Lin, Longzhong and Chen, Yizhuo and Yang, Qinmin and Zhao, Han}, title = {Rethinking Controllable Variational Autoencoders}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19250-19259} }
Boosting Crowd Counting via Multifaceted Attention: Hui Lin,

Zhiheng Ma,

Rongrong Ji,

Yaowei Wang,

Xiaopeng Hong; [pdf] [arXiv]
[bibtex]
@InProceedings{Lin_2022_CVPR, author = {Lin, Hui and Ma, Zhiheng and Ji, Rongrong and Wang, Yaowei and Hong, Xiaopeng}, title = {Boosting Crowd Counting via Multifaceted Attention}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19628-19637} }
BigDL 2.0: Seamless Scaling of AI Pipelines From Laptops to Distributed Cluster: Jason (Jinquan) Dai,

Ding Ding,

Dongjie Shi,

Shengsheng Huang,

Jiao Wang,

Xin Qiu,

Kai Huang,

Guoqiong Song,

Yang Wang,

Qiyuan Gong,

Jiaming Song,

Shan Yu,

Le Zheng,

Yina Chen,

Junwei Deng,

Ge Song; [pdf] [supp]
[bibtex]
@InProceedings{Dai_2022_CVPR, author = {Dai, Jason (Jinquan) and Ding, Ding and Shi, Dongjie and Huang, Shengsheng and Wang, Jiao and Qiu, Xin and Huang, Kai and Song, Guoqiong and Wang, Yang and Gong, Qiyuan and Song, Jiaming and Yu, Shan and Zheng, Le and Chen, Yina and Deng, Junwei and Song, Ge}, title = {BigDL 2.0: Seamless Scaling of AI Pipelines From Laptops to Distributed Cluster}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21439-21446} }
Acquiring a Dynamic Light Field Through a Single-Shot Coded Image: Ryoya Mizuno,

Keita Takahashi,

Michitaka Yoshida,

Chihiro Tsutake,

Toshiaki Fujii,

Hajime Nagahara; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mizuno_2022_CVPR, author = {Mizuno, Ryoya and Takahashi, Keita and Yoshida, Michitaka and Tsutake, Chihiro and Fujii, Toshiaki and Nagahara, Hajime}, title = {Acquiring a Dynamic Light Field Through a Single-Shot Coded Image}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19830-19840} }
Attentive Fine-Grained Structured Sparsity for Image Restoration: Junghun Oh,

Heewon Kim,

Seungjun Nah,

Cheeun Hong,

Jonghyun Choi,

Kyoung Mu Lee; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Oh_2022_CVPR, author = {Oh, Junghun and Kim, Heewon and Nah, Seungjun and Hong, Cheeun and Choi, Jonghyun and Lee, Kyoung Mu}, title = {Attentive Fine-Grained Structured Sparsity for Image Restoration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17673-17682} }
StylizedNeRF: Consistent 3D Scene Stylization As Stylized NeRF via 2D-3D Mutual Learning: Yi-Hua Huang,

Yue He,

Yu-Jie Yuan,

Yu-Kun Lai,

Lin Gao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2022_CVPR, author = {Huang, Yi-Hua and He, Yue and Yuan, Yu-Jie and Lai, Yu-Kun and Gao, Lin}, title = {StylizedNeRF: Consistent 3D Scene Stylization As Stylized NeRF via 2D-3D Mutual Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18342-18352} }
NightLab: A Dual-Level Architecture With Hardness Detection for Segmentation at Night: Xueqing Deng,

Peng Wang,

Xiaochen Lian,

Shawn Newsam; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Deng_2022_CVPR, author = {Deng, Xueqing and Wang, Peng and Lian, Xiaochen and Newsam, Shawn}, title = {NightLab: A Dual-Level Architecture With Hardness Detection for Segmentation at Night}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16938-16948} }
InfoGCN: Representation Learning for Human Skeleton-Based Action Recognition: Hyung-gun Chi,

Myoung Hoon Ha,

Seunggeun Chi,

Sang Wan Lee,

Qixing Huang,

Karthik Ramani; [pdf] [supp]
[bibtex]
@InProceedings{Chi_2022_CVPR, author = {Chi, Hyung-gun and Ha, Myoung Hoon and Chi, Seunggeun and Lee, Sang Wan and Huang, Qixing and Ramani, Karthik}, title = {InfoGCN: Representation Learning for Human Skeleton-Based Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20186-20196} }
Sparse to Dense Dynamic 3D Facial Expression Generation: Naima Otberdout,

Claudio Ferrari,

Mohamed Daoudi,

Stefano Berretti,

Alberto Del Bimbo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Otberdout_2022_CVPR, author = {Otberdout, Naima and Ferrari, Claudio and Daoudi, Mohamed and Berretti, Stefano and Del Bimbo, Alberto}, title = {Sparse to Dense Dynamic 3D Facial Expression Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20385-20394} }
Crafting Better Contrastive Views for Siamese Representation Learning: Xiangyu Peng,

Kai Wang,

Zheng Zhu,

Mang Wang,

Yang You; [pdf] [arXiv]
[bibtex]
@InProceedings{Peng_2022_CVPR, author = {Peng, Xiangyu and Wang, Kai and Zhu, Zheng and Wang, Mang and You, Yang}, title = {Crafting Better Contrastive Views for Siamese Representation Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16031-16040} }
Continual Learning for Visual Search With Backward Consistent Feature Embedding: Timmy S. T. Wan,

Jun-Cheng Chen,

Tzer-Yi Wu,

Chu-Song Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wan_2022_CVPR, author = {Wan, Timmy S. T. and Chen, Jun-Cheng and Wu, Tzer-Yi and Chen, Chu-Song}, title = {Continual Learning for Visual Search With Backward Consistent Feature Embedding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16702-16711} }
EyePAD++: A Distillation-Based Approach for Joint Eye Authentication and Presentation Attack Detection Using Periocular Images: Prithviraj Dhar,

Amit Kumar,

Kirsten Kaplan,

Khushi Gupta,

Rakesh Ranjan,

Rama Chellappa; [pdf] [supp]
[bibtex]
@InProceedings{Dhar_2022_CVPR, author = {Dhar, Prithviraj and Kumar, Amit and Kaplan, Kirsten and Gupta, Khushi and Ranjan, Rakesh and Chellappa, Rama}, title = {EyePAD++: A Distillation-Based Approach for Joint Eye Authentication and Presentation Attack Detection Using Periocular Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20218-20227} }
Efficient Two-Stage Detection of Human-Object Interactions With a Novel Unary-Pairwise Transformer: Frederic Z. Zhang,

Dylan Campbell,

Stephen Gould; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2022_CVPR, author = {Zhang, Frederic Z. and Campbell, Dylan and Gould, Stephen}, title = {Efficient Two-Stage Detection of Human-Object Interactions With a Novel Unary-Pairwise Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20104-20112} }
A Low-Cost & Real-Time Motion Capture System: Anargyros Chatzitofis,

Georgios Albanis,

Nikolaos Zioulis,

Spyridon Thermos; [pdf]
[bibtex]
@InProceedings{Chatzitofis_2022_CVPR, author = {Chatzitofis, Anargyros and Albanis, Georgios and Zioulis, Nikolaos and Thermos, Spyridon}, title = {A Low-Cost \& Real-Time Motion Capture System}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21453-21458} }
Unified Contrastive Learning in Image-Text-Label Space: Jianwei Yang,

Chunyuan Li,

Pengchuan Zhang,

Bin Xiao,

Ce Liu,

Lu Yuan,

Jianfeng Gao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2022_CVPR, author = {Yang, Jianwei and Li, Chunyuan and Zhang, Pengchuan and Xiao, Bin and Liu, Ce and Yuan, Lu and Gao, Jianfeng}, title = {Unified Contrastive Learning in Image-Text-Label Space}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19163-19173} }
Unifying Motion Deblurring and Frame Interpolation With Events: Xiang Zhang,

Lei Yu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2022_CVPR, author = {Zhang, Xiang and Yu, Lei}, title = {Unifying Motion Deblurring and Frame Interpolation With Events}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17765-17774} }
Fast Point Transformer: Chunghyun Park,

Yoonwoo Jeong,

Minsu Cho,

Jaesik Park; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Park_2022_CVPR, author = {Park, Chunghyun and Jeong, Yoonwoo and Cho, Minsu and Park, Jaesik}, title = {Fast Point Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16949-16958} }
Unimodal-Concentrated Loss: Fully Adaptive Label Distribution Learning for Ordinal Regression: Qiang Li,

Jingjing Wang,

Zhaoliang Yao,

Yachun Li,

Pengju Yang,

Jingwei Yan,

Chunmao Wang,

Shiliang Pu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Qiang and Wang, Jingjing and Yao, Zhaoliang and Li, Yachun and Yang, Pengju and Yan, Jingwei and Wang, Chunmao and Pu, Shiliang}, title = {Unimodal-Concentrated Loss: Fully Adaptive Label Distribution Learning for Ordinal Regression}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20513-20522} }
Deep Stereo Image Compression via Bi-Directional Coding: Jianjun Lei,

Xiangrui Liu,

Bo Peng,

Dengchao Jin,

Wanqing Li,

Jingxiao Gu; [pdf]
[bibtex]
@InProceedings{Lei_2022_CVPR, author = {Lei, Jianjun and Liu, Xiangrui and Peng, Bo and Jin, Dengchao and Li, Wanqing and Gu, Jingxiao}, title = {Deep Stereo Image Compression via Bi-Directional Coding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19669-19678} }
How Good Is Aesthetic Ability of a Fashion Model?: Xingxing Zou,

Kaicheng Pang,

Wen Zhang,

Waikeung Wong; [pdf] [supp]
[bibtex]
@InProceedings{Zou_2022_CVPR, author = {Zou, Xingxing and Pang, Kaicheng and Zhang, Wen and Wong, Waikeung}, title = {How Good Is Aesthetic Ability of a Fashion Model?}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21200-21209} }
Mining Multi-View Information: A Strong Self-Supervised Framework for Depth-Based 3D Hand Pose and Mesh Estimation: Pengfei Ren,

Haifeng Sun,

Jiachang Hao,

Jingyu Wang,

Qi Qi,

Jianxin Liao; [pdf] [supp]
[bibtex]
@InProceedings{Ren_2022_CVPR, author = {Ren, Pengfei and Sun, Haifeng and Hao, Jiachang and Wang, Jingyu and Qi, Qi and Liao, Jianxin}, title = {Mining Multi-View Information: A Strong Self-Supervised Framework for Depth-Based 3D Hand Pose and Mesh Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20555-20565} }
BTS: A Bi-Lingual Benchmark for Text Segmentation in the Wild: Xixi Xu,

Zhongang Qi,

Jianqi Ma,

Honglun Zhang,

Ying Shan,

Xiaohu Qie; [pdf] [supp]
[bibtex]
@InProceedings{Xu_2022_CVPR, author = {Xu, Xixi and Qi, Zhongang and Ma, Jianqi and Zhang, Honglun and Shan, Ying and Qie, Xiaohu}, title = {BTS: A Bi-Lingual Benchmark for Text Segmentation in the Wild}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19152-19162} }
Hierarchical Modular Network for Video Captioning: Hanhua Ye,

Guorong Li,

Yuankai Qi,

Shuhui Wang,

Qingming Huang,

Ming-Hsuan Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ye_2022_CVPR, author = {Ye, Hanhua and Li, Guorong and Qi, Yuankai and Wang, Shuhui and Huang, Qingming and Yang, Ming-Hsuan}, title = {Hierarchical Modular Network for Video Captioning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17939-17948} }
Alignment-Uniformity Aware Representation Learning for Zero-Shot Video Classification: Shi Pu,

Kaili Zhao,

Mao Zheng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Pu_2022_CVPR, author = {Pu, Shi and Zhao, Kaili and Zheng, Mao}, title = {Alignment-Uniformity Aware Representation Learning for Zero-Shot Video Classification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19968-19977} }
LiDARCap: Long-Range Marker-Less 3D Human Motion Capture With LiDAR Point Clouds: Jialian Li,

Jingyi Zhang,

Zhiyong Wang,

Siqi Shen,

Chenglu Wen,

Yuexin Ma,

Lan Xu,

Jingyi Yu,

Cheng Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Jialian and Zhang, Jingyi and Wang, Zhiyong and Shen, Siqi and Wen, Chenglu and Ma, Yuexin and Xu, Lan and Yu, Jingyi and Wang, Cheng}, title = {LiDARCap: Long-Range Marker-Less 3D Human Motion Capture With LiDAR Point Clouds}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20502-20512} }
GeoEngine: A Platform for Production-Ready Geospatial Research: Sagar Verma,

Siddharth Gupta,

Hal Shin,

Akash Panigrahi,

Shubham Goswami,

Shweta Pardeshi,

Natanael Exe,

Ujwal Dutta,

Tanka Raj Joshi,

Nitin Bhojwani; [pdf]
[bibtex]
@InProceedings{Verma_2022_CVPR, author = {Verma, Sagar and Gupta, Siddharth and Shin, Hal and Panigrahi, Akash and Goswami, Shubham and Pardeshi, Shweta and Exe, Natanael and Dutta, Ujwal and Joshi, Tanka Raj and Bhojwani, Nitin}, title = {GeoEngine: A Platform for Production-Ready Geospatial Research}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21416-21424} }
GroupViT: Semantic Segmentation Emerges From Text Supervision: Jiarui Xu,

Shalini De Mello,

Sifei Liu,

Wonmin Byeon,

Thomas Breuel,

Jan Kautz,

Xiaolong Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2022_CVPR, author = {Xu, Jiarui and De Mello, Shalini and Liu, Sifei and Byeon, Wonmin and Breuel, Thomas and Kautz, Jan and Wang, Xiaolong}, title = {GroupViT: Semantic Segmentation Emerges From Text Supervision}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18134-18144} }
Occlusion-Aware Cost Constructor for Light Field Depth Estimation: Yingqian Wang,

Longguang Wang,

Zhengyu Liang,

Jungang Yang,

Wei An,

Yulan Guo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2022_CVPR, author = {Wang, Yingqian and Wang, Longguang and Liang, Zhengyu and Yang, Jungang and An, Wei and Guo, Yulan}, title = {Occlusion-Aware Cost Constructor for Light Field Depth Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19809-19818} }
SmartPortraits: Depth Powered Handheld Smartphone Dataset of Human Portraits for State Estimation, Reconstruction and Synthesis: Anastasiia Kornilova,

Marsel Faizullin,

Konstantin Pakulev,

Andrey Sadkov,

Denis Kukushkin,

Azat Akhmetyanov,

Timur Akhtyamov,

Hekmat Taherinejad,

Gonzalo Ferrer; [pdf] [arXiv]
[bibtex]
@InProceedings{Kornilova_2022_CVPR, author = {Kornilova, Anastasiia and Faizullin, Marsel and Pakulev, Konstantin and Sadkov, Andrey and Kukushkin, Denis and Akhmetyanov, Azat and Akhtyamov, Timur and Taherinejad, Hekmat and Ferrer, Gonzalo}, title = {SmartPortraits: Depth Powered Handheld Smartphone Dataset of Human Portraits for State Estimation, Reconstruction and Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21318-21329} }
Stacked Hybrid-Attention and Group Collaborative Learning for Unbiased Scene Graph Generation: Xingning Dong,

Tian Gan,

Xuemeng Song,

Jianlong Wu,

Yuan Cheng,

Liqiang Nie; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dong_2022_CVPR, author = {Dong, Xingning and Gan, Tian and Song, Xuemeng and Wu, Jianlong and Cheng, Yuan and Nie, Liqiang}, title = {Stacked Hybrid-Attention and Group Collaborative Learning for Unbiased Scene Graph Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19427-19436} }
Topology-Preserving Shape Reconstruction and Registration via Neural Diffeomorphic Flow: Shanlin Sun,

Kun Han,

Deying Kong,

Hao Tang,

Xiangyi Yan,

Xiaohui Xie; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sun_2022_CVPR, author = {Sun, Shanlin and Han, Kun and Kong, Deying and Tang, Hao and Yan, Xiangyi and Xie, Xiaohui}, title = {Topology-Preserving Shape Reconstruction and Registration via Neural Diffeomorphic Flow}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20845-20855} }
Learning Part Segmentation Through Unsupervised Domain Adaptation From Synthetic Vehicles: Qing Liu,

Adam Kortylewski,

Zhishuai Zhang,

Zizhang Li,

Mengqi Guo,

Qihao Liu,

Xiaoding Yuan,

Jiteng Mu,

Weichao Qiu,

Alan Yuille; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2022_CVPR, author = {Liu, Qing and Kortylewski, Adam and Zhang, Zhishuai and Li, Zizhang and Guo, Mengqi and Liu, Qihao and Yuan, Xiaoding and Mu, Jiteng and Qiu, Weichao and Yuille, Alan}, title = {Learning Part Segmentation Through Unsupervised Domain Adaptation From Synthetic Vehicles}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19140-19151} }
Learning Object Context for Novel-View Scene Layout Generation: Xiaotian Qiao,

Gerhard P. Hancke,

Rynson W.H. Lau; [pdf]
[bibtex]
@InProceedings{Qiao_2022_CVPR, author = {Qiao, Xiaotian and Hancke, Gerhard P. and Lau, Rynson W.H.}, title = {Learning Object Context for Novel-View Scene Layout Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16990-16999} }
Neural Fields As Learnable Kernels for 3D Reconstruction: Francis Williams,

Zan Gojcic,

Sameh Khamis,

Denis Zorin,

Joan Bruna,

Sanja Fidler,

Or Litany; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Williams_2022_CVPR, author = {Williams, Francis and Gojcic, Zan and Khamis, Sameh and Zorin, Denis and Bruna, Joan and Fidler, Sanja and Litany, Or}, title = {Neural Fields As Learnable Kernels for 3D Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18500-18510} }
Detector-Free Weakly Supervised Group Activity Recognition: Dongkeun Kim,

Jinsung Lee,

Minsu Cho,

Suha Kwak; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2022_CVPR, author = {Kim, Dongkeun and Lee, Jinsung and Cho, Minsu and Kwak, Suha}, title = {Detector-Free Weakly Supervised Group Activity Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20083-20093} }
HairCLIP: Design Your Hair by Text and Reference Image: Tianyi Wei,

Dongdong Chen,

Wenbo Zhou,

Jing Liao,

Zhentao Tan,

Lu Yuan,

Weiming Zhang,

Nenghai Yu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wei_2022_CVPR, author = {Wei, Tianyi and Chen, Dongdong and Zhou, Wenbo and Liao, Jing and Tan, Zhentao and Yuan, Lu and Zhang, Weiming and Yu, Nenghai}, title = {HairCLIP: Design Your Hair by Text and Reference Image}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18072-18081} }
OakInk: A Large-Scale Knowledge Repository for Understanding Hand-Object Interaction: Lixin Yang,

Kailin Li,

Xinyu Zhan,

Fei Wu,

Anran Xu,

Liu Liu,

Cewu Lu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2022_CVPR, author = {Yang, Lixin and Li, Kailin and Zhan, Xinyu and Wu, Fei and Xu, Anran and Liu, Liu and Lu, Cewu}, title = {OakInk: A Large-Scale Knowledge Repository for Understanding Hand-Object Interaction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20953-20962} }
SwinBERT: End-to-End Transformers With Sparse Attention for Video Captioning: Kevin Lin,

Linjie Li,

Chung-Ching Lin,

Faisal Ahmed,

Zhe Gan,

Zicheng Liu,

Yumao Lu,

Lijuan Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lin_2022_CVPR, author = {Lin, Kevin and Li, Linjie and Lin, Chung-Ching and Ahmed, Faisal and Gan, Zhe and Liu, Zicheng and Lu, Yumao and Wang, Lijuan}, title = {SwinBERT: End-to-End Transformers With Sparse Attention for Video Captioning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17949-17958} }
Maximum Spatial Perturbation Consistency for Unpaired Image-to-Image Translation: Yanwu Xu,

Shaoan Xie,

Wenhao Wu,

Kun Zhang,

Mingming Gong,

Kayhan Batmanghelich; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2022_CVPR, author = {Xu, Yanwu and Xie, Shaoan and Wu, Wenhao and Zhang, Kun and Gong, Mingming and Batmanghelich, Kayhan}, title = {Maximum Spatial Perturbation Consistency for Unpaired Image-to-Image Translation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18311-18320} }
Bringing Old Films Back to Life: Ziyu Wan,

Bo Zhang,

Dongdong Chen,

Jing Liao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wan_2022_CVPR, author = {Wan, Ziyu and Zhang, Bo and Chen, Dongdong and Liao, Jing}, title = {Bringing Old Films Back to Life}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17694-17703} }
E2(GO)MOTION: Motion Augmented Event Stream for Egocentric Action Recognition: Chiara Plizzari,

Mirco Planamente,

Gabriele Goletto,

Marco Cannici,

Emanuele Gusso,

Matteo Matteucci,

Barbara Caputo; [pdf] [supp]
[bibtex]
@InProceedings{Plizzari_2022_CVPR, author = {Plizzari, Chiara and Planamente, Mirco and Goletto, Gabriele and Cannici, Marco and Gusso, Emanuele and Matteucci, Matteo and Caputo, Barbara}, title = {E2(GO)MOTION: Motion Augmented Event Stream for Egocentric Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19935-19947} }
An Empirical Study of Training End-to-End Vision-and-Language Transformers: Zi-Yi Dou,

Yichong Xu,

Zhe Gan,

Jianfeng Wang,

Shuohang Wang,

Lijuan Wang,

Chenguang Zhu,

Pengchuan Zhang,

Lu Yuan,

Nanyun Peng,

Zicheng Liu,

Michael Zeng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dou_2022_CVPR, author = {Dou, Zi-Yi and Xu, Yichong and Gan, Zhe and Wang, Jianfeng and Wang, Shuohang and Wang, Lijuan and Zhu, Chenguang and Zhang, Pengchuan and Yuan, Lu and Peng, Nanyun and Liu, Zicheng and Zeng, Michael}, title = {An Empirical Study of Training End-to-End Vision-and-Language Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18166-18176} }
Multimodal Dynamics: Dynamical Fusion for Trustworthy Multimodal Classification: Zongbo Han,

Fan Yang,

Junzhou Huang,

Changqing Zhang,

Jianhua Yao; [pdf] [supp]
[bibtex]
@InProceedings{Han_2022_CVPR, author = {Han, Zongbo and Yang, Fan and Huang, Junzhou and Zhang, Changqing and Yao, Jianhua}, title = {Multimodal Dynamics: Dynamical Fusion for Trustworthy Multimodal Classification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20707-20717} }
Unsupervised Homography Estimation With Coplanarity-Aware GAN: Mingbo Hong,

Yuhang Lu,

Nianjin Ye,

Chunyu Lin,

Qijun Zhao,

Shuaicheng Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hong_2022_CVPR, author = {Hong, Mingbo and Lu, Yuhang and Ye, Nianjin and Lin, Chunyu and Zhao, Qijun and Liu, Shuaicheng}, title = {Unsupervised Homography Estimation With Coplanarity-Aware GAN}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17663-17672} }
LIFT: Learning 4D LiDAR Image Fusion Transformer for 3D Object Detection: Yihan Zeng,

Da Zhang,

Chunwei Wang,

Zhenwei Miao,

Ting Liu,

Xin Zhan,

Dayang Hao,

Chao Ma; [pdf] [supp]
[bibtex]
@InProceedings{Zeng_2022_CVPR, author = {Zeng, Yihan and Zhang, Da and Wang, Chunwei and Miao, Zhenwei and Liu, Ting and Zhan, Xin and Hao, Dayang and Ma, Chao}, title = {LIFT: Learning 4D LiDAR Image Fusion Transformer for 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17172-17181} }
PatchNet: A Simple Face Anti-Spoofing Framework via Fine-Grained Patch Recognition: Chien-Yi Wang,

Yu-Ding Lu,

Shang-Ta Yang,

Shang-Hong Lai; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2022_CVPR, author = {Wang, Chien-Yi and Lu, Yu-Ding and Yang, Shang-Ta and Lai, Shang-Hong}, title = {PatchNet: A Simple Face Anti-Spoofing Framework via Fine-Grained Patch Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20281-20290} }
Rethinking Minimal Sufficient Representation in Contrastive Learning: Haoqing Wang,

Xun Guo,

Zhi-Hong Deng,

Yan Lu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2022_CVPR, author = {Wang, Haoqing and Guo, Xun and Deng, Zhi-Hong and Lu, Yan}, title = {Rethinking Minimal Sufficient Representation in Contrastive Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16041-16050} }
Effective Conditioned and Composed Image Retrieval Combining CLIP-Based Features: Alberto Baldrati,

Marco Bertini,

Tiberio Uricchio,

Alberto Del Bimbo; [pdf]
[bibtex]
@InProceedings{Baldrati_2022_CVPR, author = {Baldrati, Alberto and Bertini, Marco and Uricchio, Tiberio and Del Bimbo, Alberto}, title = {Effective Conditioned and Composed Image Retrieval Combining CLIP-Based Features}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21466-21474} }
Practical Stereo Matching via Cascaded Recurrent Network With Adaptive Correlation: Jiankun Li,

Peisen Wang,

Pengfei Xiong,

Tao Cai,

Ziwei Yan,

Lei Yang,

Jiangyu Liu,

Haoqiang Fan,

Shuaicheng Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Jiankun and Wang, Peisen and Xiong, Pengfei and Cai, Tao and Yan, Ziwei and Yang, Lei and Liu, Jiangyu and Fan, Haoqiang and Liu, Shuaicheng}, title = {Practical Stereo Matching via Cascaded Recurrent Network With Adaptive Correlation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16263-16272} }
D-Grasp: Physically Plausible Dynamic Grasp Synthesis for Hand-Object Interactions: Sammy Christen,

Muhammed Kocabas,

Emre Aksan,

Jemin Hwangbo,

Jie Song,

Otmar Hilliges; [pdf] [supp]
[bibtex]
@InProceedings{Christen_2022_CVPR, author = {Christen, Sammy and Kocabas, Muhammed and Aksan, Emre and Hwangbo, Jemin and Song, Jie and Hilliges, Otmar}, title = {D-Grasp: Physically Plausible Dynamic Grasp Synthesis for Hand-Object Interactions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20577-20586} }
Show, Deconfound and Tell: Image Captioning With Causal Inference: Bing Liu,

Dong Wang,

Xu Yang,

Yong Zhou,

Rui Yao,

Zhiwen Shao,

Jiaqi Zhao; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2022_CVPR, author = {Liu, Bing and Wang, Dong and Yang, Xu and Zhou, Yong and Yao, Rui and Shao, Zhiwen and Zhao, Jiaqi}, title = {Show, Deconfound and Tell: Image Captioning With Causal Inference}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18041-18050} }
ImFace: A Nonlinear 3D Morphable Face Model With Implicit Neural Representations: Mingwu Zheng,

Hongyu Yang,

Di Huang,

Liming Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zheng_2022_CVPR, author = {Zheng, Mingwu and Yang, Hongyu and Huang, Di and Chen, Liming}, title = {ImFace: A Nonlinear 3D Morphable Face Model With Implicit Neural Representations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20343-20352} }
MobRecon: Mobile-Friendly Hand Mesh Reconstruction From Monocular Image: Xingyu Chen,

Yufeng Liu,

Yajiao Dong,

Xiong Zhang,

Chongyang Ma,

Yanmin Xiong,

Yuan Zhang,

Xiaoyan Guo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2022_CVPR, author = {Chen, Xingyu and Liu, Yufeng and Dong, Yajiao and Zhang, Xiong and Ma, Chongyang and Xiong, Yanmin and Zhang, Yuan and Guo, Xiaoyan}, title = {MobRecon: Mobile-Friendly Hand Mesh Reconstruction From Monocular Image}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20544-20554} }
AlignMixup: Improving Representations by Interpolating Aligned Features: Shashanka Venkataramanan,

Ewa Kijak,

Laurent Amsaleg,

Yannis Avrithis; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Venkataramanan_2022_CVPR, author = {Venkataramanan, Shashanka and Kijak, Ewa and Amsaleg, Laurent and Avrithis, Yannis}, title = {AlignMixup: Improving Representations by Interpolating Aligned Features}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19174-19183} }
HerosNet: Hyperspectral Explicable Reconstruction and Optimal Sampling Deep Network for Snapshot Compressive Imaging: Xuanyu Zhang,

Yongbing Zhang,

Ruiqin Xiong,

Qilin Sun,

Jian Zhang; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhang_2022_CVPR, author = {Zhang, Xuanyu and Zhang, Yongbing and Xiong, Ruiqin and Sun, Qilin and Zhang, Jian}, title = {HerosNet: Hyperspectral Explicable Reconstruction and Optimal Sampling Deep Network for Snapshot Compressive Imaging}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17532-17541} }
Detecting Deepfakes With Self-Blended Images: Kaede Shiohara,

Toshihiko Yamasaki; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shiohara_2022_CVPR, author = {Shiohara, Kaede and Yamasaki, Toshihiko}, title = {Detecting Deepfakes With Self-Blended Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18720-18729} }
Learnable Irrelevant Modality Dropout for Multimodal Action Recognition on Modality-Specific Annotated Videos: Saghir Alfasly,

Jian Lu,

Chen Xu,

Yuru Zou; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Alfasly_2022_CVPR, author = {Alfasly, Saghir and Lu, Jian and Xu, Chen and Zou, Yuru}, title = {Learnable Irrelevant Modality Dropout for Multimodal Action Recognition on Modality-Specific Annotated Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20208-20217} }
Bi-Level Doubly Variational Learning for Energy-Based Latent Variable Models: Ge Kan,

Jinhu Lü,

Tian Wang,

Baochang Zhang,

Aichun Zhu,

Lei Huang,

Guodong Guo,

Hichem Snoussi; [pdf] [supp]
[bibtex]
@InProceedings{Kan_2022_CVPR, author = {Kan, Ge and L\"u, Jinhu and Wang, Tian and Zhang, Baochang and Zhu, Aichun and Huang, Lei and Guo, Guodong and Snoussi, Hichem}, title = {Bi-Level Doubly Variational Learning for Energy-Based Latent Variable Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18460-18469} }
AxIoU: An Axiomatically Justified Measure for Video Moment Retrieval: Riku Togashi,

Mayu Otani,

Yuta Nakashima,

Esa Rahtu,

Janne Heikkilä,

Tetsuya Sakai; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Togashi_2022_CVPR, author = {Togashi, Riku and Otani, Mayu and Nakashima, Yuta and Rahtu, Esa and Heikkil\"a, Janne and Sakai, Tetsuya}, title = {AxIoU: An Axiomatically Justified Measure for Video Moment Retrieval}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21076-21085} }
NOC-REK: Novel Object Captioning With Retrieved Vocabulary From External Knowledge: Duc Minh Vo,

Hong Chen,

Akihiro Sugimoto,

Hideki Nakayama; [pdf] [supp]
[bibtex]
@InProceedings{Vo_2022_CVPR, author = {Vo, Duc Minh and Chen, Hong and Sugimoto, Akihiro and Nakayama, Hideki}, title = {NOC-REK: Novel Object Captioning With Retrieved Vocabulary From External Knowledge}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18000-18008} }
Speech Driven Tongue Animation: Salvador Medina,

Denis Tome,

Carsten Stoll,

Mark Tiede,

Kevin Munhall,

Alexander G. Hauptmann,

Iain Matthews; [pdf] [supp]
[bibtex]
@InProceedings{Medina_2022_CVPR, author = {Medina, Salvador and Tome, Denis and Stoll, Carsten and Tiede, Mark and Munhall, Kevin and Hauptmann, Alexander G. and Matthews, Iain}, title = {Speech Driven Tongue Animation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20406-20416} }
Hybrid Relation Guided Set Matching for Few-Shot Action Recognition: Xiang Wang,

Shiwei Zhang,

Zhiwu Qing,

Mingqian Tang,

Zhengrong Zuo,

Changxin Gao,

Rong Jin,

Nong Sang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2022_CVPR, author = {Wang, Xiang and Zhang, Shiwei and Qing, Zhiwu and Tang, Mingqian and Zuo, Zhengrong and Gao, Changxin and Jin, Rong and Sang, Nong}, title = {Hybrid Relation Guided Set Matching for Few-Shot Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19948-19957} }
SHIFT: A Synthetic Driving Dataset for Continuous Multi-Task Domain Adaptation: Tao Sun,

Mattia Segu,

Janis Postels,

Yuxuan Wang,

Luc Van Gool,

Bernt Schiele,

Federico Tombari,

Fisher Yu; [pdf] [supp]
[bibtex]
@InProceedings{Sun_2022_CVPR, author = {Sun, Tao and Segu, Mattia and Postels, Janis and Wang, Yuxuan and Van Gool, Luc and Schiele, Bernt and Tombari, Federico and Yu, Fisher}, title = {SHIFT: A Synthetic Driving Dataset for Continuous Multi-Task Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21371-21382} }
FlexIT: Towards Flexible Semantic Image Translation: Guillaume Couairon,

Asya Grechka,

Jakob Verbeek,

Holger Schwenk,

Matthieu Cord; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Couairon_2022_CVPR, author = {Couairon, Guillaume and Grechka, Asya and Verbeek, Jakob and Schwenk, Holger and Cord, Matthieu}, title = {FlexIT: Towards Flexible Semantic Image Translation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18270-18279} }
Face2Exp: Combating Data Biases for Facial Expression Recognition: Dan Zeng,

Zhiyuan Lin,

Xiao Yan,

Yuting Liu,

Fei Wang,

Bo Tang; [pdf]
[bibtex]
@InProceedings{Zeng_2022_CVPR, author = {Zeng, Dan and Lin, Zhiyuan and Yan, Xiao and Liu, Yuting and Wang, Fei and Tang, Bo}, title = {Face2Exp: Combating Data Biases for Facial Expression Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20291-20300} }
PINA: Learning a Personalized Implicit Neural Avatar From a Single RGB-D Video Sequence: Zijian Dong,

Chen Guo,

Jie Song,

Xu Chen,

Andreas Geiger,

Otmar Hilliges; [pdf] [supp]
[bibtex]
@InProceedings{Dong_2022_CVPR, author = {Dong, Zijian and Guo, Chen and Song, Jie and Chen, Xu and Geiger, Andreas and Hilliges, Otmar}, title = {PINA: Learning a Personalized Implicit Neural Avatar From a Single RGB-D Video Sequence}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20470-20480} }
Forecasting From LiDAR via Future Object Detection: Neehar Peri,

Jonathon Luiten,

Mengtian Li,

Aljoša Ošep,

Laura Leal-Taixé,

Deva Ramanan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Peri_2022_CVPR, author = {Peri, Neehar and Luiten, Jonathon and Li, Mengtian and O\v{s}ep, Aljo\v{s}a and Leal-Taix\'e, Laura and Ramanan, Deva}, title = {Forecasting From LiDAR via Future Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17202-17211} }
CRAFT: Cross-Attentional Flow Transformer for Robust Optical Flow: Xiuchao Sui,

Shaohua Li,

Xue Geng,

Yan Wu,

Xinxing Xu,

Yong Liu,

Rick Goh,

Hongyuan Zhu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sui_2022_CVPR, author = {Sui, Xiuchao and Li, Shaohua and Geng, Xue and Wu, Yan and Xu, Xinxing and Liu, Yong and Goh, Rick and Zhu, Hongyuan}, title = {CRAFT: Cross-Attentional Flow Transformer for Robust Optical Flow}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17602-17611} }
Privacy Preserving Partial Localization: Marcel Geppert,

Viktor Larsson,

Johannes L. Schönberger,

Marc Pollefeys; [pdf] [supp]
[bibtex]
@InProceedings{Geppert_2022_CVPR, author = {Geppert, Marcel and Larsson, Viktor and Sch\"onberger, Johannes L. and Pollefeys, Marc}, title = {Privacy Preserving Partial Localization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17337-17347} }
Cross-Modal Background Suppression for Audio-Visual Event Localization: Yan Xia,

Zhou Zhao; [pdf]
[bibtex]
@InProceedings{Xia_2022_CVPR, author = {Xia, Yan and Zhao, Zhou}, title = {Cross-Modal Background Suppression for Audio-Visual Event Localization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19989-19998} }
Lagrange Motion Analysis and View Embeddings for Improved Gait Recognition: Tianrui Chai,

Annan Li,

Shaoxiong Zhang,

Zilong Li,

Yunhong Wang; [pdf] [supp]
[bibtex]
@InProceedings{Chai_2022_CVPR, author = {Chai, Tianrui and Li, Annan and Zhang, Shaoxiong and Li, Zilong and Wang, Yunhong}, title = {Lagrange Motion Analysis and View Embeddings for Improved Gait Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20249-20258} }
Neural Mesh Simplification: Rolandos Alexandros Potamias,

Stylianos Ploumpis,

Stefanos Zafeiriou; [pdf] [supp]
[bibtex]
@InProceedings{Potamias_2022_CVPR, author = {Potamias, Rolandos Alexandros and Ploumpis, Stylianos and Zafeiriou, Stefanos}, title = {Neural Mesh Simplification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18583-18592} }
Deep Hyperspectral-Depth Reconstruction Using Single Color-Dot Projection: Chunyu Li,

Yusuke Monno,

Masatoshi Okutomi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Chunyu and Monno, Yusuke and Okutomi, Masatoshi}, title = {Deep Hyperspectral-Depth Reconstruction Using Single Color-Dot Projection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19770-19779} }
M3T: Three-Dimensional Medical Image Classifier Using Multi-Plane and Multi-Slice Transformer: Jinseong Jang,

Dosik Hwang; [pdf] [supp]
[bibtex]
@InProceedings{Jang_2022_CVPR, author = {Jang, Jinseong and Hwang, Dosik}, title = {M3T: Three-Dimensional Medical Image Classifier Using Multi-Plane and Multi-Slice Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20718-20729} }
3MASSIV: Multilingual, Multimodal and Multi-Aspect Dataset of Social Media Short Videos: Vikram Gupta,

Trisha Mittal,

Puneet Mathur,

Vaibhav Mishra,

Mayank Maheshwari,

Aniket Bera,

Debdoot Mukherjee,

Dinesh Manocha; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gupta_2022_CVPR, author = {Gupta, Vikram and Mittal, Trisha and Mathur, Puneet and Mishra, Vaibhav and Maheshwari, Mayank and Bera, Aniket and Mukherjee, Debdoot and Manocha, Dinesh}, title = {3MASSIV: Multilingual, Multimodal and Multi-Aspect Dataset of Social Media Short Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21064-21075} }
Structured Sparse R-CNN for Direct Scene Graph Generation: Yao Teng,

Limin Wang; [pdf] [supp]
[bibtex]
@InProceedings{Teng_2022_CVPR, author = {Teng, Yao and Wang, Limin}, title = {Structured Sparse R-CNN for Direct Scene Graph Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19437-19446} }
Multi-Grained Spatio-Temporal Features Perceived Network for Event-Based Lip-Reading: Ganchao Tan,

Yang Wang,

Han Han,

Yang Cao,

Feng Wu,

Zheng-Jun Zha; [pdf] [supp]
[bibtex]
@InProceedings{Tan_2022_CVPR, author = {Tan, Ganchao and Wang, Yang and Han, Han and Cao, Yang and Wu, Feng and Zha, Zheng-Jun}, title = {Multi-Grained Spatio-Temporal Features Perceived Network for Event-Based Lip-Reading}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20094-20103} }
AnyFace: Free-Style Text-To-Face Synthesis and Manipulation: Jianxin Sun,

Qiyao Deng,

Qi Li,

Muyi Sun,

Min Ren,

Zhenan Sun; [pdf] [arXiv]
[bibtex]
@InProceedings{Sun_2022_CVPR, author = {Sun, Jianxin and Deng, Qiyao and Li, Qi and Sun, Muyi and Ren, Min and Sun, Zhenan}, title = {AnyFace: Free-Style Text-To-Face Synthesis and Manipulation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18687-18696} }
HL-Net: Heterophily Learning Network for Scene Graph Generation: Xin Lin,

Changxing Ding,

Yibing Zhan,

Zijian Li,

Dacheng Tao; [pdf] [supp]
[bibtex]
@InProceedings{Lin_2022_CVPR, author = {Lin, Xin and Ding, Changxing and Zhan, Yibing and Li, Zijian and Tao, Dacheng}, title = {HL-Net: Heterophily Learning Network for Scene Graph Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19476-19485} }
MERLOT Reserve: Neural Script Knowledge Through Vision and Language and Sound: Rowan Zellers,

Jiasen Lu,

Ximing Lu,

Youngjae Yu,

Yanpeng Zhao,

Mohammadreza Salehi,

Aditya Kusupati,

Jack Hessel,

Ali Farhadi,

Yejin Choi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zellers_2022_CVPR, author = {Zellers, Rowan and Lu, Jiasen and Lu, Ximing and Yu, Youngjae and Zhao, Yanpeng and Salehi, Mohammadreza and Kusupati, Aditya and Hessel, Jack and Farhadi, Ali and Choi, Yejin}, title = {MERLOT Reserve: Neural Script Knowledge Through Vision and Language and Sound}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16375-16387} }
A Conservative Approach for Unbiased Learning on Unknown Biases: Myeongho Jeon,

Daekyung Kim,

Woochul Lee,

Myungjoo Kang,

Joonseok Lee; [pdf] [supp]
[bibtex]
@InProceedings{Jeon_2022_CVPR, author = {Jeon, Myeongho and Kim, Daekyung and Lee, Woochul and Kang, Myungjoo and Lee, Joonseok}, title = {A Conservative Approach for Unbiased Learning on Unknown Biases}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16752-16760} }
Large-Scale Video Panoptic Segmentation in the Wild: A Benchmark: Jiaxu Miao,

Xiaohan Wang,

Yu Wu,

Wei Li,

Xu Zhang,

Yunchao Wei,

Yi Yang; [pdf] [supp]
[bibtex]
@InProceedings{Miao_2022_CVPR, author = {Miao, Jiaxu and Wang, Xiaohan and Wu, Yu and Li, Wei and Zhang, Xu and Wei, Yunchao and Yang, Yi}, title = {Large-Scale Video Panoptic Segmentation in the Wild: A Benchmark}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21033-21043} }
GrainSpace: A Large-Scale Dataset for Fine-Grained and Domain-Adaptive Recognition of Cereal Grains: Lei Fan,

Yiwen Ding,

Dongdong Fan,

Donglin Di,

Maurice Pagnucco,

Yang Song; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Fan_2022_CVPR, author = {Fan, Lei and Ding, Yiwen and Fan, Dongdong and Di, Donglin and Pagnucco, Maurice and Song, Yang}, title = {GrainSpace: A Large-Scale Dataset for Fine-Grained and Domain-Adaptive Recognition of Cereal Grains}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21116-21125} }
BokehMe: When Neural Rendering Meets Classical Rendering: Juewen Peng,

Zhiguo Cao,

Xianrui Luo,

Hao Lu,

Ke Xian,

Jianming Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Peng_2022_CVPR, author = {Peng, Juewen and Cao, Zhiguo and Luo, Xianrui and Lu, Hao and Xian, Ke and Zhang, Jianming}, title = {BokehMe: When Neural Rendering Meets Classical Rendering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16283-16292} }
Learning Modal-Invariant and Temporal-Memory for Video-Based Visible-Infrared Person Re-Identification: Xinyu Lin,

Jinxing Li,

Zeyu Ma,

Huafeng Li,

Shuang Li,

Kaixiong Xu,

Guangming Lu,

David Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Lin_2022_CVPR, author = {Lin, Xinyu and Li, Jinxing and Ma, Zeyu and Li, Huafeng and Li, Shuang and Xu, Kaixiong and Lu, Guangming and Zhang, David}, title = {Learning Modal-Invariant and Temporal-Memory for Video-Based Visible-Infrared Person Re-Identification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20973-20982} }
BigDatasetGAN: Synthesizing ImageNet With Pixel-Wise Annotations: Daiqing Li,

Huan Ling,

Seung Wook Kim,

Karsten Kreis,

Sanja Fidler,

Antonio Torralba; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Daiqing and Ling, Huan and Kim, Seung Wook and Kreis, Karsten and Fidler, Sanja and Torralba, Antonio}, title = {BigDatasetGAN: Synthesizing ImageNet With Pixel-Wise Annotations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21330-21340} }
Align Representations With Base: A New Approach to Self-Supervised Learning: Shaofeng Zhang,

Lyn Qiu,

Feng Zhu,

Junchi Yan,

Hengrui Zhang,

Rui Zhao,

Hongyang Li,

Xiaokang Yang; [pdf]
[bibtex]
@InProceedings{Zhang_2022_CVPR, author = {Zhang, Shaofeng and Qiu, Lyn and Zhu, Feng and Yan, Junchi and Zhang, Hengrui and Zhao, Rui and Li, Hongyang and Yang, Xiaokang}, title = {Align Representations With Base: A New Approach to Self-Supervised Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16600-16609} }
Exploring Denoised Cross-Video Contrast for Weakly-Supervised Temporal Action Localization: Jingjing Li,

Tianyu Yang,

Wei Ji,

Jue Wang,

Li Cheng; [pdf]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Jingjing and Yang, Tianyu and Ji, Wei and Wang, Jue and Cheng, Li}, title = {Exploring Denoised Cross-Video Contrast for Weakly-Supervised Temporal Action Localization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19914-19924} }
SVIP: Sequence VerIfication for Procedures in Videos: Yicheng Qian,

Weixin Luo,

Dongze Lian,

Xu Tang,

Peilin Zhao,

Shenghua Gao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Qian_2022_CVPR, author = {Qian, Yicheng and Luo, Weixin and Lian, Dongze and Tang, Xu and Zhao, Peilin and Gao, Shenghua}, title = {SVIP: Sequence VerIfication for Procedures in Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19890-19902} }
Low-Resource Adaptation for Personalized Co-Speech Gesture Generation: Chaitanya Ahuja,

Dong Won Lee,

Louis-Philippe Morency; [pdf] [supp]
[bibtex]
@InProceedings{Ahuja_2022_CVPR, author = {Ahuja, Chaitanya and Lee, Dong Won and Morency, Louis-Philippe}, title = {Low-Resource Adaptation for Personalized Co-Speech Gesture Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20566-20576} }
HDR-NeRF: High Dynamic Range Neural Radiance Fields: Xin Huang,

Qi Zhang,

Ying Feng,

Hongdong Li,

Xuan Wang,

Qing Wang; [pdf] [supp]
[bibtex]
@InProceedings{Huang_2022_CVPR, author = {Huang, Xin and Zhang, Qi and Feng, Ying and Li, Hongdong and Wang, Xuan and Wang, Qing}, title = {HDR-NeRF: High Dynamic Range Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18398-18408} }
Neural Emotion Director: Speech-Preserving Semantic Control of Facial Expressions in "In-the-Wild" Videos: Foivos Paraperas Papantoniou,

Panagiotis P. Filntisis,

Petros Maragos,

Anastasios Roussos; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Papantoniou_2022_CVPR, author = {Papantoniou, Foivos Paraperas and Filntisis, Panagiotis P. and Maragos, Petros and Roussos, Anastasios}, title = {Neural Emotion Director: Speech-Preserving Semantic Control of Facial Expressions in ''In-the-Wild'' Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18781-18790} }
Learning To Listen: Modeling Non-Deterministic Dyadic Facial Motion: Evonne Ng,

Hanbyul Joo,

Liwen Hu,

Hao Li,

Trevor Darrell,

Angjoo Kanazawa,

Shiry Ginosar; [pdf] [arXiv]
[bibtex]
@InProceedings{Ng_2022_CVPR, author = {Ng, Evonne and Joo, Hanbyul and Hu, Liwen and Li, Hao and Darrell, Trevor and Kanazawa, Angjoo and Ginosar, Shiry}, title = {Learning To Listen: Modeling Non-Deterministic Dyadic Facial Motion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20395-20405} }
3PSDF: Three-Pole Signed Distance Function for Learning Surfaces With Arbitrary Topologies: Weikai Chen,

Cheng Lin,

Weiyang Li,

Bo Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2022_CVPR, author = {Chen, Weikai and Lin, Cheng and Li, Weiyang and Yang, Bo}, title = {3PSDF: Three-Pole Signed Distance Function for Learning Surfaces With Arbitrary Topologies}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18522-18531} }
GIRAFFE HD: A High-Resolution 3D-Aware Generative Model: Yang Xue,

Yuheng Li,

Krishna Kumar Singh,

Yong Jae Lee; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xue_2022_CVPR, author = {Xue, Yang and Li, Yuheng and Singh, Krishna Kumar and Lee, Yong Jae}, title = {GIRAFFE HD: A High-Resolution 3D-Aware Generative Model}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18440-18449} }
Knowledge-Driven Self-Supervised Representation Learning for Facial Action Unit Recognition: Yanan Chang,

Shangfei Wang; [pdf]
[bibtex]
@InProceedings{Chang_2022_CVPR, author = {Chang, Yanan and Wang, Shangfei}, title = {Knowledge-Driven Self-Supervised Representation Learning for Facial Action Unit Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20417-20426} }
Learning Second Order Local Anomaly for General Face Forgery Detection: Jianwei Fei,

Yunshu Dai,

Peipeng Yu,

Tianrun Shen,

Zhihua Xia,

Jian Weng; [pdf]
[bibtex]
@InProceedings{Fei_2022_CVPR, author = {Fei, Jianwei and Dai, Yunshu and Yu, Peipeng and Shen, Tianrun and Xia, Zhihua and Weng, Jian}, title = {Learning Second Order Local Anomaly for General Face Forgery Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20270-20280} }
ADAS: A Direct Adaptation Strategy for Multi-Target Domain Adaptive Semantic Segmentation: Seunghun Lee,

Wonhyeok Choi,

Changjae Kim,

Minwoo Choi,

Sunghoon Im; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2022_CVPR, author = {Lee, Seunghun and Choi, Wonhyeok and Kim, Changjae and Choi, Minwoo and Im, Sunghoon}, title = {ADAS: A Direct Adaptation Strategy for Multi-Target Domain Adaptive Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19196-19206} }
The Devil Is in the Labels: Noisy Label Correction for Robust Scene Graph Generation: Lin Li,

Long Chen,

Yifeng Huang,

Zhimeng Zhang,

Songyang Zhang,

Jun Xiao; [pdf] [supp]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Lin and Chen, Long and Huang, Yifeng and Zhang, Zhimeng and Zhang, Songyang and Xiao, Jun}, title = {The Devil Is in the Labels: Noisy Label Correction for Robust Scene Graph Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18869-18878} }
LAVT: Language-Aware Vision Transformer for Referring Image Segmentation: Zhao Yang,

Jiaqi Wang,

Yansong Tang,

Kai Chen,

Hengshuang Zhao,

Philip H.S. Torr; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2022_CVPR, author = {Yang, Zhao and Wang, Jiaqi and Tang, Yansong and Chen, Kai and Zhao, Hengshuang and Torr, Philip H.S.}, title = {LAVT: Language-Aware Vision Transformer for Referring Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18155-18165} }
Video Demoireing With Relation-Based Temporal Consistency: Peng Dai,

Xin Yu,

Lan Ma,

Baoheng Zhang,

Jia Li,

Wenbo Li,

Jiajun Shen,

Xiaojuan Qi; [pdf] [arXiv]
[bibtex]
@InProceedings{Dai_2022_CVPR, author = {Dai, Peng and Yu, Xin and Ma, Lan and Zhang, Baoheng and Li, Jia and Li, Wenbo and Shen, Jiajun and Qi, Xiaojuan}, title = {Video Demoireing With Relation-Based Temporal Consistency}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17622-17631} }
GraFormer: Graph-Oriented Transformer for 3D Pose Estimation: Weixi Zhao,

Weiqiang Wang,

Yunjie Tian; [pdf]
[bibtex]
@InProceedings{Zhao_2022_CVPR, author = {Zhao, Weixi and Wang, Weiqiang and Tian, Yunjie}, title = {GraFormer: Graph-Oriented Transformer for 3D Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20438-20447} }
DeepCurrents: Learning Implicit Representations of Shapes With Boundaries: David Palmer,

Dmitriy Smirnov,

Stephanie Wang,

Albert Chern,

Justin Solomon; [pdf] [arXiv]
[bibtex]
@InProceedings{Palmer_2022_CVPR, author = {Palmer, David and Smirnov, Dmitriy and Wang, Stephanie and Chern, Albert and Solomon, Justin}, title = {DeepCurrents: Learning Implicit Representations of Shapes With Boundaries}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18665-18675} }
Zero Experience Required: Plug & Play Modular Transfer Learning for Semantic Visual Navigation: Ziad Al-Halah,

Santhosh Kumar Ramakrishnan,

Kristen Grauman; [pdf] [supp]
[bibtex]
@InProceedings{Al-Halah_2022_CVPR, author = {Al-Halah, Ziad and Ramakrishnan, Santhosh Kumar and Grauman, Kristen}, title = {Zero Experience Required: Plug \& Play Modular Transfer Learning for Semantic Visual Navigation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17031-17041} }
The Wanderings of Odysseus in 3D Scenes: Yan Zhang,

Siyu Tang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2022_CVPR, author = {Zhang, Yan and Tang, Siyu}, title = {The Wanderings of Odysseus in 3D Scenes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20481-20491} }
All-in-One Image Restoration for Unknown Corruption: Boyun Li,

Xiao Liu,

Peng Hu,

Zhongqin Wu,

Jiancheng Lv,

Xi Peng; [pdf] [supp]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Boyun and Liu, Xiao and Hu, Peng and Wu, Zhongqin and Lv, Jiancheng and Peng, Xi}, title = {All-in-One Image Restoration for Unknown Corruption}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17452-17462} }
Optimizing Video Prediction via Video Frame Interpolation: Yue Wu,

Qiang Wen,

Qifeng Chen; [pdf]
[bibtex]
@InProceedings{Wu_2022_CVPR, author = {Wu, Yue and Wen, Qiang and Chen, Qifeng}, title = {Optimizing Video Prediction via Video Frame Interpolation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17814-17823} }
Episodic Memory Question Answering: Samyak Datta,

Sameer Dharur,

Vincent Cartillier,

Ruta Desai,

Mukul Khanna,

Dhruv Batra,

Devi Parikh; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Datta_2022_CVPR, author = {Datta, Samyak and Dharur, Sameer and Cartillier, Vincent and Desai, Ruta and Khanna, Mukul and Batra, Dhruv and Parikh, Devi}, title = {Episodic Memory Question Answering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19119-19128} }
Continual Stereo Matching of Continuous Driving Scenes With Growing Architecture: Chenghao Zhang,

Kun Tian,

Bin Fan,

Gaofeng Meng,

Zhaoxiang Zhang,

Chunhong Pan; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2022_CVPR, author = {Zhang, Chenghao and Tian, Kun and Fan, Bin and Meng, Gaofeng and Zhang, Zhaoxiang and Pan, Chunhong}, title = {Continual Stereo Matching of Continuous Driving Scenes With Growing Architecture}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18901-18910} }
Learning To Zoom Inside Camera Imaging Pipeline: Chengzhou Tang,

Yuqiang Yang,

Bing Zeng,

Ping Tan,

Shuaicheng Liu; [pdf] [supp]
[bibtex]
@InProceedings{Tang_2022_CVPR, author = {Tang, Chengzhou and Yang, Yuqiang and Zeng, Bing and Tan, Ping and Liu, Shuaicheng}, title = {Learning To Zoom Inside Camera Imaging Pipeline}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17552-17561} }
gDNA: Towards Generative Detailed Neural Avatars: Xu Chen,

Tianjian Jiang,

Jie Song,

Jinlong Yang,

Michael J. Black,

Andreas Geiger,

Otmar Hilliges; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2022_CVPR, author = {Chen, Xu and Jiang, Tianjian and Song, Jie and Yang, Jinlong and Black, Michael J. and Geiger, Andreas and Hilliges, Otmar}, title = {gDNA: Towards Generative Detailed Neural Avatars}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20427-20437} }
Degree-of-Linear-Polarization-Based Color Constancy: Taishi Ono,

Yuhi Kondo,

Legong Sun,

Teppei Kurita,

Yusuke Moriuchi; [pdf] [supp]
[bibtex]
@InProceedings{Ono_2022_CVPR, author = {Ono, Taishi and Kondo, Yuhi and Sun, Legong and Kurita, Teppei and Moriuchi, Yusuke}, title = {Degree-of-Linear-Polarization-Based Color Constancy}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19740-19749} }
On the Importance of Asymmetry for Siamese Representation Learning: Xiao Wang,

Haoqi Fan,

Yuandong Tian,

Daisuke Kihara,

Xinlei Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2022_CVPR, author = {Wang, Xiao and Fan, Haoqi and Tian, Yuandong and Kihara, Daisuke and Chen, Xinlei}, title = {On the Importance of Asymmetry for Siamese Representation Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16570-16579} }
Probing Representation Forgetting in Supervised and Unsupervised Continual Learning: MohammadReza Davari,

Nader Asadi,

Sudhir Mudur,

Rahaf Aljundi,

Eugene Belilovsky; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Davari_2022_CVPR, author = {Davari, MohammadReza and Asadi, Nader and Mudur, Sudhir and Aljundi, Rahaf and Belilovsky, Eugene}, title = {Probing Representation Forgetting in Supervised and Unsupervised Continual Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16712-16721} }
DenseCLIP: Language-Guided Dense Prediction With Context-Aware Prompting: Yongming Rao,

Wenliang Zhao,

Guangyi Chen,

Yansong Tang,

Zheng Zhu,

Guan Huang,

Jie Zhou,

Jiwen Lu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Rao_2022_CVPR, author = {Rao, Yongming and Zhao, Wenliang and Chen, Guangyi and Tang, Yansong and Zhu, Zheng and Huang, Guan and Zhou, Jie and Lu, Jiwen}, title = {DenseCLIP: Language-Guided Dense Prediction With Context-Aware Prompting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18082-18091} }
JRDB-Act: A Large-Scale Dataset for Spatio-Temporal Action, Social Group and Activity Detection: Mahsa Ehsanpour,

Fatemeh Saleh,

Silvio Savarese,

Ian Reid,

Hamid Rezatofighi; [pdf] [supp]
[bibtex]
@InProceedings{Ehsanpour_2022_CVPR, author = {Ehsanpour, Mahsa and Saleh, Fatemeh and Savarese, Silvio and Reid, Ian and Rezatofighi, Hamid}, title = {JRDB-Act: A Large-Scale Dataset for Spatio-Temporal Action, Social Group and Activity Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20983-20992} }
AR-NeRF: Unsupervised Learning of Depth and Defocus Effects From Natural Images With Aperture Rendering Neural Radiance Fields: Takuhiro Kaneko; [pdf] [supp]
[bibtex]
@InProceedings{Kaneko_2022_CVPR, author = {Kaneko, Takuhiro}, title = {AR-NeRF: Unsupervised Learning of Depth and Defocus Effects From Natural Images With Aperture Rendering Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18387-18397} }
Decoupling and Recoupling Spatiotemporal Representation for RGB-D-Based Motion Recognition: Benjia Zhou,

Pichao Wang,

Jun Wan,

Yanyan Liang,

Fan Wang,

Du Zhang,

Zhen Lei,

Hao Li,

Rong Jin; [pdf] [supp]
[bibtex]
@InProceedings{Zhou_2022_CVPR, author = {Zhou, Benjia and Wang, Pichao and Wan, Jun and Liang, Yanyan and Wang, Fan and Zhang, Du and Lei, Zhen and Li, Hao and Jin, Rong}, title = {Decoupling and Recoupling Spatiotemporal Representation for RGB-D-Based Motion Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20154-20163} }
Towards Robust and Adaptive Motion Forecasting: A Causal Representation Perspective: Yuejiang Liu,

Riccardo Cadei,

Jonas Schweizer,

Sherwin Bahmani,

Alexandre Alahi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2022_CVPR, author = {Liu, Yuejiang and Cadei, Riccardo and Schweizer, Jonas and Bahmani, Sherwin and Alahi, Alexandre}, title = {Towards Robust and Adaptive Motion Forecasting: A Causal Representation Perspective}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17081-17092} }
Escaping Data Scarcity for High-Resolution Heterogeneous Face Hallucination: Yiqun Mei,

Pengfei Guo,

Vishal M. Patel; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mei_2022_CVPR, author = {Mei, Yiqun and Guo, Pengfei and Patel, Vishal M.}, title = {Escaping Data Scarcity for High-Resolution Heterogeneous Face Hallucination}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18676-18686} }
Visual Acoustic Matching: Changan Chen,

Ruohan Gao,

Paul Calamia,

Kristen Grauman; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2022_CVPR, author = {Chen, Changan and Gao, Ruohan and Calamia, Paul and Grauman, Kristen}, title = {Visual Acoustic Matching}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18858-18868} }
Unified Multivariate Gaussian Mixture for Efficient Neural Image Compression: Xiaosu Zhu,

Jingkuan Song,

Lianli Gao,

Feng Zheng,

Heng Tao Shen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhu_2022_CVPR, author = {Zhu, Xiaosu and Song, Jingkuan and Gao, Lianli and Zheng, Feng and Shen, Heng Tao}, title = {Unified Multivariate Gaussian Mixture for Efficient Neural Image Compression}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17612-17621} }
3D Photo Stylization: Learning To Generate Stylized Novel Views From a Single Image: Fangzhou Mu,

Jian Wang,

Yicheng Wu,

Yin Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mu_2022_CVPR, author = {Mu, Fangzhou and Wang, Jian and Wu, Yicheng and Li, Yin}, title = {3D Photo Stylization: Learning To Generate Stylized Novel Views From a Single Image}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16273-16282} }
SelfD: Self-Learning Large-Scale Driving Policies From the Web: Jimuyang Zhang,

Ruizhao Zhu,

Eshed Ohn-Bar; [pdf]
[bibtex]
@InProceedings{Zhang_2022_CVPR, author = {Zhang, Jimuyang and Zhu, Ruizhao and Ohn-Bar, Eshed}, title = {SelfD: Self-Learning Large-Scale Driving Policies From the Web}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17316-17326} }
"The Pedestrian Next to the Lamppost" Adaptive Object Graphs for Better Instantaneous Mapping: Avishkar Saha,

Oscar Mendez,

Chris Russell,

Richard Bowden; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Saha_2022_CVPR, author = {Saha, Avishkar and Mendez, Oscar and Russell, Chris and Bowden, Richard}, title = {''The Pedestrian Next to the Lamppost'' Adaptive Object Graphs for Better Instantaneous Mapping}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19528-19537} }
Surpassing the Human Accuracy: Detecting Gallbladder Cancer From USG Images With Curriculum Learning: Soumen Basu,

Mayank Gupta,

Pratyaksha Rana,

Pankaj Gupta,

Chetan Arora; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Basu_2022_CVPR, author = {Basu, Soumen and Gupta, Mayank and Rana, Pratyaksha and Gupta, Pankaj and Arora, Chetan}, title = {Surpassing the Human Accuracy: Detecting Gallbladder Cancer From USG Images With Curriculum Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20886-20896} }
Autofocus for Event Cameras: Shijie Lin,

Yinqiang Zhang,

Lei Yu,

Bin Zhou,

Xiaowei Luo,

Jia Pan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lin_2022_CVPR, author = {Lin, Shijie and Zhang, Yinqiang and Yu, Lei and Zhou, Bin and Luo, Xiaowei and Pan, Jia}, title = {Autofocus for Event Cameras}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16344-16353} }
Learning Multiple Adverse Weather Removal via Two-Stage Knowledge Learning and Multi-Contrastive Regularization: Toward a Unified Model: Wei-Ting Chen,

Zhi-Kai Huang,

Cheng-Che Tsai,

Hao-Hsiang Yang,

Jian-Jiun Ding,

Sy-Yen Kuo; [pdf]
[bibtex]
@InProceedings{Chen_2022_CVPR, author = {Chen, Wei-Ting and Huang, Zhi-Kai and Tsai, Cheng-Che and Yang, Hao-Hsiang and Ding, Jian-Jiun and Kuo, Sy-Yen}, title = {Learning Multiple Adverse Weather Removal via Two-Stage Knowledge Learning and Multi-Contrastive Regularization: Toward a Unified Model}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17653-17662} }
L-Verse: Bidirectional Generation Between Image and Text: Taehoon Kim,

Gwangmo Song,

Sihaeng Lee,

Sangyun Kim,

Yewon Seo,

Soonyoung Lee,

Seung Hwan Kim,

Honglak Lee,

Kyunghoon Bae; [pdf] [supp]
[bibtex]
@InProceedings{Kim_2022_CVPR, author = {Kim, Taehoon and Song, Gwangmo and Lee, Sihaeng and Kim, Sangyun and Seo, Yewon and Lee, Soonyoung and Kim, Seung Hwan and Lee, Honglak and Bae, Kyunghoon}, title = {L-Verse: Bidirectional Generation Between Image and Text}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16526-16536} }
Self-Supervised Learning of Adversarial Example: Towards Good Generalizations for Deepfake Detection: Liang Chen,

Yong Zhang,

Yibing Song,

Lingqiao Liu,

Jue Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2022_CVPR, author = {Chen, Liang and Zhang, Yong and Song, Yibing and Liu, Lingqiao and Wang, Jue}, title = {Self-Supervised Learning of Adversarial Example: Towards Good Generalizations for Deepfake Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18710-18719} }
Ego4D: Around the World in 3,000 Hours of Egocentric Video: Kristen Grauman,

Andrew Westbury,

Eugene Byrne,

Zachary Chavis,

Antonino Furnari,

Rohit Girdhar,

Jackson Hamburger,

Hao Jiang,

Miao Liu,

Xingyu Liu,

Miguel Martin,

Tushar Nagarajan,

Ilija Radosavovic,

Santhosh Kumar Ramakrishnan,

Fiona Ryan,

Jayant Sharma,

Michael Wray,

Mengmeng Xu,

Eric Zhongcong Xu,

Chen Zhao,

Siddhant Bansal,

Dhruv Batra,

Vincent Cartillier,

Sean Crane,

Tien Do,

Morrie Doulaty,

Akshay Erapalli,

Christoph Feichtenhofer,

Adriano Fragomeni,

Qichen Fu,

Abrham Gebreselasie,

Cristina González,

James Hillis,

Xuhua Huang,

Yifei Huang,

Wenqi Jia,

Weslie Khoo,

Jáchym Kolář,

Satwik Kottur,

Anurag Kumar,

Federico Landini,

Chao Li,

Yanghao Li,

Zhenqiang Li,

Karttikeya Mangalam,

Raghava Modhugu,

Jonathan Munro,

Tullie Murrell,

Takumi Nishiyasu,

Will Price,

Paola Ruiz,

Merey Ramazanova,

Leda Sari,

Kiran Somasundaram,

Audrey Southerland,

Yusuke Sugano,

Ruijie Tao,

Minh Vo,

Yuchen Wang,

Xindi Wu,

Takuma Yagi,

Ziwei Zhao,

Yunyi Zhu,

Pablo Arbeláez,

David Crandall,

Dima Damen,

Giovanni Maria Farinella,

Christian Fuegen,

Bernard Ghanem,

Vamsi Krishna Ithapu,

C. V. Jawahar,

Hanbyul Joo,

Kris Kitani,

Haizhou Li,

Richard Newcombe,

Aude Oliva,

Hyun Soo Park,

James M. Rehg,

Yoichi Sato,

Jianbo Shi,

Mike Zheng Shou,

Antonio Torralba,

Lorenzo Torresani,

Mingfei Yan,

Jitendra Malik; [pdf] [supp]
[bibtex]
@InProceedings{Grauman_2022_CVPR, author = {Grauman, Kristen and Westbury, Andrew and Byrne, Eugene and Chavis, Zachary and Furnari, Antonino and Girdhar, Rohit and Hamburger, Jackson and Jiang, Hao and Liu, Miao and Liu, Xingyu and Martin, Miguel and Nagarajan, Tushar and Radosavovic, Ilija and Ramakrishnan, Santhosh Kumar and Ryan, Fiona and Sharma, Jayant and Wray, Michael and Xu, Mengmeng and Xu, Eric Zhongcong and Zhao, Chen and Bansal, Siddhant and Batra, Dhruv and Cartillier, Vincent and Crane, Sean and Do, Tien and Doulaty, Morrie and Erapalli, Akshay and Feichtenhofer, Christoph and Fragomeni, Adriano and Fu, Qichen and Gebreselasie, Abrham and Gonz\'alez, Cristina and Hillis, James and Huang, Xuhua and Huang, Yifei and Jia, Wenqi and Khoo, Weslie and Kol\'a\v{r}, J\'achym and Kottur, Satwik and Kumar, Anurag and Landini, Federico and Li, Chao and Li, Yanghao and Li, Zhenqiang and Mangalam, Karttikeya and Modhugu, Raghava and Munro, Jonathan and Murrell, Tullie and Nishiyasu, Takumi and Price, Will and Ruiz, Paola and Ramazanova, Merey and Sari, Leda and Somasundaram, Kiran and Southerland, Audrey and Sugano, Yusuke and Tao, Ruijie and Vo, Minh and Wang, Yuchen and Wu, Xindi and Yagi, Takuma and Zhao, Ziwei and Zhu, Yunyi and Arbel\'aez, Pablo and Crandall, David and Damen, Dima and Farinella, Giovanni Maria and Fuegen, Christian and Ghanem, Bernard and Ithapu, Vamsi Krishna and Jawahar, C. V. and Joo, Hanbyul and Kitani, Kris and Li, Haizhou and Newcombe, Richard and Oliva, Aude and Park, Hyun Soo and Rehg, James M. and Sato, Yoichi and Shi, Jianbo and Shou, Mike Zheng and Torralba, Antonio and Torresani, Lorenzo and Yan, Mingfei and Malik, Jitendra}, title = {Ego4D: Around the World in 3,000 Hours of Egocentric Video}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18995-19012} }
Self-Supervised Pre-Training of Swin Transformers for 3D Medical Image Analysis: Yucheng Tang,

Dong Yang,

Wenqi Li,

Holger R. Roth,

Bennett Landman,

Daguang Xu,

Vishwesh Nath,

Ali Hatamizadeh; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tang_2022_CVPR, author = {Tang, Yucheng and Yang, Dong and Li, Wenqi and Roth, Holger R. and Landman, Bennett and Xu, Daguang and Nath, Vishwesh and Hatamizadeh, Ali}, title = {Self-Supervised Pre-Training of Swin Transformers for 3D Medical Image Analysis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20730-20740} }
Camera-Conditioned Stable Feature Generation for Isolated Camera Supervised Person Re-IDentification: Chao Wu,

Wenhang Ge,

Ancong Wu,

Xiaobin Chang; [pdf] [arXiv]
[bibtex]
@InProceedings{Wu_2022_CVPR, author = {Wu, Chao and Ge, Wenhang and Wu, Ancong and Chang, Xiaobin}, title = {Camera-Conditioned Stable Feature Generation for Isolated Camera Supervised Person Re-IDentification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20238-20248} }
Weakly Supervised Semantic Segmentation Using Out-of-Distribution Data: Jungbeom Lee,

Seong Joon Oh,

Sangdoo Yun,

Junsuk Choe,

Eunji Kim,

Sungroh Yoon; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2022_CVPR, author = {Lee, Jungbeom and Oh, Seong Joon and Yun, Sangdoo and Choe, Junsuk and Kim, Eunji and Yoon, Sungroh}, title = {Weakly Supervised Semantic Segmentation Using Out-of-Distribution Data}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16897-16906} }
Point-Level Region Contrast for Object Detection Pre-Training: Yutong Bai,

Xinlei Chen,

Alexander Kirillov,

Alan Yuille,

Alexander C. Berg; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bai_2022_CVPR, author = {Bai, Yutong and Chen, Xinlei and Kirillov, Alexander and Yuille, Alan and Berg, Alexander C.}, title = {Point-Level Region Contrast for Object Detection Pre-Training}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16061-16070} }
Spatial-Temporal Parallel Transformer for Arm-Hand Dynamic Estimation: Shuying Liu,

Wenbin Wu,

Jiaxian Wu,

Yue Lin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2022_CVPR, author = {Liu, Shuying and Wu, Wenbin and Wu, Jiaxian and Lin, Yue}, title = {Spatial-Temporal Parallel Transformer for Arm-Hand Dynamic Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20523-20532} }
Failure Modes of Domain Generalization Algorithms: Tigran Galstyan,

Hrayr Harutyunyan,

Hrant Khachatrian,

Greg Ver Steeg,

Aram Galstyan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Galstyan_2022_CVPR, author = {Galstyan, Tigran and Harutyunyan, Hrayr and Khachatrian, Hrant and Steeg, Greg Ver and Galstyan, Aram}, title = {Failure Modes of Domain Generalization Algorithms}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19077-19086} }
Class Similarity Weighted Knowledge Distillation for Continual Semantic Segmentation: Minh Hieu Phan,

The-Anh Ta,

Son Lam Phung,

Long Tran-Thanh,

Abdesselam Bouzerdoum; [pdf]
[bibtex]
@InProceedings{Phan_2022_CVPR, author = {Phan, Minh Hieu and Ta, The-Anh and Phung, Son Lam and Tran-Thanh, Long and Bouzerdoum, Abdesselam}, title = {Class Similarity Weighted Knowledge Distillation for Continual Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16866-16875} }
DAD-3DHeads: A Large-Scale Dense, Accurate and Diverse Dataset for 3D Head Alignment From a Single Image: Tetiana Martyniuk,

Orest Kupyn,

Yana Kurlyak,

Igor Krashenyi,

Jiří Matas,

Viktoriia Sharmanska; [pdf] [supp]
[bibtex]
@InProceedings{Martyniuk_2022_CVPR, author = {Martyniuk, Tetiana and Kupyn, Orest and Kurlyak, Yana and Krashenyi, Igor and Matas, Ji\v{r}{\'\i} and Sharmanska, Viktoriia}, title = {DAD-3DHeads: A Large-Scale Dense, Accurate and Diverse Dataset for 3D Head Alignment From a Single Image}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20942-20952} }
vCLIMB: A Novel Video Class Incremental Learning Benchmark: Andrés Villa,

Kumail Alhamoud,

Victor Escorcia,

Fabian Caba,

Juan León Alcázar,

Bernard Ghanem; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Villa_2022_CVPR, author = {Villa, Andr\'es and Alhamoud, Kumail and Escorcia, Victor and Caba, Fabian and Alc\'azar, Juan Le\'on and Ghanem, Bernard}, title = {vCLIMB: A Novel Video Class Incremental Learning Benchmark}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19035-19044} }
Bending Reality: Distortion-Aware Transformers for Adapting to Panoramic Semantic Segmentation: Jiaming Zhang,

Kailun Yang,

Chaoxiang Ma,

Simon Reiß,

Kunyu Peng,

Rainer Stiefelhagen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2022_CVPR, author = {Zhang, Jiaming and Yang, Kailun and Ma, Chaoxiang and Rei{\ss}, Simon and Peng, Kunyu and Stiefelhagen, Rainer}, title = {Bending Reality: Distortion-Aware Transformers for Adapting to Panoramic Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16917-16927} }
INS-Conv: Incremental Sparse Convolution for Online 3D Segmentation: Leyao Liu,

Tian Zheng,

Yun-Jou Lin,

Kai Ni,

Lu Fang; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2022_CVPR, author = {Liu, Leyao and Zheng, Tian and Lin, Yun-Jou and Ni, Kai and Fang, Lu}, title = {INS-Conv: Incremental Sparse Convolution for Online 3D Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18975-18984} }
Visual Vibration Tomography: Estimating Interior Material Properties From Monocular Video: Berthy T. Feng,

Alexander C. Ogren,

Chiara Daraio,

Katherine L. Bouman; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Feng_2022_CVPR, author = {Feng, Berthy T. and Ogren, Alexander C. and Daraio, Chiara and Bouman, Katherine L.}, title = {Visual Vibration Tomography: Estimating Interior Material Properties From Monocular Video}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16231-16240} }
Rope3D: The Roadside Perception Dataset for Autonomous Driving and Monocular 3D Object Detection Task: Xiaoqing Ye,

Mao Shu,

Hanyu Li,

Yifeng Shi,

Yingying Li,

Guangjie Wang,

Xiao Tan,

Errui Ding; [pdf] [supp]
[bibtex]
@InProceedings{Ye_2022_CVPR, author = {Ye, Xiaoqing and Shu, Mao and Li, Hanyu and Shi, Yifeng and Li, Yingying and Wang, Guangjie and Tan, Xiao and Ding, Errui}, title = {Rope3D: The Roadside Perception Dataset for Autonomous Driving and Monocular 3D Object Detection Task}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21341-21350} }
Noisy Boundaries: Lemon or Lemonade for Semi-Supervised Instance Segmentation?: Zhenyu Wang,

Yali Li,

Shengjin Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2022_CVPR, author = {Wang, Zhenyu and Li, Yali and Wang, Shengjin}, title = {Noisy Boundaries: Lemon or Lemonade for Semi-Supervised Instance Segmentation?}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16826-16835} }
Boosting View Synthesis With Residual Transfer: Xuejian Rong,

Jia-Bin Huang,

Ayush Saraf,

Changil Kim,

Johannes Kopf; [pdf]
[bibtex]
@InProceedings{Rong_2022_CVPR, author = {Rong, Xuejian and Huang, Jia-Bin and Saraf, Ayush and Kim, Changil and Kopf, Johannes}, title = {Boosting View Synthesis With Residual Transfer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19760-19769} }
Think Global, Act Local: Dual-Scale Graph Transformer for Vision-and-Language Navigation: Shizhe Chen,

Pierre-Louis Guhur,

Makarand Tapaswi,

Cordelia Schmid,

Ivan Laptev; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2022_CVPR, author = {Chen, Shizhe and Guhur, Pierre-Louis and Tapaswi, Makarand and Schmid, Cordelia and Laptev, Ivan}, title = {Think Global, Act Local: Dual-Scale Graph Transformer for Vision-and-Language Navigation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16537-16547} }
Towards Layer-Wise Image Vectorization: Xu Ma,

Yuqian Zhou,

Xingqian Xu,

Bin Sun,

Valerii Filev,

Nikita Orlov,

Yun Fu,

Humphrey Shi; [pdf] [supp]
[bibtex]
@InProceedings{Ma_2022_CVPR, author = {Ma, Xu and Zhou, Yuqian and Xu, Xingqian and Sun, Bin and Filev, Valerii and Orlov, Nikita and Fu, Yun and Shi, Humphrey}, title = {Towards Layer-Wise Image Vectorization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16314-16323} }
Scenic: A JAX Library for Computer Vision Research and Beyond: Mostafa Dehghani,

Alexey Gritsenko,

Anurag Arnab,

Matthias Minderer,

Yi Tay; [pdf] [arXiv]
[bibtex]
@InProceedings{Dehghani_2022_CVPR, author = {Dehghani, Mostafa and Gritsenko, Alexey and Arnab, Anurag and Minderer, Matthias and Tay, Yi}, title = {Scenic: A JAX Library for Computer Vision Research and Beyond}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21393-21398} }
CNN Filter DB: An Empirical Investigation of Trained Convolutional Filters: Paul Gavrikov,

Janis Keuper; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gavrikov_2022_CVPR, author = {Gavrikov, Paul and Keuper, Janis}, title = {CNN Filter DB: An Empirical Investigation of Trained Convolutional Filters}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19066-19076} }
ScePT: Scene-Consistent, Policy-Based Trajectory Predictions for Planning: Yuxiao Chen,

Boris Ivanovic,

Marco Pavone; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2022_CVPR, author = {Chen, Yuxiao and Ivanovic, Boris and Pavone, Marco}, title = {ScePT: Scene-Consistent, Policy-Based Trajectory Predictions for Planning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17103-17112} }
Deep Saliency Prior for Reducing Visual Distraction: Kfir Aberman,

Junfeng He,

Yossi Gandelsman,

Inbar Mosseri,

David E. Jacobs,

Kai Kohlhoff,

Yael Pritch,

Michael Rubinstein; [pdf] [arXiv]
[bibtex]
@InProceedings{Aberman_2022_CVPR, author = {Aberman, Kfir and He, Junfeng and Gandelsman, Yossi and Mosseri, Inbar and Jacobs, David E. and Kohlhoff, Kai and Pritch, Yael and Rubinstein, Michael}, title = {Deep Saliency Prior for Reducing Visual Distraction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19851-19860} }
Efficient Large-Scale Localization by Global Instance Recognition: Fei Xue,

Ignas Budvytis,

Daniel Olmeda Reino,

Roberto Cipolla; [pdf] [supp]
[bibtex]
@InProceedings{Xue_2022_CVPR, author = {Xue, Fei and Budvytis, Ignas and Reino, Daniel Olmeda and Cipolla, Roberto}, title = {Efficient Large-Scale Localization by Global Instance Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17348-17357} }
Spatial Commonsense Graph for Object Localisation in Partial Scenes: Francesco Giuliari,

Geri Skenderi,

Marco Cristani,

Yiming Wang,

Alessio Del Bue; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Giuliari_2022_CVPR, author = {Giuliari, Francesco and Skenderi, Geri and Cristani, Marco and Wang, Yiming and Del Bue, Alessio}, title = {Spatial Commonsense Graph for Object Localisation in Partial Scenes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19518-19527} }
Physically-Guided Disentangled Implicit Rendering for 3D Face Modeling: Zhenyu Zhang,

Yanhao Ge,

Ying Tai,

Weijian Cao,

Renwang Chen,

Kunlin Liu,

Hao Tang,

Xiaoming Huang,

Chengjie Wang,

Zhifeng Xie,

Dongjin Huang; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2022_CVPR, author = {Zhang, Zhenyu and Ge, Yanhao and Tai, Ying and Cao, Weijian and Chen, Renwang and Liu, Kunlin and Tang, Hao and Huang, Xiaoming and Wang, Chengjie and Xie, Zhifeng and Huang, Dongjin}, title = {Physically-Guided Disentangled Implicit Rendering for 3D Face Modeling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20353-20363} }
M5Product: Self-Harmonized Contrastive Learning for E-Commercial Multi-Modal Pretraining: Xiao Dong,

Xunlin Zhan,

Yangxin Wu,

Yunchao Wei,

Michael C. Kampffmeyer,

Xiaoyong Wei,

Minlong Lu,

Yaowei Wang,

Xiaodan Liang; [pdf] [supp]
[bibtex]
@InProceedings{Dong_2022_CVPR, author = {Dong, Xiao and Zhan, Xunlin and Wu, Yangxin and Wei, Yunchao and Kampffmeyer, Michael C. and Wei, Xiaoyong and Lu, Minlong and Wang, Yaowei and Liang, Xiaodan}, title = {M5Product: Self-Harmonized Contrastive Learning for E-Commercial Multi-Modal Pretraining}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21252-21262} }
On Guiding Visual Attention With Language Specification: Suzanne Petryk,

Lisa Dunlap,

Keyan Nasseri,

Joseph Gonzalez,

Trevor Darrell,

Anna Rohrbach; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Petryk_2022_CVPR, author = {Petryk, Suzanne and Dunlap, Lisa and Nasseri, Keyan and Gonzalez, Joseph and Darrell, Trevor and Rohrbach, Anna}, title = {On Guiding Visual Attention With Language Specification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18092-18102} }
ReSTR: Convolution-Free Referring Image Segmentation Using Transformers: Namyup Kim,

Dongwon Kim,

Cuiling Lan,

Wenjun Zeng,

Suha Kwak; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2022_CVPR, author = {Kim, Namyup and Kim, Dongwon and Lan, Cuiling and Zeng, Wenjun and Kwak, Suha}, title = {ReSTR: Convolution-Free Referring Image Segmentation Using Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18145-18154} }
Use All the Labels: A Hierarchical Multi-Label Contrastive Learning Framework: Shu Zhang,

Ran Xu,

Caiming Xiong,

Chetan Ramaiah; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2022_CVPR, author = {Zhang, Shu and Xu, Ran and Xiong, Caiming and Ramaiah, Chetan}, title = {Use All the Labels: A Hierarchical Multi-Label Contrastive Learning Framework}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16660-16669} }
SGTR: End-to-End Scene Graph Generation With Transformer: Rongjie Li,

Songyang Zhang,

Xuming He; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Rongjie and Zhang, Songyang and He, Xuming}, title = {SGTR: End-to-End Scene Graph Generation With Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19486-19496} }
Set-Supervised Action Learning in Procedural Task Videos via Pairwise Order Consistency: Zijia Lu,

Ehsan Elhamifar; [pdf] [supp]
[bibtex]
@InProceedings{Lu_2022_CVPR, author = {Lu, Zijia and Elhamifar, Ehsan}, title = {Set-Supervised Action Learning in Procedural Task Videos via Pairwise Order Consistency}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19903-19913} }
DeepFusion: Lidar-Camera Deep Fusion for Multi-Modal 3D Object Detection: Yingwei Li,

Adams Wei Yu,

Tianjian Meng,

Ben Caine,

Jiquan Ngiam,

Daiyi Peng,

Junyang Shen,

Yifeng Lu,

Denny Zhou,

Quoc V. Le,

Alan Yuille,

Mingxing Tan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Yingwei and Yu, Adams Wei and Meng, Tianjian and Caine, Ben and Ngiam, Jiquan and Peng, Daiyi and Shen, Junyang and Lu, Yifeng and Zhou, Denny and Le, Quoc V. and Yuille, Alan and Tan, Mingxing}, title = {DeepFusion: Lidar-Camera Deep Fusion for Multi-Modal 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17182-17191} }
DeepFace-EMD: Re-Ranking Using Patch-Wise Earth Mover's Distance Improves Out-of-Distribution Face Identification: Hai Phan,

Anh Nguyen; [pdf] [supp]
[bibtex]
@InProceedings{Phan_2022_CVPR, author = {Phan, Hai and Nguyen, Anh}, title = {DeepFace-EMD: Re-Ranking Using Patch-Wise Earth Mover's Distance Improves Out-of-Distribution Face Identification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20259-20269} }
General Facial Representation Learning in a Visual-Linguistic Manner: Yinglin Zheng,

Hao Yang,

Ting Zhang,

Jianmin Bao,

Dongdong Chen,

Yangyu Huang,

Lu Yuan,

Dong Chen,

Ming Zeng,

Fang Wen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zheng_2022_CVPR, author = {Zheng, Yinglin and Yang, Hao and Zhang, Ting and Bao, Jianmin and Chen, Dongdong and Huang, Yangyu and Yuan, Lu and Chen, Dong and Zeng, Ming and Wen, Fang}, title = {General Facial Representation Learning in a Visual-Linguistic Manner}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18697-18709} }
Improving Segmentation of the Inferior Alveolar Nerve Through Deep Label Propagation: Marco Cipriano,

Stefano Allegretti,

Federico Bolelli,

Federico Pollastri,

Costantino Grana; [pdf]
[bibtex]
@InProceedings{Cipriano_2022_CVPR, author = {Cipriano, Marco and Allegretti, Stefano and Bolelli, Federico and Pollastri, Federico and Grana, Costantino}, title = {Improving Segmentation of the Inferior Alveolar Nerve Through Deep Label Propagation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21137-21146} }
Dual-Shutter Optical Vibration Sensing: Mark Sheinin,

Dorian Chan,

Matthew O'Toole,

Srinivasa G. Narasimhan; [pdf] [supp]
[bibtex]
@InProceedings{Sheinin_2022_CVPR, author = {Sheinin, Mark and Chan, Dorian and O'Toole, Matthew and Narasimhan, Srinivasa G.}, title = {Dual-Shutter Optical Vibration Sensing}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16324-16333} }
Interactiveness Field in Human-Object Interactions: Xinpeng Liu,

Yong-Lu Li,

Xiaoqian Wu,

Yu-Wing Tai,

Cewu Lu,

Chi-Keung Tang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2022_CVPR, author = {Liu, Xinpeng and Li, Yong-Lu and Wu, Xiaoqian and Tai, Yu-Wing and Lu, Cewu and Tang, Chi-Keung}, title = {Interactiveness Field in Human-Object Interactions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20113-20122} }
Self-Supervised Dense Consistency Regularization for Image-to-Image Translation: Minsu Ko,

Eunju Cha,

Sungjoo Suh,

Huijin Lee,

Jae-Joon Han,

Jinwoo Shin,

Bohyung Han; [pdf] [supp]
[bibtex]
@InProceedings{Ko_2022_CVPR, author = {Ko, Minsu and Cha, Eunju and Suh, Sungjoo and Lee, Huijin and Han, Jae-Joon and Shin, Jinwoo and Han, Bohyung}, title = {Self-Supervised Dense Consistency Regularization for Image-to-Image Translation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18301-18310} }
The Devil Is in the Details: Window-Based Attention for Image Compression: Renjie Zou,

Chunfeng Song,

Zhaoxiang Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zou_2022_CVPR, author = {Zou, Renjie and Song, Chunfeng and Zhang, Zhaoxiang}, title = {The Devil Is in the Details: Window-Based Attention for Image Compression}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17492-17501} }
Category-Aware Transformer Network for Better Human-Object Interaction Detection: Leizhen Dong,

Zhimin Li,

Kunlun Xu,

Zhijun Zhang,

Luxin Yan,

Sheng Zhong,

Xu Zou; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dong_2022_CVPR, author = {Dong, Leizhen and Li, Zhimin and Xu, Kunlun and Zhang, Zhijun and Yan, Luxin and Zhong, Sheng and Zou, Xu}, title = {Category-Aware Transformer Network for Better Human-Object Interaction Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19538-19547} }
LARGE: Latent-Based Regression Through GAN Semantics: Yotam Nitzan,

Rinon Gal,

Ofir Brenner,

Daniel Cohen-Or; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Nitzan_2022_CVPR, author = {Nitzan, Yotam and Gal, Rinon and Brenner, Ofir and Cohen-Or, Daniel}, title = {LARGE: Latent-Based Regression Through GAN Semantics}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19239-19249} }
Are Multimodal Transformers Robust to Missing Modality?: Mengmeng Ma,

Jian Ren,

Long Zhao,

Davide Testuggine,

Xi Peng; [pdf] [arXiv]
[bibtex]
@InProceedings{Ma_2022_CVPR, author = {Ma, Mengmeng and Ren, Jian and Zhao, Long and Testuggine, Davide and Peng, Xi}, title = {Are Multimodal Transformers Robust to Missing Modality?}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18177-18186} }
Fisher Information Guidance for Learned Time-of-Flight Imaging: Jiaqu Li,

Tao Yue,

Sijie Zhao,

Xuemei Hu; [pdf] [supp]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Jiaqu and Yue, Tao and Zhao, Sijie and Hu, Xuemei}, title = {Fisher Information Guidance for Learned Time-of-Flight Imaging}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16334-16343} }
VRDFormer: End-to-End Video Visual Relation Detection With Transformers: Sipeng Zheng,

Shizhe Chen,

Qin Jin; [pdf] [supp]
[bibtex]
@InProceedings{Zheng_2022_CVPR, author = {Zheng, Sipeng and Chen, Shizhe and Jin, Qin}, title = {VRDFormer: End-to-End Video Visual Relation Detection With Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18836-18846} }
CLIPstyler: Image Style Transfer With a Single Text Condition: Gihyun Kwon,

Jong Chul Ye; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kwon_2022_CVPR, author = {Kwon, Gihyun and Ye, Jong Chul}, title = {CLIPstyler: Image Style Transfer With a Single Text Condition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18062-18071} }
Ray Priors Through Reprojection: Improving Neural Radiance Fields for Novel View Extrapolation: Jian Zhang,

Yuanqing Zhang,

Huan Fu,

Xiaowei Zhou,

Bowen Cai,

Jinchi Huang,

Rongfei Jia,

Binqiang Zhao,

Xing Tang; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhang_2022_CVPR, author = {Zhang, Jian and Zhang, Yuanqing and Fu, Huan and Zhou, Xiaowei and Cai, Bowen and Huang, Jinchi and Jia, Rongfei and Zhao, Binqiang and Tang, Xing}, title = {Ray Priors Through Reprojection: Improving Neural Radiance Fields for Novel View Extrapolation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18376-18386} }
Spatio-Temporal Relation Modeling for Few-Shot Action Recognition: Anirudh Thatipelli,

Sanath Narayan,

Salman Khan,

Rao Muhammad Anwer,

Fahad Shahbaz Khan,

Bernard Ghanem; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Thatipelli_2022_CVPR, author = {Thatipelli, Anirudh and Narayan, Sanath and Khan, Salman and Anwer, Rao Muhammad and Khan, Fahad Shahbaz and Ghanem, Bernard}, title = {Spatio-Temporal Relation Modeling for Few-Shot Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19958-19967} }
Pop-Out Motion: 3D-Aware Image Deformation via Learning the Shape Laplacian: Jihyun Lee,

Minhyuk Sung,

Hyunjin Kim,

Tae-Kyun Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2022_CVPR, author = {Lee, Jihyun and Sung, Minhyuk and Kim, Hyunjin and Kim, Tae-Kyun}, title = {Pop-Out Motion: 3D-Aware Image Deformation via Learning the Shape Laplacian}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18532-18541} }
Towards Noiseless Object Contours for Weakly Supervised Semantic Segmentation: Jing Li,

Junsong Fan,

Zhaoxiang Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Jing and Fan, Junsong and Zhang, Zhaoxiang}, title = {Towards Noiseless Object Contours for Weakly Supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16856-16865} }
Unsupervised Image-to-Image Translation With Generative Prior: Shuai Yang,

Liming Jiang,

Ziwei Liu,

Chen Change Loy; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2022_CVPR, author = {Yang, Shuai and Jiang, Liming and Liu, Ziwei and Loy, Chen Change}, title = {Unsupervised Image-to-Image Translation With Generative Prior}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18332-18341} }
Multi-Marginal Contrastive Learning for Multi-Label Subcellular Protein Localization: Ziyi Liu,

Zengmao Wang,

Bo Du; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2022_CVPR, author = {Liu, Ziyi and Wang, Zengmao and Du, Bo}, title = {Multi-Marginal Contrastive Learning for Multi-Label Subcellular Protein Localization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20626-20635} }
Predict, Prevent, and Evaluate: Disentangled Text-Driven Image Manipulation Empowered by Pre-Trained Vision-Language Model: Zipeng Xu,

Tianwei Lin,

Hao Tang,

Fu Li,

Dongliang He,

Nicu Sebe,

Radu Timofte,

Luc Van Gool,

Errui Ding; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2022_CVPR, author = {Xu, Zipeng and Lin, Tianwei and Tang, Hao and Li, Fu and He, Dongliang and Sebe, Nicu and Timofte, Radu and Van Gool, Luc and Ding, Errui}, title = {Predict, Prevent, and Evaluate: Disentangled Text-Driven Image Manipulation Empowered by Pre-Trained Vision-Language Model}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18229-18238} }
RU-Net: Regularized Unrolling Network for Scene Graph Generation: Xin Lin,

Changxing Ding,

Jing Zhang,

Yibing Zhan,

Dacheng Tao; [pdf] [supp]
[bibtex]
@InProceedings{Lin_2022_CVPR, author = {Lin, Xin and Ding, Changxing and Zhang, Jing and Zhan, Yibing and Tao, Dacheng}, title = {RU-Net: Regularized Unrolling Network for Scene Graph Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19457-19466} }
Integrating Language Guidance Into Vision-Based Deep Metric Learning: Karsten Roth,

Oriol Vinyals,

Zeynep Akata; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Roth_2022_CVPR, author = {Roth, Karsten and Vinyals, Oriol and Akata, Zeynep}, title = {Integrating Language Guidance Into Vision-Based Deep Metric Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16177-16189} }
PartGlot: Learning Shape Part Segmentation From Language Reference Games: Juil Koo,

Ian Huang,

Panos Achlioptas,

Leonidas J. Guibas,

Minhyuk Sung; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Koo_2022_CVPR, author = {Koo, Juil and Huang, Ian and Achlioptas, Panos and Guibas, Leonidas J. and Sung, Minhyuk}, title = {PartGlot: Learning Shape Part Segmentation From Language Reference Games}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16505-16514} }
DIVeR: Real-Time and Accurate Neural Radiance Fields With Deterministic Integration for Volume Rendering: Liwen Wu,

Jae Yong Lee,

Anand Bhattad,

Yu-Xiong Wang,

David Forsyth; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2022_CVPR, author = {Wu, Liwen and Lee, Jae Yong and Bhattad, Anand and Wang, Yu-Xiong and Forsyth, David}, title = {DIVeR: Real-Time and Accurate Neural Radiance Fields With Deterministic Integration for Volume Rendering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16200-16209} }
ContIG: Self-Supervised Multimodal Contrastive Learning for Medical Imaging With Genetics: Aiham Taleb,

Matthias Kirchler,

Remo Monti,

Christoph Lippert; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Taleb_2022_CVPR, author = {Taleb, Aiham and Kirchler, Matthias and Monti, Remo and Lippert, Christoph}, title = {ContIG: Self-Supervised Multimodal Contrastive Learning for Medical Imaging With Genetics}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20908-20921} }
Disentangling Visual and Written Concepts in CLIP: Joanna Materzyńska,

Antonio Torralba,

David Bau; [pdf]
[bibtex]
@InProceedings{Materzynska_2022_CVPR, author = {Materzy\'nska, Joanna and Torralba, Antonio and Bau, David}, title = {Disentangling Visual and Written Concepts in CLIP}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16410-16419} }
Bilateral Video Magnification Filter: Shoichiro Takeda,

Kenta Niwa,

Mariko Isogawa,

Shinya Shimizu,

Kazuki Okami,

Yushi Aono; [pdf] [supp]
[bibtex]
@InProceedings{Takeda_2022_CVPR, author = {Takeda, Shoichiro and Niwa, Kenta and Isogawa, Mariko and Shimizu, Shinya and Okami, Kazuki and Aono, Yushi}, title = {Bilateral Video Magnification Filter}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17369-17378} }
AdaFocus V2: End-to-End Training of Spatial Dynamic Networks for Video Recognition: Yulin Wang,

Yang Yue,

Yuanze Lin,

Haojun Jiang,

Zihang Lai,

Victor Kulikov,

Nikita Orlov,

Humphrey Shi,

Gao Huang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2022_CVPR, author = {Wang, Yulin and Yue, Yang and Lin, Yuanze and Jiang, Haojun and Lai, Zihang and Kulikov, Victor and Orlov, Nikita and Shi, Humphrey and Huang, Gao}, title = {AdaFocus V2: End-to-End Training of Spatial Dynamic Networks for Video Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20062-20072} }
Neural Mean Discrepancy for Efficient Out-of-Distribution Detection: Xin Dong,

Junfeng Guo,

Ang Li,

Wei-Te Ting,

Cong Liu,

H.T. Kung; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dong_2022_CVPR, author = {Dong, Xin and Guo, Junfeng and Li, Ang and Ting, Wei-Te and Liu, Cong and Kung, H.T.}, title = {Neural Mean Discrepancy for Efficient Out-of-Distribution Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19217-19227} }
Time Lens++: Event-Based Frame Interpolation With Parametric Non-Linear Flow and Multi-Scale Fusion: Stepan Tulyakov,

Alfredo Bochicchio,

Daniel Gehrig,

Stamatios Georgoulis,

Yuanyou Li,

Davide Scaramuzza; [pdf] [supp]
[bibtex]
@InProceedings{Tulyakov_2022_CVPR, author = {Tulyakov, Stepan and Bochicchio, Alfredo and Gehrig, Daniel and Georgoulis, Stamatios and Li, Yuanyou and Scaramuzza, Davide}, title = {Time Lens++: Event-Based Frame Interpolation With Parametric Non-Linear Flow and Multi-Scale Fusion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17755-17764} }
It Is Okay To Not Be Okay: Overcoming Emotional Bias in Affective Image Captioning by Contrastive Data Collection: Youssef Mohamed,

Faizan Farooq Khan,

Kilichbek Haydarov,

Mohamed Elhoseiny; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mohamed_2022_CVPR, author = {Mohamed, Youssef and Khan, Faizan Farooq and Haydarov, Kilichbek and Elhoseiny, Mohamed}, title = {It Is Okay To Not Be Okay: Overcoming Emotional Bias in Affective Image Captioning by Contrastive Data Collection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21263-21272} }
Neural Global Shutter: Learn To Restore Video From a Rolling Shutter Camera With Global Reset Feature: Zhixiang Wang,

Xiang Ji,

Jia-Bin Huang,

Shin'ichi Satoh,

Xiao Zhou,

Yinqiang Zheng; [pdf] [arXiv]
[bibtex]
@InProceedings{Wang_2022_CVPR, author = {Wang, Zhixiang and Ji, Xiang and Huang, Jia-Bin and Satoh, Shin'ichi and Zhou, Xiao and Zheng, Yinqiang}, title = {Neural Global Shutter: Learn To Restore Video From a Rolling Shutter Camera With Global Reset Feature}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17794-17803} }
DiRA: Discriminative, Restorative, and Adversarial Learning for Self-Supervised Medical Image Analysis: Fatemeh Haghighi,

Mohammad Reza Hosseinzadeh Taher,

Michael B. Gotway,

Jianming Liang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Haghighi_2022_CVPR, author = {Haghighi, Fatemeh and Taher, Mohammad Reza Hosseinzadeh and Gotway, Michael B. and Liang, Jianming}, title = {DiRA: Discriminative, Restorative, and Adversarial Learning for Self-Supervised Medical Image Analysis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20824-20834} }
Open Challenges in Deep Stereo: The Booster Dataset: Pierluigi Zama Ramirez,

Fabio Tosi,

Matteo Poggi,

Samuele Salti,

Stefano Mattoccia,

Luigi Di Stefano; [pdf] [supp]
[bibtex]
@InProceedings{Ramirez_2022_CVPR, author = {Ramirez, Pierluigi Zama and Tosi, Fabio and Poggi, Matteo and Salti, Samuele and Mattoccia, Stefano and Di Stefano, Luigi}, title = {Open Challenges in Deep Stereo: The Booster Dataset}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21168-21178} }
Self-Supervised Bulk Motion Artifact Removal in Optical Coherence Tomography Angiography: Jiaxiang Ren,

Kicheon Park,

Yingtian Pan,

Haibin Ling; [pdf] [arXiv]
[bibtex]
@InProceedings{Ren_2022_CVPR, author = {Ren, Jiaxiang and Park, Kicheon and Pan, Yingtian and Ling, Haibin}, title = {Self-Supervised Bulk Motion Artifact Removal in Optical Coherence Tomography Angiography}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20617-20625} }
PoseTrack21: A Dataset for Person Search, Multi-Object Tracking and Multi-Person Pose Tracking: Andreas Döring,

Di Chen,

Shanshan Zhang,

Bernt Schiele,

Jürgen Gall; [pdf] [supp]
[bibtex]
@InProceedings{Doring_2022_CVPR, author = {D\"oring, Andreas and Chen, Di and Zhang, Shanshan and Schiele, Bernt and Gall, J\"urgen}, title = {PoseTrack21: A Dataset for Person Search, Multi-Object Tracking and Multi-Person Pose Tracking}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20963-20972} }
Ithaca365: Dataset and Driving Perception Under Repeated and Challenging Weather Conditions: Carlos A. Diaz-Ruiz,

Youya Xia,

Yurong You,

Jose Nino,

Junan Chen,

Josephine Monica,

Xiangyu Chen,

Katie Luo,

Yan Wang,

Marc Emond,

Wei-Lun Chao,

Bharath Hariharan,

Kilian Q. Weinberger,

Mark Campbell; [pdf] [supp]
[bibtex]
@InProceedings{Diaz-Ruiz_2022_CVPR, author = {Diaz-Ruiz, Carlos A. and Xia, Youya and You, Yurong and Nino, Jose and Chen, Junan and Monica, Josephine and Chen, Xiangyu and Luo, Katie and Wang, Yan and Emond, Marc and Chao, Wei-Lun and Hariharan, Bharath and Weinberger, Kilian Q. and Campbell, Mark}, title = {Ithaca365: Dataset and Driving Perception Under Repeated and Challenging Weather Conditions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21383-21392} }
YouMVOS: An Actor-Centric Multi-Shot Video Object Segmentation Dataset: Donglai Wei,

Siddhant Kharbanda,

Sarthak Arora,

Roshan Roy,

Nishant Jain,

Akash Palrecha,

Tanav Shah,

Shray Mathur,

Ritik Mathur,

Abhijay Kemkar,

Anirudh Chakravarthy,

Zudi Lin,

Won-Dong Jang,

Yansong Tang,

Song Bai,

James Tompkin,

Philip H.S. Torr,

Hanspeter Pfister; [pdf]
[bibtex]
@InProceedings{Wei_2022_CVPR, author = {Wei, Donglai and Kharbanda, Siddhant and Arora, Sarthak and Roy, Roshan and Jain, Nishant and Palrecha, Akash and Shah, Tanav and Mathur, Shray and Mathur, Ritik and Kemkar, Abhijay and Chakravarthy, Anirudh and Lin, Zudi and Jang, Won-Dong and Tang, Yansong and Bai, Song and Tompkin, James and Torr, Philip H.S. and Pfister, Hanspeter}, title = {YouMVOS: An Actor-Centric Multi-Shot Video Object Segmentation Dataset}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21044-21053} }
Rethinking Spatial Invariance of Convolutional Networks for Object Counting: Zhi-Qi Cheng,

Qi Dai,

Hong Li,

Jingkuan Song,

Xiao Wu,

Alexander G. Hauptmann; [pdf]
[bibtex]
@InProceedings{Cheng_2022_CVPR, author = {Cheng, Zhi-Qi and Dai, Qi and Li, Hong and Song, Jingkuan and Wu, Xiao and Hauptmann, Alexander G.}, title = {Rethinking Spatial Invariance of Convolutional Networks for Object Counting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19638-19648} }
Geometric Anchor Correspondence Mining With Uncertainty Modeling for Universal Domain Adaptation: Liang Chen,

Yihang Lou,

Jianzhong He,

Tao Bai,

Minghua Deng; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2022_CVPR, author = {Chen, Liang and Lou, Yihang and He, Jianzhong and Bai, Tao and Deng, Minghua}, title = {Geometric Anchor Correspondence Mining With Uncertainty Modeling for Universal Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16134-16143} }
Coopernaut: End-to-End Driving With Cooperative Perception for Networked Vehicles: Jiaxun Cui,

Hang Qiu,

Dian Chen,

Peter Stone,

Yuke Zhu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cui_2022_CVPR, author = {Cui, Jiaxun and Qiu, Hang and Chen, Dian and Stone, Peter and Zhu, Yuke}, title = {Coopernaut: End-to-End Driving With Cooperative Perception for Networked Vehicles}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17252-17262} }
Few-Shot Keypoint Detection With Uncertainty Learning for Unseen Species: Changsheng Lu,

Piotr Koniusz; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lu_2022_CVPR, author = {Lu, Changsheng and Koniusz, Piotr}, title = {Few-Shot Keypoint Detection With Uncertainty Learning for Unseen Species}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19416-19426} }
3D-SPS: Single-Stage 3D Visual Grounding via Referred Point Progressive Selection: Junyu Luo,

Jiahui Fu,

Xianghao Kong,

Chen Gao,

Haibing Ren,

Hao Shen,

Huaxia Xia,

Si Liu; [pdf]
[bibtex]
@InProceedings{Luo_2022_CVPR, author = {Luo, Junyu and Fu, Jiahui and Kong, Xianghao and Gao, Chen and Ren, Haibing and Shen, Hao and Xia, Huaxia and Liu, Si}, title = {3D-SPS: Single-Stage 3D Visual Grounding via Referred Point Progressive Selection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16454-16463} }
Learning Multiple Dense Prediction Tasks From Partially Annotated Data: Wei-Hong Li,

Xialei Liu,

Hakan Bilen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Wei-Hong and Liu, Xialei and Bilen, Hakan}, title = {Learning Multiple Dense Prediction Tasks From Partially Annotated Data}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18879-18889} }
Towards Low-Cost and Efficient Malaria Detection: Waqas Sultani,

Wajahat Nawaz,

Syed Javed,

Muhammad Sohail Danish,

Asma Saadia,

Mohsen Ali; [pdf] [arXiv]
[bibtex]
@InProceedings{Sultani_2022_CVPR, author = {Sultani, Waqas and Nawaz, Wajahat and Javed, Syed and Danish, Muhammad Sohail and Saadia, Asma and Ali, Mohsen}, title = {Towards Low-Cost and Efficient Malaria Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20687-20696} }
Learning Neural Light Fields With Ray-Space Embedding: Benjamin Attal,

Jia-Bin Huang,

Michael Zollhöfer,

Johannes Kopf,

Changil Kim; [pdf] [supp]
[bibtex]
@InProceedings{Attal_2022_CVPR, author = {Attal, Benjamin and Huang, Jia-Bin and Zollh\"ofer, Michael and Kopf, Johannes and Kim, Changil}, title = {Learning Neural Light Fields With Ray-Space Embedding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19819-19829} }
Clean Implicit 3D Structure From Noisy 2D STEM Images: Hannah Kniesel,

Timo Ropinski,

Tim Bergner,

Kavitha Shaga Devan,

Clarissa Read,

Paul Walther,

Tobias Ritschel,

Pedro Hermosilla; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kniesel_2022_CVPR, author = {Kniesel, Hannah and Ropinski, Timo and Bergner, Tim and Devan, Kavitha Shaga and Read, Clarissa and Walther, Paul and Ritschel, Tobias and Hermosilla, Pedro}, title = {Clean Implicit 3D Structure From Noisy 2D STEM Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20762-20772} }
UKPGAN: A General Self-Supervised Keypoint Detector: Yang You,

Wenhai Liu,

Yanjie Ze,

Yong-Lu Li,

Weiming Wang,

Cewu Lu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{You_2022_CVPR, author = {You, Yang and Liu, Wenhai and Ze, Yanjie and Li, Yong-Lu and Wang, Weiming and Lu, Cewu}, title = {UKPGAN: A General Self-Supervised Keypoint Detector}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17042-17051} }
Learning Optimal K-Space Acquisition and Reconstruction Using Physics-Informed Neural Networks: Wei Peng,

Li Feng,

Guoying Zhao,

Fang Liu; [pdf] [supp]
[bibtex]
@InProceedings{Peng_2022_CVPR, author = {Peng, Wei and Feng, Li and Zhao, Guoying and Liu, Fang}, title = {Learning Optimal K-Space Acquisition and Reconstruction Using Physics-Informed Neural Networks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20794-20803} }
Raw High-Definition Radar for Multi-Task Learning: Julien Rebut,

Arthur Ouaknine,

Waqas Malik,

Patrick Pérez; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Rebut_2022_CVPR, author = {Rebut, Julien and Ouaknine, Arthur and Malik, Waqas and P\'erez, Patrick}, title = {Raw High-Definition Radar for Multi-Task Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17021-17030} }
Exploring Set Similarity for Dense Self-Supervised Representation Learning: Zhaoqing Wang,

Qiang Li,

Guoxin Zhang,

Pengfei Wan,

Wen Zheng,

Nannan Wang,

Mingming Gong,

Tongliang Liu; [pdf] [arXiv]
[bibtex]
@InProceedings{Wang_2022_CVPR, author = {Wang, Zhaoqing and Li, Qiang and Zhang, Guoxin and Wan, Pengfei and Zheng, Wen and Wang, Nannan and Gong, Mingming and Liu, Tongliang}, title = {Exploring Set Similarity for Dense Self-Supervised Representation Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16590-16599} }
ONCE-3DLanes: Building Monocular 3D Lane Detection: Fan Yan,

Ming Nie,

Xinyue Cai,

Jianhua Han,

Hang Xu,

Zhen Yang,

Chaoqiang Ye,

Yanwei Fu,

Michael Bi Mi,

Li Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Yan_2022_CVPR, author = {Yan, Fan and Nie, Ming and Cai, Xinyue and Han, Jianhua and Xu, Hang and Yang, Zhen and Ye, Chaoqiang and Fu, Yanwei and Mi, Michael Bi and Zhang, Li}, title = {ONCE-3DLanes: Building Monocular 3D Lane Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17143-17152} }
Weakly but Deeply Supervised Occlusion-Reasoned Parametric Road Layouts: Buyu Liu,

Bingbing Zhuang,

Manmohan Chandraker; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2022_CVPR, author = {Liu, Buyu and Zhuang, Bingbing and Chandraker, Manmohan}, title = {Weakly but Deeply Supervised Occlusion-Reasoned Parametric Road Layouts}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17000-17009} }
Modulated Contrast for Versatile Image Synthesis: Fangneng Zhan,

Jiahui Zhang,

Yingchen Yu,

Rongliang Wu,

Shijian Lu; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhan_2022_CVPR, author = {Zhan, Fangneng and Zhang, Jiahui and Yu, Yingchen and Wu, Rongliang and Lu, Shijian}, title = {Modulated Contrast for Versatile Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18280-18290} }
Identifying Ambiguous Similarity Conditions via Semantic Matching: Han-Jia Ye,

Yi Shi,

De-Chuan Zhan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ye_2022_CVPR, author = {Ye, Han-Jia and Shi, Yi and Zhan, De-Chuan}, title = {Identifying Ambiguous Similarity Conditions via Semantic Matching}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16610-16619} }
MSTR: Multi-Scale Transformer for End-to-End Human-Object Interaction Detection: Bumsoo Kim,

Jonghwan Mun,

Kyoung-Woon On,

Minchul Shin,

Junhyun Lee,

Eun-Sol Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2022_CVPR, author = {Kim, Bumsoo and Mun, Jonghwan and On, Kyoung-Woon and Shin, Minchul and Lee, Junhyun and Kim, Eun-Sol}, title = {MSTR: Multi-Scale Transformer for End-to-End Human-Object Interaction Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19578-19587} }
DetectorDetective: Investigating the Effects of Adversarial Examples on Object Detectors: Sivapriya Vellaichamy,

Matthew Hull,

Zijie J. Wang,

Nilaksh Das,

ShengYun Peng,

Haekyu Park,

Duen Horng (Polo) Chau; [pdf]
[bibtex]
@InProceedings{Vellaichamy_2022_CVPR, author = {Vellaichamy, Sivapriya and Hull, Matthew and Wang, Zijie J. and Das, Nilaksh and Peng, ShengYun and Park, Haekyu and Chau, Duen Horng (Polo)}, title = {DetectorDetective: Investigating the Effects of Adversarial Examples on Object Detectors}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21484-21491} }
EMScore: Evaluating Video Captioning via Coarse-Grained and Fine-Grained Embedding Matching: Yaya Shi,

Xu Yang,

Haiyang Xu,

Chunfeng Yuan,

Bing Li,

Weiming Hu,

Zheng-Jun Zha; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shi_2022_CVPR, author = {Shi, Yaya and Yang, Xu and Xu, Haiyang and Yuan, Chunfeng and Li, Bing and Hu, Weiming and Zha, Zheng-Jun}, title = {EMScore: Evaluating Video Captioning via Coarse-Grained and Fine-Grained Embedding Matching}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17929-17938} }
SNR-Aware Low-Light Image Enhancement: Xiaogang Xu,

Ruixing Wang,

Chi-Wing Fu,

Jiaya Jia; [pdf]
[bibtex]
@InProceedings{Xu_2022_CVPR, author = {Xu, Xiaogang and Wang, Ruixing and Fu, Chi-Wing and Jia, Jiaya}, title = {SNR-Aware Low-Light Image Enhancement}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17714-17724} }
3D Common Corruptions and Data Augmentation: Oğuzhan Fatih Kar,

Teresa Yeo,

Andrei Atanov,

Amir Zamir; [pdf] [arXiv]
[bibtex]
@InProceedings{Kar_2022_CVPR, author = {Kar, O\u{g}uzhan Fatih and Yeo, Teresa and Atanov, Andrei and Zamir, Amir}, title = {3D Common Corruptions and Data Augmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18963-18974} }
Injecting Semantic Concepts Into End-to-End Image Captioning: Zhiyuan Fang,

Jianfeng Wang,

Xiaowei Hu,

Lin Liang,

Zhe Gan,

Lijuan Wang,

Yezhou Yang,

Zicheng Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Fang_2022_CVPR, author = {Fang, Zhiyuan and Wang, Jianfeng and Hu, Xiaowei and Liang, Lin and Gan, Zhe and Wang, Lijuan and Yang, Yezhou and Liu, Zicheng}, title = {Injecting Semantic Concepts Into End-to-End Image Captioning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18009-18019} }
L2G: A Simple Local-to-Global Knowledge Transfer Framework for Weakly Supervised Semantic Segmentation: Peng-Tao Jiang,

Yuqi Yang,

Qibin Hou,

Yunchao Wei; [pdf] [arXiv]
[bibtex]
@InProceedings{Jiang_2022_CVPR, author = {Jiang, Peng-Tao and Yang, Yuqi and Hou, Qibin and Wei, Yunchao}, title = {L2G: A Simple Local-to-Global Knowledge Transfer Framework for Weakly Supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16886-16896} }
VL-InterpreT: An Interactive Visualization Tool for Interpreting Vision-Language Transformers: Estelle Aflalo,

Meng Du,

Shao-Yen Tseng,

Yongfei Liu,

Chenfei Wu,

Nan Duan,

Vasudev Lal; [pdf]
[bibtex]
@InProceedings{Aflalo_2022_CVPR, author = {Aflalo, Estelle and Du, Meng and Tseng, Shao-Yen and Liu, Yongfei and Wu, Chenfei and Duan, Nan and Lal, Vasudev}, title = {VL-InterpreT: An Interactive Visualization Tool for Interpreting Vision-Language Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21406-21415} }
LiDAR Snowfall Simulation for Robust 3D Object Detection: Martin Hahner,

Christos Sakaridis,

Mario Bijelic,

Felix Heide,

Fisher Yu,

Dengxin Dai,

Luc Van Gool; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hahner_2022_CVPR, author = {Hahner, Martin and Sakaridis, Christos and Bijelic, Mario and Heide, Felix and Yu, Fisher and Dai, Dengxin and Van Gool, Luc}, title = {LiDAR Snowfall Simulation for Robust 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16364-16374} }
Structural and Statistical Texture Knowledge Distillation for Semantic Segmentation: Deyi Ji,

Haoran Wang,

Mingyuan Tao,

Jianqiang Huang,

Xian-Sheng Hua,

Hongtao Lu; [pdf]
[bibtex]
@InProceedings{Ji_2022_CVPR, author = {Ji, Deyi and Wang, Haoran and Tao, Mingyuan and Huang, Jianqiang and Hua, Xian-Sheng and Lu, Hongtao}, title = {Structural and Statistical Texture Knowledge Distillation for Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16876-16885} }
Blended Diffusion for Text-Driven Editing of Natural Images: Omri Avrahami,

Dani Lischinski,

Ohad Fried; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Avrahami_2022_CVPR, author = {Avrahami, Omri and Lischinski, Dani and Fried, Ohad}, title = {Blended Diffusion for Text-Driven Editing of Natural Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {18208-18218} }
BE-STI: Spatial-Temporal Integrated Network for Class-Agnostic Motion Prediction With Bidirectional Enhancement: Yunlong Wang,

Hongyu Pan,

Jun Zhu,

Yu-Huan Wu,

Xin Zhan,

Kun Jiang,

Diange Yang; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2022_CVPR, author = {Wang, Yunlong and Pan, Hongyu and Zhu, Jun and Wu, Yu-Huan and Zhan, Xin and Jiang, Kun and Yang, Diange}, title = {BE-STI: Spatial-Temporal Integrated Network for Class-Agnostic Motion Prediction With Bidirectional Enhancement}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17093-17102} }
A Structured Dictionary Perspective on Implicit Neural Representations: Gizem Yüce,

Guillermo Ortiz-Jiménez,

Beril Besbinar,

Pascal Frossard; [pdf] [supp]
[bibtex]
@InProceedings{Yuce_2022_CVPR, author = {Y\"uce, Gizem and Ortiz-Jim\'enez, Guillermo and Besbinar, Beril and Frossard, Pascal}, title = {A Structured Dictionary Perspective on Implicit Neural Representations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19228-19238} }
Learning To Answer Questions in Dynamic Audio-Visual Scenarios: Guangyao Li,

Yake Wei,

Yapeng Tian,

Chenliang Xu,

Ji-Rong Wen,

Di Hu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Guangyao and Wei, Yake and Tian, Yapeng and Xu, Chenliang and Wen, Ji-Rong and Hu, Di}, title = {Learning To Answer Questions in Dynamic Audio-Visual Scenarios}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19108-19118} }
Synthetic Aperture Imaging With Events and Frames: Wei Liao,

Xiang Zhang,

Lei Yu,

Shijie Lin,

Wen Yang,

Ning Qiao; [pdf] [supp]
[bibtex]
@InProceedings{Liao_2022_CVPR, author = {Liao, Wei and Zhang, Xiang and Yu, Lei and Lin, Shijie and Yang, Wen and Qiao, Ning}, title = {Synthetic Aperture Imaging With Events and Frames}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17735-17744} }
CLIP-Event: Connecting Text and Images With Event Structures: Manling Li,

Ruochen Xu,

Shuohang Wang,

Luowei Zhou,

Xudong Lin,

Chenguang Zhu,

Michael Zeng,

Heng Ji,

Shih-Fu Chang; [pdf] [supp]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Manling and Xu, Ruochen and Wang, Shuohang and Zhou, Luowei and Lin, Xudong and Zhu, Chenguang and Zeng, Michael and Ji, Heng and Chang, Shih-Fu}, title = {CLIP-Event: Connecting Text and Images With Event Structures}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16420-16429} }
Scaling Up Vision-Language Pre-Training for Image Captioning: Xiaowei Hu,

Zhe Gan,

Jianfeng Wang,

Zhengyuan Yang,

Zicheng Liu,

Yumao Lu,

Lijuan Wang; [pdf] [arXiv]
[bibtex]
@InProceedings{Hu_2022_CVPR, author = {Hu, Xiaowei and Gan, Zhe and Wang, Jianfeng and Yang, Zhengyuan and Liu, Zicheng and Lu, Yumao and Wang, Lijuan}, title = {Scaling Up Vision-Language Pre-Training for Image Captioning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17980-17989} }
Unsupervised Action Segmentation by Joint Representation Learning and Online Clustering: Sateesh Kumar,

Sanjay Haresh,

Awais Ahmed,

Andrey Konin,

M. Zeeshan Zia,

Quoc-Huy Tran; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kumar_2022_CVPR, author = {Kumar, Sateesh and Haresh, Sanjay and Ahmed, Awais and Konin, Andrey and Zia, M. Zeeshan and Tran, Quoc-Huy}, title = {Unsupervised Action Segmentation by Joint Representation Learning and Online Clustering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20174-20185} }
LISA: Learning Implicit Shape and Appearance of Hands: Enric Corona,

Tomas Hodan,

Minh Vo,

Francesc Moreno-Noguer,

Chris Sweeney,

Richard Newcombe,

Lingni Ma; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Corona_2022_CVPR, author = {Corona, Enric and Hodan, Tomas and Vo, Minh and Moreno-Noguer, Francesc and Sweeney, Chris and Newcombe, Richard and Ma, Lingni}, title = {LISA: Learning Implicit Shape and Appearance of Hands}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20533-20543} }
DiGS: Divergence Guided Shape Implicit Neural Representation for Unoriented Point Clouds: Yizhak Ben-Shabat,

Chamin Hewa Koneputugodage,

Stephen Gould; [pdf] [supp]
[bibtex]
@InProceedings{Ben-Shabat_2022_CVPR, author = {Ben-Shabat, Yizhak and Koneputugodage, Chamin Hewa and Gould, Stephen}, title = {DiGS: Divergence Guided Shape Implicit Neural Representation for Unoriented Point Clouds}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19323-19332} }
Semi-Supervised Learning of Semantic Correspondence With Pseudo-Labels: Jiwon Kim,

Kwangrok Ryoo,

Junyoung Seo,

Gyuseong Lee,

Daehwan Kim,

Hansang Cho,

Seungryong Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2022_CVPR, author = {Kim, Jiwon and Ryoo, Kwangrok and Seo, Junyoung and Lee, Gyuseong and Kim, Daehwan and Cho, Hansang and Kim, Seungryong}, title = {Semi-Supervised Learning of Semantic Correspondence With Pseudo-Labels}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19699-19709} }
HLRTF: Hierarchical Low-Rank Tensor Factorization for Inverse Problems in Multi-Dimensional Imaging: Yisi Luo,

Xi-Le Zhao,

Deyu Meng,

Tai-Xiang Jiang; [pdf] [supp]
[bibtex]
@InProceedings{Luo_2022_CVPR, author = {Luo, Yisi and Zhao, Xi-Le and Meng, Deyu and Jiang, Tai-Xiang}, title = {HLRTF: Hierarchical Low-Rank Tensor Factorization for Inverse Problems in Multi-Dimensional Imaging}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {19303-19312} }
FIBA: Frequency-Injection Based Backdoor Attack in Medical Image Analysis: Yu Feng,

Benteng Ma,

Jing Zhang,

Shanshan Zhao,

Yong Xia,

Dacheng Tao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Feng_2022_CVPR, author = {Feng, Yu and Ma, Benteng and Zhang, Jing and Zhao, Shanshan and Xia, Yong and Tao, Dacheng}, title = {FIBA: Frequency-Injection Based Backdoor Attack in Medical Image Analysis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20876-20885} }
Deep Constrained Least Squares for Blind Image Super-Resolution: Ziwei Luo,

Haibin Huang,

Lei Yu,

Youwei Li,

Haoqiang Fan,

Shuaicheng Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Luo_2022_CVPR, author = {Luo, Ziwei and Huang, Haibin and Yu, Lei and Li, Youwei and Fan, Haoqiang and Liu, Shuaicheng}, title = {Deep Constrained Least Squares for Blind Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17642-17652} }
Beyond a Pre-Trained Object Detector: Cross-Modal Textual and Visual Context for Image Captioning: Chia-Wen Kuo,

Zsolt Kira; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kuo_2022_CVPR, author = {Kuo, Chia-Wen and Kira, Zsolt}, title = {Beyond a Pre-Trained Object Detector: Cross-Modal Textual and Visual Context for Image Captioning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17969-17979} }
Symmetry-Aware Neural Architecture for Embodied Visual Exploration: Shuang Liu,

Takayuki Okatani; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2022_CVPR, author = {Liu, Shuang and Okatani, Takayuki}, title = {Symmetry-Aware Neural Architecture for Embodied Visual Exploration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17242-17251} }
From Representation to Reasoning: Towards Both Evidence and Commonsense Reasoning for Video Question-Answering: Jiangtong Li,

Li Niu,

Liqing Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2022_CVPR, author = {Li, Jiangtong and Niu, Li and Zhang, Liqing}, title = {From Representation to Reasoning: Towards Both Evidence and Commonsense Reasoning for Video Question-Answering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {21273-21282} }
DanceTrack: Multi-Object Tracking in Uniform Appearance and Diverse Motion: Peize Sun,

Jinkun Cao,

Yi Jiang,

Zehuan Yuan,

Song Bai,

Kris Kitani,

Ping Luo; [pdf] [arXiv]
[bibtex]
@InProceedings{Sun_2022_CVPR, author = {Sun, Peize and Cao, Jinkun and Jiang, Yi and Yuan, Zehuan and Bai, Song and Kitani, Kris and Luo, Ping}, title = {DanceTrack: Multi-Object Tracking in Uniform Appearance and Diverse Motion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20993-21002} }
Unsupervised Learning of Debiased Representations With Pseudo-Attributes: Seonguk Seo,

Joon-Young Lee,

Bohyung Han; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Seo_2022_CVPR, author = {Seo, Seonguk and Lee, Joon-Young and Han, Bohyung}, title = {Unsupervised Learning of Debiased Representations With Pseudo-Attributes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16742-16751} }
TubeDETR: Spatio-Temporal Video Grounding With Transformers: Antoine Yang,

Antoine Miech,

Josef Sivic,

Ivan Laptev,

Cordelia Schmid; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2022_CVPR, author = {Yang, Antoine and Miech, Antoine and Sivic, Josef and Laptev, Ivan and Schmid, Cordelia}, title = {TubeDETR: Spatio-Temporal Video Grounding With Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16442-16453} }
SLIC: Self-Supervised Learning With Iterative Clustering for Human Action Videos: Salar Hosseini Khorasgani,

Yuxuan Chen,

Florian Shkurti; [pdf] [supp]
[bibtex]
@InProceedings{Khorasgani_2022_CVPR, author = {Khorasgani, Salar Hosseini and Chen, Yuxuan and Shkurti, Florian}, title = {SLIC: Self-Supervised Learning With Iterative Clustering for Human Action Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16091-16101} }
UBnormal: New Benchmark for Supervised Open-Set Video Anomaly Detection: Andra Acsintoae,

Andrei Florescu,

Mariana-Iuliana Georgescu,

Tudor Mare,

Paul Sumedrea,

Radu Tudor Ionescu,

Fahad Shahbaz Khan,

Mubarak Shah; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Acsintoae_2022_CVPR, author = {Acsintoae, Andra and Florescu, Andrei and Georgescu, Mariana-Iuliana and Mare, Tudor and Sumedrea, Paul and Ionescu, Radu Tudor and Khan, Fahad Shahbaz and Shah, Mubarak}, title = {UBnormal: New Benchmark for Supervised Open-Set Video Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20143-20153} }
Beyond Cross-View Image Retrieval: Highly Accurate Vehicle Localization Using Satellite Image: Yujiao Shi,

Hongdong Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shi_2022_CVPR, author = {Shi, Yujiao and Li, Hongdong}, title = {Beyond Cross-View Image Retrieval: Highly Accurate Vehicle Localization Using Satellite Image}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {17010-17020} }
Closing the Generalization Gap of Cross-Silo Federated Medical Image Segmentation: An Xu,

Wenqi Li,

Pengfei Guo,

Dong Yang,

Holger R. Roth,

Ali Hatamizadeh,

Can Zhao,

Daguang Xu,

Heng Huang,

Ziyue Xu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2022_CVPR, author = {Xu, An and Li, Wenqi and Guo, Pengfei and Yang, Dong and Roth, Holger R. and Hatamizadeh, Ali and Zhao, Can and Xu, Daguang and Huang, Heng and Xu, Ziyue}, title = {Closing the Generalization Gap of Cross-Silo Federated Medical Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20866-20875} }
Leverage Your Local and Global Representations: A New Self-Supervised Learning Strategy: Tong Zhang,

Congpei Qiu,

Wei Ke,

Sabine Süsstrunk,

Mathieu Salzmann; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2022_CVPR, author = {Zhang, Tong and Qiu, Congpei and Ke, Wei and S\"usstrunk, Sabine and Salzmann, Mathieu}, title = {Leverage Your Local and Global Representations: A New Self-Supervised Learning Strategy}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16580-16589} }
NeRF in the Dark: High Dynamic Range View Synthesis From Noisy Raw Images: Ben Mildenhall,

Peter Hedman,

Ricardo Martin-Brualla,

Pratul P. Srinivasan,

Jonathan T. Barron; [pdf] [supp]
[bibtex]
@InProceedings{Mildenhall_2022_CVPR, author = {Mildenhall, Ben and Hedman, Peter and Martin-Brualla, Ricardo and Srinivasan, Pratul P. and Barron, Jonathan T.}, title = {NeRF in the Dark: High Dynamic Range View Synthesis From Noisy Raw Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16190-16199} }
DArch: Dental Arch Prior-Assisted 3D Tooth Instance Segmentation With Weak Annotations: Liangdong Qiu,

Chongjie Ye,

Pei Chen,

Yunbi Liu,

Xiaoguang Han,

Shuguang Cui; [pdf]
[bibtex]
@InProceedings{Qiu_2022_CVPR, author = {Qiu, Liangdong and Ye, Chongjie and Chen, Pei and Liu, Yunbi and Han, Xiaoguang and Cui, Shuguang}, title = {DArch: Dental Arch Prior-Assisted 3D Tooth Instance Segmentation With Weak Annotations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {20752-20761} }
Globetrotter: Connecting Languages by Connecting Images: Dídac Surís,

Dave Epstein,

Carl Vondrick; [pdf] [supp]
[bibtex]
@InProceedings{Suris_2022_CVPR, author = {Sur{\'\i}s, D{\'\i}dac and Epstein, Dave and Vondrick, Carl}, title = {Globetrotter: Connecting Languages by Connecting Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2022}, pages = {16474-16484} }; Back