Papers
- Back
Deep Frequency Filtering for Domain Generalization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lin_2023_CVPR, author = {Lin, Shiqi and Zhang, Zhizheng and Huang, Zhipeng and Lu, Yan and Lan, Cuiling and Chu, Peng and You, Quanzeng and Wang, Jiang and Liu, Zicheng and Parulkar, Amey and Navkal, Viraj and Chen, Zhibo}, title = {Deep Frequency Filtering for Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11797-11807} }
Frame Flexible Network-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Yitian and Bai, Yue and Liu, Chang and Wang, Huan and Li, Sheng and Fu, Yun}, title = {Frame Flexible Network}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10504-10513} }
Unsupervised Cumulative Domain Adaptation for Foggy Scene Optical Flow-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhou_2023_CVPR, author = {Zhou, Hanyu and Chang, Yi and Yan, Wending and Yan, Luxin}, title = {Unsupervised Cumulative Domain Adaptation for Foggy Scene Optical Flow}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9569-9578} }
MarS3D: A Plug-and-Play Motion-Aware Model for Semantic Segmentation on Multi-Scan 3D Point Clouds-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Jiahui and Chang, Chirui and Liu, Jianhui and Wu, Xiaoyang and Ma, Lan and Qi, Xiaojuan}, title = {MarS3D: A Plug-and-Play Motion-Aware Model for Semantic Segmentation on Multi-Scan 3D Point Clouds}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9372-9381} }
An Image Quality Assessment Dataset for Portraits-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chahine_2023_CVPR, author = {Chahine, Nicolas and Calarasanu, Stefania and Garcia-Civiero, Davide and Cayla, Th\'eo and Ferradans, Sira and Ponce, Jean}, title = {An Image Quality Assessment Dataset for Portraits}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9968-9978} }
Painting 3D Nature in 2D: View Synthesis of Natural Scenes From a Single Semantic Mask-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Shangzhan and Peng, Sida and Chen, Tianrun and Mou, Linzhan and Lin, Haotong and Yu, Kaicheng and Liao, Yiyi and Zhou, Xiaowei}, title = {Painting 3D Nature in 2D: View Synthesis of Natural Scenes From a Single Semantic Mask}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8518-8528} }
Fast Point Cloud Generation With Straight Flows-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_CVPR, author = {Wu, Lemeng and Wang, Dilin and Gong, Chengyue and Liu, Xingchao and Xiong, Yunyang and Ranjan, Rakesh and Krishnamoorthi, Raghuraman and Chandra, Vikas and Liu, Qiang}, title = {Fast Point Cloud Generation With Straight Flows}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9445-9454} }
Achieving a Better Stability-Plasticity Trade-Off via Auxiliary Networks in Continual Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2023_CVPR, author = {Kim, Sanghwan and Noci, Lorenzo and Orvieto, Antonio and Hofmann, Thomas}, title = {Achieving a Better Stability-Plasticity Trade-Off via Auxiliary Networks in Continual Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11930-11939} }
Video Event Restoration Based on Keyframes for Video Anomaly Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_CVPR, author = {Yang, Zhiwei and Liu, Jing and Wu, Zhaoyang and Wu, Peng and Liu, Xiaotao}, title = {Video Event Restoration Based on Keyframes for Video Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14592-14601} }
EcoTTA: Memory-Efficient Continual Test-Time Adaptation via Self-Distilled Regularization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Song_2023_CVPR, author = {Song, Junha and Lee, Jungsoo and Kweon, In So and Choi, Sungha}, title = {EcoTTA: Memory-Efficient Continual Test-Time Adaptation via Self-Distilled Regularization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11920-11929} }
Tri-Perspective View for Vision-Based 3D Semantic Occupancy Prediction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_CVPR, author = {Huang, Yuanhui and Zheng, Wenzhao and Zhang, Yunpeng and Zhou, Jie and Lu, Jiwen}, title = {Tri-Perspective View for Vision-Based 3D Semantic Occupancy Prediction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9223-9232} }
Castling-ViT: Compressing Self-Attention via Switching Towards Linear-Angular Attention at Vision Transformer Inference-
[pdf]
[supp]
[bibtex]@InProceedings{You_2023_CVPR, author = {You, Haoran and Xiong, Yunyang and Dai, Xiaoliang and Wu, Bichen and Zhang, Peizhao and Fan, Haoqi and Vajda, Peter and Lin, Yingyan (Celine)}, title = {Castling-ViT: Compressing Self-Attention via Switching Towards Linear-Angular Attention at Vision Transformer Inference}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14431-14442} }
Rethinking Federated Learning With Domain Shift: A Prototype View-
[pdf]
[bibtex]@InProceedings{Huang_2023_CVPR, author = {Huang, Wenke and Ye, Mang and Shi, Zekun and Li, He and Du, Bo}, title = {Rethinking Federated Learning With Domain Shift: A Prototype View}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16312-16322} }
HGFormer: Hierarchical Grouping Transformer for Domain Generalized Semantic Segmentation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Ding_2023_CVPR, author = {Ding, Jian and Xue, Nan and Xia, Gui-Song and Schiele, Bernt and Dai, Dengxin}, title = {HGFormer: Hierarchical Grouping Transformer for Domain Generalized Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15413-15423} }
Distilling Vision-Language Pre-Training To Collaborate With Weakly-Supervised Temporal Action Localization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ju_2023_CVPR, author = {Ju, Chen and Zheng, Kunhao and Liu, Jinxiang and Zhao, Peisen and Zhang, Ya and Chang, Jianlong and Tian, Qi and Wang, Yanfeng}, title = {Distilling Vision-Language Pre-Training To Collaborate With Weakly-Supervised Temporal Action Localization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14751-14762} }
Augmentation Matters: A Simple-Yet-Effective Approach to Semi-Supervised Semantic Segmentation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhao_2023_CVPR, author = {Zhao, Zhen and Yang, Lihe and Long, Sifan and Pi, Jimin and Zhou, Luping and Wang, Jingdong}, title = {Augmentation Matters: A Simple-Yet-Effective Approach to Semi-Supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11350-11359} }
Boosting Verified Training for Robust Image Classifications via Abstraction-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Zhaodi and Xue, Zhiyi and Chen, Yang and Liu, Si and Zhang, Yueling and Liu, Jing and Zhang, Min}, title = {Boosting Verified Training for Robust Image Classifications via Abstraction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16251-16260} }
3D Shape Reconstruction of Semi-Transparent Worms-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ilett_2023_CVPR, author = {Ilett, Thomas P. and Yuval, Omer and Ranner, Thomas and Cohen, Netta and Hogg, David C.}, title = {3D Shape Reconstruction of Semi-Transparent Worms}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12565-12575} }
Mapping Degeneration Meets Label Evolution: Learning Infrared Small Target Detection With Single Point Supervision-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ying_2023_CVPR, author = {Ying, Xinyi and Liu, Li and Wang, Yingqian and Li, Ruojing and Chen, Nuo and Lin, Zaiping and Sheng, Weidong and Zhou, Shilin}, title = {Mapping Degeneration Meets Label Evolution: Learning Infrared Small Target Detection With Single Point Supervision}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15528-15538} }
Swept-Angle Synthetic Wavelength Interferometry-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kotwal_2023_CVPR, author = {Kotwal, Alankar and Levin, Anat and Gkioulekas, Ioannis}, title = {Swept-Angle Synthetic Wavelength Interferometry}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8233-8243} }
Adaptive Global Decay Process for Event Cameras-
[pdf]
[supp]
[bibtex]@InProceedings{Nunes_2023_CVPR, author = {Nunes, Urbano Miguel and Benosman, Ryad and Ieng, Sio-Hoi}, title = {Adaptive Global Decay Process for Event Cameras}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9771-9780} }
Multi-Space Neural Radiance Fields-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yin_2023_CVPR, author = {Yin, Ze-Xin and Qiu, Jiaxiong and Cheng, Ming-Ming and Ren, Bo}, title = {Multi-Space Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12407-12416} }
Bitstream-Corrupted JPEG Images Are Restorable: Two-Stage Compensation and Alignment Framework for Image Restoration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Wenyang and Wang, Yi and Yap, Kim-Hui and Chau, Lap-Pui}, title = {Bitstream-Corrupted JPEG Images Are Restorable: Two-Stage Compensation and Alignment Framework for Image Restoration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9979-9988} }
Histopathology Whole Slide Image Analysis With Heterogeneous Graph Representation Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Chan_2023_CVPR, author = {Chan, Tsai Hor and Cendra, Fernando Julio and Ma, Lan and Yin, Guosheng and Yu, Lequan}, title = {Histopathology Whole Slide Image Analysis With Heterogeneous Graph Representation Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15661-15670} }
Towards All-in-One Pre-Training via Maximizing Multi-Modal Mutual Information-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Su_2023_CVPR, author = {Su, Weijie and Zhu, Xizhou and Tao, Chenxin and Lu, Lewei and Li, Bin and Huang, Gao and Qiao, Yu and Wang, Xiaogang and Zhou, Jie and Dai, Jifeng}, title = {Towards All-in-One Pre-Training via Maximizing Multi-Modal Mutual Information}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15888-15899} }
Aligning Bag of Regions for Open-Vocabulary Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_CVPR, author = {Wu, Size and Zhang, Wenwei and Jin, Sheng and Liu, Wentao and Loy, Chen Change}, title = {Aligning Bag of Regions for Open-Vocabulary Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15254-15264} }
Two-View Geometry Scoring Without Correspondences-
[pdf]
[supp]
[bibtex]@InProceedings{Barroso-Laguna_2023_CVPR, author = {Barroso-Laguna, Axel and Brachmann, Eric and Prisacariu, Victor Adrian and Brostow, Gabriel J. and Turmukhambetov, Daniyar}, title = {Two-View Geometry Scoring Without Correspondences}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8979-8989} }
Annealing-Based Label-Transfer Learning for Open World Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Ma_2023_CVPR, author = {Ma, Yuqing and Li, Hainan and Zhang, Zhange and Guo, Jinyang and Zhang, Shanghang and Gong, Ruihao and Liu, Xianglong}, title = {Annealing-Based Label-Transfer Learning for Open World Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11454-11463} }
Self-Supervised Video Forensics by Audio-Visual Anomaly Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Feng_2023_CVPR, author = {Feng, Chao and Chen, Ziyang and Owens, Andrew}, title = {Self-Supervised Video Forensics by Audio-Visual Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10491-10503} }
Class Balanced Adaptive Pseudo Labeling for Federated Semi-Supervised Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Ming and Li, Qingli and Wang, Yan}, title = {Class Balanced Adaptive Pseudo Labeling for Federated Semi-Supervised Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16292-16301} }
Rethinking Out-of-Distribution (OOD) Detection: Masked Image Modeling Is All You Need-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Jingyao and Chen, Pengguang and He, Zexin and Yu, Shaozuo and Liu, Shu and Jia, Jiaya}, title = {Rethinking Out-of-Distribution (OOD) Detection: Masked Image Modeling Is All You Need}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11578-11589} }
Masked Scene Contrast: A Scalable Framework for Unsupervised 3D Representation Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_CVPR, author = {Wu, Xiaoyang and Wen, Xin and Liu, Xihui and Zhao, Hengshuang}, title = {Masked Scene Contrast: A Scalable Framework for Unsupervised 3D Representation Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9415-9424} }
Multi Domain Learning for Motion Magnification-
[pdf]
[supp]
[bibtex]@InProceedings{Singh_2023_CVPR, author = {Singh, Jasdeep and Murala, Subrahmanyam and Kosuru, G. Sankara Raju}, title = {Multi Domain Learning for Motion Magnification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13914-13923} }
A Simple Baseline for Video Restoration With Grouped Spatial-Temporal Shift-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Dasong and Shi, Xiaoyu and Zhang, Yi and Cheung, Ka Chun and See, Simon and Wang, Xiaogang and Qin, Hongwei and Li, Hongsheng}, title = {A Simple Baseline for Video Restoration With Grouped Spatial-Temporal Shift}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9822-9832} }
itKD: Interchange Transfer-Based Knowledge Distillation for 3D Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cho_2023_CVPR, author = {Cho, Hyeon and Choi, Junyong and Baek, Geonwoo and Hwang, Wonjun}, title = {itKD: Interchange Transfer-Based Knowledge Distillation for 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13540-13549} }
2PCNet: Two-Phase Consistency Training for Day-to-Night Unsupervised Domain Adaptive Object Detection-
[pdf]
[arXiv]
[bibtex]@InProceedings{Kennerley_2023_CVPR, author = {Kennerley, Mikhail and Wang, Jian-Gang and Veeravalli, Bharadwaj and Tan, Robby T.}, title = {2PCNet: Two-Phase Consistency Training for Day-to-Night Unsupervised Domain Adaptive Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11484-11493} }
Panoptic Lifting for 3D Scene Understanding With Neural Fields-
[pdf]
[supp]
[bibtex]@InProceedings{Siddiqui_2023_CVPR, author = {Siddiqui, Yawar and Porzi, Lorenzo and Bul\`o, Samuel Rota and M\"uller, Norman and Nie{\ss}ner, Matthias and Dai, Angela and Kontschieder, Peter}, title = {Panoptic Lifting for 3D Scene Understanding With Neural Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9043-9052} }
WeatherStream: Light Transport Automation of Single Image Deweathering-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Howard and Ba, Yunhao and Yang, Ethan and Mehra, Varan and Gella, Blake and Suzuki, Akira and Pfahnl, Arnold and Chandrappa, Chethan Chinder and Wong, Alex and Kadambi, Achuta}, title = {WeatherStream: Light Transport Automation of Single Image Deweathering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13499-13509} }
Learning To Detect Mirrors From Videos via Dual Correspondences-
[pdf]
[supp]
[bibtex]@InProceedings{Lin_2023_CVPR, author = {Lin, Jiaying and Tan, Xin and Lau, Rynson W.H.}, title = {Learning To Detect Mirrors From Videos via Dual Correspondences}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9109-9118} }
The Devil Is in the Points: Weakly Semi-Supervised Instance Segmentation via Point-Guided Mask Representation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2023_CVPR, author = {Kim, Beomyoung and Jeong, Joonhyun and Han, Dongyoon and Hwang, Sung Ju}, title = {The Devil Is in the Points: Weakly Semi-Supervised Instance Segmentation via Point-Guided Mask Representation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11360-11370} }
Language-Guided Audio-Visual Source Separation via Trimodal Consistency-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tan_2023_CVPR, author = {Tan, Reuben and Ray, Arijit and Burns, Andrea and Plummer, Bryan A. and Salamon, Justin and Nieto, Oriol and Russell, Bryan and Saenko, Kate}, title = {Language-Guided Audio-Visual Source Separation via Trimodal Consistency}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10575-10584} }
DynaMask: Dynamic Mask Selection for Instance Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Ruihuang and He, Chenhang and Li, Shuai and Zhang, Yabin and Zhang, Lei}, title = {DynaMask: Dynamic Mask Selection for Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11279-11288} }
SAP-DETR: Bridging the Gap Between Salient Points and Queries-Based Transformer Detector for Fast Model Convergency-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Yang and Zhang, Yao and Wang, Yixin and Zhang, Yang and Tian, Jiang and Shi, Zhongchao and Fan, Jianping and He, Zhiqiang}, title = {SAP-DETR: Bridging the Gap Between Salient Points and Queries-Based Transformer Detector for Fast Model Convergency}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15539-15547} }
GD-MAE: Generative Decoder for MAE Pre-Training on LiDAR Point Clouds-
[pdf]
[supp]
[bibtex]@InProceedings{Yang_2023_CVPR, author = {Yang, Honghui and He, Tong and Liu, Jiaheng and Chen, Hua and Wu, Boxi and Lin, Binbin and He, Xiaofei and Ouyang, Wanli}, title = {GD-MAE: Generative Decoder for MAE Pre-Training on LiDAR Point Clouds}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9403-9414} }
Re-Thinking Model Inversion Attacks Against Deep Neural Networks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nguyen_2023_CVPR, author = {Nguyen, Ngoc-Bao and Chandrasegaran, Keshigeyan and Abdollahzadeh, Milad and Cheung, Ngai-Man}, title = {Re-Thinking Model Inversion Attacks Against Deep Neural Networks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16384-16393} }
You Need Multiple Exiting: Dynamic Early Exiting for Accelerating Unified Vision Language Model-
[pdf]
[arXiv]
[bibtex]@InProceedings{Tang_2023_CVPR, author = {Tang, Shengkun and Wang, Yaqing and Kong, Zhenglun and Zhang, Tianchi and Li, Yao and Ding, Caiwen and Wang, Yanzhi and Liang, Yi and Xu, Dongkuan}, title = {You Need Multiple Exiting: Dynamic Early Exiting for Accelerating Unified Vision Language Model}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10781-10791} }
PROB: Probabilistic Objectness for Open World Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zohar_2023_CVPR, author = {Zohar, Orr and Wang, Kuan-Chieh and Yeung, Serena}, title = {PROB: Probabilistic Objectness for Open World Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11444-11453} }
SparseFusion: Distilling View-Conditioned Diffusion for 3D Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhou_2023_CVPR, author = {Zhou, Zhizhuo and Tulsiani, Shubham}, title = {SparseFusion: Distilling View-Conditioned Diffusion for 3D Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12588-12597} }
Dynamic Focus-Aware Positional Queries for Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{He_2023_CVPR, author = {He, Haoyu and Cai, Jianfei and Pan, Zizheng and Liu, Jing and Zhang, Jing and Tao, Dacheng and Zhuang, Bohan}, title = {Dynamic Focus-Aware Positional Queries for Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11299-11308} }
HARP: Personalized Hand Reconstruction From a Monocular RGB Video-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Karunratanakul_2023_CVPR, author = {Karunratanakul, Korrawe and Prokudin, Sergey and Hilliges, Otmar and Tang, Siyu}, title = {HARP: Personalized Hand Reconstruction From a Monocular RGB Video}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12802-12813} }
DART: Diversify-Aggregate-Repeat Training Improves Generalization of Neural Networks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jain_2023_CVPR, author = {Jain, Samyak and Addepalli, Sravanti and Sahu, Pawan Kumar and Dey, Priyam and Babu, R. Venkatesh}, title = {DART: Diversify-Aggregate-Repeat Training Improves Generalization of Neural Networks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16048-16059} }
EvShutter: Transforming Events for Unconstrained Rolling Shutter Correction-
[pdf]
[supp]
[bibtex]@InProceedings{Erbach_2023_CVPR, author = {Erbach, Julius and Tulyakov, Stepan and Vitoria, Patricia and Bochicchio, Alfredo and Li, Yuanyou}, title = {EvShutter: Transforming Events for Unconstrained Rolling Shutter Correction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13904-13913} }
Ambiguity-Resistant Semi-Supervised Learning for Dense Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Chang and Zhang, Weiming and Lin, Xiangru and Zhang, Wei and Tan, Xiao and Han, Junyu and Li, Xiaomao and Ding, Errui and Wang, Jingdong}, title = {Ambiguity-Resistant Semi-Supervised Learning for Dense Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15579-15588} }
Scalable, Detailed and Mask-Free Universal Photometric Stereo-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ikehata_2023_CVPR, author = {Ikehata, Satoshi}, title = {Scalable, Detailed and Mask-Free Universal Photometric Stereo}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13198-13207} }
Towards High-Quality and Efficient Video Super-Resolution via Spatial-Temporal Data Overfitting-
[pdf]
[arXiv]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Gen and Ji, Jie and Qin, Minghai and Niu, Wei and Ren, Bin and Afghah, Fatemeh and Guo, Linke and Ma, Xiaolong}, title = {Towards High-Quality and Efficient Video Super-Resolution via Spatial-Temporal Data Overfitting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10259-10269} }
BiFormer: Vision Transformer With Bi-Level Routing Attention-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_CVPR, author = {Zhu, Lei and Wang, Xinjiang and Ke, Zhanghan and Zhang, Wayne and Lau, Rynson W.H.}, title = {BiFormer: Vision Transformer With Bi-Level Routing Attention}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10323-10333} }
Class-Incremental Exemplar Compression for Class-Incremental Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Luo_2023_CVPR, author = {Luo, Zilin and Liu, Yaoyao and Schiele, Bernt and Sun, Qianru}, title = {Class-Incremental Exemplar Compression for Class-Incremental Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11371-11380} }
Behind the Scenes: Density Fields for Single View Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wimbauer_2023_CVPR, author = {Wimbauer, Felix and Yang, Nan and Rupprecht, Christian and Cremers, Daniel}, title = {Behind the Scenes: Density Fields for Single View Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9076-9086} }
StyleGAN Salon: Multi-View Latent Optimization for Pose-Invariant Hairstyle Transfer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Khwanmuang_2023_CVPR, author = {Khwanmuang, Sasikarn and Phongthawee, Pakkapon and Sangkloy, Patsorn and Suwajanakorn, Supasorn}, title = {StyleGAN Salon: Multi-View Latent Optimization for Pose-Invariant Hairstyle Transfer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8609-8618} }
Resource-Efficient RGBD Aerial Tracking-
[pdf]
[supp]
[bibtex]@InProceedings{Yang_2023_CVPR, author = {Yang, Jinyu and Gao, Shang and Li, Zhe and Zheng, Feng and Leonardis, Ale\v{s}}, title = {Resource-Efficient RGBD Aerial Tracking}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13374-13383} }
Bilateral Memory Consolidation for Continual Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Nie_2023_CVPR, author = {Nie, Xing and Xu, Shixiong and Liu, Xiyan and Meng, Gaofeng and Huo, Chunlei and Xiang, Shiming}, title = {Bilateral Memory Consolidation for Continual Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16026-16035} }
Search-Map-Search: A Frame Selection Paradigm for Action Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Zhao_2023_CVPR, author = {Zhao, Mingjun and Yu, Yakun and Wang, Xiaoli and Yang, Lei and Niu, Di}, title = {Search-Map-Search: A Frame Selection Paradigm for Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10627-10636} }
Uncovering the Missing Pattern: Unified Framework Towards Trajectory Imputation and Prediction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_CVPR, author = {Xu, Yi and Bazarjani, Armin and Chi, Hyung-gun and Choi, Chiho and Fu, Yun}, title = {Uncovering the Missing Pattern: Unified Framework Towards Trajectory Imputation and Prediction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9632-9643} }
FlexiViT: One Model for All Patch Sizes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Beyer_2023_CVPR, author = {Beyer, Lucas and Izmailov, Pavel and Kolesnikov, Alexander and Caron, Mathilde and Kornblith, Simon and Zhai, Xiaohua and Minderer, Matthias and Tschannen, Michael and Alabdulmohsin, Ibrahim and Pavetic, Filip}, title = {FlexiViT: One Model for All Patch Sizes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14496-14506} }
Structured Kernel Estimation for Photon-Limited Deconvolution-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sanghvi_2023_CVPR, author = {Sanghvi, Yash and Mao, Zhiyuan and Chan, Stanley H.}, title = {Structured Kernel Estimation for Photon-Limited Deconvolution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9863-9872} }
Frame Interpolation Transformer and Uncertainty Guidance-
[pdf]
[supp]
[bibtex]@InProceedings{Plack_2023_CVPR, author = {Plack, Markus and Briedis, Karlis Martins and Djelouah, Abdelaziz and Hullin, Matthias B. and Gross, Markus and Schroers, Christopher}, title = {Frame Interpolation Transformer and Uncertainty Guidance}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9811-9821} }
Neural Preset for Color Style Transfer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ke_2023_CVPR, author = {Ke, Zhanghan and Liu, Yuhao and Zhu, Lei and Zhao, Nanxuan and Lau, Rynson W.H.}, title = {Neural Preset for Color Style Transfer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14173-14182} }
Wavelet Diffusion Models Are Fast and Scalable Image Generators-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Phung_2023_CVPR, author = {Phung, Hao and Dao, Quan and Tran, Anh}, title = {Wavelet Diffusion Models Are Fast and Scalable Image Generators}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10199-10208} }
PA&DA: Jointly Sampling Path and Data for Consistent NAS-
[pdf]
[supp]
[bibtex]@InProceedings{Lu_2023_CVPR, author = {Lu, Shun and Hu, Yu and Yang, Longxing and Sun, Zihao and Mei, Jilin and Tan, Jianchao and Song, Chengru}, title = {PA\&DA: Jointly Sampling Path and Data for Consistent NAS}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11940-11949} }
3D Spatial Multimodal Knowledge Accumulation for Scene Graph Prediction in Point Cloud-
[pdf]
[supp]
[bibtex]@InProceedings{Feng_2023_CVPR, author = {Feng, Mingtao and Hou, Haoran and Zhang, Liang and Wu, Zijie and Guo, Yulan and Mian, Ajmal}, title = {3D Spatial Multimodal Knowledge Accumulation for Scene Graph Prediction in Point Cloud}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9182-9191} }
ViTs for SITS: Vision Transformers for Satellite Image Time Series-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tarasiou_2023_CVPR, author = {Tarasiou, Michail and Chavez, Erik and Zafeiriou, Stefanos}, title = {ViTs for SITS: Vision Transformers for Satellite Image Time Series}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10418-10428} }
Prompt, Generate, Then Cache: Cascade of Foundation Models Makes Strong Few-Shot Learners-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Renrui and Hu, Xiangfei and Li, Bohao and Huang, Siyuan and Deng, Hanqiu and Qiao, Yu and Gao, Peng and Li, Hongsheng}, title = {Prompt, Generate, Then Cache: Cascade of Foundation Models Makes Strong Few-Shot Learners}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15211-15222} }
VideoMAE V2: Scaling Video Masked Autoencoders With Dual Masking-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Limin and Huang, Bingkun and Zhao, Zhiyu and Tong, Zhan and He, Yinan and Wang, Yi and Wang, Yali and Qiao, Yu}, title = {VideoMAE V2: Scaling Video Masked Autoencoders With Dual Masking}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14549-14560} }
Perception and Semantic Aware Regularization for Sequential Confidence Calibration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Peng_2023_CVPR, author = {Peng, Zhenghua and Luo, Yu and Chen, Tianshui and Xu, Keke and Huang, Shuangping}, title = {Perception and Semantic Aware Regularization for Sequential Confidence Calibration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10658-10668} }
Vid2Seq: Large-Scale Pretraining of a Visual Language Model for Dense Video Captioning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_CVPR, author = {Yang, Antoine and Nagrani, Arsha and Seo, Paul Hongsuck and Miech, Antoine and Pont-Tuset, Jordi and Laptev, Ivan and Sivic, Josef and Schmid, Cordelia}, title = {Vid2Seq: Large-Scale Pretraining of a Visual Language Model for Dense Video Captioning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10714-10726} }
ERNIE-ViLG 2.0: Improving Text-to-Image Diffusion Model With Knowledge-Enhanced Mixture-of-Denoising-Experts-
[pdf]
[supp]
[bibtex]@InProceedings{Feng_2023_CVPR, author = {Feng, Zhida and Zhang, Zhenyu and Yu, Xintong and Fang, Yewei and Li, Lanxin and Chen, Xuyi and Lu, Yuxiang and Liu, Jiaxiang and Yin, Weichong and Feng, Shikun and Sun, Yu and Chen, Li and Tian, Hao and Wu, Hua and Wang, Haifeng}, title = {ERNIE-ViLG 2.0: Improving Text-to-Image Diffusion Model With Knowledge-Enhanced Mixture-of-Denoising-Experts}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10135-10145} }
Revisiting the Stack-Based Inverse Tone Mapping-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Ning and Ye, Yuyao and Zhao, Yang and Wang, Ronggang}, title = {Revisiting the Stack-Based Inverse Tone Mapping}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9162-9171} }
Exploiting Completeness and Uncertainty of Pseudo Labels for Weakly Supervised Video Anomaly Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Chen and Li, Guorong and Qi, Yuankai and Wang, Shuhui and Qing, Laiyun and Huang, Qingming and Yang, Ming-Hsuan}, title = {Exploiting Completeness and Uncertainty of Pseudo Labels for Weakly Supervised Video Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16271-16280} }
Full or Weak Annotations? An Adaptive Strategy for Budget-Constrained Annotation Campaigns-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tejero_2023_CVPR, author = {Tejero, Javier Gamazo and Zinkernagel, Martin S. and Wolf, Sebastian and Sznitman, Raphael and M\'arquez-Neila, Pablo}, title = {Full or Weak Annotations? An Adaptive Strategy for Budget-Constrained Annotation Campaigns}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11381-11391} }
Backdoor Defense via Deconfounded Representation Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Zaixi and Liu, Qi and Wang, Zhicai and Lu, Zepu and Hu, Qingyong}, title = {Backdoor Defense via Deconfounded Representation Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12228-12238} }
HairStep: Transfer Synthetic to Real Using Strand and Depth Maps for Single-View 3D Hair Modeling-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zheng_2023_CVPR, author = {Zheng, Yujian and Jin, Zirong and Li, Moran and Huang, Haibin and Ma, Chongyang and Cui, Shuguang and Han, Xiaoguang}, title = {HairStep: Transfer Synthetic to Real Using Strand and Depth Maps for Single-View 3D Hair Modeling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12726-12735} }
MoDAR: Using Motion Forecasting for 3D Object Detection in Point Cloud Sequences-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Yingwei and Qi, Charles R. and Zhou, Yin and Liu, Chenxi and Anguelov, Dragomir}, title = {MoDAR: Using Motion Forecasting for 3D Object Detection in Point Cloud Sequences}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9329-9339} }
ALSO: Automotive Lidar Self-Supervision by Occupancy Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Boulch_2023_CVPR, author = {Boulch, Alexandre and Sautier, Corentin and Michele, Bj\"orn and Puy, Gilles and Marlet, Renaud}, title = {ALSO: Automotive Lidar Self-Supervision by Occupancy Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13455-13465} }
Learning Dynamic Style Kernels for Artistic Style Transfer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_CVPR, author = {Xu, Wenju and Long, Chengjiang and Nie, Yongwei}, title = {Learning Dynamic Style Kernels for Artistic Style Transfer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10083-10092} }
Chat2Map: Efficient Scene Mapping From Multi-Ego Conversations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Majumder_2023_CVPR, author = {Majumder, Sagnik and Jiang, Hao and Moulon, Pierre and Henderson, Ethan and Calamia, Paul and Grauman, Kristen and Ithapu, Vamsi Krishna}, title = {Chat2Map: Efficient Scene Mapping From Multi-Ego Conversations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10554-10564} }
GeoMAE: Masked Geometric Target Prediction for Self-Supervised Point Cloud Pre-Training-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tian_2023_CVPR, author = {Tian, Xiaoyu and Ran, Haoxi and Wang, Yue and Zhao, Hang}, title = {GeoMAE: Masked Geometric Target Prediction for Self-Supervised Point Cloud Pre-Training}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13570-13580} }
Learning Conditional Attributes for Compositional Zero-Shot Learning-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Qingsheng and Liu, Lingqiao and Jing, Chenchen and Chen, Hao and Liang, Guoqiang and Wang, Peng and Shen, Chunhua}, title = {Learning Conditional Attributes for Compositional Zero-Shot Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11197-11206} }
Complete 3D Human Reconstruction From a Single Incomplete Image-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Junying and Yoon, Jae Shin and Wang, Tuanfeng Y. and Singh, Krishna Kumar and Neumann, Ulrich}, title = {Complete 3D Human Reconstruction From a Single Incomplete Image}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8748-8758} }
PVT-SSD: Single-Stage 3D Object Detector With Point-Voxel Transformer-
[pdf]
[supp]
[bibtex]@InProceedings{Yang_2023_CVPR, author = {Yang, Honghui and Wang, Wenxiao and Chen, Minghao and Lin, Binbin and He, Tong and Chen, Hua and He, Xiaofei and Ouyang, Wanli}, title = {PVT-SSD: Single-Stage 3D Object Detector With Point-Voxel Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13476-13487} }
Adaptive Human Matting for Dynamic Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lin_2023_CVPR, author = {Lin, Chung-Ching and Wang, Jiang and Luo, Kun and Lin, Kevin and Li, Linjie and Wang, Lijuan and Liu, Zicheng}, title = {Adaptive Human Matting for Dynamic Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10229-10238} }
Learning Common Rationale To Improve Self-Supervised Representation for Fine-Grained Visual Recognition Problems-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shu_2023_CVPR, author = {Shu, Yangyang and van den Hengel, Anton and Liu, Lingqiao}, title = {Learning Common Rationale To Improve Self-Supervised Representation for Fine-Grained Visual Recognition Problems}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11392-11401} }
High-Fidelity 3D Human Digitization From Single 2K Resolution Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Han_2023_CVPR, author = {Han, Sang-Hun and Park, Min-Gyu and Yoon, Ju Hong and Kang, Ju-Mi and Park, Young-Jae and Jeon, Hae-Gon}, title = {High-Fidelity 3D Human Digitization From Single 2K Resolution Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12869-12879} }
Fully Self-Supervised Depth Estimation From Defocus Clue-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Si_2023_CVPR, author = {Si, Haozhe and Zhao, Bin and Wang, Dong and Gao, Yunpeng and Chen, Mulin and Wang, Zhigang and Li, Xuelong}, title = {Fully Self-Supervised Depth Estimation From Defocus Clue}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9140-9149} }
Prompting Large Language Models With Answer Heuristics for Knowledge-Based Visual Question Answering-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shao_2023_CVPR, author = {Shao, Zhenwei and Yu, Zhou and Wang, Meng and Yu, Jun}, title = {Prompting Large Language Models With Answer Heuristics for Knowledge-Based Visual Question Answering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14974-14983} }
Improving Robustness of Semantic Segmentation to Motion-Blur Using Class-Centric Augmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Aakanksha_2023_CVPR, author = {Aakanksha and Rajagopalan, A. N.}, title = {Improving Robustness of Semantic Segmentation to Motion-Blur Using Class-Centric Augmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10470-10479} }
Progressive Open Space Expansion for Open-Set Model Attribution-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_CVPR, author = {Yang, Tianyun and Wang, Danding and Tang, Fan and Zhao, Xinying and Cao, Juan and Tang, Sheng}, title = {Progressive Open Space Expansion for Open-Set Model Attribution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15856-15865} }
Backdoor Cleansing With Unlabeled Data-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Pang_2023_CVPR, author = {Pang, Lu and Sun, Tao and Ling, Haibin and Chen, Chao}, title = {Backdoor Cleansing With Unlabeled Data}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12218-12227} }
Harmonious Feature Learning for Interactive Hand-Object Pose Estimation-
[pdf]
[supp]
[bibtex]@InProceedings{Lin_2023_CVPR, author = {Lin, Zhifeng and Ding, Changxing and Yao, Huan and Kuang, Zengsheng and Huang, Shaoli}, title = {Harmonious Feature Learning for Interactive Hand-Object Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12989-12998} }
CLOTH4D: A Dataset for Clothed Human Reconstruction-
[pdf]
[supp]
[bibtex]@InProceedings{Zou_2023_CVPR, author = {Zou, Xingxing and Han, Xintong and Wong, Waikeung}, title = {CLOTH4D: A Dataset for Clothed Human Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12847-12857} }
Generative Bias for Robust Visual Question Answering-
[pdf]
[arXiv]
[bibtex]@InProceedings{Cho_2023_CVPR, author = {Cho, Jae Won and Kim, Dong-Jin and Ryu, Hyeonggon and Kweon, In So}, title = {Generative Bias for Robust Visual Question Answering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11681-11690} }
Data-Free Sketch-Based Image Retrieval-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chaudhuri_2023_CVPR, author = {Chaudhuri, Abhra and Bhunia, Ayan Kumar and Song, Yi-Zhe and Dutta, Anjan}, title = {Data-Free Sketch-Based Image Retrieval}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12084-12093} }
Multi-Object Manipulation via Object-Centric Neural Scattering Functions-
[pdf]
[supp]
[bibtex]@InProceedings{Tian_2023_CVPR, author = {Tian, Stephen and Cai, Yancheng and Yu, Hong-Xing and Zakharov, Sergey and Liu, Katherine and Gaidon, Adrien and Li, Yunzhu and Wu, Jiajun}, title = {Multi-Object Manipulation via Object-Centric Neural Scattering Functions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9021-9031} }
The Wisdom of Crowds: Temporal Progressive Attention for Early Action Prediction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Stergiou_2023_CVPR, author = {Stergiou, Alexandros and Damen, Dima}, title = {The Wisdom of Crowds: Temporal Progressive Attention for Early Action Prediction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14709-14719} }
Invertible Neural Skinning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kant_2023_CVPR, author = {Kant, Yash and Siarohin, Aliaksandr and Guler, Riza Alp and Chai, Menglei and Ren, Jian and Tulyakov, Sergey and Gilitschenski, Igor}, title = {Invertible Neural Skinning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8715-8725} }
Weakly Supervised Semantic Segmentation via Adversarial Learning of Classifier and Reconstructor-
[pdf]
[supp]
[bibtex]@InProceedings{Kweon_2023_CVPR, author = {Kweon, Hyeokjun and Yoon, Sung-Hoon and Yoon, Kuk-Jin}, title = {Weakly Supervised Semantic Segmentation via Adversarial Learning of Classifier and Reconstructor}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11329-11339} }
Distilling Cross-Temporal Contexts for Continuous Sign Language Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Guo_2023_CVPR, author = {Guo, Leming and Xue, Wanli and Guo, Qing and Liu, Bo and Zhang, Kaihua and Yuan, Tiantian and Chen, Shengyong}, title = {Distilling Cross-Temporal Contexts for Continuous Sign Language Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10771-10780} }
Unsupervised Deep Probabilistic Approach for Partial Point Cloud Registration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mei_2023_CVPR, author = {Mei, Guofeng and Tang, Hao and Huang, Xiaoshui and Wang, Weijie and Liu, Juan and Zhang, Jian and Van Gool, Luc and Wu, Qiang}, title = {Unsupervised Deep Probabilistic Approach for Partial Point Cloud Registration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13611-13620} }
Similarity Metric Learning for RGB-Infrared Group Re-Identification-
[pdf]
[supp]
[bibtex]@InProceedings{Xiong_2023_CVPR, author = {Xiong, Jianghao and Lai, Jianhuang}, title = {Similarity Metric Learning for RGB-Infrared Group Re-Identification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13662-13671} }
Train/Test-Time Adaptation With Retrieval-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zancato_2023_CVPR, author = {Zancato, Luca and Achille, Alessandro and Liu, Tian Yu and Trager, Matthew and Perera, Pramuditha and Soatto, Stefano}, title = {Train/Test-Time Adaptation With Retrieval}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15911-15921} }
ProxyFormer: Proxy Alignment Assisted Point Cloud Completion With Missing Part Sensitive Transformer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Shanshan and Gao, Pan and Tan, Xiaoyang and Wei, Mingqiang}, title = {ProxyFormer: Proxy Alignment Assisted Point Cloud Completion With Missing Part Sensitive Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9466-9475} }
Mod-Squad: Designing Mixtures of Experts As Modular Multi-Task Learners-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Zitian and Shen, Yikang and Ding, Mingyu and Chen, Zhenfang and Zhao, Hengshuang and Learned-Miller, Erik G. and Gan, Chuang}, title = {Mod-Squad: Designing Mixtures of Experts As Modular Multi-Task Learners}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11828-11837} }
Learning Customized Visual Models With Retrieval-Augmented Knowledge-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Haotian and Son, Kilho and Yang, Jianwei and Liu, Ce and Gao, Jianfeng and Lee, Yong Jae and Li, Chunyuan}, title = {Learning Customized Visual Models With Retrieval-Augmented Knowledge}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15148-15158} }
Run, Don't Walk: Chasing Higher FLOPS for Faster Neural Networks-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Jierun and Kao, Shiu-hong and He, Hao and Zhuo, Weipeng and Wen, Song and Lee, Chul-Ho and Chan, S.-H. Gary}, title = {Run, Don't Walk: Chasing Higher FLOPS for Faster Neural Networks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12021-12031} }
Learning Procedure-Aware Video Representation From Instructional Videos and Their Narrations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhong_2023_CVPR, author = {Zhong, Yiwu and Yu, Licheng and Bai, Yang and Li, Shangwen and Yan, Xueting and Li, Yin}, title = {Learning Procedure-Aware Video Representation From Instructional Videos and Their Narrations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14825-14835} }
Co-Training 2L Submodels for Visual Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Touvron_2023_CVPR, author = {Touvron, Hugo and Cord, Matthieu and Oquab, Maxime and Bojanowski, Piotr and Verbeek, Jakob and J\'egou, Herv\'e}, title = {Co-Training 2L Submodels for Visual Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11701-11710} }
K-Planes: Explicit Radiance Fields in Space, Time, and Appearance-
[pdf]
[supp]
[bibtex]@InProceedings{Fridovich-Keil_2023_CVPR, author = {Fridovich-Keil, Sara and Meanti, Giacomo and Warburg, Frederik Rahb{\ae}k and Recht, Benjamin and Kanazawa, Angjoo}, title = {K-Planes: Explicit Radiance Fields in Space, Time, and Appearance}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12479-12488} }
Multi-Mode Online Knowledge Distillation for Self-Supervised Visual Representation Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Song_2023_CVPR, author = {Song, Kaiyou and Xie, Jin and Zhang, Shan and Luo, Zimeng}, title = {Multi-Mode Online Knowledge Distillation for Self-Supervised Visual Representation Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11848-11857} }
Viewpoint Equivariance for Multi-View 3D Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Dian and Li, Jie and Guizilini, Vitor and Ambrus, Rares Andrei and Gaidon, Adrien}, title = {Viewpoint Equivariance for Multi-View 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9213-9222} }
A Generalized Framework for Video Instance Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Heo_2023_CVPR, author = {Heo, Miran and Hwang, Sukjun and Hyun, Jeongseok and Kim, Hanjung and Oh, Seoung Wug and Lee, Joon-Young and Kim, Seon Joo}, title = {A Generalized Framework for Video Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14623-14632} }
On Distillation of Guided Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Meng_2023_CVPR, author = {Meng, Chenlin and Rombach, Robin and Gao, Ruiqi and Kingma, Diederik and Ermon, Stefano and Ho, Jonathan and Salimans, Tim}, title = {On Distillation of Guided Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14297-14306} }
Disentangled Representation Learning for Unsupervised Neural Quantization-
[pdf]
[bibtex]@InProceedings{Noh_2023_CVPR, author = {Noh, Haechan and Hyun, Sangeek and Jeong, Woojin and Lim, Hanshin and Heo, Jae-Pil}, title = {Disentangled Representation Learning for Unsupervised Neural Quantization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12001-12010} }
Zero-Shot Pose Transfer for Unrigged Stylized 3D Characters-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Jiashun and Li, Xueting and Liu, Sifei and De Mello, Shalini and Gallo, Orazio and Wang, Xiaolong and Kautz, Jan}, title = {Zero-Shot Pose Transfer for Unrigged Stylized 3D Characters}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8704-8714} }
Listening Human Behavior: 3D Human Pose Estimation With Acoustic Signals-
[pdf]
[supp]
[bibtex]@InProceedings{Shibata_2023_CVPR, author = {Shibata, Yuto and Kawashima, Yutaka and Isogawa, Mariko and Irie, Go and Kimura, Akisato and Aoki, Yoshimitsu}, title = {Listening Human Behavior: 3D Human Pose Estimation With Acoustic Signals}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13323-13332} }
Meta-Learning With a Geometry-Adaptive Preconditioner-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kang_2023_CVPR, author = {Kang, Suhyun and Hwang, Duhun and Eo, Moonjung and Kim, Taesup and Rhee, Wonjong}, title = {Meta-Learning With a Geometry-Adaptive Preconditioner}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16080-16090} }
NeuralDome: A Neural Modeling Pipeline on Multi-View Human-Object Interactions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Juze and Luo, Haimin and Yang, Hongdi and Xu, Xinru and Wu, Qianyang and Shi, Ye and Yu, Jingyi and Xu, Lan and Wang, Jingya}, title = {NeuralDome: A Neural Modeling Pipeline on Multi-View Human-Object Interactions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8834-8845} }
No One Left Behind: Improving the Worst Categories in Long-Tailed Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Du_2023_CVPR, author = {Du, Yingxiao and Wu, Jianxin}, title = {No One Left Behind: Improving the Worst Categories in Long-Tailed Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15804-15813} }
Target-Referenced Reactive Grasping for Dynamic Objects-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Jirong and Zhang, Ruo and Fang, Hao-Shu and Gou, Minghao and Fang, Hongjie and Wang, Chenxi and Xu, Sheng and Yan, Hengxu and Lu, Cewu}, title = {Target-Referenced Reactive Grasping for Dynamic Objects}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8824-8833} }
Complexity-Guided Slimmable Decoder for Efficient Deep Video Compression-
[pdf]
[supp]
[bibtex]@InProceedings{Hu_2023_CVPR, author = {Hu, Zhihao and Xu, Dong}, title = {Complexity-Guided Slimmable Decoder for Efficient Deep Video Compression}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14358-14367} }
MarginMatch: Improving Semi-Supervised Learning with Pseudo-Margins-
[pdf]
[supp]
[bibtex]@InProceedings{Sosea_2023_CVPR, author = {Sosea, Tiberiu and Caragea, Cornelia}, title = {MarginMatch: Improving Semi-Supervised Learning with Pseudo-Margins}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15773-15782} }
Beyond Appearance: A Semantic Controllable Self-Supervised Learning Framework for Human-Centric Visual Tasks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Weihua and Xu, Xianzhe and Jia, Jian and Luo, Hao and Wang, Yaohua and Wang, Fan and Jin, Rong and Sun, Xiuyu}, title = {Beyond Appearance: A Semantic Controllable Self-Supervised Learning Framework for Human-Centric Visual Tasks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15050-15061} }
Neural Fourier Filter Bank-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_CVPR, author = {Wu, Zhijie and Jin, Yuhe and Yi, Kwang Moo}, title = {Neural Fourier Filter Bank}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14153-14163} }
NeRFInvertor: High Fidelity NeRF-GAN Inversion for Single-Shot Real Image Animation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Yin_2023_CVPR, author = {Yin, Yu and Ghasedi, Kamran and Wu, HsiangTao and Yang, Jiaolong and Tong, Xin and Fu, Yun}, title = {NeRFInvertor: High Fidelity NeRF-GAN Inversion for Single-Shot Real Image Animation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8539-8548} }
Trace and Pace: Controllable Pedestrian Animation via Guided Trajectory Diffusion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Rempe_2023_CVPR, author = {Rempe, Davis and Luo, Zhengyi and Bin Peng, Xue and Yuan, Ye and Kitani, Kris and Kreis, Karsten and Fidler, Sanja and Litany, Or}, title = {Trace and Pace: Controllable Pedestrian Animation via Guided Trajectory Diffusion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13756-13766} }
Overlooked Factors in Concept-Based Explanations: Dataset Choice, Concept Learnability, and Human Capability-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ramaswamy_2023_CVPR, author = {Ramaswamy, Vikram V. and Kim, Sunnie S. Y. and Fong, Ruth and Russakovsky, Olga}, title = {Overlooked Factors in Concept-Based Explanations: Dataset Choice, Concept Learnability, and Human Capability}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10932-10941} }
Unsupervised 3D Shape Reconstruction by Part Retrieval and Assembly-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_CVPR, author = {Xu, Xianghao and Guerrero, Paul and Fisher, Matthew and Chaudhuri, Siddhartha and Ritchie, Daniel}, title = {Unsupervised 3D Shape Reconstruction by Part Retrieval and Assembly}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8559-8567} }
SeqTrack: Sequence to Sequence Learning for Visual Object Tracking-
[pdf]
[arXiv]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Xin and Peng, Houwen and Wang, Dong and Lu, Huchuan and Hu, Han}, title = {SeqTrack: Sequence to Sequence Learning for Visual Object Tracking}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14572-14581} }
AutoLabel: CLIP-Based Framework for Open-Set Video Domain Adaptation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zara_2023_CVPR, author = {Zara, Giacomo and Roy, Subhankar and Rota, Paolo and Ricci, Elisa}, title = {AutoLabel: CLIP-Based Framework for Open-Set Video Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11504-11513} }
DINER: Depth-Aware Image-Based NEural Radiance Fields-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Prinzler_2023_CVPR, author = {Prinzler, Malte and Hilliges, Otmar and Thies, Justus}, title = {DINER: Depth-Aware Image-Based NEural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12449-12459} }
Reconstructing Signing Avatars From Video Using Linguistic Priors-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Forte_2023_CVPR, author = {Forte, Maria-Paola and Kulits, Peter and Huang, Chun-Hao P. and Choutas, Vasileios and Tzionas, Dimitrios and Kuchenbecker, Katherine J. and Black, Michael J.}, title = {Reconstructing Signing Avatars From Video Using Linguistic Priors}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12791-12801} }
DeepMapping2: Self-Supervised Large-Scale LiDAR Map Optimization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Chao and Liu, Xinhao and Li, Yiming and Ding, Li and Feng, Chen}, title = {DeepMapping2: Self-Supervised Large-Scale LiDAR Map Optimization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9306-9316} }
DoNet: Deep De-Overlapping Network for Cytology Instance Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jiang_2023_CVPR, author = {Jiang, Hao and Zhang, Rushan and Zhou, Yanning and Wang, Yumeng and Chen, Hao}, title = {DoNet: Deep De-Overlapping Network for Cytology Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15641-15650} }
Instant Domain Augmentation for LiDAR Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ryu_2023_CVPR, author = {Ryu, Kwonyoung and Hwang, Soonmin and Park, Jaesik}, title = {Instant Domain Augmentation for LiDAR Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9350-9360} }
A Characteristic Function-Based Method for Bottom-Up Human Pose Estimation-
[pdf]
[supp]
[bibtex]@InProceedings{Qu_2023_CVPR, author = {Qu, Haoxuan and Cai, Yujun and Foo, Lin Geng and Kumar, Ajay and Liu, Jun}, title = {A Characteristic Function-Based Method for Bottom-Up Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13009-13018} }
SceneTrilogy: On Human Scene-Sketch and Its Complementarity With Photo and Text-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chowdhury_2023_CVPR, author = {Chowdhury, Pinaki Nath and Bhunia, Ayan Kumar and Sain, Aneeshan and Koley, Subhadeep and Xiang, Tao and Song, Yi-Zhe}, title = {SceneTrilogy: On Human Scene-Sketch and Its Complementarity With Photo and Text}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10972-10983} }
RefSR-NeRF: Towards High Fidelity and Super Resolution View Synthesis-
[pdf]
[supp]
[bibtex]@InProceedings{Huang_2023_CVPR, author = {Huang, Xudong and Li, Wei and Hu, Jie and Chen, Hanting and Wang, Yunhe}, title = {RefSR-NeRF: Towards High Fidelity and Super Resolution View Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8244-8253} }
Polarimetric iToF: Measuring High-Fidelity Depth Through Scattering Media-
[pdf]
[supp]
[bibtex]@InProceedings{Jeon_2023_CVPR, author = {Jeon, Daniel S. and Meuleman, Andr\'eas and Baek, Seung-Hwan and Kim, Min H.}, title = {Polarimetric iToF: Measuring High-Fidelity Depth Through Scattering Media}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12353-12362} }
Mobile User Interface Element Detection via Adaptively Prompt Tuning-
[pdf]
[arXiv]
[bibtex]@InProceedings{Gu_2023_CVPR, author = {Gu, Zhangxuan and Xu, Zhuoer and Chen, Haoxing and Lan, Jun and Meng, Changhua and Wang, Weiqiang}, title = {Mobile User Interface Element Detection via Adaptively Prompt Tuning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11155-11164} }
Sparse Multi-Modal Graph Transformer With Shared-Context Processing for Representation Learning of Giga-Pixel Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nakhli_2023_CVPR, author = {Nakhli, Ramin and Moghadam, Puria Azadi and Mi, Haoyang and Farahani, Hossein and Baras, Alexander and Gilks, Blake and Bashashati, Ali}, title = {Sparse Multi-Modal Graph Transformer With Shared-Context Processing for Representation Learning of Giga-Pixel Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11547-11557} }
Generating Human Motion From Textual Descriptions With Discrete Representations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Jianrong and Zhang, Yangsong and Cun, Xiaodong and Zhang, Yong and Zhao, Hongwei and Lu, Hongtao and Shen, Xi and Shan, Ying}, title = {Generating Human Motion From Textual Descriptions With Discrete Representations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14730-14740} }
Spatial-Temporal Concept Based Explanation of 3D ConvNets-
[pdf]
[arXiv]
[bibtex]@InProceedings{Ji_2023_CVPR, author = {Ji, Ying and Wang, Yu and Kato, Jien}, title = {Spatial-Temporal Concept Based Explanation of 3D ConvNets}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15444-15453} }
Robust Test-Time Adaptation in Dynamic Scenarios-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yuan_2023_CVPR, author = {Yuan, Longhui and Xie, Binhui and Li, Shuang}, title = {Robust Test-Time Adaptation in Dynamic Scenarios}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15922-15932} }
Global and Local Mixture Consistency Cumulative Learning for Long-Tailed Visual Recognitions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Du_2023_CVPR, author = {Du, Fei and Yang, Peng and Jia, Qi and Nan, Fengtao and Chen, Xiaoting and Yang, Yun}, title = {Global and Local Mixture Consistency Cumulative Learning for Long-Tailed Visual Recognitions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15814-15823} }
NIRVANA: Neural Implicit Representations of Videos With Adaptive Networks and Autoregressive Patch-Wise Modeling-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Maiya_2023_CVPR, author = {Maiya, Shishira R. and Girish, Sharath and Ehrlich, Max and Wang, Hanyu and Lee, Kwot Sin and Poirson, Patrick and Wu, Pengxiang and Wang, Chen and Shrivastava, Abhinav}, title = {NIRVANA: Neural Implicit Representations of Videos With Adaptive Networks and Autoregressive Patch-Wise Modeling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14378-14387} }
Collaboration Helps Camera Overtake LiDAR in 3D Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hu_2023_CVPR, author = {Hu, Yue and Lu, Yifan and Xu, Runsheng and Xie, Weidi and Chen, Siheng and Wang, Yanfeng}, title = {Collaboration Helps Camera Overtake LiDAR in 3D Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9243-9252} }
ReCo: Region-Controlled Text-to-Image Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_CVPR, author = {Yang, Zhengyuan and Wang, Jianfeng and Gan, Zhe and Li, Linjie and Lin, Kevin and Wu, Chenfei and Duan, Nan and Liu, Zicheng and Liu, Ce and Zeng, Michael and Wang, Lijuan}, title = {ReCo: Region-Controlled Text-to-Image Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14246-14255} }
Fix the Noise: Disentangling Source Feature for Controllable Domain Translation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2023_CVPR, author = {Lee, Dongyeun and Lee, Jae Young and Kim, Doyeon and Choi, Jaehyun and Yoo, Jaejun and Kim, Junmo}, title = {Fix the Noise: Disentangling Source Feature for Controllable Domain Translation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14224-14234} }
Sparsely Annotated Semantic Segmentation With Adaptive Gaussian Mixtures-
[pdf]
[supp]
[bibtex]@InProceedings{Wu_2023_CVPR, author = {Wu, Linshan and Zhong, Zhun and Fang, Leyuan and He, Xingxin and Liu, Qiang and Ma, Jiayi and Chen, Hao}, title = {Sparsely Annotated Semantic Segmentation With Adaptive Gaussian Mixtures}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15454-15464} }
Diversity-Aware Meta Visual Prompting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_CVPR, author = {Huang, Qidong and Dong, Xiaoyi and Chen, Dongdong and Zhang, Weiming and Wang, Feifei and Hua, Gang and Yu, Nenghai}, title = {Diversity-Aware Meta Visual Prompting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10878-10887} }
FaceLit: Neural 3D Relightable Faces-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ranjan_2023_CVPR, author = {Ranjan, Anurag and Yi, Kwang Moo and Chang, Jen-Hao Rick and Tuzel, Oncel}, title = {FaceLit: Neural 3D Relightable Faces}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8619-8628} }
Visual Programming: Compositional Visual Reasoning Without Training-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gupta_2023_CVPR, author = {Gupta, Tanmay and Kembhavi, Aniruddha}, title = {Visual Programming: Compositional Visual Reasoning Without Training}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14953-14962} }
Real-Time Evaluation in Online Continual Learning: A New Hope-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ghunaim_2023_CVPR, author = {Ghunaim, Yasir and Bibi, Adel and Alhamoud, Kumail and Alfarra, Motasem and Al Kader Hammoud, Hasan Abed and Prabhu, Ameya and Torr, Philip H.S. and Ghanem, Bernard}, title = {Real-Time Evaluation in Online Continual Learning: A New Hope}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11888-11897} }
BAAM: Monocular 3D Pose and Shape Reconstruction With Bi-Contextual Attention Module and Attention-Guided Modeling-
[pdf]
[supp]
[bibtex]@InProceedings{Lee_2023_CVPR, author = {Lee, Hyo-Jun and Kim, Hanul and Choi, Su-Min and Jeong, Seong-Gyun and Koh, Yeong Jun}, title = {BAAM: Monocular 3D Pose and Shape Reconstruction With Bi-Contextual Attention Module and Attention-Guided Modeling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9011-9020} }
Freestyle Layout-to-Image Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xue_2023_CVPR, author = {Xue, Han and Huang, Zhiwu and Sun, Qianru and Song, Li and Zhang, Wenjun}, title = {Freestyle Layout-to-Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14256-14266} }
Visual Dependency Transformers: Dependency Tree Emerges From Reversed Attention-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ding_2023_CVPR, author = {Ding, Mingyu and Shen, Yikang and Fan, Lijie and Chen, Zhenfang and Chen, Zitian and Luo, Ping and Tenenbaum, Joshua B. and Gan, Chuang}, title = {Visual Dependency Transformers: Dependency Tree Emerges From Reversed Attention}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14528-14539} }
Differentiable Architecture Search With Random Features-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Xuanyang and Li, Yonggang and Zhang, Xiangyu and Wang, Yongtao and Sun, Jian}, title = {Differentiable Architecture Search With Random Features}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16060-16069} }
Enhanced Stable View Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jain_2023_CVPR, author = {Jain, Nishant and Kumar, Suryansh and Van Gool, Luc}, title = {Enhanced Stable View Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13208-13217} }
Breaching FedMD: Image Recovery via Paired-Logits Inversion Attack-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Takahashi_2023_CVPR, author = {Takahashi, Hideaki and Liu, Jingjing and Liu, Yang}, title = {Breaching FedMD: Image Recovery via Paired-Logits Inversion Attack}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12198-12207} }
Biomechanics-Guided Facial Action Unit Detection Through Force Modeling-
[pdf]
[supp]
[bibtex]@InProceedings{Cui_2023_CVPR, author = {Cui, Zijun and Kuang, Chenyi and Gao, Tian and Talamadupula, Kartik and Ji, Qiang}, title = {Biomechanics-Guided Facial Action Unit Detection Through Force Modeling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8694-8703} }
Equiangular Basis Vectors-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shen_2023_CVPR, author = {Shen, Yang and Sun, Xuhao and Wei, Xiu-Shen}, title = {Equiangular Basis Vectors}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11755-11765} }
Cross-Guided Optimization of Radiance Fields With Multi-View Image Super-Resolution for High-Resolution Novel View Synthesis-
[pdf]
[supp]
[bibtex]@InProceedings{Yoon_2023_CVPR, author = {Yoon, Youngho and Yoon, Kuk-Jin}, title = {Cross-Guided Optimization of Radiance Fields With Multi-View Image Super-Resolution for High-Resolution Novel View Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12428-12438} }
Unified Pose Sequence Modeling-
[pdf]
[bibtex]@InProceedings{Foo_2023_CVPR, author = {Foo, Lin Geng and Li, Tianjiao and Rahmani, Hossein and Ke, Qiuhong and Liu, Jun}, title = {Unified Pose Sequence Modeling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13019-13030} }
Probability-Based Global Cross-Modal Upsampling for Pansharpening-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_CVPR, author = {Zhu, Zeyu and Cao, Xiangyong and Zhou, Man and Huang, Junhao and Meng, Deyu}, title = {Probability-Based Global Cross-Modal Upsampling for Pansharpening}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14039-14048} }
FAC: 3D Representation Learning via Foreground Aware Feature Contrast-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Kangcheng and Xiao, Aoran and Zhang, Xiaoqin and Lu, Shijian and Shao, Ling}, title = {FAC: 3D Representation Learning via Foreground Aware Feature Contrast}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9476-9485} }
Improving Visual Representation Learning Through Perceptual Understanding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tukra_2023_CVPR, author = {Tukra, Samyakh and Hoffman, Frederick and Chatfield, Ken}, title = {Improving Visual Representation Learning Through Perceptual Understanding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14486-14495} }
Learning Bottleneck Concepts in Image Classification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Bowen and Li, Liangzhi and Nakashima, Yuta and Nagahara, Hajime}, title = {Learning Bottleneck Concepts in Image Classification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10962-10971} }
Inversion-Based Style Transfer With Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Yuxin and Huang, Nisha and Tang, Fan and Huang, Haibin and Ma, Chongyang and Dong, Weiming and Xu, Changsheng}, title = {Inversion-Based Style Transfer With Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10146-10156} }
Learning Imbalanced Data With Vision Transformers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_CVPR, author = {Xu, Zhengzhuo and Liu, Ruikang and Yang, Shuo and Chai, Zenghao and Yuan, Chun}, title = {Learning Imbalanced Data With Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15793-15803} }
PHA: Patch-Wise High-Frequency Augmentation for Transformer-Based Person Re-Identification-
[pdf]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Guiwei and Zhang, Yongfei and Zhang, Tianyu and Li, Bo and Pu, Shiliang}, title = {PHA: Patch-Wise High-Frequency Augmentation for Transformer-Based Person Re-Identification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14133-14142} }
Learning Instance-Level Representation for Large-Scale Multi-Modal Pretraining in E-Commerce-
[pdf]
[supp]
[bibtex]@InProceedings{Jin_2023_CVPR, author = {Jin, Yang and Li, Yongzhi and Yuan, Zehuan and Mu, Yadong}, title = {Learning Instance-Level Representation for Large-Scale Multi-Modal Pretraining in E-Commerce}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11060-11069} }
Conditional Text Image Generation With Diffusion Models-
[pdf]
[bibtex]@InProceedings{Zhu_2023_CVPR, author = {Zhu, Yuanzhi and Li, Zhaohai and Wang, Tianwei and He, Mengchao and Yao, Cong}, title = {Conditional Text Image Generation With Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14235-14245} }
AnchorFormer: Point Cloud Completion From Discriminative Nodes-
[pdf]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Zhikai and Long, Fuchen and Qiu, Zhaofan and Yao, Ting and Zhou, Wengang and Luo, Jiebo and Mei, Tao}, title = {AnchorFormer: Point Cloud Completion From Discriminative Nodes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13581-13590} }
Co-SLAM: Joint Coordinate and Sparse Parametric Encodings for Neural Real-Time SLAM-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Hengyi and Wang, Jingwen and Agapito, Lourdes}, title = {Co-SLAM: Joint Coordinate and Sparse Parametric Encodings for Neural Real-Time SLAM}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13293-13302} }
Regularization of Polynomial Networks for Image Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chrysos_2023_CVPR, author = {Chrysos, Grigorios G. and Wang, Bohan and Deng, Jiankang and Cevher, Volkan}, title = {Regularization of Polynomial Networks for Image Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16123-16132} }
EfficientViT: Memory Efficient Vision Transformer With Cascaded Group Attention-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Xinyu and Peng, Houwen and Zheng, Ningxin and Yang, Yuqing and Hu, Han and Yuan, Yixuan}, title = {EfficientViT: Memory Efficient Vision Transformer With Cascaded Group Attention}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14420-14430} }
DiffCollage: Parallel Generation of Large Content With Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Qinsheng and Song, Jiaming and Huang, Xun and Chen, Yongxin and Liu, Ming-Yu}, title = {DiffCollage: Parallel Generation of Large Content With Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10188-10198} }
Efficient Second-Order Plane Adjustment-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhou_2023_CVPR, author = {Zhou, Lipu}, title = {Efficient Second-Order Plane Adjustment}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13113-13121} }
Mofusion: A Framework for Denoising-Diffusion-Based Motion Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dabral_2023_CVPR, author = {Dabral, Rishabh and Mughal, Muhammad Hamza and Golyanik, Vladislav and Theobalt, Christian}, title = {Mofusion: A Framework for Denoising-Diffusion-Based Motion Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9760-9770} }
PoseFormerV2: Exploring Frequency Domain for Efficient and Robust 3D Human Pose Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhao_2023_CVPR, author = {Zhao, Qitao and Zheng, Ce and Liu, Mengyuan and Wang, Pichao and Chen, Chen}, title = {PoseFormerV2: Exploring Frequency Domain for Efficient and Robust 3D Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8877-8886} }
Mask3D: Pre-Training 2D Vision Transformers by Learning Masked 3D Priors-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hou_2023_CVPR, author = {Hou, Ji and Dai, Xiaoliang and He, Zijian and Dai, Angela and Nie{\ss}ner, Matthias}, title = {Mask3D: Pre-Training 2D Vision Transformers by Learning Masked 3D Priors}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13510-13519} }
Physically Adversarial Infrared Patches With Learnable Shapes and Locations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wei_2023_CVPR, author = {Wei, Xingxing and Yu, Jie and Huang, Yao}, title = {Physically Adversarial Infrared Patches With Learnable Shapes and Locations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12334-12342} }
Exemplar-FreeSOLO: Enhancing Unsupervised Instance Segmentation With Exemplars-
[pdf]
[supp]
[bibtex]@InProceedings{Ishtiak_2023_CVPR, author = {Ishtiak, Taoseef and En, Qing and Guo, Yuhong}, title = {Exemplar-FreeSOLO: Enhancing Unsupervised Instance Segmentation With Exemplars}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15424-15433} }
Multimodal Prompting With Missing Modalities for Visual Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2023_CVPR, author = {Lee, Yi-Lun and Tsai, Yi-Hsuan and Chiu, Wei-Chen and Lee, Chen-Yu}, title = {Multimodal Prompting With Missing Modalities for Visual Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14943-14952} }
Neural Koopman Pooling: Control-Inspired Temporal Dynamics Encoding for Skeleton-Based Action Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Xinghan and Xu, Xin and Mu, Yadong}, title = {Neural Koopman Pooling: Control-Inspired Temporal Dynamics Encoding for Skeleton-Based Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10597-10607} }
Blind Image Quality Assessment via Vision-Language Correspondence: A Multitask Learning Perspective-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Weixia and Zhai, Guangtao and Wei, Ying and Yang, Xiaokang and Ma, Kede}, title = {Blind Image Quality Assessment via Vision-Language Correspondence: A Multitask Learning Perspective}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14071-14081} }
Integral Neural Networks-
[pdf]
[supp]
[bibtex]@InProceedings{Solodskikh_2023_CVPR, author = {Solodskikh, Kirill and Kurbanov, Azim and Aydarkhanov, Ruslan and Zhelavskaya, Irina and Parfenov, Yury and Song, Dehua and Lefkimmiatis, Stamatios}, title = {Integral Neural Networks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16113-16122} }
EXCALIBUR: Encouraging and Evaluating Embodied Exploration-
[pdf]
[supp]
[bibtex]@InProceedings{Zhu_2023_CVPR, author = {Zhu, Hao and Kapoor, Raghav and Min, So Yeon and Han, Winson and Li, Jiatai and Geng, Kaiwen and Neubig, Graham and Bisk, Yonatan and Kembhavi, Aniruddha and Weihs, Luca}, title = {EXCALIBUR: Encouraging and Evaluating Embodied Exploration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14931-14942} }
Visual DNA: Representing and Comparing Images Using Distributions of Neuron Activations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ramtoula_2023_CVPR, author = {Ramtoula, Benjamin and Gadd, Matthew and Newman, Paul and De Martini, Daniele}, title = {Visual DNA: Representing and Comparing Images Using Distributions of Neuron Activations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11113-11123} }
Recognizability Embedding Enhancement for Very Low-Resolution Face Recognition and Quality Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chai_2023_CVPR, author = {Chai, Jacky Chen Long and Ng, Tiong-Sik and Low, Cheng-Yaw and Park, Jaewoo and Teoh, Andrew Beng Jin}, title = {Recognizability Embedding Enhancement for Very Low-Resolution Face Recognition and Quality Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9957-9967} }
Accelerating Dataset Distillation via Model Augmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Lei and Zhang, Jie and Lei, Bowen and Mukherjee, Subhabrata and Pan, Xiang and Zhao, Bo and Ding, Caiwen and Li, Yao and Xu, Dongkuan}, title = {Accelerating Dataset Distillation via Model Augmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11950-11959} }
Frame-Event Alignment and Fusion Network for High Frame Rate Tracking-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Jiqing and Wang, Yuanchen and Liu, Wenxi and Li, Meng and Bai, Jinpeng and Yin, Baocai and Yang, Xin}, title = {Frame-Event Alignment and Fusion Network for High Frame Rate Tracking}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9781-9790} }
Shape-Aware Text-Driven Layered Video Editing-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2023_CVPR, author = {Lee, Yao-Chih and Jang, Ji-Ze Genevieve and Chen, Yi-Ting and Qiu, Elizabeth and Huang, Jia-Bin}, title = {Shape-Aware Text-Driven Layered Video Editing}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14317-14326} }
Solving Relaxations of MAP-MRF Problems: Combinatorial In-Face Frank-Wolfe Directions-
[pdf]
[arXiv]
[bibtex]@InProceedings{Kolmogorov_2023_CVPR, author = {Kolmogorov, Vladimir}, title = {Solving Relaxations of MAP-MRF Problems: Combinatorial In-Face Frank-Wolfe Directions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11980-11989} }
MEGANE: Morphable Eyeglass and Avatar Network-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Junxuan and Saito, Shunsuke and Simon, Tomas and Lombardi, Stephen and Li, Hongdong and Saragih, Jason}, title = {MEGANE: Morphable Eyeglass and Avatar Network}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12769-12779} }
Enhancing Multiple Reliability Measures via Nuisance-Extended Information Bottleneck-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jeong_2023_CVPR, author = {Jeong, Jongheon and Yu, Sihyun and Lee, Hankook and Shin, Jinwoo}, title = {Enhancing Multiple Reliability Measures via Nuisance-Extended Information Bottleneck}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16206-16218} }
Rethinking the Approximation Error in 3D Surface Fitting for Point Cloud Normal Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Du_2023_CVPR, author = {Du, Hang and Yan, Xuejun and Wang, Jingjing and Xie, Di and Pu, Shiliang}, title = {Rethinking the Approximation Error in 3D Surface Fitting for Point Cloud Normal Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9486-9495} }
Objaverse: A Universe of Annotated 3D Objects-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Deitke_2023_CVPR, author = {Deitke, Matt and Schwenk, Dustin and Salvador, Jordi and Weihs, Luca and Michel, Oscar and VanderBilt, Eli and Schmidt, Ludwig and Ehsani, Kiana and Kembhavi, Aniruddha and Farhadi, Ali}, title = {Objaverse: A Universe of Annotated 3D Objects}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13142-13153} }
A-Cap: Anticipation Captioning With Commonsense Knowledge-
[pdf]
[supp]
[bibtex]@InProceedings{Vo_2023_CVPR, author = {Vo, Duc Minh and Luong, Quoc-An and Sugimoto, Akihiro and Nakayama, Hideki}, title = {A-Cap: Anticipation Captioning With Commonsense Knowledge}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10824-10833} }
Domain Generalized Stereo Matching via Hierarchical Visual Transformation-
[pdf]
[supp]
[bibtex]@InProceedings{Chang_2023_CVPR, author = {Chang, Tianyu and Yang, Xun and Zhang, Tianzhu and Wang, Meng}, title = {Domain Generalized Stereo Matching via Hierarchical Visual Transformation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9559-9568} }
Adapting Shortcut With Normalizing Flow: An Efficient Tuning Framework for Visual Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Yaoming and Shi, Bowen and Zhang, Xiaopeng and Li, Jin and Liu, Yuchen and Dai, Wenrui and Li, Chenglin and Xiong, Hongkai and Tian, Qi}, title = {Adapting Shortcut With Normalizing Flow: An Efficient Tuning Framework for Visual Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15965-15974} }
Unpaired Image-to-Image Translation With Shortest Path Regularization-
[pdf]
[bibtex]@InProceedings{Xie_2023_CVPR, author = {Xie, Shaoan and Xu, Yanwu and Gong, Mingming and Zhang, Kun}, title = {Unpaired Image-to-Image Translation With Shortest Path Regularization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10177-10187} }
MotionDiffuser: Controllable Multi-Agent Motion Prediction Using Diffusion-
[pdf]
[supp]
[bibtex]@InProceedings{Jiang_2023_CVPR, author = {Jiang, Chiyu {\textquotedblleft}Max{\textquotedblright} and Cornman, Andre and Park, Cheolho and Sapp, Benjamin and Zhou, Yin and Anguelov, Dragomir}, title = {MotionDiffuser: Controllable Multi-Agent Motion Prediction Using Diffusion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9644-9653} }
ConvNeXt V2: Co-Designing and Scaling ConvNets With Masked Autoencoders-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Woo_2023_CVPR, author = {Woo, Sanghyun and Debnath, Shoubhik and Hu, Ronghang and Chen, Xinlei and Liu, Zhuang and Kweon, In So and Xie, Saining}, title = {ConvNeXt V2: Co-Designing and Scaling ConvNets With Masked Autoencoders}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16133-16142} }
Unsupervised Deep Asymmetric Stereo Matching With Spatially-Adaptive Self-Similarity-
[pdf]
[supp]
[bibtex]@InProceedings{Song_2023_CVPR, author = {Song, Taeyong and Kim, Sunok and Sohn, Kwanghoon}, title = {Unsupervised Deep Asymmetric Stereo Matching With Spatially-Adaptive Self-Similarity}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13672-13680} }
TWINS: A Fine-Tuning Framework for Improved Transferability of Adversarial Robustness and Generalization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Ziquan and Xu, Yi and Ji, Xiangyang and Chan, Antoni B.}, title = {TWINS: A Fine-Tuning Framework for Improved Transferability of Adversarial Robustness and Generalization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16436-16446} }
Object-Aware Distillation Pyramid for Open-Vocabulary Object Detection-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Luting and Liu, Yi and Du, Penghui and Ding, Zihan and Liao, Yue and Qi, Qiaosong and Chen, Biaolong and Liu, Si}, title = {Object-Aware Distillation Pyramid for Open-Vocabulary Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11186-11196} }
Evolved Part Masking for Self-Supervised Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Feng_2023_CVPR, author = {Feng, Zhanzhou and Zhang, Shiliang}, title = {Evolved Part Masking for Self-Supervised Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10386-10395} }
MV-JAR: Masked Voxel Jigsaw and Reconstruction for LiDAR-Based Self-Supervised Pre-Training-
[pdf]
[supp]
[bibtex]@InProceedings{Xu_2023_CVPR, author = {Xu, Runsen and Wang, Tai and Zhang, Wenwei and Chen, Runjian and Cao, Jinkun and Pang, Jiangmiao and Lin, Dahua}, title = {MV-JAR: Masked Voxel Jigsaw and Reconstruction for LiDAR-Based Self-Supervised Pre-Training}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13445-13454} }
Open-Set Semantic Segmentation for Point Clouds via Adversarial Prototype Framework-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Jianan and Dong, Qiulei}, title = {Open-Set Semantic Segmentation for Point Clouds via Adversarial Prototype Framework}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9425-9434} }
Learning Attention As Disentangler for Compositional Zero-Shot Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hao_2023_CVPR, author = {Hao, Shaozhe and Han, Kai and Wong, Kwan-Yee K.}, title = {Learning Attention As Disentangler for Compositional Zero-Shot Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15315-15324} }
MetaViewer: Towards a Unified Multi-View Representation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Ren and Sun, Haoliang and Ma, Yuling and Xi, Xiaoming and Yin, Yilong}, title = {MetaViewer: Towards a Unified Multi-View Representation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11590-11599} }
Natural Language-Assisted Sign Language Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zuo_2023_CVPR, author = {Zuo, Ronglai and Wei, Fangyun and Mak, Brian}, title = {Natural Language-Assisted Sign Language Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14890-14900} }
Learning Semantic Relationship Among Instances for Image-Text Matching-
[pdf]
[bibtex]@InProceedings{Fu_2023_CVPR, author = {Fu, Zheren and Mao, Zhendong and Song, Yan and Zhang, Yongdong}, title = {Learning Semantic Relationship Among Instances for Image-Text Matching}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15159-15168} }
Global-to-Local Modeling for Video-Based 3D Human Pose and Shape Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shen_2023_CVPR, author = {Shen, Xiaolong and Yang, Zongxin and Wang, Xiaohan and Ma, Jianxin and Zhou, Chang and Yang, Yi}, title = {Global-to-Local Modeling for Video-Based 3D Human Pose and Shape Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8887-8896} }
BEDLAM: A Synthetic Dataset of Bodies Exhibiting Detailed Lifelike Animated Motion-
[pdf]
[supp]
[bibtex]@InProceedings{Black_2023_CVPR, author = {Black, Michael J. and Patel, Priyanka and Tesch, Joachim and Yang, Jinlong}, title = {BEDLAM: A Synthetic Dataset of Bodies Exhibiting Detailed Lifelike Animated Motion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8726-8737} }
ProtoCon: Pseudo-Label Refinement via Online Clustering and Prototypical Consistency for Efficient Semi-Supervised Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nassar_2023_CVPR, author = {Nassar, Islam and Hayat, Munawar and Abbasnejad, Ehsan and Rezatofighi, Hamid and Haffari, Gholamreza}, title = {ProtoCon: Pseudo-Label Refinement via Online Clustering and Prototypical Consistency for Efficient Semi-Supervised Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11641-11650} }
Image Super-Resolution Using T-Tetromino Pixels-
[pdf]
[bibtex]@InProceedings{Grosche_2023_CVPR, author = {Grosche, Simon and Regensky, Andy and Seiler, J\"urgen and Kaup, Andr\'e}, title = {Image Super-Resolution Using T-Tetromino Pixels}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9989-9998} }
GFIE: A Dataset and Baseline for Gaze-Following From 2D to 3D in Indoor Environments-
[pdf]
[supp]
[bibtex]@InProceedings{Hu_2023_CVPR, author = {Hu, Zhengxi and Yang, Yuxue and Zhai, Xiaolin and Yang, Dingye and Zhou, Bohan and Liu, Jingtai}, title = {GFIE: A Dataset and Baseline for Gaze-Following From 2D to 3D in Indoor Environments}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8907-8916} }
BKinD-3D: Self-Supervised 3D Keypoint Discovery From Multi-View Videos-
[pdf]
[supp]
[bibtex]@InProceedings{Sun_2023_CVPR, author = {Sun, Jennifer J. and Karashchuk, Lili and Dravid, Amil and Ryou, Serim and Fereidooni, Sonia and Tuthill, John C. and Katsaggelos, Aggelos and Brunton, Bingni W. and Gkioxari, Georgia and Kennedy, Ann and Yue, Yisong and Perona, Pietro}, title = {BKinD-3D: Self-Supervised 3D Keypoint Discovery From Multi-View Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9001-9010} }
StyleRF: Zero-Shot 3D Style Transfer of Neural Radiance Fields-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Kunhao and Zhan, Fangneng and Chen, Yiwen and Zhang, Jiahui and Yu, Yingchen and El Saddik, Abdulmotaleb and Lu, Shijian and Xing, Eric P.}, title = {StyleRF: Zero-Shot 3D Style Transfer of Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8338-8348} }
Accidental Light Probes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yu_2023_CVPR, author = {Yu, Hong-Xing and Agarwala, Samir and Herrmann, Charles and Szeliski, Richard and Snavely, Noah and Wu, Jiajun and Sun, Deqing}, title = {Accidental Light Probes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12521-12530} }
Iterative Vision-and-Language Navigation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Krantz_2023_CVPR, author = {Krantz, Jacob and Banerjee, Shurjo and Zhu, Wang and Corso, Jason and Anderson, Peter and Lee, Stefan and Thomason, Jesse}, title = {Iterative Vision-and-Language Navigation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14921-14930} }
Adversarial Counterfactual Visual Explanations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jeanneret_2023_CVPR, author = {Jeanneret, Guillaume and Simon, Lo{\"\i}c and Jurie, Fr\'ed\'eric}, title = {Adversarial Counterfactual Visual Explanations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16425-16435} }
MaLP: Manipulation Localization Using a Proactive Scheme-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Asnani_2023_CVPR, author = {Asnani, Vishal and Yin, Xi and Hassner, Tal and Liu, Xiaoming}, title = {MaLP: Manipulation Localization Using a Proactive Scheme}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12343-12352} }
MM-Diffusion: Learning Multi-Modal Diffusion Models for Joint Audio and Video Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Ruan_2023_CVPR, author = {Ruan, Ludan and Ma, Yiyang and Yang, Huan and He, Huiguo and Liu, Bei and Fu, Jianlong and Yuan, Nicholas Jing and Jin, Qin and Guo, Baining}, title = {MM-Diffusion: Learning Multi-Modal Diffusion Models for Joint Audio and Video Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10219-10228} }
Robust Generalization Against Photon-Limited Corruptions via Worst-Case Sharpness Minimization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_CVPR, author = {Huang, Zhuo and Zhu, Miaoxi and Xia, Xiaobo and Shen, Li and Yu, Jun and Gong, Chen and Han, Bo and Du, Bo and Liu, Tongliang}, title = {Robust Generalization Against Photon-Limited Corruptions via Worst-Case Sharpness Minimization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16175-16185} }
Point2Pix: Photo-Realistic Point Cloud Rendering via Neural Radiance Fields-
[pdf]
[arXiv]
[bibtex]@InProceedings{Hu_2023_CVPR, author = {Hu, Tao and Xu, Xiaogang and Liu, Shu and Jia, Jiaya}, title = {Point2Pix: Photo-Realistic Point Cloud Rendering via Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8349-8358} }
NICO++: Towards Better Benchmarking for Domain Generalization-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Xingxuan and He, Yue and Xu, Renzhe and Yu, Han and Shen, Zheyan and Cui, Peng}, title = {NICO++: Towards Better Benchmarking for Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16036-16047} }
CHMATCH: Contrastive Hierarchical Matching and Robust Adaptive Threshold Boosted Semi-Supervised Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Wu_2023_CVPR, author = {Wu, Jianlong and Yang, Haozhe and Gan, Tian and Ding, Ning and Jiang, Feijun and Nie, Liqiang}, title = {CHMATCH: Contrastive Hierarchical Matching and Robust Adaptive Threshold Boosted Semi-Supervised Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15762-15772} }
Neural Dependencies Emerging From Learning Massive Categories-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Feng_2023_CVPR, author = {Feng, Ruili and Zheng, Kecheng and Zhu, Kai and Shen, Yujun and Zhao, Jian and Huang, Yukun and Zhao, Deli and Zhou, Jingren and Jordan, Michael and Zha, Zheng-Jun}, title = {Neural Dependencies Emerging From Learning Massive Categories}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11711-11720} }
ARCTIC: A Dataset for Dexterous Bimanual Hand-Object Manipulation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fan_2023_CVPR, author = {Fan, Zicong and Taheri, Omid and Tzionas, Dimitrios and Kocabas, Muhammed and Kaufmann, Manuel and Black, Michael J. and Hilliges, Otmar}, title = {ARCTIC: A Dataset for Dexterous Bimanual Hand-Object Manipulation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12943-12954} }
MAGVIT: Masked Generative Video Transformer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yu_2023_CVPR, author = {Yu, Lijun and Cheng, Yong and Sohn, Kihyuk and Lezama, Jos\'e and Zhang, Han and Chang, Huiwen and Hauptmann, Alexander G. and Yang, Ming-Hsuan and Hao, Yuan and Essa, Irfan and Jiang, Lu}, title = {MAGVIT: Masked Generative Video Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10459-10469} }
Hidden Gems: 4D Radar Scene Flow Learning Using Cross-Modal Supervision-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ding_2023_CVPR, author = {Ding, Fangqiang and Palffy, Andras and Gavrila, Dariu M. and Lu, Chris Xiaoxuan}, title = {Hidden Gems: 4D Radar Scene Flow Learning Using Cross-Modal Supervision}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9340-9349} }
OmniMAE: Single Model Masked Pretraining on Images and Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Girdhar_2023_CVPR, author = {Girdhar, Rohit and El-Nouby, Alaaeldin and Singh, Mannat and Alwala, Kalyan Vasudev and Joulin, Armand and Misra, Ishan}, title = {OmniMAE: Single Model Masked Pretraining on Images and Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10406-10417} }
Real-Time Neural Light Field on Mobile Devices-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cao_2023_CVPR, author = {Cao, Junli and Wang, Huan and Chemerys, Pavlo and Shakhrai, Vladislav and Hu, Ju and Fu, Yun and Makoviichuk, Denys and Tulyakov, Sergey and Ren, Jian}, title = {Real-Time Neural Light Field on Mobile Devices}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8328-8337} }
End-to-End Video Matting With Trimap Propagation-
[pdf]
[supp]
[bibtex]@InProceedings{Huang_2023_CVPR, author = {Huang, Wei-Lun and Lee, Ming-Sui}, title = {End-to-End Video Matting With Trimap Propagation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14337-14347} }
DropMAE: Masked Autoencoders With Spatial-Attention Dropout for Tracking Tasks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_CVPR, author = {Wu, Qiangqiang and Yang, Tianyu and Liu, Ziquan and Wu, Baoyuan and Shan, Ying and Chan, Antoni B.}, title = {DropMAE: Masked Autoencoders With Spatial-Attention Dropout for Tracking Tasks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14561-14571} }
High-Fidelity Clothed Avatar Reconstruction From a Single Image-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liao_2023_CVPR, author = {Liao, Tingting and Zhang, Xiaomei and Xiu, Yuliang and Yi, Hongwei and Liu, Xudong and Qi, Guo-Jun and Zhang, Yong and Wang, Xuan and Zhu, Xiangyu and Lei, Zhen}, title = {High-Fidelity Clothed Avatar Reconstruction From a Single Image}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8662-8672} }
Zero-Shot Object Counting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_CVPR, author = {Xu, Jingyi and Le, Hieu and Nguyen, Vu and Ranjan, Viresh and Samaras, Dimitris}, title = {Zero-Shot Object Counting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15548-15557} }
Implicit Diffusion Models for Continuous Super-Resolution-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gao_2023_CVPR, author = {Gao, Sicheng and Liu, Xuhui and Zeng, Bohan and Xu, Sheng and Li, Yanjing and Luo, Xiaoyan and Liu, Jianzhuang and Zhen, Xiantong and Zhang, Baochang}, title = {Implicit Diffusion Models for Continuous Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10021-10030} }
Phase-Shifting Coder: Predicting Accurate Orientation in Oriented Object Detection-
[pdf]
[arXiv]
[bibtex]@InProceedings{Yu_2023_CVPR, author = {Yu, Yi and Da, Feipeng}, title = {Phase-Shifting Coder: Predicting Accurate Orientation in Oriented Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13354-13363} }
Neural Lens Modeling-
[pdf]
[supp]
[bibtex]@InProceedings{Xian_2023_CVPR, author = {Xian, Wenqi and Bo\v{z}i\v{c}, Alja\v{z} and Snavely, Noah and Lassner, Christoph}, title = {Neural Lens Modeling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8435-8445} }
CoralStyleCLIP: Co-Optimized Region and Layer Selection for Image Editing-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Revanur_2023_CVPR, author = {Revanur, Ambareesh and Basu, Debraj and Agrawal, Shradha and Agarwal, Dhwanit and Pai, Deepak}, title = {CoralStyleCLIP: Co-Optimized Region and Layer Selection for Image Editing}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12695-12704} }
GLeaD: Improving GANs With a Generator-Leading Task-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bai_2023_CVPR, author = {Bai, Qingyan and Yang, Ceyuan and Xu, Yinghao and Liu, Xihui and Yang, Yujiu and Shen, Yujun}, title = {GLeaD: Improving GANs With a Generator-Leading Task}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12094-12104} }
GALIP: Generative Adversarial CLIPs for Text-to-Image Synthesis-
[pdf]
[arXiv]
[bibtex]@InProceedings{Tao_2023_CVPR, author = {Tao, Ming and Bao, Bing-Kun and Tang, Hao and Xu, Changsheng}, title = {GALIP: Generative Adversarial CLIPs for Text-to-Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14214-14223} }
Indiscernible Object Counting in Underwater Scenes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sun_2023_CVPR, author = {Sun, Guolei and An, Zhaochong and Liu, Yun and Liu, Ce and Sakaridis, Christos and Fan, Deng-Ping and Van Gool, Luc}, title = {Indiscernible Object Counting in Underwater Scenes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13791-13801} }
Low-Light Image Enhancement via Structure Modeling and Guidance-
[pdf]
[arXiv]
[bibtex]@InProceedings{Xu_2023_CVPR, author = {Xu, Xiaogang and Wang, Ruixing and Lu, Jiangbo}, title = {Low-Light Image Enhancement via Structure Modeling and Guidance}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9893-9903} }
Physics-Driven Diffusion Models for Impact Sound Synthesis From Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Su_2023_CVPR, author = {Su, Kun and Qian, Kaizhi and Shlizerman, Eli and Torralba, Antonio and Gan, Chuang}, title = {Physics-Driven Diffusion Models for Impact Sound Synthesis From Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9749-9759} }
Alias-Free Convnets: Fractional Shift Invariance via Polynomial Activations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Michaeli_2023_CVPR, author = {Michaeli, Hagay and Michaeli, Tomer and Soudry, Daniel}, title = {Alias-Free Convnets: Fractional Shift Invariance via Polynomial Activations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16333-16342} }
Shortcomings of Top-Down Randomization-Based Sanity Checks for Evaluations of Deep Neural Network Explanations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Binder_2023_CVPR, author = {Binder, Alexander and Weber, Leander and Lapuschkin, Sebastian and Montavon, Gr\'egoire and M\"uller, Klaus-Robert and Samek, Wojciech}, title = {Shortcomings of Top-Down Randomization-Based Sanity Checks for Evaluations of Deep Neural Network Explanations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16143-16152} }
Neural Part Priors: Learning To Optimize Part-Based Object Completion in RGB-D Scans-
[pdf]
[supp]
[bibtex]@InProceedings{Bokhovkin_2023_CVPR, author = {Bokhovkin, Aleksei and Dai, Angela}, title = {Neural Part Priors: Learning To Optimize Part-Based Object Completion in RGB-D Scans}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9032-9042} }
Towards Trustable Skin Cancer Diagnosis via Rewriting Model's Decision-
[pdf]
[supp]
[bibtex]@InProceedings{Yan_2023_CVPR, author = {Yan, Siyuan and Yu, Zhen and Zhang, Xuelin and Mahapatra, Dwarikanath and Chandra, Shekhar S. and Janda, Monika and Soyer, Peter and Ge, Zongyuan}, title = {Towards Trustable Skin Cancer Diagnosis via Rewriting Model's Decision}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11568-11577} }
FeatER: An Efficient Network for Human Reconstruction via Feature Map-Based TransformER-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zheng_2023_CVPR, author = {Zheng, Ce and Mendieta, Matias and Yang, Taojiannan and Qi, Guo-Jun and Chen, Chen}, title = {FeatER: An Efficient Network for Human Reconstruction via Feature Map-Based TransformER}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13945-13954} }
Visibility Constrained Wide-Band Illumination Spectrum Design for Seeing-in-the-Dark-
[pdf]
[arXiv]
[bibtex]@InProceedings{Niu_2023_CVPR, author = {Niu, Muyao and Li, Zhuoxiao and Zhong, Zhihang and Zheng, Yinqiang}, title = {Visibility Constrained Wide-Band Illumination Spectrum Design for Seeing-in-the-Dark}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13976-13985} }
Learning With Noisy Labels via Self-Supervised Adversarial Noisy Masking-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tu_2023_CVPR, author = {Tu, Yuanpeng and Zhang, Boshen and Li, Yuxi and Liu, Liang and Li, Jian and Zhang, Jiangning and Wang, Yabiao and Wang, Chengjie and Zhao, Cai Rong}, title = {Learning With Noisy Labels via Self-Supervised Adversarial Noisy Masking}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16186-16195} }
Towards Domain Generalization for Multi-View 3D Object Detection in Bird-Eye-View-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Shuo and Zhao, Xinhai and Xu, Hai-Ming and Chen, Zehui and Yu, Dameng and Chang, Jiahao and Yang, Zhen and Zhao, Feng}, title = {Towards Domain Generalization for Multi-View 3D Object Detection in Bird-Eye-View}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13333-13342} }
Q: How To Specialize Large Vision-Language Models to Data-Scarce VQA Tasks? A: Self-Train on Unlabeled Images!-
[pdf]
[bibtex]@InProceedings{Khan_2023_CVPR, author = {Khan, Zaid and BG, Vijay Kumar and Schulter, Samuel and Yu, Xiang and Fu, Yun and Chandraker, Manmohan}, title = {Q: How To Specialize Large Vision-Language Models to Data-Scarce VQA Tasks? A: Self-Train on Unlabeled Images!}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15005-15015} }
Improving Robust Generalization by Direct PAC-Bayesian Bound Minimization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Zifan and Ding, Nan and Levinboim, Tomer and Chen, Xi and Soricut, Radu}, title = {Improving Robust Generalization by Direct PAC-Bayesian Bound Minimization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16458-16468} }
AssemblyHands: Towards Egocentric Activity Understanding via 3D Hand Pose Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ohkawa_2023_CVPR, author = {Ohkawa, Takehiko and He, Kun and Sener, Fadime and Hodan, Tomas and Tran, Luan and Keskin, Cem}, title = {AssemblyHands: Towards Egocentric Activity Understanding via 3D Hand Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12999-13008} }
Scene-Aware Egocentric 3D Human Pose Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Jian and Luvizon, Diogo and Xu, Weipeng and Liu, Lingjie and Sarkar, Kripasindhu and Theobalt, Christian}, title = {Scene-Aware Egocentric 3D Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13031-13040} }
NeuralField-LDM: Scene Generation With Hierarchical Latent Diffusion Models-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2023_CVPR, author = {Kim, Seung Wook and Brown, Bradley and Yin, Kangxue and Kreis, Karsten and Schwarz, Katja and Li, Daiqing and Rombach, Robin and Torralba, Antonio and Fidler, Sanja}, title = {NeuralField-LDM: Scene Generation With Hierarchical Latent Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8496-8506} }
DPF: Learning Dense Prediction Fields With Weak Supervision-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Xiaoxue and Zheng, Yuhang and Zheng, Yupeng and Zhou, Qiang and Zhao, Hao and Zhou, Guyue and Zhang, Ya-Qin}, title = {DPF: Learning Dense Prediction Fields With Weak Supervision}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15347-15357} }
CNVid-3.5M: Build, Filter, and Pre-Train the Large-Scale Public Chinese Video-Text Dataset-
[pdf]
[supp]
[bibtex]@InProceedings{Gan_2023_CVPR, author = {Gan, Tian and Wang, Qing and Dong, Xingning and Ren, Xiangyuan and Nie, Liqiang and Guo, Qingpei}, title = {CNVid-3.5M: Build, Filter, and Pre-Train the Large-Scale Public Chinese Video-Text Dataset}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14815-14824} }
iQuery: Instruments As Queries for Audio-Visual Sound Separation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Jiaben and Zhang, Renrui and Lian, Dongze and Yang, Jiaqi and Zeng, Ziyao and Shi, Jianbo}, title = {iQuery: Instruments As Queries for Audio-Visual Sound Separation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14675-14686} }
Sampling Is Matter: Point-Guided 3D Human Mesh Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2023_CVPR, author = {Kim, Jeonghwan and Gwon, Mi-Gyeong and Park, Hyunwoo and Kwon, Hyukmin and Um, Gi-Mun and Kim, Wonjun}, title = {Sampling Is Matter: Point-Guided 3D Human Mesh Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12880-12889} }
Look Around for Anomalies: Weakly-Supervised Anomaly Detection via Context-Motion Relational Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Cho_2023_CVPR, author = {Cho, MyeongAh and Kim, Minjung and Hwang, Sangwon and Park, Chaewon and Lee, Kyungjae and Lee, Sangyoun}, title = {Look Around for Anomalies: Weakly-Supervised Anomaly Detection via Context-Motion Relational Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12137-12146} }
Detecting Everything in the Open World: Towards Universal Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Zhenyu and Li, Yali and Chen, Xi and Lim, Ser-Nam and Torralba, Antonio and Zhao, Hengshuang and Wang, Shengjin}, title = {Detecting Everything in the Open World: Towards Universal Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11433-11443} }
NUWA-LIP: Language-Guided Image Inpainting With Defect-Free VQGAN-
[pdf]
[supp]
[bibtex]@InProceedings{Ni_2023_CVPR, author = {Ni, Minheng and Li, Xiaoming and Zuo, Wangmeng}, title = {NUWA-LIP: Language-Guided Image Inpainting With Defect-Free VQGAN}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14183-14192} }
Language Adaptive Weight Generation for Multi-Task Visual Grounding-
[pdf]
[supp]
[bibtex]@InProceedings{Su_2023_CVPR, author = {Su, Wei and Miao, Peihan and Dou, Huanzhang and Wang, Gaoang and Qiao, Liang and Li, Zheyang and Li, Xi}, title = {Language Adaptive Weight Generation for Multi-Task Visual Grounding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10857-10866} }
Continuous Intermediate Token Learning With Implicit Motion Manifold for Keyframe Based Motion Interpolation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mo_2023_CVPR, author = {Mo, Clinton A. and Hu, Kun and Long, Chengjiang and Wang, Zhiyong}, title = {Continuous Intermediate Token Learning With Implicit Motion Manifold for Keyframe Based Motion Interpolation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13894-13903} }
SGLoc: Scene Geometry Encoding for Outdoor LiDAR Localization-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Wen and Yu, Shangshu and Wang, Cheng and Hu, Guosheng and Shen, Siqi and Wen, Chenglu}, title = {SGLoc: Scene Geometry Encoding for Outdoor LiDAR Localization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9286-9295} }
Bridging Search Region Interaction With Template for RGB-T Tracking-
[pdf]
[bibtex]@InProceedings{Hui_2023_CVPR, author = {Hui, Tianrui and Xun, Zizheng and Peng, Fengguang and Huang, Junshi and Wei, Xiaoming and Wei, Xiaolin and Dai, Jiao and Han, Jizhong and Liu, Si}, title = {Bridging Search Region Interaction With Template for RGB-T Tracking}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13630-13639} }
Indescribable Multi-Modal Spatial Evaluator-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kong_2023_CVPR, author = {Kong, Lingke and Qi, X. Sharon and Shen, Qijin and Wang, Jiacheng and Zhang, Jingyi and Hu, Yanle and Zhou, Qichao}, title = {Indescribable Multi-Modal Spatial Evaluator}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9853-9862} }
ImageBind: One Embedding Space To Bind Them All-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Girdhar_2023_CVPR, author = {Girdhar, Rohit and El-Nouby, Alaaeldin and Liu, Zhuang and Singh, Mannat and Alwala, Kalyan Vasudev and Joulin, Armand and Misra, Ishan}, title = {ImageBind: One Embedding Space To Bind Them All}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15180-15190} }
Three Guidelines You Should Know for Universally Slimmable Self-Supervised Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cao_2023_CVPR, author = {Cao, Yun-Hao and Sun, Peiqin and Zhou, Shuchang}, title = {Three Guidelines You Should Know for Universally Slimmable Self-Supervised Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15742-15751} }
MetaFusion: Infrared and Visible Image Fusion via Meta-Feature Embedding From Object Detection-
[pdf]
[bibtex]@InProceedings{Zhao_2023_CVPR, author = {Zhao, Wenda and Xie, Shigeng and Zhao, Fan and He, You and Lu, Huchuan}, title = {MetaFusion: Infrared and Visible Image Fusion via Meta-Feature Embedding From Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13955-13965} }
End-to-End Vectorized HD-Map Construction With Piecewise Bezier Curve-
[pdf]
[supp]
[bibtex]@InProceedings{Qiao_2023_CVPR, author = {Qiao, Limeng and Ding, Wenjie and Qiu, Xi and Zhang, Chi}, title = {End-to-End Vectorized HD-Map Construction With Piecewise Bezier Curve}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13218-13228} }
On Data Scaling in Masked Image Modeling-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xie_2023_CVPR, author = {Xie, Zhenda and Zhang, Zheng and Cao, Yue and Lin, Yutong and Wei, Yixuan and Dai, Qi and Hu, Han}, title = {On Data Scaling in Masked Image Modeling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10365-10374} }
Balanced Energy Regularization Loss for Out-of-Distribution Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Choi_2023_CVPR, author = {Choi, Hyunjun and Jeong, Hawook and Choi, Jin Young}, title = {Balanced Energy Regularization Loss for Out-of-Distribution Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15691-15700} }
3D-Aware Face Swapping-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Yixuan and Ma, Chao and Yan, Yichao and Zhu, Wenhan and Yang, Xiaokang}, title = {3D-Aware Face Swapping}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12705-12714} }
Phone2Proc: Bringing Robust Robots Into Our Chaotic World-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Deitke_2023_CVPR, author = {Deitke, Matt and Hendrix, Rose and Farhadi, Ali and Ehsani, Kiana and Kembhavi, Aniruddha}, title = {Phone2Proc: Bringing Robust Robots Into Our Chaotic World}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9665-9675} }
Learning Articulated Shape With Keypoint Pseudo-Labels From Web Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Stathopoulos_2023_CVPR, author = {Stathopoulos, Anastasis and Pavlakos, Georgios and Han, Ligong and Metaxas, Dimitris N.}, title = {Learning Articulated Shape With Keypoint Pseudo-Labels From Web Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13092-13101} }
Rethinking Image Super Resolution From Long-Tailed Distribution Learning Perspective-
[pdf]
[supp]
[bibtex]@InProceedings{Gou_2023_CVPR, author = {Gou, Yuanbiao and Hu, Peng and Lv, Jiancheng and Zhu, Hongyuan and Peng, Xi}, title = {Rethinking Image Super Resolution From Long-Tailed Distribution Learning Perspective}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14327-14336} }
SCOTCH and SODA: A Transformer Video Shadow Detection Framework-
[pdf]
[arXiv]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Lihao and Prost, Jean and Zhu, Lei and Papadakis, Nicolas and Li\`o, Pietro and Sch\"onlieb, Carola-Bibiane and Aviles-Rivero, Angelica I.}, title = {SCOTCH and SODA: A Transformer Video Shadow Detection Framework}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10449-10458} }
CodeTalker: Speech-Driven 3D Facial Animation With Discrete Motion Prior-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xing_2023_CVPR, author = {Xing, Jinbo and Xia, Menghan and Zhang, Yuechen and Cun, Xiaodong and Wang, Jue and Wong, Tien-Tsin}, title = {CodeTalker: Speech-Driven 3D Facial Animation With Discrete Motion Prior}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12780-12790} }
Improving Zero-Shot Generalization and Robustness of Multi-Modal Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ge_2023_CVPR, author = {Ge, Yunhao and Ren, Jie and Gallagher, Andrew and Wang, Yuxiao and Yang, Ming-Hsuan and Adam, Hartwig and Itti, Laurent and Lakshminarayanan, Balaji and Zhao, Jiaping}, title = {Improving Zero-Shot Generalization and Robustness of Multi-Modal Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11093-11101} }
CODA-Prompt: COntinual Decomposed Attention-Based Prompting for Rehearsal-Free Continual Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Smith_2023_CVPR, author = {Smith, James Seale and Karlinsky, Leonid and Gutta, Vyshnavi and Cascante-Bonilla, Paola and Kim, Donghyun and Arbelle, Assaf and Panda, Rameswar and Feris, Rogerio and Kira, Zsolt}, title = {CODA-Prompt: COntinual Decomposed Attention-Based Prompting for Rehearsal-Free Continual Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11909-11919} }
Real-Time Multi-Person Eyeblink Detection in the Wild for Untrimmed Video-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zeng_2023_CVPR, author = {Zeng, Wenzheng and Xiao, Yang and Wei, Sicheng and Gan, Jinfang and Zhang, Xintao and Cao, Zhiguo and Fang, Zhiwen and Zhou, Joey Tianyi}, title = {Real-Time Multi-Person Eyeblink Detection in the Wild for Untrimmed Video}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13854-13863} }
Category Query Learning for Human-Object Interaction Classification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xie_2023_CVPR, author = {Xie, Chi and Zeng, Fangao and Hu, Yue and Liang, Shuang and Wei, Yichen}, title = {Category Query Learning for Human-Object Interaction Classification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15275-15284} }
MDQE: Mining Discriminative Query Embeddings To Segment Occluded Instances on Challenging Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Minghan and Li, Shuai and Xiang, Wangmeng and Zhang, Lei}, title = {MDQE: Mining Discriminative Query Embeddings To Segment Occluded Instances on Challenging Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10524-10533} }
Are We Ready for Vision-Centric Driving Streaming Perception? The ASAP Benchmark-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Xiaofeng and Zhu, Zheng and Zhang, Yunpeng and Huang, Guan and Ye, Yun and Xu, Wenbo and Chen, Ziwei and Wang, Xingang}, title = {Are We Ready for Vision-Centric Driving Streaming Perception? The ASAP Benchmark}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9600-9610} }
PDPP:Projected Diffusion for Procedure Planning in Instructional Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Hanlin and Wu, Yilu and Guo, Sheng and Wang, Limin}, title = {PDPP:Projected Diffusion for Procedure Planning in Instructional Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14836-14845} }
Efficient Map Sparsification Based on 2D and 3D Discretized Grids-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Xiaoyu and Liu, Yun-Hui}, title = {Efficient Map Sparsification Based on 2D and 3D Discretized Grids}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12470-12478} }
Class Attention Transfer Based Knowledge Distillation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Guo_2023_CVPR, author = {Guo, Ziyao and Yan, Haonan and Li, Hui and Lin, Xiaodong}, title = {Class Attention Transfer Based Knowledge Distillation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11868-11877} }
Temporally Consistent Online Depth Estimation Using Point-Based Fusion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Khan_2023_CVPR, author = {Khan, Numair and Penner, Eric and Lanman, Douglas and Xiao, Lei}, title = {Temporally Consistent Online Depth Estimation Using Point-Based Fusion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9119-9129} }
Generalizable Implicit Neural Representations via Instance Pattern Composers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2023_CVPR, author = {Kim, Chiheon and Lee, Doyup and Kim, Saehoon and Cho, Minsu and Han, Wook-Shin}, title = {Generalizable Implicit Neural Representations via Instance Pattern Composers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11808-11817} }
What Can Human Sketches Do for Object Detection?-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chowdhury_2023_CVPR, author = {Chowdhury, Pinaki Nath and Bhunia, Ayan Kumar and Sain, Aneeshan and Koley, Subhadeep and Xiang, Tao and Song, Yi-Zhe}, title = {What Can Human Sketches Do for Object Detection?}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15083-15094} }
Identity-Preserving Talking Face Generation With Landmark and Appearance Priors-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhong_2023_CVPR, author = {Zhong, Weizhi and Fang, Chaowei and Cai, Yinqi and Wei, Pengxu and Zhao, Gangming and Lin, Liang and Li, Guanbin}, title = {Identity-Preserving Talking Face Generation With Landmark and Appearance Priors}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9729-9738} }
Weakly Supervised Segmentation With Point Annotations for Histopathology Images via Contrast-Based Variational Model-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Hongrun and Burrows, Liam and Meng, Yanda and Sculthorpe, Declan and Mukherjee, Abhik and Coupland, Sarah E. and Chen, Ke and Zheng, Yalin}, title = {Weakly Supervised Segmentation With Point Annotations for Histopathology Images via Contrast-Based Variational Model}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15630-15640} }
Zero-Shot Generative Model Adaptation via Image-Specific Prompt Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Guo_2023_CVPR, author = {Guo, Jiayi and Wang, Chaofei and Wu, You and Zhang, Eric and Wang, Kai and Xu, Xingqian and Song, Shiji and Shi, Humphrey and Huang, Gao}, title = {Zero-Shot Generative Model Adaptation via Image-Specific Prompt Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11494-11503} }
CelebV-Text: A Large-Scale Facial Text-Video Dataset-
[pdf]
[supp]
[bibtex]@InProceedings{Yu_2023_CVPR, author = {Yu, Jianhui and Zhu, Hao and Jiang, Liming and Loy, Chen Change and Cai, Weidong and Wu, Wayne}, title = {CelebV-Text: A Large-Scale Facial Text-Video Dataset}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14805-14814} }
Hard Patches Mining for Masked Image Modeling-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Haochen and Song, Kaiyou and Fan, Junsong and Wang, Yuxi and Xie, Jin and Zhang, Zhaoxiang}, title = {Hard Patches Mining for Masked Image Modeling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10375-10385} }
Diffusion-SDF: Text-To-Shape via Voxelized Diffusion-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Muheng and Duan, Yueqi and Zhou, Jie and Lu, Jiwen}, title = {Diffusion-SDF: Text-To-Shape via Voxelized Diffusion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12642-12651} }
Compositor: Bottom-Up Clustering and Compositing for Robust Part and Object Segmentation-
[pdf]
[bibtex]@InProceedings{He_2023_CVPR, author = {He, Ju and Chen, Jieneng and Lin, Ming-Xian and Yu, Qihang and Yuille, Alan L.}, title = {Compositor: Bottom-Up Clustering and Compositing for Robust Part and Object Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11259-11268} }
Boundary-Aware Backward-Compatible Representation via Adversarial Learning in Image Retrieval-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Pan_2023_CVPR, author = {Pan, Tan and Xu, Furong and Yang, Xudong and He, Sifeng and Jiang, Chen and Guo, Qingpei and Qian, Feng and Zhang, Xiaobo and Cheng, Yuan and Yang, Lei and Chu, Wei}, title = {Boundary-Aware Backward-Compatible Representation via Adversarial Learning in Image Retrieval}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15201-15210} }
Super-CLEVR: A Virtual Benchmark To Diagnose Domain Robustness in Visual Reasoning-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Zhuowan and Wang, Xingrui and Stengel-Eskin, Elias and Kortylewski, Adam and Ma, Wufei and Van Durme, Benjamin and Yuille, Alan L.}, title = {Super-CLEVR: A Virtual Benchmark To Diagnose Domain Robustness in Visual Reasoning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14963-14973} }
Sliced Optimal Partial Transport-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bai_2023_CVPR, author = {Bai, Yikun and Schmitzer, Bernhard and Thorpe, Matthew and Kolouri, Soheil}, title = {Sliced Optimal Partial Transport}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13681-13690} }
Siamese DETR-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Zeren and Huang, Gengshi and Li, Wei and Teng, Jianing and Wang, Kun and Shao, Jing and Loy, Chen Change and Sheng, Lu}, title = {Siamese DETR}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15722-15731} }
Turning Strengths Into Weaknesses: A Certified Robustness Inspired Attack Framework Against Graph Neural Networks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Binghui and Pang, Meng and Dong, Yun}, title = {Turning Strengths Into Weaknesses: A Certified Robustness Inspired Attack Framework Against Graph Neural Networks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16394-16403} }
Demystifying Causal Features on Adversarial Examples and Causal Inoculation for Robust Network by Adversarial Instrumental Variable Regression-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2023_CVPR, author = {Kim, Junho and Lee, Byung-Kwan and Ro, Yong Man}, title = {Demystifying Causal Features on Adversarial Examples and Causal Inoculation for Robust Network by Adversarial Instrumental Variable Regression}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12302-12312} }
B-Spline Texture Coefficients Estimator for Screen Content Image Super-Resolution-
[pdf]
[supp]
[bibtex]@InProceedings{Pak_2023_CVPR, author = {Pak, Byeonghyun and Lee, Jaewon and Jin, Kyong Hwan}, title = {B-Spline Texture Coefficients Estimator for Screen Content Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10062-10071} }
Domain Expansion of Image Generators-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nitzan_2023_CVPR, author = {Nitzan, Yotam and Gharbi, Micha\"el and Zhang, Richard and Park, Taesung and Zhu, Jun-Yan and Cohen-Or, Daniel and Shechtman, Eli}, title = {Domain Expansion of Image Generators}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15933-15942} }
LVQAC: Lattice Vector Quantization Coupled With Spatially Adaptive Companding for Efficient Learned Image Compression-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Xi and Wu, Xiaolin}, title = {LVQAC: Lattice Vector Quantization Coupled With Spatially Adaptive Companding for Efficient Learned Image Compression}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10239-10248} }
Fine-Grained Face Swapping via Regional GAN Inversion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Zhian and Li, Maomao and Zhang, Yong and Wang, Cairong and Zhang, Qi and Wang, Jue and Nie, Yongwei}, title = {Fine-Grained Face Swapping via Regional GAN Inversion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8578-8587} }
Taming Diffusion Models for Audio-Driven Co-Speech Gesture Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_CVPR, author = {Zhu, Lingting and Liu, Xian and Liu, Xuanyu and Qian, Rui and Liu, Ziwei and Yu, Lequan}, title = {Taming Diffusion Models for Audio-Driven Co-Speech Gesture Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10544-10553} }
NeRFLix: High-Quality Neural View Synthesis by Learning a Degradation-Driven Inter-Viewpoint MiXer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhou_2023_CVPR, author = {Zhou, Kun and Li, Wenbo and Wang, Yi and Hu, Tao and Jiang, Nianjuan and Han, Xiaoguang and Lu, Jiangbo}, title = {NeRFLix: High-Quality Neural View Synthesis by Learning a Degradation-Driven Inter-Viewpoint MiXer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12363-12374} }
STMixer: A One-Stage Sparse Action Detector-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_CVPR, author = {Wu, Tao and Cao, Mengqi and Gao, Ziteng and Wu, Gangshan and Wang, Limin}, title = {STMixer: A One-Stage Sparse Action Detector}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14720-14729} }
Genie: Show Me the Data for Quantization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jeon_2023_CVPR, author = {Jeon, Yongkweon and Lee, Chungman and Kim, Ho-young}, title = {Genie: Show Me the Data for Quantization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12064-12073} }
Multi-Agent Automated Machine Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Zhaozhi and Su, Kefan and Zhang, Jian and Jia, Huizhu and Ye, Qixiang and Xie, Xiaodong and Lu, Zongqing}, title = {Multi-Agent Automated Machine Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11960-11969} }
Robot Structure Prior Guided Temporal Attention for Camera-to-Robot Pose Estimation From Image Sequence-
[pdf]
[bibtex]@InProceedings{Tian_2023_CVPR, author = {Tian, Yang and Zhang, Jiyao and Yin, Zekai and Dong, Hao}, title = {Robot Structure Prior Guided Temporal Attention for Camera-to-Robot Pose Estimation From Image Sequence}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8917-8926} }
HRDFuse: Monocular 360deg Depth Estimation by Collaboratively Learning Holistic-With-Regional Depth Distributions-
[pdf]
[supp]
[bibtex]@InProceedings{Ai_2023_CVPR, author = {Ai, Hao and Cao, Zidong and Cao, Yan-Pei and Shan, Ying and Wang, Lin}, title = {HRDFuse: Monocular 360deg Depth Estimation by Collaboratively Learning Holistic-With-Regional Depth Distributions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13273-13282} }
StructVPR: Distill Structural Knowledge With Weighting Samples for Visual Place Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shen_2023_CVPR, author = {Shen, Yanqing and Zhou, Sanping and Fu, Jingwen and Wang, Ruotong and Chen, Shitao and Zheng, Nanning}, title = {StructVPR: Distill Structural Knowledge With Weighting Samples for Visual Place Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11217-11226} }
Learning Human-to-Robot Handovers From Point Clouds-
[pdf]
[supp]
[bibtex]@InProceedings{Christen_2023_CVPR, author = {Christen, Sammy and Yang, Wei and P\'erez-D{\textquoteright}Arpino, Claudia and Hilliges, Otmar and Fox, Dieter and Chao, Yu-Wei}, title = {Learning Human-to-Robot Handovers From Point Clouds}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9654-9664} }
Score Jacobian Chaining: Lifting Pretrained 2D Diffusion Models for 3D Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Haochen and Du, Xiaodan and Li, Jiahao and Yeh, Raymond A. and Shakhnarovich, Greg}, title = {Score Jacobian Chaining: Lifting Pretrained 2D Diffusion Models for 3D Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12619-12629} }
Role of Transients in Two-Bounce Non-Line-of-Sight Imaging-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Somasundaram_2023_CVPR, author = {Somasundaram, Siddharth and Dave, Akshat and Henley, Connor and Veeraraghavan, Ashok and Raskar, Ramesh}, title = {Role of Transients in Two-Bounce Non-Line-of-Sight Imaging}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9192-9201} }
Elastic Aggregation for Federated Optimization-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Dengsheng and Hu, Jie and Tan, Vince Junkai and Wei, Xiaoming and Wu, Enhua}, title = {Elastic Aggregation for Federated Optimization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12187-12197} }
ObjectMatch: Robust Registration Using Canonical Object Correspondences-
[pdf]
[supp]
[bibtex]@InProceedings{Gumeli_2023_CVPR, author = {G\"umeli, Can and Dai, Angela and Nie{\ss}ner, Matthias}, title = {ObjectMatch: Robust Registration Using Canonical Object Correspondences}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13082-13091} }
Center Focusing Network for Real-Time LiDAR Panoptic Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Xiaoyan and Zhang, Gang and Wang, Boyue and Hu, Yongli and Yin, Baocai}, title = {Center Focusing Network for Real-Time LiDAR Panoptic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13425-13434} }
Restoration of Hand-Drawn Architectural Drawings Using Latent Space Mapping With Degradation Generator-
[pdf]
[supp]
[bibtex]@InProceedings{Choi_2023_CVPR, author = {Choi, Nakkwan and Lee, Seungjae and Lee, Yongsik and Yang, Seungjoon}, title = {Restoration of Hand-Drawn Architectural Drawings Using Latent Space Mapping With Degradation Generator}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14164-14172} }
Few-Shot Class-Incremental Learning via Class-Aware Bilateral Distillation-
[pdf]
[supp]
[bibtex]@InProceedings{Zhao_2023_CVPR, author = {Zhao, Linglan and Lu, Jing and Xu, Yunlu and Cheng, Zhanzhan and Guo, Dashan and Niu, Yi and Fang, Xiangzhong}, title = {Few-Shot Class-Incremental Learning via Class-Aware Bilateral Distillation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11838-11847} }
Learning To Dub Movies via Hierarchical Prosody Models-
[pdf]
[arXiv]
[bibtex]@InProceedings{Cong_2023_CVPR, author = {Cong, Gaoxiang and Li, Liang and Qi, Yuankai and Zha, Zheng-Jun and Wu, Qi and Wang, Wenyu and Jiang, Bin and Yang, Ming-Hsuan and Huang, Qingming}, title = {Learning To Dub Movies via Hierarchical Prosody Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14687-14697} }
DiffusionRig: Learning Personalized Priors for Facial Appearance Editing-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ding_2023_CVPR, author = {Ding, Zheng and Zhang, Xuaner and Xia, Zhihao and Jebe, Lars and Tu, Zhuowen and Zhang, Xiuming}, title = {DiffusionRig: Learning Personalized Priors for Facial Appearance Editing}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12736-12746} }
Delving StyleGAN Inversion for Image Editing: A Foundation Latent Space Viewpoint-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Hongyu and Song, Yibing and Chen, Qifeng}, title = {Delving StyleGAN Inversion for Image Editing: A Foundation Latent Space Viewpoint}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10072-10082} }
Enlarging Instance-Specific and Class-Specific Information for Open-Set Action Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cen_2023_CVPR, author = {Cen, Jun and Zhang, Shiwei and Wang, Xiang and Pei, Yixuan and Qing, Zhiwu and Zhang, Yingya and Chen, Qifeng}, title = {Enlarging Instance-Specific and Class-Specific Information for Open-Set Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15295-15304} }
Decoupled Semantic Prototypes Enable Learning From Diverse Annotation Types for Semi-Weakly Segmentation in Expert-Driven Domains-
[pdf]
[supp]
[bibtex]@InProceedings{Reiss_2023_CVPR, author = {Rei{\ss}, Simon and Seibold, Constantin and Freytag, Alexander and Rodner, Erik and Stiefelhagen, Rainer}, title = {Decoupled Semantic Prototypes Enable Learning From Diverse Annotation Types for Semi-Weakly Segmentation in Expert-Driven Domains}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15495-15506} }
Iterative Next Boundary Detection for Instance Segmentation of Tree Rings in Microscopy Images of Shrub Cross Sections-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gillert_2023_CVPR, author = {Gillert, Alexander and Resente, Giulia and Anadon-Rosell, Alba and Wilmking, Martin and von Lukas, Uwe Freiherr}, title = {Iterative Next Boundary Detection for Instance Segmentation of Tree Rings in Microscopy Images of Shrub Cross Sections}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14540-14548} }
Learning and Aggregating Lane Graphs for Urban Automated Driving-
[pdf]
[supp]
[bibtex]@InProceedings{Buchner_2023_CVPR, author = {B\"uchner, Martin and Z\"urn, Jannik and Todoran, Ion-George and Valada, Abhinav and Burgard, Wolfram}, title = {Learning and Aggregating Lane Graphs for Urban Automated Driving}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13415-13424} }
Universal Instance Perception As Object Discovery and Retrieval-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yan_2023_CVPR, author = {Yan, Bin and Jiang, Yi and Wu, Jiannan and Wang, Dong and Luo, Ping and Yuan, Zehuan and Lu, Huchuan}, title = {Universal Instance Perception As Object Discovery and Retrieval}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15325-15336} }
Transferable Adversarial Attacks on Vision Transformers With Token Gradient Regularization-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Jianping and Huang, Yizhan and Wu, Weibin and Lyu, Michael R.}, title = {Transferable Adversarial Attacks on Vision Transformers With Token Gradient Regularization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16415-16424} }
MCF: Mutual Correction Framework for Semi-Supervised Medical Image Segmentation-
[pdf]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Yongchao and Xiao, Bin and Bi, Xiuli and Li, Weisheng and Gao, Xinbo}, title = {MCF: Mutual Correction Framework for Semi-Supervised Medical Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15651-15660} }
Parametric Implicit Face Representation for Audio-Driven Facial Reenactment-
[pdf]
[supp]
[bibtex]@InProceedings{Huang_2023_CVPR, author = {Huang, Ricong and Lai, Peiwen and Qin, Yipeng and Li, Guanbin}, title = {Parametric Implicit Face Representation for Audio-Driven Facial Reenactment}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12759-12768} }
VILA: Learning Image Aesthetics From User Comments With Vision-Language Pretraining-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ke_2023_CVPR, author = {Ke, Junjie and Ye, Keren and Yu, Jiahui and Wu, Yonghui and Milanfar, Peyman and Yang, Feng}, title = {VILA: Learning Image Aesthetics From User Comments With Vision-Language Pretraining}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10041-10051} }
Procedure-Aware Pretraining for Instructional Video Understanding-
[pdf]
[supp]
[bibtex]@InProceedings{Zhou_2023_CVPR, author = {Zhou, Honglu and Mart{\'\i}n-Mart{\'\i}n, Roberto and Kapadia, Mubbasir and Savarese, Silvio and Niebles, Juan Carlos}, title = {Procedure-Aware Pretraining for Instructional Video Understanding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10727-10738} }
Fine-Grained Audible Video Description-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shen_2023_CVPR, author = {Shen, Xuyang and Li, Dong and Zhou, Jinxing and Qin, Zhen and He, Bowen and Han, Xiaodong and Li, Aixuan and Dai, Yuchao and Kong, Lingpeng and Wang, Meng and Qiao, Yu and Zhong, Yiran}, title = {Fine-Grained Audible Video Description}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10585-10596} }
3D Semantic Segmentation in the Wild: Learning Generalized Models for Adverse-Condition Point Clouds-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xiao_2023_CVPR, author = {Xiao, Aoran and Huang, Jiaxing and Xuan, Weihao and Ren, Ruijie and Liu, Kangcheng and Guan, Dayan and El Saddik, Abdulmotaleb and Lu, Shijian and Xing, Eric P.}, title = {3D Semantic Segmentation in the Wild: Learning Generalized Models for Adverse-Condition Point Clouds}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9382-9392} }
RaBit: Parametric Modeling of 3D Biped Cartoon Characters With a Topological-Consistent Dataset-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Luo_2023_CVPR, author = {Luo, Zhongjin and Cai, Shengcai and Dong, Jinguo and Ming, Ruibo and Qiu, Liangdong and Zhan, Xiaohang and Han, Xiaoguang}, title = {RaBit: Parametric Modeling of 3D Biped Cartoon Characters With a Topological-Consistent Dataset}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12825-12835} }
Uni3D: A Unified Baseline for Multi-Dataset 3D Object Detection-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Bo and Yuan, Jiakang and Shi, Botian and Chen, Tao and Li, Yikang and Qiao, Yu}, title = {Uni3D: A Unified Baseline for Multi-Dataset 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9253-9262} }
ACR: Attention Collaboration-Based Regressor for Arbitrary Two-Hand Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yu_2023_CVPR, author = {Yu, Zhengdi and Huang, Shaoli and Fang, Chen and Breckon, Toby P. and Wang, Jue}, title = {ACR: Attention Collaboration-Based Regressor for Arbitrary Two-Hand Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12955-12964} }
Improving Table Structure Recognition With Visual-Alignment Sequential Coordinate Modeling-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_CVPR, author = {Huang, Yongshuai and Lu, Ning and Chen, Dapeng and Li, Yibo and Xie, Zecheng and Zhu, Shenggao and Gao, Liangcai and Peng, Wei}, title = {Improving Table Structure Recognition With Visual-Alignment Sequential Coordinate Modeling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11134-11143} }
HumanGen: Generating Human Radiance Fields With Explicit Priors-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jiang_2023_CVPR, author = {Jiang, Suyi and Jiang, Haoran and Wang, Ziyu and Luo, Haimin and Chen, Wenzheng and Xu, Lan}, title = {HumanGen: Generating Human Radiance Fields With Explicit Priors}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12543-12554} }
Local Connectivity-Based Density Estimation for Face Clustering-
[pdf]
[supp]
[bibtex]@InProceedings{Shin_2023_CVPR, author = {Shin, Junho and Lee, Hyo-Jun and Kim, Hyunseop and Baek, Jong-Hyeon and Kim, Daehyun and Koh, Yeong Jun}, title = {Local Connectivity-Based Density Estimation for Face Clustering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13621-13629} }
Adaptive Zone-Aware Hierarchical Planner for Vision-Language Navigation-
[pdf]
[bibtex]@InProceedings{Gao_2023_CVPR, author = {Gao, Chen and Peng, Xingyu and Yan, Mi and Wang, He and Yang, Lirong and Ren, Haibing and Li, Hongsheng and Liu, Si}, title = {Adaptive Zone-Aware Hierarchical Planner for Vision-Language Navigation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14911-14920} }
Memory-Friendly Scalable Super-Resolution via Rewinding Lottery Ticket Hypothesis-
[pdf]
[supp]
[bibtex]@InProceedings{Lin_2023_CVPR, author = {Lin, Jin and Luo, Xiaotong and Hong, Ming and Qu, Yanyun and Xie, Yuan and Wu, Zongze}, title = {Memory-Friendly Scalable Super-Resolution via Rewinding Lottery Ticket Hypothesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14398-14407} }
Therbligs in Action: Video Understanding Through Motion Primitives-
[pdf]
[bibtex]@InProceedings{Dessalene_2023_CVPR, author = {Dessalene, Eadom and Maynord, Michael and Ferm\"uller, Cornelia and Aloimonos, Yiannis}, title = {Therbligs in Action: Video Understanding Through Motion Primitives}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10618-10626} }
SadTalker: Learning Realistic 3D Motion Coefficients for Stylized Audio-Driven Single Image Talking Face Animation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Wenxuan and Cun, Xiaodong and Wang, Xuan and Zhang, Yong and Shen, Xi and Guo, Yu and Shan, Ying and Wang, Fei}, title = {SadTalker: Learning Realistic 3D Motion Coefficients for Stylized Audio-Driven Single Image Talking Face Animation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8652-8661} }
HAAV: Hierarchical Aggregation of Augmented Views for Image Captioning-
[pdf]
[supp]
[bibtex]@InProceedings{Kuo_2023_CVPR, author = {Kuo, Chia-Wen and Kira, Zsolt}, title = {HAAV: Hierarchical Aggregation of Augmented Views for Image Captioning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11039-11049} }
Learning Sample Relationship for Exposure Correction-
[pdf]
[bibtex]@InProceedings{Huang_2023_CVPR, author = {Huang, Jie and Zhao, Feng and Zhou, Man and Xiao, Jie and Zheng, Naishan and Zheng, Kaiwen and Xiong, Zhiwei}, title = {Learning Sample Relationship for Exposure Correction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9904-9913} }
TRACE: 5D Temporal Regression of Avatars With Dynamic Cameras in 3D Environments-
[pdf]
[supp]
[bibtex]@InProceedings{Sun_2023_CVPR, author = {Sun, Yu and Bao, Qian and Liu, Wu and Mei, Tao and Black, Michael J.}, title = {TRACE: 5D Temporal Regression of Avatars With Dynamic Cameras in 3D Environments}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8856-8866} }
End-to-End 3D Dense Captioning With Vote2Cap-DETR-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Sijin and Zhu, Hongyuan and Chen, Xin and Lei, Yinjie and Yu, Gang and Chen, Tao}, title = {End-to-End 3D Dense Captioning With Vote2Cap-DETR}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11124-11133} }
Learned Two-Plane Perspective Prior Based Image Resampling for Efficient Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ghosh_2023_CVPR, author = {Ghosh, Anurag and Reddy, N. Dinesh and Mertz, Christoph and Narasimhan, Srinivasa G.}, title = {Learned Two-Plane Perspective Prior Based Image Resampling for Efficient Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13364-13373} }
Tell Me What Happened: Unifying Text-Guided Video Completion via Multimodal Masked Video Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fu_2023_CVPR, author = {Fu, Tsu-Jui and Yu, Licheng and Zhang, Ning and Fu, Cheng-Yang and Su, Jong-Chyi and Wang, William Yang and Bell, Sean}, title = {Tell Me What Happened: Unifying Text-Guided Video Completion via Multimodal Masked Video Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10681-10692} }
Tracking Through Containers and Occluders in the Wild-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Van_Hoorick_2023_CVPR, author = {Van Hoorick, Basile and Tokmakov, Pavel and Stent, Simon and Li, Jie and Vondrick, Carl}, title = {Tracking Through Containers and Occluders in the Wild}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13802-13812} }
Decompose, Adjust, Compose: Effective Normalization by Playing With Frequency for Domain Generalization-
[pdf]
[arXiv]
[bibtex]@InProceedings{Lee_2023_CVPR, author = {Lee, Sangrok and Bae, Jongseong and Kim, Ha Young}, title = {Decompose, Adjust, Compose: Effective Normalization by Playing With Frequency for Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11776-11785} }
Novel Class Discovery for 3D Point Cloud Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Riz_2023_CVPR, author = {Riz, Luigi and Saltori, Cristiano and Ricci, Elisa and Poiesi, Fabio}, title = {Novel Class Discovery for 3D Point Cloud Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9393-9402} }
Learning 3D-Aware Image Synthesis With Unknown Pose Distribution-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shi_2023_CVPR, author = {Shi, Zifan and Shen, Yujun and Xu, Yinghao and Peng, Sida and Liao, Yiyi and Guo, Sheng and Chen, Qifeng and Yeung, Dit-Yan}, title = {Learning 3D-Aware Image Synthesis With Unknown Pose Distribution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13062-13071} }
Train-Once-for-All Personalization-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Hong-You and Li, Yandong and Cui, Yin and Zhang, Mingda and Chao, Wei-Lun and Zhang, Li}, title = {Train-Once-for-All Personalization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11818-11827} }
DIFu: Depth-Guided Implicit Function for Clothed Human Reconstruction-
[pdf]
[supp]
[bibtex]@InProceedings{Song_2023_CVPR, author = {Song, Dae-Young and Lee, HeeKyung and Seo, Jeongil and Cho, Donghyeon}, title = {DIFu: Depth-Guided Implicit Function for Clothed Human Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8738-8747} }
Bi-LRFusion: Bi-Directional LiDAR-Radar Fusion for 3D Dynamic Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Yingjie and Deng, Jiajun and Li, Yao and Hu, Jinshui and Liu, Cong and Zhang, Yu and Ji, Jianmin and Ouyang, Wanli and Zhang, Yanyong}, title = {Bi-LRFusion: Bi-Directional LiDAR-Radar Fusion for 3D Dynamic Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13394-13403} }
LOCATE: Localize and Transfer Object Parts for Weakly Supervised Affordance Grounding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Gen and Jampani, Varun and Sun, Deqing and Sevilla-Lara, Laura}, title = {LOCATE: Localize and Transfer Object Parts for Weakly Supervised Affordance Grounding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10922-10931} }
TokenHPE: Learning Orientation Tokens for Efficient Head Pose Estimation via Transformers-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Cheng and Liu, Hai and Deng, Yongjian and Xie, Bochen and Li, Youfu}, title = {TokenHPE: Learning Orientation Tokens for Efficient Head Pose Estimation via Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8897-8906} }
BioNet: A Biologically-Inspired Network for Face Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Pengyu}, title = {BioNet: A Biologically-Inspired Network for Face Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10344-10354} }
Scaling Up GANs for Text-to-Image Synthesis-
[pdf]
[arXiv]
[bibtex]@InProceedings{Kang_2023_CVPR, author = {Kang, Minguk and Zhu, Jun-Yan and Zhang, Richard and Park, Jaesik and Shechtman, Eli and Paris, Sylvain and Park, Taesung}, title = {Scaling Up GANs for Text-to-Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10124-10134} }
DepGraph: Towards Any Structural Pruning-
[pdf]
[arXiv]
[bibtex]@InProceedings{Fang_2023_CVPR, author = {Fang, Gongfan and Ma, Xinyin and Song, Mingli and Mi, Michael Bi and Wang, Xinchao}, title = {DepGraph: Towards Any Structural Pruning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16091-16101} }
Exploring Discontinuity for Video Frame Interpolation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2023_CVPR, author = {Lee, Sangjin and Lee, Hyeongmin and Shin, Chajin and Son, Hanbin and Lee, Sangyoun}, title = {Exploring Discontinuity for Video Frame Interpolation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9791-9800} }
DynamicStereo: Consistent Dynamic Depth From Stereo Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Karaev_2023_CVPR, author = {Karaev, Nikita and Rocco, Ignacio and Graham, Benjamin and Neverova, Natalia and Vedaldi, Andrea and Rupprecht, Christian}, title = {DynamicStereo: Consistent Dynamic Depth From Stereo Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13229-13239} }
Vid2Avatar: 3D Avatar Reconstruction From Videos in the Wild via Self-Supervised Scene Decomposition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Guo_2023_CVPR, author = {Guo, Chen and Jiang, Tianjian and Chen, Xu and Song, Jie and Hilliges, Otmar}, title = {Vid2Avatar: 3D Avatar Reconstruction From Videos in the Wild via Self-Supervised Scene Decomposition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12858-12868} }
Task Residual for Tuning Vision-Language Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yu_2023_CVPR, author = {Yu, Tao and Lu, Zhihe and Jin, Xin and Chen, Zhibo and Wang, Xinchao}, title = {Task Residual for Tuning Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10899-10909} }
Hierarchical Prompt Learning for Multi-Task Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Yajing and Lu, Yuning and Liu, Hao and An, Yaozu and Xu, Zhuoran and Yao, Zhuokun and Zhang, Baofeng and Xiong, Zhiwei and Gui, Chenguang}, title = {Hierarchical Prompt Learning for Multi-Task Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10888-10898} }
RIFormer: Keep Your Vision Backbone Effective but Removing Token Mixer-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Jiahao and Zhang, Songyang and Liu, Yong and Wu, Taiqiang and Yang, Yujiu and Liu, Xihui and Chen, Kai and Luo, Ping and Lin, Dahua}, title = {RIFormer: Keep Your Vision Backbone Effective but Removing Token Mixer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14443-14452} }
Context-Based Trit-Plane Coding for Progressive Image Compression-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jeon_2023_CVPR, author = {Jeon, Seungmin and Choi, Kwang Pyo and Park, Youngo and Kim, Chang-Su}, title = {Context-Based Trit-Plane Coding for Progressive Image Compression}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14348-14357} }
Recurrent Vision Transformers for Object Detection With Event Cameras-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gehrig_2023_CVPR, author = {Gehrig, Mathias and Scaramuzza, Davide}, title = {Recurrent Vision Transformers for Object Detection With Event Cameras}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13884-13893} }
METransformer: Radiology Report Generation by Transformer With Multiple Learnable Expert Tokens-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Zhanyu and Liu, Lingqiao and Wang, Lei and Zhou, Luping}, title = {METransformer: Radiology Report Generation by Transformer With Multiple Learnable Expert Tokens}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11558-11567} }
Revealing the Dark Secrets of Masked Image Modeling-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xie_2023_CVPR, author = {Xie, Zhenda and Geng, Zigang and Hu, Jingcheng and Zhang, Zheng and Hu, Han and Cao, Yue}, title = {Revealing the Dark Secrets of Masked Image Modeling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14475-14485} }
Fine-Grained Classification With Noisy Labels-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wei_2023_CVPR, author = {Wei, Qi and Feng, Lei and Sun, Haoliang and Wang, Ren and Guo, Chenhui and Yin, Yilong}, title = {Fine-Grained Classification With Noisy Labels}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11651-11660} }
CAP: Robust Point Cloud Classification via Semantic and Structural Modeling-
[pdf]
[supp]
[bibtex]@InProceedings{Ding_2023_CVPR, author = {Ding, Daizong and Jiang, Erling and Huang, Yuanmin and Zhang, Mi and Li, Wenxuan and Yang, Min}, title = {CAP: Robust Point Cloud Classification via Semantic and Structural Modeling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12260-12270} }
Visual-Tactile Sensing for In-Hand Object Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_CVPR, author = {Xu, Wenqiang and Yu, Zhenjun and Xue, Han and Ye, Ruolin and Yao, Siqiong and Lu, Cewu}, title = {Visual-Tactile Sensing for In-Hand Object Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8803-8812} }
Local-to-Global Registration for Bundle-Adjusting Neural Radiance Fields-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Yue and Chen, Xingyu and Wang, Xuan and Zhang, Qi and Guo, Yu and Shan, Ying and Wang, Fei}, title = {Local-to-Global Registration for Bundle-Adjusting Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8264-8273} }
FJMP: Factorized Joint Multi-Agent Motion Prediction Over Learned Directed Acyclic Interaction Graphs-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Rowe_2023_CVPR, author = {Rowe, Luke and Ethier, Martin and Dykhne, Eli-Henry and Czarnecki, Krzysztof}, title = {FJMP: Factorized Joint Multi-Agent Motion Prediction Over Learned Directed Acyclic Interaction Graphs}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13745-13755} }
Correlational Image Modeling for Self-Supervised Visual Pre-Training-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Wei and Xie, Jiahao and Loy, Chen Change}, title = {Correlational Image Modeling for Self-Supervised Visual Pre-Training}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15105-15115} }
Self-Supervised Implicit Glyph Attention for Text Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Guan_2023_CVPR, author = {Guan, Tongkun and Gu, Chaochen and Tu, Jingzheng and Yang, Xue and Feng, Qi and Zhao, Yudi and Shen, Wei}, title = {Self-Supervised Implicit Glyph Attention for Text Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15285-15294} }
ACL-SPC: Adaptive Closed-Loop System for Self-Supervised Point Cloud Completion-
[pdf]
[supp]
[bibtex]@InProceedings{Hong_2023_CVPR, author = {Hong, Sangmin and Yavartanoo, Mohsen and Neshatavar, Reyhaneh and Lee, Kyoung Mu}, title = {ACL-SPC: Adaptive Closed-Loop System for Self-Supervised Point Cloud Completion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9435-9444} }
Focus on Details: Online Multi-Object Tracking With Diverse Fine-Grained Representation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ren_2023_CVPR, author = {Ren, Hao and Han, Shoudong and Ding, Huilin and Zhang, Ziwen and Wang, Hongwei and Wang, Faquan}, title = {Focus on Details: Online Multi-Object Tracking With Diverse Fine-Grained Representation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11289-11298} }
DiffPose: Toward More Reliable 3D Pose Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gong_2023_CVPR, author = {Gong, Jia and Foo, Lin Geng and Fan, Zhipeng and Ke, Qiuhong and Rahmani, Hossein and Liu, Jun}, title = {DiffPose: Toward More Reliable 3D Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13041-13051} }
Learning Analytical Posterior Probability for Human Mesh Recovery-
[pdf]
[supp]
[bibtex]@InProceedings{Fang_2023_CVPR, author = {Fang, Qi and Chen, Kang and Fan, Yinghui and Shuai, Qing and Li, Jiefeng and Zhang, Weidong}, title = {Learning Analytical Posterior Probability for Human Mesh Recovery}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8781-8791} }
Non-Contrastive Unsupervised Learning of Physiological Signals From Video-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Speth_2023_CVPR, author = {Speth, Jeremy and Vance, Nathan and Flynn, Patrick and Czajka, Adam}, title = {Non-Contrastive Unsupervised Learning of Physiological Signals From Video}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14464-14474} }
FashionSAP: Symbols and Attributes Prompt for Fine-Grained Fashion Vision-Language Pre-Training-
[pdf]
[arXiv]
[bibtex]@InProceedings{Han_2023_CVPR, author = {Han, Yunpeng and Zhang, Lisai and Chen, Qingcai and Chen, Zhijian and Li, Zhonghua and Yang, Jianxin and Cao, Zhao}, title = {FashionSAP: Symbols and Attributes Prompt for Fine-Grained Fashion Vision-Language Pre-Training}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15028-15038} }
Structure Aggregation for Cross-Spectral Stereo Image Guided Denoising-
[pdf]
[supp]
[bibtex]@InProceedings{Sheng_2023_CVPR, author = {Sheng, Zehua and Yu, Zhu and Liu, Xiongwei and Cao, Si-Yuan and Liu, Yuqi and Shen, Hui-Liang and Zhang, Huaqi}, title = {Structure Aggregation for Cross-Spectral Stereo Image Guided Denoising}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13997-14006} }
RONO: Robust Discriminative Learning With Noisy Labels for 2D-3D Cross-Modal Retrieval-
[pdf]
[supp]
[bibtex]@InProceedings{Feng_2023_CVPR, author = {Feng, Yanglin and Zhu, Hongyuan and Peng, Dezhong and Peng, Xi and Hu, Peng}, title = {RONO: Robust Discriminative Learning With Noisy Labels for 2D-3D Cross-Modal Retrieval}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11610-11619} }
ConQueR: Query Contrast Voxel-DETR for 3D Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_CVPR, author = {Zhu, Benjin and Wang, Zhe and Shi, Shaoshuai and Xu, Hang and Hong, Lanqing and Li, Hongsheng}, title = {ConQueR: Query Contrast Voxel-DETR for 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9296-9305} }
Robust Multiview Point Cloud Registration With Reliable Pose Graph Initialization and History Reweighting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Haiping and Liu, Yuan and Dong, Zhen and Guo, Yulan and Liu, Yu-Shen and Wang, Wenping and Yang, Bisheng}, title = {Robust Multiview Point Cloud Registration With Reliable Pose Graph Initialization and History Reweighting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9506-9515} }
OSRT: Omnidirectional Image Super-Resolution With Distortion-Aware Transformer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yu_2023_CVPR, author = {Yu, Fanghua and Wang, Xintao and Cao, Mingdeng and Li, Gen and Shan, Ying and Dong, Chao}, title = {OSRT: Omnidirectional Image Super-Resolution With Distortion-Aware Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13283-13292} }
BEV@DC: Bird's-Eye View Assisted Training for Depth Completion-
[pdf]
[supp]
[bibtex]@InProceedings{Zhou_2023_CVPR, author = {Zhou, Wending and Yan, Xu and Liao, Yinghong and Lin, Yuankai and Huang, Jin and Zhao, Gangming and Cui, Shuguang and Li, Zhen}, title = {BEV@DC: Bird's-Eye View Assisted Training for Depth Completion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9233-9242} }
Large-Scale Training Data Search for Object Re-Identification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yao_2023_CVPR, author = {Yao, Yue and Gedeon, Tom and Zheng, Liang}, title = {Large-Scale Training Data Search for Object Re-Identification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15568-15578} }
SelfME: Self-Supervised Motion Learning for Micro-Expression Recognition-
[pdf]
[bibtex]@InProceedings{Fan_2023_CVPR, author = {Fan, Xinqi and Chen, Xueli and Jiang, Mingjie and Shahid, Ali Raza and Yan, Hong}, title = {SelfME: Self-Supervised Motion Learning for Micro-Expression Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13834-13843} }
NewsNet: A Novel Dataset for Hierarchical Temporal Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Wu_2023_CVPR, author = {Wu, Haoqian and Chen, Keyu and Liu, Haozhe and Zhuge, Mingchen and Li, Bing and Qiao, Ruizhi and Shu, Xiujun and Gan, Bei and Xu, Liangsheng and Ren, Bo and Xu, Mengmeng and Zhang, Wentian and Ramachandra, Raghavendra and Lin, Chia-Wen and Ghanem, Bernard}, title = {NewsNet: A Novel Dataset for Hierarchical Temporal Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10669-10680} }
Uncertainty-Aware Unsupervised Image Deblurring With Deep Residual Prior-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tang_2023_CVPR, author = {Tang, Xiaole and Zhao, Xile and Liu, Jun and Wang, Jianli and Miao, Yuchun and Zeng, Tieyong}, title = {Uncertainty-Aware Unsupervised Image Deblurring With Deep Residual Prior}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9883-9892} }
FedDM: Iterative Distribution Matching for Communication-Efficient Federated Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xiong_2023_CVPR, author = {Xiong, Yuanhao and Wang, Ruochen and Cheng, Minhao and Yu, Felix and Hsieh, Cho-Jui}, title = {FedDM: Iterative Distribution Matching for Communication-Efficient Federated Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16323-16332} }
Bit-Shrinking: Limiting Instantaneous Sharpness for Improving Post-Training Quantization-
[pdf]
[bibtex]@InProceedings{Lin_2023_CVPR, author = {Lin, Chen and Peng, Bo and Li, Zheyang and Tan, Wenming and Ren, Ye and Xiao, Jun and Pu, Shiliang}, title = {Bit-Shrinking: Limiting Instantaneous Sharpness for Improving Post-Training Quantization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16196-16205} }
LSTFE-Net:Long Short-Term Feature Enhancement Network for Video Small Object Detection-
[pdf]
[bibtex]@InProceedings{Xiao_2023_CVPR, author = {Xiao, Jinsheng and Wu, Yuanxu and Chen, Yunhua and Wang, Shurui and Wang, Zhongyuan and Ma, Jiayi}, title = {LSTFE-Net:Long Short-Term Feature Enhancement Network for Video Small Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14613-14622} }
MIC: Masked Image Consistency for Context-Enhanced Domain Adaptation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hoyer_2023_CVPR, author = {Hoyer, Lukas and Dai, Dengxin and Wang, Haoran and Van Gool, Luc}, title = {MIC: Masked Image Consistency for Context-Enhanced Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11721-11732} }
SkyEye: Self-Supervised Bird's-Eye-View Semantic Mapping Using Monocular Frontal View Images-
[pdf]
[supp]
[bibtex]@InProceedings{Gosala_2023_CVPR, author = {Gosala, Nikhil and Petek, K\"ursat and Drews-Jr, Paulo L. J. and Burgard, Wolfram and Valada, Abhinav}, title = {SkyEye: Self-Supervised Bird's-Eye-View Semantic Mapping Using Monocular Frontal View Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14901-14910} }
VoxFormer: Sparse Voxel Transformer for Camera-Based 3D Semantic Scene Completion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Yiming and Yu, Zhiding and Choy, Christopher and Xiao, Chaowei and Alvarez, Jose M. and Fidler, Sanja and Feng, Chen and Anandkumar, Anima}, title = {VoxFormer: Sparse Voxel Transformer for Camera-Based 3D Semantic Scene Completion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9087-9098} }
Joint Video Multi-Frame Interpolation and Deblurring Under Unknown Exposure Time-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shang_2023_CVPR, author = {Shang, Wei and Ren, Dongwei and Yang, Yi and Zhang, Hongzhi and Ma, Kede and Zuo, Wangmeng}, title = {Joint Video Multi-Frame Interpolation and Deblurring Under Unknown Exposure Time}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13935-13944} }
Dual-Bridging With Adversarial Noise Generation for Domain Adaptive rPPG Estimation-
[pdf]
[bibtex]@InProceedings{Du_2023_CVPR, author = {Du, Jingda and Liu, Si-Qi and Zhang, Bochao and Yuen, Pong C.}, title = {Dual-Bridging With Adversarial Noise Generation for Domain Adaptive rPPG Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10355-10364} }
NeuDA: Neural Deformable Anchor for High-Fidelity Implicit Surface Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cai_2023_CVPR, author = {Cai, Bowen and Huang, Jinchi and Jia, Rongfei and Lv, Chengfei and Fu, Huan}, title = {NeuDA: Neural Deformable Anchor for High-Fidelity Implicit Surface Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8476-8485} }
Boosting Weakly-Supervised Temporal Action Localization With Text Information-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Guozhang and Cheng, De and Ding, Xinpeng and Wang, Nannan and Wang, Xiaoyu and Gao, Xinbo}, title = {Boosting Weakly-Supervised Temporal Action Localization With Text Information}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10648-10657} }
OpenMix: Exploring Outlier Samples for Misclassification Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_CVPR, author = {Zhu, Fei and Cheng, Zhen and Zhang, Xu-Yao and Liu, Cheng-Lin}, title = {OpenMix: Exploring Outlier Samples for Misclassification Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12074-12083} }
Multivariate, Multi-Frequency and Multimodal: Rethinking Graph Neural Networks for Emotion Recognition in Conversation-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Feiyu and Shao, Jie and Zhu, Shuyuan and Shen, Heng Tao}, title = {Multivariate, Multi-Frequency and Multimodal: Rethinking Graph Neural Networks for Emotion Recognition in Conversation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10761-10770} }
Bridging Precision and Confidence: A Train-Time Loss for Calibrating Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Munir_2023_CVPR, author = {Munir, Muhammad Akhtar and Khan, Muhammad Haris and Khan, Salman and Khan, Fahad Shahbaz}, title = {Bridging Precision and Confidence: A Train-Time Loss for Calibrating Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11474-11483} }
DyLiN: Making Light Field Networks Dynamic-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yu_2023_CVPR, author = {Yu, Heng and Julin, Joel and Milacski, Zolt\'an \'A. and Niinuma, Koichiro and Jeni, L\'aszl\'o A.}, title = {DyLiN: Making Light Field Networks Dynamic}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12397-12406} }
Human Guided Ground-Truth Generation for Realistic Image Super-Resolution-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Du and Liang, Jie and Zhang, Xindong and Liu, Ming and Zeng, Hui and Zhang, Lei}, title = {Human Guided Ground-Truth Generation for Realistic Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14082-14091} }
Align and Attend: Multimodal Summarization With Dual Contrastive Losses-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{He_2023_CVPR, author = {He, Bo and Wang, Jun and Qiu, Jielin and Bui, Trung and Shrivastava, Abhinav and Wang, Zhaowen}, title = {Align and Attend: Multimodal Summarization With Dual Contrastive Losses}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14867-14878} }
SinGRAF: Learning a 3D Generative Radiance Field for a Single Scene-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Son_2023_CVPR, author = {Son, Minjung and Park, Jeong Joon and Guibas, Leonidas and Wetzstein, Gordon}, title = {SinGRAF: Learning a 3D Generative Radiance Field for a Single Scene}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8507-8517} }
Self-Supervised AutoFlow-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_CVPR, author = {Huang, Hsin-Ping and Herrmann, Charles and Hur, Junhwa and Lu, Erika and Sargent, Kyle and Stone, Austin and Yang, Ming-Hsuan and Sun, Deqing}, title = {Self-Supervised AutoFlow}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11412-11421} }
Neuralangelo: High-Fidelity Neural Surface Reconstruction-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Zhaoshuo and M\"uller, Thomas and Evans, Alex and Taylor, Russell H. and Unberath, Mathias and Liu, Ming-Yu and Lin, Chen-Hsuan}, title = {Neuralangelo: High-Fidelity Neural Surface Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8456-8465} }
Re-GAN: Data-Efficient GANs Training via Architectural Reconfiguration-
[pdf]
[supp]
[bibtex]@InProceedings{Saxena_2023_CVPR, author = {Saxena, Divya and Cao, Jiannong and Xu, Jiahao and Kulshrestha, Tarun}, title = {Re-GAN: Data-Efficient GANs Training via Architectural Reconfiguration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16230-16240} }
Dimensionality-Varying Diffusion Process-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Han and Feng, Ruili and Yang, Zhantao and Huang, Lianghua and Liu, Yu and Zhang, Yifei and Shen, Yujun and Zhao, Deli and Zhou, Jingren and Cheng, Fan}, title = {Dimensionality-Varying Diffusion Process}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14307-14316} }
RenderDiffusion: Image Diffusion for 3D Reconstruction, Inpainting and Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Anciukevicius_2023_CVPR, author = {Anciukevi\v{c}ius, Titas and Xu, Zexiang and Fisher, Matthew and Henderson, Paul and Bilen, Hakan and Mitra, Niloy J. and Guerrero, Paul}, title = {RenderDiffusion: Image Diffusion for 3D Reconstruction, Inpainting and Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12608-12618} }
Latent-NeRF for Shape-Guided Generation of 3D Shapes and Textures-
[pdf]
[arXiv]
[bibtex]@InProceedings{Metzer_2023_CVPR, author = {Metzer, Gal and Richardson, Elad and Patashnik, Or and Giryes, Raja and Cohen-Or, Daniel}, title = {Latent-NeRF for Shape-Guided Generation of 3D Shapes and Textures}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12663-12673} }
Learning Generative Structure Prior for Blind Text Image Super-Resolution-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Xiaoming and Zuo, Wangmeng and Loy, Chen Change}, title = {Learning Generative Structure Prior for Blind Text Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10103-10113} }
PEFAT: Boosting Semi-Supervised Medical Image Classification via Pseudo-Loss Estimation and Feature Adversarial Training-
[pdf]
[supp]
[bibtex]@InProceedings{Zeng_2023_CVPR, author = {Zeng, Qingjie and Xie, Yutong and Lu, Zilin and Xia, Yong}, title = {PEFAT: Boosting Semi-Supervised Medical Image Classification via Pseudo-Loss Estimation and Feature Adversarial Training}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15671-15680} }
Ground-Truth Free Meta-Learning for Deep Compressive Sampling-
[pdf]
[supp]
[bibtex]@InProceedings{Qin_2023_CVPR, author = {Qin, Xinran and Quan, Yuhui and Pang, Tongyao and Ji, Hui}, title = {Ground-Truth Free Meta-Learning for Deep Compressive Sampling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9947-9956} }
SHS-Net: Learning Signed Hyper Surfaces for Oriented Normal Estimation of Point Clouds-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Qing and Feng, Huifang and Shi, Kanle and Gao, Yue and Fang, Yi and Liu, Yu-Shen and Han, Zhizhong}, title = {SHS-Net: Learning Signed Hyper Surfaces for Oriented Normal Estimation of Point Clouds}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13591-13600} }
DistractFlow: Improving Optical Flow Estimation via Realistic Distractions and Pseudo-Labeling-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jeong_2023_CVPR, author = {Jeong, Jisoo and Cai, Hong and Garrepalli, Risheek and Porikli, Fatih}, title = {DistractFlow: Improving Optical Flow Estimation via Realistic Distractions and Pseudo-Labeling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13691-13700} }
DSVT: Dynamic Sparse Voxel Transformer With Rotated Sets-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Haiyang and Shi, Chen and Shi, Shaoshuai and Lei, Meng and Wang, Sen and He, Di and Schiele, Bernt and Wang, Liwei}, title = {DSVT: Dynamic Sparse Voxel Transformer With Rotated Sets}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13520-13529} }
Enhancing the Self-Universality for Transferable Targeted Attacks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wei_2023_CVPR, author = {Wei, Zhipeng and Chen, Jingjing and Wu, Zuxuan and Jiang, Yu-Gang}, title = {Enhancing the Self-Universality for Transferable Targeted Attacks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12281-12290} }
EditableNeRF: Editing Topologically Varying Neural Radiance Fields by Key Points-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zheng_2023_CVPR, author = {Zheng, Chengwei and Lin, Wenbin and Xu, Feng}, title = {EditableNeRF: Editing Topologically Varying Neural Radiance Fields by Key Points}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8317-8327} }
NeuralEditor: Editing Neural Radiance Fields via Manipulating Point Clouds-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Jun-Kun and Lyu, Jipeng and Wang, Yu-Xiong}, title = {NeuralEditor: Editing Neural Radiance Fields via Manipulating Point Clouds}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12439-12448} }
NIKI: Neural Inverse Kinematics With Invertible Neural Networks for 3D Human Pose and Shape Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Jiefeng and Bian, Siyuan and Liu, Qi and Tang, Jiasheng and Wang, Fan and Lu, Cewu}, title = {NIKI: Neural Inverse Kinematics With Invertible Neural Networks for 3D Human Pose and Shape Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12933-12942} }
Transfer4D: A Framework for Frugal Motion Capture and Deformation Transfer-
[pdf]
[supp]
[bibtex]@InProceedings{Maheshwari_2023_CVPR, author = {Maheshwari, Shubh and Narain, Rahul and Hebbalaguppe, Ramya}, title = {Transfer4D: A Framework for Frugal Motion Capture and Deformation Transfer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12836-12846} }
Randomized Adversarial Training via Taylor Expansion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jin_2023_CVPR, author = {Jin, Gaojie and Yi, Xinping and Wu, Dengyu and Mu, Ronghui and Huang, Xiaowei}, title = {Randomized Adversarial Training via Taylor Expansion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16447-16457} }
Learning To Measure the Point Cloud Reconstruction Loss in a Representation Space-
[pdf]
[supp]
[bibtex]@InProceedings{Huang_2023_CVPR, author = {Huang, Tianxin and Ding, Zhonggan and Zhang, Jiangning and Tai, Ying and Zhang, Zhenyu and Chen, Mingang and Wang, Chengjie and Liu, Yong}, title = {Learning To Measure the Point Cloud Reconstruction Loss in a Representation Space}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12208-12217} }
Progressive Neighbor Consistency Mining for Correspondence Pruning-
[pdf]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Xin and Yang, Jufeng}, title = {Progressive Neighbor Consistency Mining for Correspondence Pruning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9527-9537} }
Bootstrapping Objectness From Videos by Relaxed Common Fate and Visual Grouping-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lian_2023_CVPR, author = {Lian, Long and Wu, Zhirong and Yu, Stella X.}, title = {Bootstrapping Objectness From Videos by Relaxed Common Fate and Visual Grouping}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14582-14591} }
Semi-Supervised Hand Appearance Recovery via Structure Disentanglement and Dual Adversarial Discrimination-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhao_2023_CVPR, author = {Zhao, Zimeng and Zuo, Binghui and Long, Zhiyu and Wang, Yangang}, title = {Semi-Supervised Hand Appearance Recovery via Structure Disentanglement and Dual Adversarial Discrimination}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12125-12136} }
Back to the Source: Diffusion-Driven Adaptation To Test-Time Corruption-
[pdf]
[supp]
[bibtex]@InProceedings{Gao_2023_CVPR, author = {Gao, Jin and Zhang, Jialing and Liu, Xihui and Darrell, Trevor and Shelhamer, Evan and Wang, Dequan}, title = {Back to the Source: Diffusion-Driven Adaptation To Test-Time Corruption}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11786-11796} }
LayoutDM: Discrete Diffusion Model for Controllable Layout Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Inoue_2023_CVPR, author = {Inoue, Naoto and Kikuchi, Kotaro and Simo-Serra, Edgar and Otani, Mayu and Yamaguchi, Kota}, title = {LayoutDM: Discrete Diffusion Model for Controllable Layout Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10167-10176} }
ShapeTalk: A Language Dataset and Framework for 3D Shape Edits and Deformations-
[pdf]
[bibtex]@InProceedings{Achlioptas_2023_CVPR, author = {Achlioptas, Panos and Huang, Ian and Sung, Minhyuk and Tulyakov, Sergey and Guibas, Leonidas}, title = {ShapeTalk: A Language Dataset and Framework for 3D Shape Edits and Deformations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12685-12694} }
RGBD2: Generative Scene Synthesis via Incremental View Inpainting Using RGBD Diffusion Models-
[pdf]
[arXiv]
[bibtex]@InProceedings{Lei_2023_CVPR, author = {Lei, Jiabao and Tang, Jiapeng and Jia, Kui}, title = {RGBD2: Generative Scene Synthesis via Incremental View Inpainting Using RGBD Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8422-8434} }
System-Status-Aware Adaptive Network for Online Streaming Video Understanding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Foo_2023_CVPR, author = {Foo, Lin Geng and Gong, Jia and Fan, Zhipeng and Liu, Jun}, title = {System-Status-Aware Adaptive Network for Online Streaming Video Understanding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10514-10523} }
Local-Guided Global: Paired Similarity Representation for Visual Reinforcement Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Choi_2023_CVPR, author = {Choi, Hyesong and Lee, Hunsang and Song, Wonil and Jeon, Sangryul and Sohn, Kwanghoon and Min, Dongbo}, title = {Local-Guided Global: Paired Similarity Representation for Visual Reinforcement Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15072-15082} }
FFCV: Accelerating Training by Removing Data Bottlenecks-
[pdf]
[supp]
[bibtex]@InProceedings{Leclerc_2023_CVPR, author = {Leclerc, Guillaume and Ilyas, Andrew and Engstrom, Logan and Park, Sung Min and Salman, Hadi and M\k{a}dry, Aleksander}, title = {FFCV: Accelerating Training by Removing Data Bottlenecks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12011-12020} }
Region-Aware Pretraining for Open-Vocabulary Object Detection With Vision Transformers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2023_CVPR, author = {Kim, Dahun and Angelova, Anelia and Kuo, Weicheng}, title = {Region-Aware Pretraining for Open-Vocabulary Object Detection With Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11144-11154} }
Towards Unsupervised Object Detection From LiDAR Point Clouds-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Lunjun and Yang, Anqi Joyce and Xiong, Yuwen and Casas, Sergio and Yang, Bin and Ren, Mengye and Urtasun, Raquel}, title = {Towards Unsupervised Object Detection From LiDAR Point Clouds}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9317-9328} }
NeRF-DS: Neural Radiance Fields for Dynamic Specular Objects-
[pdf]
[supp]
[bibtex]@InProceedings{Yan_2023_CVPR, author = {Yan, Zhiwen and Li, Chen and Lee, Gim Hee}, title = {NeRF-DS: Neural Radiance Fields for Dynamic Specular Objects}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8285-8295} }
M6Doc: A Large-Scale Multi-Format, Multi-Type, Multi-Layout, Multi-Language, Multi-Annotation Category Dataset for Modern Document Layout Analysis-
[pdf]
[supp]
[bibtex]@InProceedings{Cheng_2023_CVPR, author = {Cheng, Hiuyi and Zhang, Peirong and Wu, Sihang and Zhang, Jiaxin and Zhu, Qiyuan and Xie, Zecheng and Li, Jing and Ding, Kai and Jin, Lianwen}, title = {M6Doc: A Large-Scale Multi-Format, Multi-Type, Multi-Layout, Multi-Language, Multi-Annotation Category Dataset for Modern Document Layout Analysis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15138-15147} }
RealFusion: 360deg Reconstruction of Any Object From a Single Image-
[pdf]
[supp]
[bibtex]@InProceedings{Melas-Kyriazi_2023_CVPR, author = {Melas-Kyriazi, Luke and Laina, Iro and Rupprecht, Christian and Vedaldi, Andrea}, title = {RealFusion: 360deg Reconstruction of Any Object From a Single Image}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8446-8455} }
LargeKernel3D: Scaling Up Kernels in 3D Sparse CNNs-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Yukang and Liu, Jianhui and Zhang, Xiangyu and Qi, Xiaojuan and Jia, Jiaya}, title = {LargeKernel3D: Scaling Up Kernels in 3D Sparse CNNs}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13488-13498} }
3D Concept Learning and Reasoning From Multi-View Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hong_2023_CVPR, author = {Hong, Yining and Lin, Chunru and Du, Yilun and Chen, Zhenfang and Tenenbaum, Joshua B. and Gan, Chuang}, title = {3D Concept Learning and Reasoning From Multi-View Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9202-9212} }
Soft Augmentation for Image Classification-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Yang and Yan, Shen and Leal-Taix\'e, Laura and Hays, James and Ramanan, Deva}, title = {Soft Augmentation for Image Classification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16241-16250} }
PREIM3D: 3D Consistent Precise Image Attribute Editing From a Single Image-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Jianhui and Li, Jianmin and Zhang, Haoji and Liu, Shilong and Wang, Zhengyi and Xiao, Zihao and Zheng, Kaiwen and Zhu, Jun}, title = {PREIM3D: 3D Consistent Precise Image Attribute Editing From a Single Image}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8549-8558} }
Detecting Backdoors in Pre-Trained Encoders-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Feng_2023_CVPR, author = {Feng, Shiwei and Tao, Guanhong and Cheng, Siyuan and Shen, Guangyu and Xu, Xiangzhe and Liu, Yingqi and Zhang, Kaiyuan and Ma, Shiqing and Zhang, Xiangyu}, title = {Detecting Backdoors in Pre-Trained Encoders}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16352-16362} }
Primitive Generation and Semantic-Related Alignment for Universal Zero-Shot Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{He_2023_CVPR, author = {He, Shuting and Ding, Henghui and Jiang, Wei}, title = {Primitive Generation and Semantic-Related Alignment for Universal Zero-Shot Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11238-11247} }
Long Range Pooling for 3D Large-Scale Scene Understanding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Xiang-Li and Guo, Meng-Hao and Mu, Tai-Jiang and Martin, Ralph R. and Hu, Shi-Min}, title = {Long Range Pooling for 3D Large-Scale Scene Understanding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10300-10311} }
Causally-Aware Intraoperative Imputation for Overall Survival Time Prediction-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Xiang and Qian, Xuelin and Liang, Litian and Kong, Lingjie and Dong, Qiaole and Chen, Jiejun and Liu, Dingxia and Yao, Xiuzhong and Fu, Yanwei}, title = {Causally-Aware Intraoperative Imputation for Overall Survival Time Prediction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15681-15690} }
Twin Contrastive Learning With Noisy Labels-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_CVPR, author = {Huang, Zhizhong and Zhang, Junping and Shan, Hongming}, title = {Twin Contrastive Learning With Noisy Labels}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11661-11670} }
Asymmetric Feature Fusion for Image Retrieval-
[pdf]
[supp]
[bibtex]@InProceedings{Wu_2023_CVPR, author = {Wu, Hui and Wang, Min and Zhou, Wengang and Lu, Zhenbo and Li, Houqiang}, title = {Asymmetric Feature Fusion for Image Retrieval}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11082-11092} }
CREPE: Can Vision-Language Foundation Models Reason Compositionally?-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ma_2023_CVPR, author = {Ma, Zixian and Hong, Jerry and Gul, Mustafa Omer and Gandhi, Mona and Gao, Irena and Krishna, Ranjay}, title = {CREPE: Can Vision-Language Foundation Models Reason Compositionally?}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10910-10921} }
PyramidFlow: High-Resolution Defect Contrastive Localization Using Pyramid Normalizing Flow-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lei_2023_CVPR, author = {Lei, Jiarui and Hu, Xiaobo and Wang, Yue and Liu, Dong}, title = {PyramidFlow: High-Resolution Defect Contrastive Localization Using Pyramid Normalizing Flow}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14143-14152} }
On-the-Fly Category Discovery-
[pdf]
[bibtex]@InProceedings{Du_2023_CVPR, author = {Du, Ruoyi and Chang, Dongliang and Liang, Kongming and Hospedales, Timothy and Song, Yi-Zhe and Ma, Zhanyu}, title = {On-the-Fly Category Discovery}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11691-11700} }
MAIR: Multi-View Attention Inverse Rendering With 3D Spatially-Varying Lighting Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Choi_2023_CVPR, author = {Choi, JunYong and Lee, SeokYeong and Park, Haesol and Jung, Seung-Won and Kim, Ig-Jae and Cho, Junghyun}, title = {MAIR: Multi-View Attention Inverse Rendering With 3D Spatially-Varying Lighting Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8392-8401} }
DF-Platter: Multi-Face Heterogeneous Deepfake Dataset-
[pdf]
[supp]
[bibtex]@InProceedings{Narayan_2023_CVPR, author = {Narayan, Kartik and Agarwal, Harsh and Thakral, Kartik and Mittal, Surbhi and Vatsa, Mayank and Singh, Richa}, title = {DF-Platter: Multi-Face Heterogeneous Deepfake Dataset}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9739-9748} }
Shifted Diffusion for Text-to-Image Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhou_2023_CVPR, author = {Zhou, Yufan and Liu, Bingchen and Zhu, Yizhe and Yang, Xiao and Chen, Changyou and Xu, Jinhui}, title = {Shifted Diffusion for Text-to-Image Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10157-10166} }
Boosting Detection in Crowd Analysis via Underutilized Output Features-
[pdf]
[supp]
[bibtex]@InProceedings{Wu_2023_CVPR, author = {Wu, Shaokai and Yang, Fengyu}, title = {Boosting Detection in Crowd Analysis via Underutilized Output Features}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15609-15618} }
K3DN: Disparity-Aware Kernel Estimation for Dual-Pixel Defocus Deblurring-
[pdf]
[supp]
[bibtex]@InProceedings{Yang_2023_CVPR, author = {Yang, Yan and Pan, Liyuan and Liu, Liu and Liu, Miaomiao}, title = {K3DN: Disparity-Aware Kernel Estimation for Dual-Pixel Defocus Deblurring}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13263-13272} }
DartBlur: Privacy Preservation With Detection Artifact Suppression-
[pdf]
[supp]
[bibtex]@InProceedings{Jiang_2023_CVPR, author = {Jiang, Baowei and Bai, Bing and Lin, Haozhe and Wang, Yu and Guo, Yuchen and Fang, Lu}, title = {DartBlur: Privacy Preservation With Detection Artifact Suppression}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16479-16488} }
LipFormer: High-Fidelity and Generalizable Talking Face Generation With a Pre-Learned Facial Codebook-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Jiayu and Zhao, Kang and Zhang, Shiwei and Zhang, Yingya and Shen, Yujun and Zhao, Deli and Zhou, Jingren}, title = {LipFormer: High-Fidelity and Generalizable Talking Face Generation With a Pre-Learned Facial Codebook}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13844-13853} }
Generalizable Local Feature Pre-Training for Deformable Shape Analysis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Attaiki_2023_CVPR, author = {Attaiki, Souhaib and Li, Lei and Ovsjanikov, Maks}, title = {Generalizable Local Feature Pre-Training for Deformable Shape Analysis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13650-13661} }
Progressive Random Convolutions for Single Domain Generalization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Choi_2023_CVPR, author = {Choi, Seokeon and Das, Debasmit and Choi, Sungha and Yang, Seunghan and Park, Hyunsin and Yun, Sungrack}, title = {Progressive Random Convolutions for Single Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10312-10322} }
OPE-SR: Orthogonal Position Encoding for Designing a Parameter-Free Upsampling Module in Arbitrary-Scale Image Super-Resolution-
[pdf]
[supp]
[bibtex]@InProceedings{Song_2023_CVPR, author = {Song, Gaochao and Sun, Qian and Zhang, Luo and Su, Ran and Shi, Jianfeng and He, Ying}, title = {OPE-SR: Orthogonal Position Encoding for Designing a Parameter-Free Upsampling Module in Arbitrary-Scale Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10009-10020} }
I2MVFormer: Large Language Model Generated Multi-View Document Supervision for Zero-Shot Image Classification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Naeem_2023_CVPR, author = {Naeem, Muhammad Ferjad and Khan, Muhammad Gul Zain Ali and Xian, Yongqin and Afzal, Muhammad Zeshan and Stricker, Didier and Van Gool, Luc and Tombari, Federico}, title = {I2MVFormer: Large Language Model Generated Multi-View Document Supervision for Zero-Shot Image Classification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15169-15179} }
MixSim: A Hierarchical Framework for Mixed Reality Traffic Simulation-
[pdf]
[supp]
[bibtex]@InProceedings{Suo_2023_CVPR, author = {Suo, Simon and Wong, Kelvin and Xu, Justin and Tu, James and Cui, Alexander and Casas, Sergio and Urtasun, Raquel}, title = {MixSim: A Hierarchical Framework for Mixed Reality Traffic Simulation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9622-9631} }
Context-Aware Alignment and Mutual Masking for 3D-Language Pre-Training-
[pdf]
[supp]
[bibtex]@InProceedings{Jin_2023_CVPR, author = {Jin, Zhao and Hayat, Munawar and Yang, Yuwei and Guo, Yulan and Lei, Yinjie}, title = {Context-Aware Alignment and Mutual Masking for 3D-Language Pre-Training}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10984-10994} }
Generalized Decoding for Pixel, Image, and Language-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zou_2023_CVPR, author = {Zou, Xueyan and Dou, Zi-Yi and Yang, Jianwei and Gan, Zhe and Li, Linjie and Li, Chunyuan and Dai, Xiyang and Behl, Harkirat and Wang, Jianfeng and Yuan, Lu and Peng, Nanyun and Wang, Lijuan and Lee, Yong Jae and Gao, Jianfeng}, title = {Generalized Decoding for Pixel, Image, and Language}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15116-15127} }
Towards Unified Scene Text Spotting Based on Sequence Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kil_2023_CVPR, author = {Kil, Taeho and Kim, Seonghyeon and Seo, Sukmin and Kim, Yoonsik and Kim, Daehee}, title = {Towards Unified Scene Text Spotting Based on Sequence Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15223-15232} }
X3KD: Knowledge Distillation Across Modalities, Tasks and Stages for Multi-Camera 3D Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Klingner_2023_CVPR, author = {Klingner, Marvin and Borse, Shubhankar and Kumar, Varun Ravi and Rezaei, Behnaz and Narayanan, Venkatraman and Yogamani, Senthil and Porikli, Fatih}, title = {X3KD: Knowledge Distillation Across Modalities, Tasks and Stages for Multi-Camera 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13343-13353} }
Rawgment: Noise-Accounted RAW Augmentation Enables Recognition in a Wide Variety of Environments-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yoshimura_2023_CVPR, author = {Yoshimura, Masakazu and Otsuka, Junji and Irie, Atsushi and Ohashi, Takeshi}, title = {Rawgment: Noise-Accounted RAW Augmentation Enables Recognition in a Wide Variety of Environments}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14007-14017} }
BITE: Beyond Priors for Improved Three-D Dog Pose Estimation-
[pdf]
[supp]
[bibtex]@InProceedings{Ruegg_2023_CVPR, author = {R\"uegg, Nadine and Tripathi, Shashank and Schindler, Konrad and Black, Michael J. and Zuffi, Silvia}, title = {BITE: Beyond Priors for Improved Three-D Dog Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8867-8876} }
Equivalent Transformation and Dual Stream Network Construction for Mobile Image Super-Resolution-
[pdf]
[supp]
[bibtex]@InProceedings{Chao_2023_CVPR, author = {Chao, Jiahao and Zhou, Zhou and Gao, Hongfan and Gong, Jiali and Yang, Zhengfeng and Zeng, Zhenbing and Dehbi, Lydia}, title = {Equivalent Transformation and Dual Stream Network Construction for Mobile Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14102-14111} }
High-Resolution Image Reconstruction With Latent Diffusion Models From Human Brain Activity-
[pdf]
[supp]
[bibtex]@InProceedings{Takagi_2023_CVPR, author = {Takagi, Yu and Nishimoto, Shinji}, title = {High-Resolution Image Reconstruction With Latent Diffusion Models From Human Brain Activity}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14453-14463} }
DARE-GRAM: Unsupervised Domain Adaptation Regression by Aligning Inverse Gram Matrices-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nejjar_2023_CVPR, author = {Nejjar, Ismail and Wang, Qin and Fink, Olga}, title = {DARE-GRAM: Unsupervised Domain Adaptation Regression by Aligning Inverse Gram Matrices}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11744-11754} }
Bidirectional Copy-Paste for Semi-Supervised Medical Image Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bai_2023_CVPR, author = {Bai, Yunhao and Chen, Duowen and Li, Qingli and Shen, Wei and Wang, Yan}, title = {Bidirectional Copy-Paste for Semi-Supervised Medical Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11514-11524} }
Learning Discriminative Representations for Skeleton Based Action Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhou_2023_CVPR, author = {Zhou, Huanyu and Liu, Qingjie and Wang, Yunhong}, title = {Learning Discriminative Representations for Skeleton Based Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10608-10617} }
Few-Shot Non-Line-of-Sight Imaging With Signal-Surface Collaborative Regularization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Xintong and Wang, Jianyu and Xiao, Leping and Fu, Xing and Qiu, Lingyun and Shi, Zuoqiang}, title = {Few-Shot Non-Line-of-Sight Imaging With Signal-Surface Collaborative Regularization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13303-13312} }
Probabilistic Debiasing of Scene Graphs-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Biswas_2023_CVPR, author = {Biswas, Bashirul Azam and Ji, Qiang}, title = {Probabilistic Debiasing of Scene Graphs}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10429-10438} }
Depth Estimation From Camera Image and mmWave Radar Point Cloud-
[pdf]
[supp]
[bibtex]@InProceedings{Singh_2023_CVPR, author = {Singh, Akash Deep and Ba, Yunhao and Sarker, Ankur and Zhang, Howard and Kadambi, Achuta and Soatto, Stefano and Srivastava, Mani and Wong, Alex}, title = {Depth Estimation From Camera Image and mmWave Radar Point Cloud}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9275-9285} }
Learning Event Guided High Dynamic Range Video Reconstruction-
[pdf]
[supp]
[bibtex]@InProceedings{Yang_2023_CVPR, author = {Yang, Yixin and Han, Jin and Liang, Jinxiu and Sato, Imari and Shi, Boxin}, title = {Learning Event Guided High Dynamic Range Video Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13924-13934} }
Prototypical Residual Networks for Anomaly Detection and Localization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Hui and Wu, Zuxuan and Wang, Zheng and Chen, Zhineng and Jiang, Yu-Gang}, title = {Prototypical Residual Networks for Anomaly Detection and Localization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16281-16291} }
Ultrahigh Resolution Image/Video Matting With Spatio-Temporal Sparsity-
[pdf]
[supp]
[bibtex]@InProceedings{Sun_2023_CVPR, author = {Sun, Yanan and Tang, Chi-Keung and Tai, Yu-Wing}, title = {Ultrahigh Resolution Image/Video Matting With Spatio-Temporal Sparsity}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14112-14121} }
Zero-Shot Noise2Noise: Efficient Image Denoising Without Any Data-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mansour_2023_CVPR, author = {Mansour, Youssef and Heckel, Reinhard}, title = {Zero-Shot Noise2Noise: Efficient Image Denoising Without Any Data}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14018-14027} }
FIANCEE: Faster Inference of Adversarial Networks via Conditional Early Exits-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Karpikova_2023_CVPR, author = {Karpikova, Polina and Radionova, Ekaterina and Yaschenko, Anastasia and Spiridonov, Andrei and Kostyushko, Leonid and Fabbricatore, Riccardo and Ivakhnenko, Aleksei}, title = {FIANCEE: Faster Inference of Adversarial Networks via Conditional Early Exits}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12032-12043} }
Simultaneously Short- and Long-Term Temporal Modeling for Semi-Supervised Video Semantic Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Lao_2023_CVPR, author = {Lao, Jiangwei and Hong, Weixiang and Guo, Xin and Zhang, Yingying and Wang, Jian and Chen, Jingdong and Chu, Wei}, title = {Simultaneously Short- and Long-Term Temporal Modeling for Semi-Supervised Video Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14763-14772} }
Learning To Generate Text-Grounded Mask for Open-World Semantic Segmentation From Only Image-Text Pairs-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cha_2023_CVPR, author = {Cha, Junbum and Mun, Jonghwan and Roh, Byungseok}, title = {Learning To Generate Text-Grounded Mask for Open-World Semantic Segmentation From Only Image-Text Pairs}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11165-11174} }
Shakes on a Plane: Unsupervised Depth Estimation From Unstabilized Photography-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chugunov_2023_CVPR, author = {Chugunov, Ilya and Zhang, Yuxuan and Heide, Felix}, title = {Shakes on a Plane: Unsupervised Depth Estimation From Unstabilized Photography}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13240-13251} }
Learning Correspondence Uncertainty via Differentiable Nonlinear Least Squares-
[pdf]
[supp]
[bibtex]@InProceedings{Muhle_2023_CVPR, author = {Muhle, Dominik and Koestler, Lukas and Jatavallabhula, Krishna Murthy and Cremers, Daniel}, title = {Learning Correspondence Uncertainty via Differentiable Nonlinear Least Squares}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13102-13112} }
Towards Effective Visual Representations for Partial-Label Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xia_2023_CVPR, author = {Xia, Shiyu and Lv, Jiaqi and Xu, Ning and Niu, Gang and Geng, Xin}, title = {Towards Effective Visual Representations for Partial-Label Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15589-15598} }
MaskCLIP: Masked Self-Distillation Advances Contrastive Language-Image Pretraining-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dong_2023_CVPR, author = {Dong, Xiaoyi and Bao, Jianmin and Zheng, Yinglin and Zhang, Ting and Chen, Dongdong and Yang, Hao and Zeng, Ming and Zhang, Weiming and Yuan, Lu and Chen, Dong and Wen, Fang and Yu, Nenghai}, title = {MaskCLIP: Masked Self-Distillation Advances Contrastive Language-Image Pretraining}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10995-11005} }
Inferring and Leveraging Parts From Object Shape for Improving Semantic Image Synthesis-
[pdf]
[supp]
[bibtex]@InProceedings{Wei_2023_CVPR, author = {Wei, Yuxiang and Ji, Zhilong and Wu, Xiaohe and Bai, Jinfeng and Zhang, Lei and Zuo, Wangmeng}, title = {Inferring and Leveraging Parts From Object Shape for Improving Semantic Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11248-11258} }
MIME: Human-Aware 3D Scene Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yi_2023_CVPR, author = {Yi, Hongwei and Huang, Chun-Hao P. and Tripathi, Shashank and Hering, Lea and Thies, Justus and Black, Michael J.}, title = {MIME: Human-Aware 3D Scene Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12965-12976} }
NerVE: Neural Volumetric Edges for Parametric Curve Extraction From Point Cloud-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_CVPR, author = {Zhu, Xiangyu and Du, Dong and Chen, Weikai and Zhao, Zhiyou and Nie, Yinyu and Han, Xiaoguang}, title = {NerVE: Neural Volumetric Edges for Parametric Curve Extraction From Point Cloud}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13601-13610} }
ShapeClipper: Scalable 3D Shape Learning From Single-View Images via Geometric and CLIP-Based Consistency-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_CVPR, author = {Huang, Zixuan and Jampani, Varun and Thai, Anh and Li, Yuanzhen and Stojanov, Stefan and Rehg, James M.}, title = {ShapeClipper: Scalable 3D Shape Learning From Single-View Images via Geometric and CLIP-Based Consistency}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12912-12922} }
Backdoor Attacks Against Deep Image Compression via Adaptive Frequency Trigger-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yu_2023_CVPR, author = {Yu, Yi and Wang, Yufei and Yang, Wenhan and Lu, Shijian and Tan, Yap-Peng and Kot, Alex C.}, title = {Backdoor Attacks Against Deep Image Compression via Adaptive Frequency Trigger}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12250-12259} }
A New Path: Scaling Vision-and-Language Navigation With Synthetic Instructions and Imitation Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kamath_2023_CVPR, author = {Kamath, Aishwarya and Anderson, Peter and Wang, Su and Koh, Jing Yu and Ku, Alexander and Waters, Austin and Yang, Yinfei and Baldridge, Jason and Parekh, Zarana}, title = {A New Path: Scaling Vision-and-Language Navigation With Synthetic Instructions and Imitation Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10813-10823} }
Layout-Based Causal Inference for Object Navigation-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Sixian and Song, Xinhang and Li, Weijie and Bai, Yubing and Yu, Xinyao and Jiang, Shuqiang}, title = {Layout-Based Causal Inference for Object Navigation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10792-10802} }
Pose-Disentangled Contrastive Learning for Self-Supervised Facial Representation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Yuanyuan and Wang, Wenbin and Zhan, Yibing and Feng, Shaoze and Liu, Kejun and Chen, Zhe}, title = {Pose-Disentangled Contrastive Learning for Self-Supervised Facial Representation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9717-9728} }
Inverse Rendering of Translucent Objects Using Physical and Neural Renderers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Chenhao and Ngo, Trung Thanh and Nagahara, Hajime}, title = {Inverse Rendering of Translucent Objects Using Physical and Neural Renderers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12510-12520} }
Towards Building Self-Aware Object Detectors via Reliable Uncertainty Quantification and Calibration-
[pdf]
[supp]
[bibtex]@InProceedings{Oksuz_2023_CVPR, author = {Oksuz, Kemal and Joy, Tom and Dokania, Puneet K.}, title = {Towards Building Self-Aware Object Detectors via Reliable Uncertainty Quantification and Calibration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9263-9274} }
Source-Free Video Domain Adaptation With Spatial-Temporal-Historical Consistency Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Kai and Patel, Deep and Kruus, Erik and Min, Martin Renqiang}, title = {Source-Free Video Domain Adaptation With Spatial-Temporal-Historical Consistency Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14643-14652} }
Fusing Pre-Trained Language Models With Multimodal Prompts Through Reinforcement Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Yu_2023_CVPR, author = {Yu, Youngjae and Chung, Jiwan and Yun, Heeseung and Hessel, Jack and Park, Jae Sung and Lu, Ximing and Zellers, Rowan and Ammanabrolu, Prithviraj and Le Bras, Ronan and Kim, Gunhee and Choi, Yejin}, title = {Fusing Pre-Trained Language Models With Multimodal Prompts Through Reinforcement Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10845-10856} }
Dense Network Expansion for Class Incremental Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hu_2023_CVPR, author = {Hu, Zhiyuan and Li, Yunsheng and Lyu, Jiancheng and Gao, Dashan and Vasconcelos, Nuno}, title = {Dense Network Expansion for Class Incremental Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11858-11867} }
Regularize Implicit Neural Representation by Itself-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Zhemin and Wang, Hongxia and Meng, Deyu}, title = {Regularize Implicit Neural Representation by Itself}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10280-10288} }
Ambiguous Medical Image Segmentation Using Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Rahman_2023_CVPR, author = {Rahman, Aimon and Valanarasu, Jeya Maria Jose and Hacihaliloglu, Ilker and Patel, Vishal M.}, title = {Ambiguous Medical Image Segmentation Using Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11536-11546} }
DANI-Net: Uncalibrated Photometric Stereo by Differentiable Shadow Handling, Anisotropic Reflectance Modeling, and Neural Inverse Rendering-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Zongrui and Zheng, Qian and Shi, Boxin and Pan, Gang and Jiang, Xudong}, title = {DANI-Net: Uncalibrated Photometric Stereo by Differentiable Shadow Handling, Anisotropic Reflectance Modeling, and Neural Inverse Rendering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8381-8391} }
Towards Better Stability and Adaptability: Improve Online Self-Training for Model Adaptation in Semantic Segmentation-
[pdf]
[bibtex]@InProceedings{Zhao_2023_CVPR, author = {Zhao, Dong and Wang, Shuang and Zang, Qi and Quan, Dou and Ye, Xiutiao and Jiao, Licheng}, title = {Towards Better Stability and Adaptability: Improve Online Self-Training for Model Adaptation in Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11733-11743} }
Ranking Regularization for Critical Rare Classes: Minimizing False Positives at a High True Positive Rate-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mohammadi_2023_CVPR, author = {Mohammadi, Kiarash and Zhao, He and Zhai, Mengyao and Tung, Frederick}, title = {Ranking Regularization for Critical Rare Classes: Minimizing False Positives at a High True Positive Rate}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15783-15792} }
Joint HDR Denoising and Fusion: A Real-World Mobile HDR Image Dataset-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Shuaizheng and Zhang, Xindong and Sun, Lingchen and Liang, Zhetong and Zeng, Hui and Zhang, Lei}, title = {Joint HDR Denoising and Fusion: A Real-World Mobile HDR Image Dataset}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13966-13975} }
MIST: Multi-Modal Iterative Spatial-Temporal Transformer for Long-Form Video Question Answering-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gao_2023_CVPR, author = {Gao, Difei and Zhou, Luowei and Ji, Lei and Zhu, Linchao and Yang, Yi and Shou, Mike Zheng}, title = {MIST: Multi-Modal Iterative Spatial-Temporal Transformer for Long-Form Video Question Answering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14773-14783} }
Privacy-Preserving Representations Are Not Enough: Recovering Scene Content From Camera Poses-
[pdf]
[supp]
[bibtex]@InProceedings{Chelani_2023_CVPR, author = {Chelani, Kunal and Sattler, Torsten and Kahl, Fredrik and Kukelova, Zuzana}, title = {Privacy-Preserving Representations Are Not Enough: Recovering Scene Content From Camera Poses}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13132-13141} }
A New Dataset Based on Images Taken by Blind People for Testing the Robustness of Image Classification Models Trained for ImageNet Categories-
[pdf]
[supp]
[bibtex]@InProceedings{Bafghi_2023_CVPR, author = {Bafghi, Reza Akbarian and Gurari, Danna}, title = {A New Dataset Based on Images Taken by Blind People for Testing the Robustness of Image Classification Models Trained for ImageNet Categories}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16261-16270} }
Detecting Backdoors During the Inference Stage Based on Corruption Robustness Consistency-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Xiaogeng and Li, Minghui and Wang, Haoyu and Hu, Shengshan and Ye, Dengpan and Jin, Hai and Wu, Libing and Xiao, Chaowei}, title = {Detecting Backdoors During the Inference Stage Based on Corruption Robustness Consistency}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16363-16372} }
Black-Box Sparse Adversarial Attack via Multi-Objective Optimisation-
[pdf]
[supp]
[bibtex]@InProceedings{Williams_2023_CVPR, author = {Williams, Phoenix Neale and Li, Ke}, title = {Black-Box Sparse Adversarial Attack via Multi-Objective Optimisation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12291-12301} }
Renderable Neural Radiance Map for Visual Navigation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kwon_2023_CVPR, author = {Kwon, Obin and Park, Jeongho and Oh, Songhwai}, title = {Renderable Neural Radiance Map for Visual Navigation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9099-9108} }
Learning Orthogonal Prototypes for Generalized Few-Shot Semantic Segmentation-
[pdf]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Sun-Ao and Zhang, Yiheng and Qiu, Zhaofan and Xie, Hongtao and Zhang, Yongdong and Yao, Ting}, title = {Learning Orthogonal Prototypes for Generalized Few-Shot Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11319-11328} }
Are Deep Neural Networks SMARTer Than Second Graders?-
[pdf]
[arXiv]
[bibtex]@InProceedings{Cherian_2023_CVPR, author = {Cherian, Anoop and Peng, Kuan-Chuan and Lohit, Suhas and Smith, Kevin A. and Tenenbaum, Joshua B.}, title = {Are Deep Neural Networks SMARTer Than Second Graders?}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10834-10844} }
Bi-Level Meta-Learning for Few-Shot Domain Generalization-
[pdf]
[supp]
[bibtex]@InProceedings{Qin_2023_CVPR, author = {Qin, Xiaorong and Song, Xinhang and Jiang, Shuqiang}, title = {Bi-Level Meta-Learning for Few-Shot Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15900-15910} }
Multi-Modal Learning With Missing Modality via Shared-Specific Feature Modelling-
[pdf]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Hu and Chen, Yuanhong and Ma, Congbo and Avery, Jodie and Hull, Louise and Carneiro, Gustavo}, title = {Multi-Modal Learning With Missing Modality via Shared-Specific Feature Modelling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15878-15887} }
DisWOT: Student Architecture Search for Distillation WithOut Training-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dong_2023_CVPR, author = {Dong, Peijie and Li, Lujun and Wei, Zimian}, title = {DisWOT: Student Architecture Search for Distillation WithOut Training}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11898-11908} }
Logical Consistency and Greater Descriptive Power for Facial Hair Attribute Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_CVPR, author = {Wu, Haiyu and Bezold, Grace and Bhatta, Aman and Bowyer, Kevin W.}, title = {Logical Consistency and Greater Descriptive Power for Facial Hair Attribute Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8588-8597} }
Spatio-Temporal Pixel-Level Contrastive Learning-Based Source-Free Domain Adaptation for Video Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lo_2023_CVPR, author = {Lo, Shao-Yuan and Oza, Poojan and Chennupati, Sumanth and Galindo, Alejandro and Patel, Vishal M.}, title = {Spatio-Temporal Pixel-Level Contrastive Learning-Based Source-Free Domain Adaptation for Video Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10534-10543} }
InternImage: Exploring Large-Scale Vision Foundation Models With Deformable Convolutions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Wenhai and Dai, Jifeng and Chen, Zhe and Huang, Zhenhang and Li, Zhiqi and Zhu, Xizhou and Hu, Xiaowei and Lu, Tong and Lu, Lewei and Li, Hongsheng and Wang, Xiaogang and Qiao, Yu}, title = {InternImage: Exploring Large-Scale Vision Foundation Models With Deformable Convolutions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14408-14419} }
DAA: A Delta Age AdaIN Operation for Age Estimation via Binary Code Transformer-
[pdf]
[arXiv]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Ping and Zhang, Xingpeng and Li, Ye and Tao, Ju and Xiao, Bin and Wang, Bing and Jiang, Zongjie}, title = {DAA: A Delta Age AdaIN Operation for Age Estimation via Binary Code Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15836-15845} }
Mind the Label Shift of Augmentation-Based Graph OOD Generalization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yu_2023_CVPR, author = {Yu, Junchi and Liang, Jian and He, Ran}, title = {Mind the Label Shift of Augmentation-Based Graph OOD Generalization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11620-11630} }
Unsupervised Intrinsic Image Decomposition With LiDAR Intensity-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sato_2023_CVPR, author = {Sato, Shogo and Yao, Yasuhiro and Yoshida, Taiga and Kaneko, Takuhiro and Ando, Shingo and Shimamura, Jun}, title = {Unsupervised Intrinsic Image Decomposition With LiDAR Intensity}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13466-13475} }
PET-NeuS: Positional Encoding Tri-Planes for Neural Surfaces-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Yiqun and Skorokhodov, Ivan and Wonka, Peter}, title = {PET-NeuS: Positional Encoding Tri-Planes for Neural Surfaces}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12598-12607} }
ZegCLIP: Towards Adapting CLIP for Zero-Shot Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhou_2023_CVPR, author = {Zhou, Ziqin and Lei, Yinjie and Zhang, Bowen and Liu, Lingqiao and Liu, Yifan}, title = {ZegCLIP: Towards Adapting CLIP for Zero-Shot Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11175-11185} }
AdaptiveMix: Improving GAN Training via Feature Space Shrinkage-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Haozhe and Zhang, Wentian and Li, Bing and Wu, Haoqian and He, Nanjun and Huang, Yawen and Li, Yuexiang and Ghanem, Bernard and Zheng, Yefeng}, title = {AdaptiveMix: Improving GAN Training via Feature Space Shrinkage}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16219-16229} }
Specialist Diffusion: Plug-and-Play Sample-Efficient Fine-Tuning of Text-to-Image Diffusion Models To Learn Any Unseen Style-
[pdf]
[supp]
[bibtex]@InProceedings{Lu_2023_CVPR, author = {Lu, Haoming and Tunanyan, Hazarapet and Wang, Kai and Navasardyan, Shant and Wang, Zhangyang and Shi, Humphrey}, title = {Specialist Diffusion: Plug-and-Play Sample-Efficient Fine-Tuning of Text-to-Image Diffusion Models To Learn Any Unseen Style}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14267-14276} }
HyperCUT: Video Sequence From a Single Blurry Image Using Unsupervised Ordering-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Pham_2023_CVPR, author = {Pham, Bang-Dang and Tran, Phong and Tran, Anh and Pham, Cuong and Nguyen, Rang and Hoai, Minh}, title = {HyperCUT: Video Sequence From a Single Blurry Image Using Unsupervised Ordering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9843-9852} }
Can't Steal? Cont-Steal! Contrastive Stealing Attacks Against Image Encoders-
[pdf]
[supp]
[bibtex]@InProceedings{Sha_2023_CVPR, author = {Sha, Zeyang and He, Xinlei and Yu, Ning and Backes, Michael and Zhang, Yang}, title = {Can't Steal? Cont-Steal! Contrastive Stealing Attacks Against Image Encoders}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16373-16383} }
Nerflets: Local Radiance Fields for Efficient Structure-Aware 3D Scene Representation From 2D Supervision-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Xiaoshuai and Kundu, Abhijit and Funkhouser, Thomas and Guibas, Leonidas and Su, Hao and Genova, Kyle}, title = {Nerflets: Local Radiance Fields for Efficient Structure-Aware 3D Scene Representation From 2D Supervision}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8274-8284} }
CLIP Is Also an Efficient Segmenter: A Text-Driven Approach for Weakly Supervised Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lin_2023_CVPR, author = {Lin, Yuqi and Chen, Minghao and Wang, Wenxiao and Wu, Boxi and Li, Ke and Lin, Binbin and Liu, Haifeng and He, Xiaofei}, title = {CLIP Is Also an Efficient Segmenter: A Text-Driven Approach for Weakly Supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15305-15314} }
Spatially Adaptive Self-Supervised Learning for Real-World Image Denoising-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Junyi and Zhang, Zhilu and Liu, Xiaoyu and Feng, Chaoyu and Wang, Xiaotao and Lei, Lei and Zuo, Wangmeng}, title = {Spatially Adaptive Self-Supervised Learning for Real-World Image Denoising}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9914-9924} }
From Images to Textual Prompts: Zero-Shot Visual Question Answering With Frozen Large Language Models-
[pdf]
[supp]
[bibtex]@InProceedings{Guo_2023_CVPR, author = {Guo, Jiaxian and Li, Junnan and Li, Dongxu and Tiong, Anthony Meng Huat and Li, Boyang and Tao, Dacheng and Hoi, Steven}, title = {From Images to Textual Prompts: Zero-Shot Visual Question Answering With Frozen Large Language Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10867-10877} }
Observation-Centric SORT: Rethinking SORT for Robust Multi-Object Tracking-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cao_2023_CVPR, author = {Cao, Jinkun and Pang, Jiangmiao and Weng, Xinshuo and Khirodkar, Rawal and Kitani, Kris}, title = {Observation-Centric SORT: Rethinking SORT for Robust Multi-Object Tracking}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9686-9696} }
Transformer-Based Learned Optimization-
[pdf]
[supp]
[bibtex]@InProceedings{Gartner_2023_CVPR, author = {G\"artner, Erik and Metz, Luke and Andriluka, Mykhaylo and Freeman, C. Daniel and Sminchisescu, Cristian}, title = {Transformer-Based Learned Optimization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11970-11979} }
Quantum-Inspired Spectral-Spatial Pyramid Network for Hyperspectral Image Classification-
[pdf]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Jie and Zhang, Yongshan and Zhou, Yicong}, title = {Quantum-Inspired Spectral-Spatial Pyramid Network for Hyperspectral Image Classification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9925-9934} }
Towards Benchmarking and Assessing Visual Naturalness of Physical World Adversarial Attacks-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Simin and Zhang, Shuning and Chen, Gujun and Wang, Dong and Feng, Pu and Wang, Jiakai and Liu, Aishan and Yi, Xin and Liu, Xianglong}, title = {Towards Benchmarking and Assessing Visual Naturalness of Physical World Adversarial Attacks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12324-12333} }
Visual Prompt Multi-Modal Tracking-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_CVPR, author = {Zhu, Jiawen and Lai, Simiao and Chen, Xin and Wang, Dong and Lu, Huchuan}, title = {Visual Prompt Multi-Modal Tracking}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9516-9526} }
Dealing With Cross-Task Class Discrimination in Online Continual Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Guo_2023_CVPR, author = {Guo, Yiduo and Liu, Bing and Zhao, Dongyan}, title = {Dealing With Cross-Task Class Discrimination in Online Continual Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11878-11887} }
GIVL: Improving Geographical Inclusivity of Vision-Language Models With Pre-Training Methods-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yin_2023_CVPR, author = {Yin, Da and Gao, Feng and Thattai, Govind and Johnston, Michael and Chang, Kai-Wei}, title = {GIVL: Improving Geographical Inclusivity of Vision-Language Models With Pre-Training Methods}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10951-10961} }
Bi3D: Bi-Domain Active Learning for Cross-Domain 3D Object Detection-
[pdf]
[arXiv]
[bibtex]@InProceedings{Yuan_2023_CVPR, author = {Yuan, Jiakang and Zhang, Bo and Yan, Xiangchao and Chen, Tao and Shi, Botian and Li, Yikang and Qiao, Yu}, title = {Bi3D: Bi-Domain Active Learning for Cross-Domain 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15599-15608} }
Towards Fast Adaptation of Pretrained Contrastive Models for Multi-Channel Video-Language Retrieval-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lin_2023_CVPR, author = {Lin, Xudong and Tiwari, Simran and Huang, Shiyuan and Li, Manling and Shou, Mike Zheng and Ji, Heng and Chang, Shih-Fu}, title = {Towards Fast Adaptation of Pretrained Contrastive Models for Multi-Channel Video-Language Retrieval}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14846-14855} }
Crowd3D: Towards Hundreds of People Reconstruction From a Single Image-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wen_2023_CVPR, author = {Wen, Hao and Huang, Jing and Cui, Huili and Lin, Haozhe and Lai, Yu-Kun and Fang, Lu and Li, Kun}, title = {Crowd3D: Towards Hundreds of People Reconstruction From a Single Image}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8937-8946} }
Highly Confident Local Structure Based Consensus Graph Learning for Incomplete Multi-View Clustering-
[pdf]
[supp]
[bibtex]@InProceedings{Wen_2023_CVPR, author = {Wen, Jie and Liu, Chengliang and Xu, Gehui and Wu, Zhihao and Huang, Chao and Fei, Lunke and Xu, Yong}, title = {Highly Confident Local Structure Based Consensus Graph Learning for Incomplete Multi-View Clustering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15712-15721} }
Humans As Light Bulbs: 3D Human Reconstruction From Thermal Reflection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Ruoshi and Vondrick, Carl}, title = {Humans As Light Bulbs: 3D Human Reconstruction From Thermal Reflection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12531-12542} }
CafeBoost: Causal Feature Boost To Eliminate Task-Induced Bias for Class Incremental Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Qiu_2023_CVPR, author = {Qiu, Benliu and Li, Hongliang and Wen, Haitao and Qiu, Heqian and Wang, Lanxiao and Meng, Fanman and Wu, Qingbo and Pan, Lili}, title = {CafeBoost: Causal Feature Boost To Eliminate Task-Induced Bias for Class Incremental Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16016-16025} }
A-La-Carte Prompt Tuning (APT): Combining Distinct Data via Composable Prompting-
[pdf]
[supp]
[bibtex]@InProceedings{Bowman_2023_CVPR, author = {Bowman, Benjamin and Achille, Alessandro and Zancato, Luca and Trager, Matthew and Perera, Pramuditha and Paolini, Giovanni and Soatto, Stefano}, title = {A-La-Carte Prompt Tuning (APT): Combining Distinct Data via Composable Prompting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14984-14993} }
ViLEM: Visual-Language Error Modeling for Image-Text Retrieval-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Yuxin and Ma, Zongyang and Zhang, Ziqi and Qi, Zhongang and Yuan, Chunfeng and Shan, Ying and Li, Bing and Hu, Weiming and Qie, Xiaohu and Wu, Jianping}, title = {ViLEM: Visual-Language Error Modeling for Image-Text Retrieval}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11018-11027} }
Egocentric Auditory Attention Localization in Conversations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ryan_2023_CVPR, author = {Ryan, Fiona and Jiang, Hao and Shukla, Abhinav and Rehg, James M. and Ithapu, Vamsi Krishna}, title = {Egocentric Auditory Attention Localization in Conversations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14663-14674} }
Open-World Multi-Task Control Through Goal-Aware Representation Learning and Adaptive Horizon Prediction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cai_2023_CVPR, author = {Cai, Shaofei and Wang, Zihao and Ma, Xiaojian and Liu, Anji and Liang, Yitao}, title = {Open-World Multi-Task Control Through Goal-Aware Representation Learning and Adaptive Horizon Prediction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13734-13744} }
MoDi: Unconditional Motion Synthesis From Diverse Data-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Raab_2023_CVPR, author = {Raab, Sigal and Leibovitch, Inbal and Li, Peizhuo and Aberman, Kfir and Sorkine-Hornung, Olga and Cohen-Or, Daniel}, title = {MoDi: Unconditional Motion Synthesis From Diverse Data}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13873-13883} }
Visual Localization Using Imperfect 3D Models From the Internet-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Panek_2023_CVPR, author = {Panek, Vojtech and Kukelova, Zuzana and Sattler, Torsten}, title = {Visual Localization Using Imperfect 3D Models From the Internet}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13175-13186} }
PVO: Panoptic Visual Odometry-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ye_2023_CVPR, author = {Ye, Weicai and Lan, Xinyue and Chen, Shuo and Ming, Yuhang and Yu, Xingyuan and Bao, Hujun and Cui, Zhaopeng and Zhang, Guofeng}, title = {PVO: Panoptic Visual Odometry}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9579-9589} }
Generative Diffusion Prior for Unified Image Restoration and Enhancement-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fei_2023_CVPR, author = {Fei, Ben and Lyu, Zhaoyang and Pan, Liang and Zhang, Junzhe and Yang, Weidong and Luo, Tianyue and Zhang, Bo and Dai, Bo}, title = {Generative Diffusion Prior for Unified Image Restoration and Enhancement}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9935-9946} }
Real-Time Controllable Denoising for Image and Video-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Zhaoyang and Jiang, Yitong and Shao, Wenqi and Wang, Xiaogang and Luo, Ping and Lin, Kaimo and Gu, Jinwei}, title = {Real-Time Controllable Denoising for Image and Video}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14028-14038} }
ISBNet: A 3D Point Cloud Instance Segmentation Network With Instance-Aware Sampling and Box-Aware Dynamic Convolution-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ngo_2023_CVPR, author = {Ngo, Tuan Duc and Hua, Binh-Son and Nguyen, Khoi}, title = {ISBNet: A 3D Point Cloud Instance Segmentation Network With Instance-Aware Sampling and Box-Aware Dynamic Convolution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13550-13559} }
IterativePFN: True Iterative Point Cloud Filtering-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{de_Silva_Edirimuni_2023_CVPR, author = {de Silva Edirimuni, Dasith and Lu, Xuequan and Shao, Zhiwen and Li, Gang and Robles-Kelly, Antonio and He, Ying}, title = {IterativePFN: True Iterative Point Cloud Filtering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13530-13539} }
CLIP-S4: Language-Guided Self-Supervised Semantic Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{He_2023_CVPR, author = {He, Wenbin and Jamonnak, Suphanut and Gou, Liang and Ren, Liu}, title = {CLIP-S4: Language-Guided Self-Supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11207-11216} }
Deep Incomplete Multi-View Clustering With Cross-View Partial Sample and Prototype Alignment-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jin_2023_CVPR, author = {Jin, Jiaqi and Wang, Siwei and Dong, Zhibin and Liu, Xinwang and Zhu, En}, title = {Deep Incomplete Multi-View Clustering With Cross-View Partial Sample and Prototype Alignment}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11600-11609} }
Revisiting Multimodal Representation in Contrastive Learning: From Patch and Token Embeddings to Finite Discrete Tokens-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Yuxiao and Yuan, Jianbo and Tian, Yu and Geng, Shijie and Li, Xinyu and Zhou, Ding and Metaxas, Dimitris N. and Yang, Hongxia}, title = {Revisiting Multimodal Representation in Contrastive Learning: From Patch and Token Embeddings to Finite Discrete Tokens}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15095-15104} }
Heterogeneous Continual Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Madaan_2023_CVPR, author = {Madaan, Divyam and Yin, Hongxu and Byeon, Wonmin and Kautz, Jan and Molchanov, Pavlo}, title = {Heterogeneous Continual Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15985-15995} }
Object Pose Estimation With Statistical Guarantees: Conformal Keypoint Detection and Geometric Uncertainty Propagation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_CVPR, author = {Yang, Heng and Pavone, Marco}, title = {Object Pose Estimation With Statistical Guarantees: Conformal Keypoint Detection and Geometric Uncertainty Propagation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8947-8958} }
3D-Aware Multi-Class Image-to-Image Translation With NeRFs-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Senmao and van de Weijer, Joost and Wang, Yaxing and Khan, Fahad Shahbaz and Liu, Meiqin and Yang, Jian}, title = {3D-Aware Multi-Class Image-to-Image Translation With NeRFs}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12652-12662} }
Unsupervised Visible-Infrared Person Re-Identification via Progressive Graph Matching and Alternate Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Wu_2023_CVPR, author = {Wu, Zesen and Ye, Mang}, title = {Unsupervised Visible-Infrared Person Re-Identification via Progressive Graph Matching and Alternate Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9548-9558} }
Hierarchical B-Frame Video Coding Using Two-Layer CANF Without Motion Coding-
[pdf]
[supp]
[bibtex]@InProceedings{Alexandre_2023_CVPR, author = {Alexandre, David and Hang, Hsueh-Ming and Peng, Wen-Hsiao}, title = {Hierarchical B-Frame Video Coding Using Two-Layer CANF Without Motion Coding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10249-10258} }
Seeing Through the Glass: Neural 3D Reconstruction of Object Inside a Transparent Container-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tong_2023_CVPR, author = {Tong, Jinguang and Muthu, Sundaram and Maken, Fahira Afzal and Nguyen, Chuong and Li, Hongdong}, title = {Seeing Through the Glass: Neural 3D Reconstruction of Object Inside a Transparent Container}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12555-12564} }
Neural Voting Field for Camera-Space 3D Hand Pose Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_CVPR, author = {Huang, Lin and Lin, Chung-Ching and Lin, Kevin and Liang, Lin and Wang, Lijuan and Yuan, Junsong and Liu, Zicheng}, title = {Neural Voting Field for Camera-Space 3D Hand Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8969-8978} }
Visual Recognition-Driven Image Restoration for Multiple Degradation With Intrinsic Semantics Recovery-
[pdf]
[supp]
[bibtex]@InProceedings{Yang_2023_CVPR, author = {Yang, Zizheng and Huang, Jie and Chang, Jiahao and Zhou, Man and Yu, Hu and Zhang, Jinghao and Zhao, Feng}, title = {Visual Recognition-Driven Image Restoration for Multiple Degradation With Intrinsic Semantics Recovery}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14059-14070} }
Knowledge Combination To Learn Rotated Detection Without Rotated Annotation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_CVPR, author = {Zhu, Tianyu and Ferenczi, Bryce and Purkait, Pulak and Drummond, Tom and Rezatofighi, Hamid and van den Hengel, Anton}, title = {Knowledge Combination To Learn Rotated Detection Without Rotated Annotation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15518-15527} }
Pointersect: Neural Rendering With Cloud-Ray Intersection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chang_2023_CVPR, author = {Chang, Jen-Hao Rick and Chen, Wei-Yu and Ranjan, Anurag and Yi, Kwang Moo and Tuzel, Oncel}, title = {Pointersect: Neural Rendering With Cloud-Ray Intersection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8359-8369} }
Beyond Attentive Tokens: Incorporating Token Importance and Diversity for Efficient Vision Transformers-
[pdf]
[arXiv]
[bibtex]@InProceedings{Long_2023_CVPR, author = {Long, Sifan and Zhao, Zhen and Pi, Jimin and Wang, Shengsheng and Wang, Jingdong}, title = {Beyond Attentive Tokens: Incorporating Token Importance and Diversity for Efficient Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10334-10343} }
STDLens: Model Hijacking-Resilient Federated Learning for Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chow_2023_CVPR, author = {Chow, Ka-Ho and Liu, Ling and Wei, Wenqi and Ilhan, Fatih and Wu, Yanzhao}, title = {STDLens: Model Hijacking-Resilient Federated Learning for Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16343-16351} }
MagicPony: Learning Articulated 3D Animals in the Wild-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_CVPR, author = {Wu, Shangzhe and Li, Ruining and Jakab, Tomas and Rupprecht, Christian and Vedaldi, Andrea}, title = {MagicPony: Learning Articulated 3D Animals in the Wild}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8792-8802} }
Affordances From Human Videos as a Versatile Representation for Robotics-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bahl_2023_CVPR, author = {Bahl, Shikhar and Mendonca, Russell and Chen, Lili and Jain, Unnat and Pathak, Deepak}, title = {Affordances From Human Videos as a Versatile Representation for Robotics}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13778-13790} }
AMT: All-Pairs Multi-Field Transforms for Efficient Frame Interpolation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Zhen and Zhu, Zuo-Liang and Han, Ling-Hao and Hou, Qibin and Guo, Chun-Le and Cheng, Ming-Ming}, title = {AMT: All-Pairs Multi-Field Transforms for Efficient Frame Interpolation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9801-9810} }
Toward RAW Object Detection: A New Benchmark and a New Model-
[pdf]
[supp]
[bibtex]@InProceedings{Xu_2023_CVPR, author = {Xu, Ruikang and Chen, Chang and Peng, Jingyang and Li, Cheng and Huang, Yibin and Song, Fenglong and Yan, Youliang and Xiong, Zhiwei}, title = {Toward RAW Object Detection: A New Benchmark and a New Model}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13384-13393} }
Music-Driven Group Choreography-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Le_2023_CVPR, author = {Le, Nhat and Pham, Thang and Do, Tuong and Tjiputra, Erman and Tran, Quang D. and Nguyen, Anh}, title = {Music-Driven Group Choreography}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8673-8682} }
Cascade Evidential Learning for Open-World Weakly-Supervised Temporal Action Localization-
[pdf]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Mengyuan and Gao, Junyu and Xu, Changsheng}, title = {Cascade Evidential Learning for Open-World Weakly-Supervised Temporal Action Localization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14741-14750} }
STAR Loss: Reducing Semantic Ambiguity in Facial Landmark Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Zhou_2023_CVPR, author = {Zhou, Zhenglin and Li, Huaxia and Liu, Hong and Wang, Nanyang and Yu, Gang and Ji, Rongrong}, title = {STAR Loss: Reducing Semantic Ambiguity in Facial Landmark Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15475-15484} }
Seeing What You Said: Talking Face Generation Guided by a Lip Reading Expert-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Jiadong and Qian, Xinyuan and Zhang, Malu and Tan, Robby T. and Li, Haizhou}, title = {Seeing What You Said: Talking Face Generation Guided by a Lip Reading Expert}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14653-14662} }
SimpSON: Simplifying Photo Cleanup With Single-Click Distracting Object Segmentation Network-
[pdf]
[supp]
[bibtex]@InProceedings{Huynh_2023_CVPR, author = {Huynh, Chuong and Zhou, Yuqian and Lin, Zhe and Barnes, Connelly and Shechtman, Eli and Amirghodsi, Sohrab and Shrivastava, Abhinav}, title = {SimpSON: Simplifying Photo Cleanup With Single-Click Distracting Object Segmentation Network}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14518-14527} }
Learning Neural Duplex Radiance Fields for Real-Time View Synthesis-
[pdf]
[supp]
[bibtex]@InProceedings{Wan_2023_CVPR, author = {Wan, Ziyu and Richardt, Christian and Bo\v{z}i\v{c}, Alja\v{z} and Li, Chao and Rengarajan, Vijay and Nam, Seonghyeon and Xiang, Xiaoyu and Li, Tuotuo and Zhu, Bo and Ranjan, Rakesh and Liao, Jing}, title = {Learning Neural Duplex Radiance Fields for Real-Time View Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8307-8316} }
Towards Modality-Agnostic Person Re-Identification With Descriptive Query-
[pdf]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Cuiqun and Ye, Mang and Jiang, Ding}, title = {Towards Modality-Agnostic Person Re-Identification With Descriptive Query}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15128-15137} }
An In-Depth Exploration of Person Re-Identification and Gait Recognition in Cloth-Changing Conditions-
[pdf]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Weijia and Hou, Saihui and Zhang, Chunjie and Cao, Chunshui and Liu, Xu and Huang, Yongzhen and Zhao, Yao}, title = {An In-Depth Exploration of Person Re-Identification and Gait Recognition in Cloth-Changing Conditions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13824-13833} }
Visual Exemplar Driven Task-Prompting for Unified Perception in Autonomous Driving-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liang_2023_CVPR, author = {Liang, Xiwen and Niu, Minzhe and Han, Jianhua and Xu, Hang and Xu, Chunjing and Liang, Xiaodan}, title = {Visual Exemplar Driven Task-Prompting for Unified Perception in Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9611-9621} }
Toward Verifiable and Reproducible Human Evaluation for Text-to-Image Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Otani_2023_CVPR, author = {Otani, Mayu and Togashi, Riku and Sawai, Yu and Ishigami, Ryosuke and Nakashima, Yuta and Rahtu, Esa and Heikkil\"a, Janne and Satoh, Shin{\textquoteright}ichi}, title = {Toward Verifiable and Reproducible Human Evaluation for Text-to-Image Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14277-14286} }
Learning a 3D Morphable Face Reflectance Model From Low-Cost Data-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Han_2023_CVPR, author = {Han, Yuxuan and Wang, Zhibo and Xu, Feng}, title = {Learning a 3D Morphable Face Reflectance Model From Low-Cost Data}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8598-8608} }
Recurrent Homography Estimation Using Homography-Guided Image Warping and Focus Transformer-
[pdf]
[supp]
[bibtex]@InProceedings{Cao_2023_CVPR, author = {Cao, Si-Yuan and Zhang, Runmin and Luo, Lun and Yu, Beinan and Sheng, Zehua and Li, Junwei and Shen, Hui-Liang}, title = {Recurrent Homography Estimation Using Homography-Guided Image Warping and Focus Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9833-9842} }
I2-SDF: Intrinsic Indoor Scene Reconstruction and Editing via Raytracing in Neural SDFs-
[pdf]
[supp]
[bibtex]@InProceedings{Zhu_2023_CVPR, author = {Zhu, Jingsen and Huo, Yuchi and Ye, Qi and Luan, Fujun and Li, Jifan and Xi, Dianbing and Wang, Lisha and Tang, Rui and Hua, Wei and Bao, Hujun and Wang, Rui}, title = {I2-SDF: Intrinsic Indoor Scene Reconstruction and Editing via Raytracing in Neural SDFs}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12489-12498} }
DLBD: A Self-Supervised Direct-Learned Binary Descriptor-
[pdf]
[bibtex]@InProceedings{Xiao_2023_CVPR, author = {Xiao, Bin and Hu, Yang and Liu, Bo and Bi, Xiuli and Li, Weisheng and Gao, Xinbo}, title = {DLBD: A Self-Supervised Direct-Learned Binary Descriptor}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15846-15855} }
Fuzzy Positive Learning for Semi-Supervised Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Qiao_2023_CVPR, author = {Qiao, Pengchong and Wei, Zhidan and Wang, Yu and Wang, Zhennan and Song, Guoli and Xu, Fan and Ji, Xiangyang and Liu, Chang and Chen, Jie}, title = {Fuzzy Positive Learning for Semi-Supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15465-15474} }
Multi-View Inverse Rendering for Large-Scale Real-World Indoor Scenes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Zhen and Wang, Lingli and Cheng, Mofang and Pan, Cihui and Yang, Jiaqi}, title = {Multi-View Inverse Rendering for Large-Scale Real-World Indoor Scenes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12499-12509} }
Boosting Transductive Few-Shot Fine-Tuning With Margin-Based Uncertainty Weighting and Probability Regularization-
[pdf]
[supp]
[bibtex]@InProceedings{Tao_2023_CVPR, author = {Tao, Ran and Chen, Hao and Savvides, Marios}, title = {Boosting Transductive Few-Shot Fine-Tuning With Margin-Based Uncertainty Weighting and Probability Regularization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15752-15761} }
SMPConv: Self-Moving Point Representations for Continuous Convolution-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2023_CVPR, author = {Kim, Sanghyeon and Park, Eunbyung}, title = {SMPConv: Self-Moving Point Representations for Continuous Convolution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10289-10299} }
PRISE: Demystifying Deep Lucas-Kanade With Strongly Star-Convex Constraints for Multimodel Image Alignment-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Yiqing and Huang, Xinming and Zhang, Ziming}, title = {PRISE: Demystifying Deep Lucas-Kanade With Strongly Star-Convex Constraints for Multimodel Image Alignment}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13187-13197} }
Learning To Exploit Temporal Structure for Biomedical Vision-Language Processing-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bannur_2023_CVPR, author = {Bannur, Shruthi and Hyland, Stephanie and Liu, Qianchu and P\'erez-Garc{\'\i}a, Fernando and Ilse, Maximilian and Castro, Daniel C. and Boecking, Benedikt and Sharma, Harshita and Bouzid, Kenza and Thieme, Anja and Schwaighofer, Anton and Wetscherek, Maria and Lungren, Matthew P. and Nori, Aditya and Alvarez-Valle, Javier and Oktay, Ozan}, title = {Learning To Exploit Temporal Structure for Biomedical Vision-Language Processing}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15016-15027} }
Simple Cues Lead to a Strong Multi-Object Tracker-
[pdf]
[supp]
[bibtex]@InProceedings{Seidenschwarz_2023_CVPR, author = {Seidenschwarz, Jenny and Bras\'o, Guillem and Serrano, V{\'\i}ctor Castro and Elezi, Ismail and Leal-Taix\'e, Laura}, title = {Simple Cues Lead to a Strong Multi-Object Tracker}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13813-13823} }
Marching-Primitives: Shape Abstraction From Signed Distance Function-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Weixiao and Wu, Yuwei and Ruan, Sipu and Chirikjian, Gregory S.}, title = {Marching-Primitives: Shape Abstraction From Signed Distance Function}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8771-8780} }
PointVector: A Vector Representation in Point Cloud Analysis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Deng_2023_CVPR, author = {Deng, Xin and Zhang, WenYu and Ding, Qing and Zhang, XinMing}, title = {PointVector: A Vector Representation in Point Cloud Analysis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9455-9465} }
BAEFormer: Bi-Directional and Early Interaction Transformers for Bird's Eye View Semantic Segmentation-
[pdf]
[bibtex]@InProceedings{Pan_2023_CVPR, author = {Pan, Cong and He, Yonghao and Peng, Junran and Zhang, Qian and Sui, Wei and Zhang, Zhaoxiang}, title = {BAEFormer: Bi-Directional and Early Interaction Transformers for Bird's Eye View Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9590-9599} }
Generic-to-Specific Distillation of Masked Autoencoders-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_CVPR, author = {Huang, Wei and Peng, Zhiliang and Dong, Li and Wei, Furu and Jiao, Jianbin and Ye, Qixiang}, title = {Generic-to-Specific Distillation of Masked Autoencoders}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15996-16005} }
Combining Implicit-Explicit View Correlation for Light Field Semantic Segmentation-
[pdf]
[bibtex]@InProceedings{Cong_2023_CVPR, author = {Cong, Ruixuan and Yang, Da and Chen, Rongshan and Wang, Sizhe and Cui, Zhenglong and Sheng, Hao}, title = {Combining Implicit-Explicit View Correlation for Light Field Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9172-9181} }
SOOD: Towards Semi-Supervised Oriented Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hua_2023_CVPR, author = {Hua, Wei and Liang, Dingkang and Li, Jingyu and Liu, Xiaolong and Zou, Zhikang and Ye, Xiaoqing and Bai, Xiang}, title = {SOOD: Towards Semi-Supervised Oriented Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15558-15567} }
Beyond mAP: Towards Better Evaluation of Instance Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jena_2023_CVPR, author = {Jena, Rohit and Zhornyak, Lukas and Doiphode, Nehal and Chaudhari, Pratik and Buch, Vivek and Gee, James and Shi, Jianbo}, title = {Beyond mAP: Towards Better Evaluation of Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11309-11318} }
BASiS: Batch Aligned Spectral Embedding Space-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Streicher_2023_CVPR, author = {Streicher, Or and Cohen, Ido and Gilboa, Guy}, title = {BASiS: Batch Aligned Spectral Embedding Space}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10396-10405} }
DCFace: Synthetic Face Generation With Dual Condition Diffusion Model-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2023_CVPR, author = {Kim, Minchul and Liu, Feng and Jain, Anil and Liu, Xiaoming}, title = {DCFace: Synthetic Face Generation With Dual Condition Diffusion Model}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12715-12725} }
Infinite Photorealistic Worlds Using Procedural Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Raistrick_2023_CVPR, author = {Raistrick, Alexander and Lipson, Lahav and Ma, Zeyu and Mei, Lingjie and Wang, Mingzhe and Zuo, Yiming and Kayan, Karhan and Wen, Hongyu and Han, Beining and Wang, Yihan and Newell, Alejandro and Law, Hei and Goyal, Ankit and Yang, Kaiyu and Deng, Jia}, title = {Infinite Photorealistic Worlds Using Procedural Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12630-12641} }
Diversity-Measurable Anomaly Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Wenrui and Chang, Hong and Ma, Bingpeng and Shan, Shiguang and Chen, Xilin}, title = {Diversity-Measurable Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12147-12156} }
A Large-Scale Robustness Analysis of Video Action Recognition Models-
[pdf]
[supp]
[bibtex]@InProceedings{Schiappa_2023_CVPR, author = {Schiappa, Madeline Chantry and Biyani, Naman and Kamtam, Prudvi and Vyas, Shruti and Palangi, Hamid and Vineet, Vibhav and Rawat, Yogesh S.}, title = {A Large-Scale Robustness Analysis of Video Action Recognition Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14698-14708} }
Blind Video Deflickering by Neural Filtering With a Flawed Atlas-
[pdf]
[arXiv]
[bibtex]@InProceedings{Lei_2023_CVPR, author = {Lei, Chenyang and Ren, Xuanchi and Zhang, Zhaoxiang and Chen, Qifeng}, title = {Blind Video Deflickering by Neural Filtering With a Flawed Atlas}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10439-10448} }
Grid-Guided Neural Radiance Fields for Large Urban Scenes-
[pdf]
[arXiv]
[bibtex]@InProceedings{Xu_2023_CVPR, author = {Xu, Linning and Xiangli, Yuanbo and Peng, Sida and Pan, Xingang and Zhao, Nanxuan and Theobalt, Christian and Dai, Bo and Lin, Dahua}, title = {Grid-Guided Neural Radiance Fields for Large Urban Scenes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8296-8306} }
FreeNeRF: Improving Few-Shot Neural Rendering With Free Frequency Regularization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_CVPR, author = {Yang, Jiawei and Pavone, Marco and Wang, Yue}, title = {FreeNeRF: Improving Few-Shot Neural Rendering With Free Frequency Regularization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8254-8263} }
NeuWigs: A Neural Dynamic Model for Volumetric Hair Capture and Animation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Ziyan and Nam, Giljoo and Stuyck, Tuur and Lombardi, Stephen and Cao, Chen and Saragih, Jason and Zollh\"ofer, Michael and Hodgins, Jessica and Lassner, Christoph}, title = {NeuWigs: A Neural Dynamic Model for Volumetric Hair Capture and Animation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8641-8651} }
CLIP2: Contrastive Language-Image-Point Pretraining From Real-World Point Cloud Data-
[pdf]
[supp]
[bibtex]@InProceedings{Zeng_2023_CVPR, author = {Zeng, Yihan and Jiang, Chenhan and Mao, Jiageng and Han, Jianhua and Ye, Chaoqiang and Huang, Qingqiu and Yeung, Dit-Yan and Yang, Zhen and Liang, Xiaodan and Xu, Hang}, title = {CLIP2: Contrastive Language-Image-Point Pretraining From Real-World Point Cloud Data}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15244-15253} }
HNeRV: A Hybrid Neural Representation for Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Hao and Gwilliam, Matthew and Lim, Ser-Nam and Shrivastava, Abhinav}, title = {HNeRV: A Hybrid Neural Representation for Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10270-10279} }
Model-Agnostic Gender Debiased Image Captioning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hirota_2023_CVPR, author = {Hirota, Yusuke and Nakashima, Yuta and Garcia, Noa}, title = {Model-Agnostic Gender Debiased Image Captioning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15191-15200} }
FitMe: Deep Photorealistic 3D Morphable Model Avatars-
[pdf]
[supp]
[bibtex]@InProceedings{Lattas_2023_CVPR, author = {Lattas, Alexandros and Moschoglou, Stylianos and Ploumpis, Stylianos and Gecer, Baris and Deng, Jiankang and Zafeiriou, Stefanos}, title = {FitMe: Deep Photorealistic 3D Morphable Model Avatars}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8629-8640} }
CLIPPO: Image-and-Language Understanding From Pixels Only-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tschannen_2023_CVPR, author = {Tschannen, Michael and Mustafa, Basil and Houlsby, Neil}, title = {CLIPPO: Image-and-Language Understanding From Pixels Only}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11006-11017} }
DETR With Additional Global Aggregation for Cross-Domain Weakly Supervised Object Detection-
[pdf]
[arXiv]
[bibtex]@InProceedings{Tang_2023_CVPR, author = {Tang, Zongheng and Sun, Yifan and Liu, Si and Yang, Yi}, title = {DETR With Additional Global Aggregation for Cross-Domain Weakly Supervised Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11422-11432} }
Towards Bridging the Performance Gaps of Joint Energy-Based Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_CVPR, author = {Yang, Xiulong and Su, Qing and Ji, Shihao}, title = {Towards Bridging the Performance Gaps of Joint Energy-Based Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15732-15741} }
expOSE: Accurate Initialization-Free Projective Factorization Using Exponential Regularization-
[pdf]
[supp]
[bibtex]@InProceedings{Iglesias_2023_CVPR, author = {Iglesias, Jos\'e Pedro and Nilsson, Amanda and Olsson, Carl}, title = {expOSE: Accurate Initialization-Free Projective Factorization Using Exponential Regularization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8959-8968} }
OpenGait: Revisiting Gait Recognition Towards Better Practicality-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fan_2023_CVPR, author = {Fan, Chao and Liang, Junhao and Shen, Chuanfu and Hou, Saihui and Huang, Yongzhen and Yu, Shiqi}, title = {OpenGait: Revisiting Gait Recognition Towards Better Practicality}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9707-9716} }
DATID-3D: Diversity-Preserved Domain Adaptation Using Text-to-Image Diffusion for 3D Generative Model-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2023_CVPR, author = {Kim, Gwanghyun and Chun, Se Young}, title = {DATID-3D: Diversity-Preserved Domain Adaptation Using Text-to-Image Diffusion for 3D Generative Model}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14203-14213} }
Learning Neural Volumetric Representations of Dynamic Humans in Minutes-
[pdf]
[arXiv]
[bibtex]@InProceedings{Geng_2023_CVPR, author = {Geng, Chen and Peng, Sida and Xu, Zhen and Bao, Hujun and Zhou, Xiaowei}, title = {Learning Neural Volumetric Representations of Dynamic Humans in Minutes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8759-8770} }
Streaming Video Model-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhao_2023_CVPR, author = {Zhao, Yucheng and Luo, Chong and Tang, Chuanxin and Chen, Dongdong and Codella, Noel and Zha, Zheng-Jun}, title = {Streaming Video Model}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14602-14612} }
CapDet: Unifying Dense Captioning and Open-World Detection Pretraining-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Long_2023_CVPR, author = {Long, Yanxin and Wen, Youpeng and Han, Jianhua and Xu, Hang and Ren, Pengzhen and Zhang, Wei and Zhao, Shen and Liang, Xiaodan}, title = {CapDet: Unifying Dense Captioning and Open-World Detection Pretraining}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15233-15243} }
Bayesian Posterior Approximation With Stochastic Ensembles-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Balabanov_2023_CVPR, author = {Balabanov, Oleksandr and Mehlig, Bernhard and Linander, Hampus}, title = {Bayesian Posterior Approximation With Stochastic Ensembles}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13701-13711} }
Symmetric Shape-Preserving Autoencoder for Unsupervised Real Scene Point Cloud Completion-
[pdf]
[supp]
[bibtex]@InProceedings{Ma_2023_CVPR, author = {Ma, Changfeng and Chen, Yinuo and Guo, Pengxiao and Guo, Jie and Wang, Chongjun and Guo, Yanwen}, title = {Symmetric Shape-Preserving Autoencoder for Unsupervised Real Scene Point Cloud Completion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13560-13569} }
Comprehensive and Delicate: An Efficient Transformer for Image Restoration-
[pdf]
[supp]
[bibtex]@InProceedings{Zhao_2023_CVPR, author = {Zhao, Haiyu and Gou, Yuanbiao and Li, Boyun and Peng, Dezhong and Lv, Jiancheng and Peng, Xi}, title = {Comprehensive and Delicate: An Efficient Transformer for Image Restoration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14122-14132} }
Zero-Shot Model Diagnosis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Luo_2023_CVPR, author = {Luo, Jinqi and Wang, Zhaoning and Wu, Chen Henry and Huang, Dong and De la Torre, Fernando}, title = {Zero-Shot Model Diagnosis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11631-11640} }
ShadowDiffusion: When Degradation Prior Meets Diffusion Model for Shadow Removal-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Guo_2023_CVPR, author = {Guo, Lanqing and Wang, Chong and Yang, Wenhan and Huang, Siyu and Wang, Yufei and Pfister, Hanspeter and Wen, Bihan}, title = {ShadowDiffusion: When Degradation Prior Meets Diffusion Model for Shadow Removal}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14049-14058} }
Pruning Parameterization With Bi-Level Optimization for Efficient Semantic Segmentation on the Edge-
[pdf]
[supp]
[bibtex]@InProceedings{Yang_2023_CVPR, author = {Yang, Changdi and Zhao, Pu and Li, Yanyu and Niu, Wei and Guan, Jiexiong and Tang, Hao and Qin, Minghai and Ren, Bin and Lin, Xue and Wang, Yanzhi}, title = {Pruning Parameterization With Bi-Level Optimization for Efficient Semantic Segmentation on the Edge}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15402-15412} }
NLOST: Non-Line-of-Sight Imaging With Transformer-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Yue and Peng, Jiayong and Ye, Juntian and Zhang, Yueyi and Xu, Feihu and Xiong, Zhiwei}, title = {NLOST: Non-Line-of-Sight Imaging With Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13313-13322} }
Text-Visual Prompting for Efficient 2D Temporal Video Grounding-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Yimeng and Chen, Xin and Jia, Jinghan and Liu, Sijia and Ding, Ke}, title = {Text-Visual Prompting for Efficient 2D Temporal Video Grounding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14794-14804} }
NEF: Neural Edge Fields for 3D Parametric Curve Reconstruction From Multi-View Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ye_2023_CVPR, author = {Ye, Yunfan and Yi, Renjiao and Gao, Zhirui and Zhu, Chenyang and Cai, Zhiping and Xu, Kai}, title = {NEF: Neural Edge Fields for 3D Parametric Curve Reconstruction From Multi-View Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8486-8495} }
Geometric Visual Similarity Learning in 3D Medical Image Self-Supervised Pre-Training-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{He_2023_CVPR, author = {He, Yuting and Yang, Guanyu and Ge, Rongjun and Chen, Yang and Coatrieux, Jean-Louis and Wang, Boyu and Li, Shuo}, title = {Geometric Visual Similarity Learning in 3D Medical Image Self-Supervised Pre-Training}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9538-9547} }
Less Is More: Reducing Task and Model Complexity for 3D Point Cloud Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Li and Shum, Hubert P. H. and Breckon, Toby P.}, title = {Less Is More: Reducing Task and Model Complexity for 3D Point Cloud Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9361-9371} }
AdaMAE: Adaptive Masking for Efficient Spatiotemporal Learning With Masked Autoencoders-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bandara_2023_CVPR, author = {Bandara, Wele Gedara Chaminda and Patel, Naman and Gholami, Ali and Nikkhah, Mehdi and Agrawal, Motilal and Patel, Vishal M.}, title = {AdaMAE: Adaptive Masking for Efficient Spatiotemporal Learning With Masked Autoencoders}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14507-14517} }
Directional Connectivity-Based Segmentation of Medical Images-
[pdf]
[arXiv]
[bibtex]@InProceedings{Yang_2023_CVPR, author = {Yang, Ziyun and Farsiu, Sina}, title = {Directional Connectivity-Based Segmentation of Medical Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11525-11535} }
Towards Flexible Multi-Modal Document Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Inoue_2023_CVPR, author = {Inoue, Naoto and Kikuchi, Kotaro and Simo-Serra, Edgar and Otani, Mayu and Yamaguchi, Kota}, title = {Towards Flexible Multi-Modal Document Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14287-14296} }
LiDAR-in-the-Loop Hyperparameter Optimization-
[pdf]
[supp]
[bibtex]@InProceedings{Goudreault_2023_CVPR, author = {Goudreault, F\'elix and Scheuble, Dominik and Bijelic, Mario and Robidoux, Nicolas and Heide, Felix}, title = {LiDAR-in-the-Loop Hyperparameter Optimization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13404-13414} }
Local 3D Editing via 3D Distillation of CLIP Knowledge-
[pdf]
[supp]
[bibtex]@InProceedings{Hyung_2023_CVPR, author = {Hyung, Junha and Hwang, Sungwon and Kim, Daejin and Lee, Hyunji and Choo, Jaegul}, title = {Local 3D Editing via 3D Distillation of CLIP Knowledge}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12674-12684} }
Human Body Shape Completion With Implicit Shape and Flow Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Zhou_2023_CVPR, author = {Zhou, Boyao and Meng, Di and Franco, Jean-S\'ebastien and Boyer, Edmond}, title = {Human Body Shape Completion With Implicit Shape and Flow Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12901-12911} }
Modular Memorability: Tiered Representations for Video Memorability Prediction-
[pdf]
[supp]
[bibtex]@InProceedings{Dumont_2023_CVPR, author = {Dumont, Th\'eo and Hevia, Juan Segundo and Fosco, Camilo L.}, title = {Modular Memorability: Tiered Representations for Video Memorability Prediction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10751-10760} }
Weakly-Supervised Domain Adaptive Semantic Segmentation With Prototypical Contrastive Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Das_2023_CVPR, author = {Das, Anurag and Xian, Yongqin and Dai, Dengxin and Schiele, Bernt}, title = {Weakly-Supervised Domain Adaptive Semantic Segmentation With Prototypical Contrastive Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15434-15443} }
Language-Guided Music Recommendation for Video via Prompt Analogies-
[pdf]
[supp]
[bibtex]@InProceedings{McKee_2023_CVPR, author = {McKee, Daniel and Salamon, Justin and Sivic, Josef and Russell, Bryan}, title = {Language-Guided Music Recommendation for Video via Prompt Analogies}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14784-14793} }
Re2TAL: Rewiring Pretrained Video Backbones for Reversible Temporal Action Localization-
[pdf]
[supp]
[bibtex]@InProceedings{Zhao_2023_CVPR, author = {Zhao, Chen and Liu, Shuming and Mangalam, Karttikeya and Ghanem, Bernard}, title = {Re2TAL: Rewiring Pretrained Video Backbones for Reversible Temporal Action Localization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10637-10647} }
NeRFLight: Fast and Light Neural Radiance Fields Using a Shared Feature Grid-
[pdf]
[supp]
[bibtex]@InProceedings{Rivas-Manzaneque_2023_CVPR, author = {Rivas-Manzaneque, Fernando and Sierra-Acosta, Jorge and Penate-Sanchez, Adrian and Moreno-Noguer, Francesc and Ribeiro, Angela}, title = {NeRFLight: Fast and Light Neural Radiance Fields Using a Shared Feature Grid}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12417-12427} }
MVImgNet: A Large-Scale Dataset of Multi-View Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yu_2023_CVPR, author = {Yu, Xianggang and Xu, Mutian and Zhang, Yidan and Liu, Haolin and Ye, Chongjie and Wu, Yushuang and Yan, Zizheng and Zhu, Chenming and Xiong, Zhangyang and Liang, Tianyou and Chen, Guanying and Cui, Shuguang and Han, Xiaoguang}, title = {MVImgNet: A Large-Scale Dataset of Multi-View Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9150-9161} }
A New Benchmark: On the Utility of Synthetic Data With Blender for Bare Supervised Learning and Downstream Domain Adaptation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tang_2023_CVPR, author = {Tang, Hui and Jia, Kui}, title = {A New Benchmark: On the Utility of Synthetic Data With Blender for Bare Supervised Learning and Downstream Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15954-15964} }
Autoregressive Visual Tracking-
[pdf]
[bibtex]@InProceedings{Wei_2023_CVPR, author = {Wei, Xing and Bai, Yifan and Zheng, Yongchao and Shi, Dahu and Gong, Yihong}, title = {Autoregressive Visual Tracking}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9697-9706} }
Unsupervised Domain Adaption With Pixel-Level Discriminator for Image-Aware Layout Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_CVPR, author = {Xu, Chenchen and Zhou, Min and Ge, Tiezheng and Jiang, Yuning and Xu, Weiwei}, title = {Unsupervised Domain Adaption With Pixel-Level Discriminator for Image-Aware Layout Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10114-10123} }
Real-Time 6K Image Rescaling With Rate-Distortion Optimization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Qi_2023_CVPR, author = {Qi, Chenyang and Yang, Xin and Cheng, Ka Leong and Chen, Ying-Cong and Chen, Qifeng}, title = {Real-Time 6K Image Rescaling With Rate-Distortion Optimization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14092-14101} }
Gated Stereo: Joint Depth Estimation From Gated and Wide-Baseline Active Stereo Cues-
[pdf]
[supp]
[bibtex]@InProceedings{Walz_2023_CVPR, author = {Walz, Stefanie and Bijelic, Mario and Ramazzina, Andrea and Walia, Amanpreet and Mannan, Fahim and Heide, Felix}, title = {Gated Stereo: Joint Depth Estimation From Gated and Wide-Baseline Active Stereo Cues}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13252-13262} }
MammalNet: A Large-Scale Video Benchmark for Mammal Recognition and Behavior Understanding-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Jun and Hu, Ming and Coker, Darren J. and Berumen, Michael L. and Costelloe, Blair and Beery, Sara and Rohrbach, Anna and Elhoseiny, Mohamed}, title = {MammalNet: A Large-Scale Video Benchmark for Mammal Recognition and Behavior Understanding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13052-13061} }
Hand Avatar: Free-Pose Hand Animation and Rendering From Monocular Video-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Xingyu and Wang, Baoyuan and Shum, Heung-Yeung}, title = {Hand Avatar: Free-Pose Hand Animation and Rendering From Monocular Video}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8683-8693} }
VindLU: A Recipe for Effective Video-and-Language Pretraining-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cheng_2023_CVPR, author = {Cheng, Feng and Wang, Xizi and Lei, Jie and Crandall, David and Bansal, Mohit and Bertasius, Gedas}, title = {VindLU: A Recipe for Effective Video-and-Language Pretraining}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10739-10750} }
OmniAvatar: Geometry-Guided Controllable 3D Head Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_CVPR, author = {Xu, Hongyi and Song, Guoxian and Jiang, Zihang and Zhang, Jianfeng and Shi, Yichun and Liu, Jing and Ma, Wanchun and Feng, Jiashi and Luo, Linjie}, title = {OmniAvatar: Geometry-Guided Controllable 3D Head Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12814-12824} }
SUDS: Scalable Urban Dynamic Scenes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Turki_2023_CVPR, author = {Turki, Haithem and Zhang, Jason Y. and Ferroni, Francesco and Ramanan, Deva}, title = {SUDS: Scalable Urban Dynamic Scenes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12375-12385} }
Cloud-Device Collaborative Adaptation to Continual Changing Environments in the Real-World-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gan_2023_CVPR, author = {Gan, Yulu and Pan, Mingjie and Zhang, Rongyu and Ling, Zijian and Zhao, Lingran and Liu, Jiaming and Zhang, Shanghang}, title = {Cloud-Device Collaborative Adaptation to Continual Changing Environments in the Real-World}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12157-12166} }
Seasoning Model Soups for Robustness to Adversarial and Natural Distribution Shifts-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Croce_2023_CVPR, author = {Croce, Francesco and Rebuffi, Sylvestre-Alvise and Shelhamer, Evan and Gowal, Sven}, title = {Seasoning Model Soups for Robustness to Adversarial and Natural Distribution Shifts}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12313-12323} }
How To Prevent the Continuous Damage of Noises To Model Training?-
[pdf]
[supp]
[bibtex]@InProceedings{Yu_2023_CVPR, author = {Yu, Xiaotian and Jiang, Yang and Shi, Tianqi and Feng, Zunlei and Wang, Yuexuan and Song, Mingli and Sun, Li}, title = {How To Prevent the Continuous Damage of Noises To Model Training?}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12054-12063} }
Skinned Motion Retargeting With Residual Perception of Motion Semantics & Geometry-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Jiaxu and Weng, Junwu and Kang, Di and Zhao, Fang and Huang, Shaoli and Zhe, Xuefei and Bao, Linchao and Shan, Ying and Wang, Jue and Tu, Zhigang}, title = {Skinned Motion Retargeting With Residual Perception of Motion Semantics \& Geometry}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13864-13872} }
Weakly-Supervised Single-View Image Relighting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yi_2023_CVPR, author = {Yi, Renjiao and Zhu, Chenyang and Xu, Kai}, title = {Weakly-Supervised Single-View Image Relighting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8402-8411} }
DualVector: Unsupervised Vector Font Synthesis With Dual-Part Representation-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Ying-Tian and Zhang, Zhifei and Guo, Yuan-Chen and Fisher, Matthew and Wang, Zhaowen and Zhang, Song-Hai}, title = {DualVector: Unsupervised Vector Font Synthesis With Dual-Part Representation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14193-14202} }
ReasonNet: End-to-End Driving With Temporal and Global Reasoning-
[pdf]
[supp]
[bibtex]@InProceedings{Shao_2023_CVPR, author = {Shao, Hao and Wang, Letian and Chen, Ruobing and Waslander, Steven L. and Li, Hongsheng and Liu, Yu}, title = {ReasonNet: End-to-End Driving With Temporal and Global Reasoning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13723-13733} }
Learning Situation Hyper-Graphs for Video Question Answering-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Urooj_2023_CVPR, author = {Urooj, Aisha and Kuehne, Hilde and Wu, Bo and Chheu, Kim and Bousselham, Walid and Gan, Chuang and Lobo, Niels and Shah, Mubarak}, title = {Learning Situation Hyper-Graphs for Video Question Answering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14879-14889} }
GazeNeRF: 3D-Aware Gaze Redirection With Neural Radiance Fields-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ruzzi_2023_CVPR, author = {Ruzzi, Alessandro and Shi, Xiangwei and Wang, Xi and Li, Gengyan and De Mello, Shalini and Chang, Hyung Jin and Zhang, Xucong and Hilliges, Otmar}, title = {GazeNeRF: 3D-Aware Gaze Redirection With Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9676-9685} }
SegLoc: Learning Segmentation-Based Representations for Privacy-Preserving Visual Localization-
[pdf]
[supp]
[bibtex]@InProceedings{Pietrantoni_2023_CVPR, author = {Pietrantoni, Maxime and Humenberger, Martin and Sattler, Torsten and Csurka, Gabriela}, title = {SegLoc: Learning Segmentation-Based Representations for Privacy-Preserving Visual Localization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15380-15391} }
Efficient Hierarchical Entropy Model for Learned Point Cloud Compression-
[pdf]
[supp]
[bibtex]@InProceedings{Song_2023_CVPR, author = {Song, Rui and Fu, Chunyang and Liu, Shan and Li, Ge}, title = {Efficient Hierarchical Entropy Model for Learned Point Cloud Compression}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14368-14377} }
Image Cropping With Spatial-Aware Feature and Rank Consistency-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Chao and Niu, Li and Zhang, Bo and Zhang, Liqing}, title = {Image Cropping With Spatial-Aware Feature and Rank Consistency}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10052-10061} }
SVGformer: Representation Learning for Continuous Vector Graphics Using Transformers-
[pdf]
[supp]
[bibtex]@InProceedings{Cao_2023_CVPR, author = {Cao, Defu and Wang, Zhaowen and Echevarria, Jose and Liu, Yan}, title = {SVGformer: Representation Learning for Continuous Vector Graphics Using Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10093-10102} }
Learning Attribute and Class-Specific Representation Duet for Fine-Grained Fashion Analysis-
[pdf]
[supp]
[bibtex]@InProceedings{Jiao_2023_CVPR, author = {Jiao, Yang and Gao, Yan and Meng, Jingjing and Shang, Jin and Sun, Yi}, title = {Learning Attribute and Class-Specific Representation Duet for Fine-Grained Fashion Analysis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11050-11059} }
Pixels, Regions, and Objects: Multiple Enhancement for Salient Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Yi and Wang, Ruili and Fan, Xin and Wang, Tianzhu and He, Xiangjian}, title = {Pixels, Regions, and Objects: Multiple Enhancement for Salient Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10031-10040} }
Leveraging Temporal Context in Low Representational Power Regimes-
[pdf]
[supp]
[bibtex]@InProceedings{Fosco_2023_CVPR, author = {Fosco, Camilo L. and Jin, SouYoung and Josephs, Emilie and Oliva, Aude}, title = {Leveraging Temporal Context in Low Representational Power Regimes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10693-10703} }
Omni3D: A Large Benchmark and Model for 3D Object Detection in the Wild-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Brazil_2023_CVPR, author = {Brazil, Garrick and Kumar, Abhinav and Straub, Julian and Ravi, Nikhila and Johnson, Justin and Gkioxari, Georgia}, title = {Omni3D: A Large Benchmark and Model for 3D Object Detection in the Wild}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13154-13164} }
OT-Filter: An Optimal Transport Filter for Learning With Noisy Labels-
[pdf]
[bibtex]@InProceedings{Feng_2023_CVPR, author = {Feng, Chuanwen and Ren, Yilong and Xie, Xike}, title = {OT-Filter: An Optimal Transport Filter for Learning With Noisy Labels}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16164-16174} }
Rigidity-Aware Detection for 6D Object Pose Estimation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Hai_2023_CVPR, author = {Hai, Yang and Song, Rui and Li, Jiaojiao and Salzmann, Mathieu and Hu, Yinlin}, title = {Rigidity-Aware Detection for 6D Object Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8927-8936} }
Clover: Towards a Unified Video-Language Alignment and Fusion Model-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_CVPR, author = {Huang, Jingjia and Li, Yinan and Feng, Jiashi and Wu, Xinglong and Sun, Xiaoshuai and Ji, Rongrong}, title = {Clover: Towards a Unified Video-Language Alignment and Fusion Model}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14856-14866} }
Self-Supervised Learning From Images With a Joint-Embedding Predictive Architecture-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Assran_2023_CVPR, author = {Assran, Mahmoud and Duval, Quentin and Misra, Ishan and Bojanowski, Piotr and Vincent, Pascal and Rabbat, Michael and LeCun, Yann and Ballas, Nicolas}, title = {Self-Supervised Learning From Images With a Joint-Embedding Predictive Architecture}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15619-15629} }
A2J-Transformer: Anchor-to-Joint Transformer Network for 3D Interacting Hand Pose Estimation From a Single RGB Image-
[pdf]
[bibtex]@InProceedings{Jiang_2023_CVPR, author = {Jiang, Changlong and Xiao, Yang and Wu, Cunlin and Zhang, Mingyang and Zheng, Jinghong and Cao, Zhiguo and Zhou, Joey Tianyi}, title = {A2J-Transformer: Anchor-to-Joint Transformer Network for 3D Interacting Hand Pose Estimation From a Single RGB Image}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8846-8855} }
The Treasure Beneath Multiple Annotations: An Uncertainty-Aware Edge Detector-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhou_2023_CVPR, author = {Zhou, Caixia and Huang, Yaping and Pu, Mengyang and Guan, Qingji and Huang, Li and Ling, Haibin}, title = {The Treasure Beneath Multiple Annotations: An Uncertainty-Aware Edge Detector}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15507-15517} }
DP-NeRF: Deblurred Neural Radiance Field With Physical Scene Priors-
[pdf]
[supp]
[bibtex]@InProceedings{Lee_2023_CVPR, author = {Lee, Dogyoon and Lee, Minhyeok and Shin, Chajin and Lee, Sangyoun}, title = {DP-NeRF: Deblurred Neural Radiance Field With Physical Scene Priors}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12386-12396} }
Self-Supervised Blind Motion Deblurring With Deep Expectation Maximization-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Ji and Wang, Weixi and Nan, Yuesong and Ji, Hui}, title = {Self-Supervised Blind Motion Deblurring With Deep Expectation Maximization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13986-13996} }
Grounding Counterfactual Explanation of Image Classifiers to Textual Concept Space-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2023_CVPR, author = {Kim, Siwon and Oh, Jinoh and Lee, Sungjin and Yu, Seunghak and Do, Jaeyoung and Taghavi, Tara}, title = {Grounding Counterfactual Explanation of Image Classifiers to Textual Concept Space}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10942-10950} }
SemiCVT: Semi-Supervised Convolutional Vision Transformer for Semantic Segmentation-
[pdf]
[bibtex]@InProceedings{Huang_2023_CVPR, author = {Huang, Huimin and Xie, Shiao and Lin, Lanfen and Tong, Ruofeng and Chen, Yen-Wei and Li, Yuexiang and Wang, Hong and Huang, Yawen and Zheng, Yefeng}, title = {SemiCVT: Semi-Supervised Convolutional Vision Transformer for Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11340-11349} }
Towards Open-World Segmentation of Parts-
[pdf]
[supp]
[bibtex]@InProceedings{Pan_2023_CVPR, author = {Pan, Tai-Yu and Liu, Qing and Chao, Wei-Lun and Price, Brian}, title = {Towards Open-World Segmentation of Parts}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15392-15401} }
Stitchable Neural Networks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Pan_2023_CVPR, author = {Pan, Zizheng and Cai, Jianfei and Zhuang, Bohan}, title = {Stitchable Neural Networks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16102-16112} }
Audio-Visual Grouping Network for Sound Localization From Mixtures-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mo_2023_CVPR, author = {Mo, Shentong and Tian, Yapeng}, title = {Audio-Visual Grouping Network for Sound Localization From Mixtures}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10565-10574} }
Fair Federated Medical Image Segmentation via Client Contribution Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jiang_2023_CVPR, author = {Jiang, Meirui and Roth, Holger R. and Li, Wenqi and Yang, Dong and Zhao, Can and Nath, Vishwesh and Xu, Daguang and Dou, Qi and Xu, Ziyue}, title = {Fair Federated Medical Image Segmentation via Client Contribution Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16302-16311} }
Dynamic Generative Targeted Attacks With Pattern Injection-
[pdf]
[supp]
[bibtex]@InProceedings{Feng_2023_CVPR, author = {Feng, Weiwei and Xu, Nanqing and Zhang, Tianzhu and Zhang, Yongdong}, title = {Dynamic Generative Targeted Attacks With Pattern Injection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16404-16414} }
Visual Recognition by Request-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tang_2023_CVPR, author = {Tang, Chufeng and Xie, Lingxi and Zhang, Xiaopeng and Hu, Xiaolin and Tian, Qi}, title = {Visual Recognition by Request}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15265-15274} }
PointCert: Point Cloud Classification With Deterministic Certified Robustness Guarantees-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Jinghuai and Jia, Jinyuan and Liu, Hongbin and Gong, Neil Zhenqiang}, title = {PointCert: Point Cloud Classification With Deterministic Certified Robustness Guarantees}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9496-9505} }
Cap4Video: What Can Auxiliary Captions Do for Text-Video Retrieval?-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_CVPR, author = {Wu, Wenhao and Luo, Haipeng and Fang, Bo and Wang, Jingdong and Ouyang, Wanli}, title = {Cap4Video: What Can Auxiliary Captions Do for Text-Video Retrieval?}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10704-10713} }
Progressive Semantic-Visual Mutual Adaption for Generalized Zero-Shot Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Man and Li, Feng and Zhang, Chunjie and Wei, Yunchao and Bai, Huihui and Zhao, Yao}, title = {Progressive Semantic-Visual Mutual Adaption for Generalized Zero-Shot Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15337-15346} }
Block Selection Method for Using Feature Norm in Out-of-Distribution Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yu_2023_CVPR, author = {Yu, Yeonguk and Shin, Sungho and Lee, Seongju and Jun, Changhyun and Lee, Kyoobin}, title = {Block Selection Method for Using Feature Norm in Out-of-Distribution Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15701-15711} }
Four-View Geometry With Unknown Radial Distortion-
[pdf]
[supp]
[bibtex]@InProceedings{Hruby_2023_CVPR, author = {Hruby, Petr and Korotynskiy, Viktor and Duff, Timothy and Oeding, Luke and Pollefeys, Marc and Pajdla, Tomas and Larsson, Viktor}, title = {Four-View Geometry With Unknown Radial Distortion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8990-9000} }
How To Prevent the Poor Performance Clients for Personalized Federated Learning?-
[pdf]
[supp]
[bibtex]@InProceedings{Qu_2023_CVPR, author = {Qu, Zhe and Li, Xingyu and Han, Xiao and Duan, Rui and Shen, Chengchao and Chen, Lixing}, title = {How To Prevent the Poor Performance Clients for Personalized Federated Learning?}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12167-12176} }
Galactic: Scaling End-to-End Reinforcement Learning for Rearrangement at 100k Steps-per-Second-
[pdf]
[supp]
[bibtex]@InProceedings{Berges_2023_CVPR, author = {Berges, Vincent-Pierre and Szot, Andrew and Chaplot, Devendra Singh and Gokaslan, Aaron and Mottaghi, Roozbeh and Batra, Dhruv and Undersander, Eric}, title = {Galactic: Scaling End-to-End Reinforcement Learning for Rearrangement at 100k Steps-per-Second}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13767-13777} }
Learning on Gradients: Generalized Artifacts Representation for GAN-Generated Images Detection-
[pdf]
[bibtex]@InProceedings{Tan_2023_CVPR, author = {Tan, Chuangchuang and Zhao, Yao and Wei, Shikui and Gu, Guanghua and Wei, Yunchao}, title = {Learning on Gradients: Generalized Artifacts Representation for GAN-Generated Images Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12105-12114} }
Don't Lie to Me! Robust and Efficient Explainability With Verified Perturbation Analysis-
[pdf]
[supp]
[bibtex]@InProceedings{Fel_2023_CVPR, author = {Fel, Thomas and Ducoffe, Melanie and Vigouroux, David and Cad\`ene, R\'emi and Capelle, Mika\"el and Nicod\`eme, Claire and Serre, Thomas}, title = {Don't Lie to Me! Robust and Efficient Explainability With Verified Perturbation Analysis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16153-16163} }
Defending Against Patch-Based Backdoor Attacks on Self-Supervised Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tejankar_2023_CVPR, author = {Tejankar, Ajinkya and Sanjabi, Maziar and Wang, Qifan and Wang, Sinong and Firooz, Hamed and Pirsiavash, Hamed and Tan, Liang}, title = {Defending Against Patch-Based Backdoor Attacks on Self-Supervised Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12239-12249} }
GeoNet: Benchmarking Unsupervised Adaptation Across Geographies-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kalluri_2023_CVPR, author = {Kalluri, Tarun and Xu, Wangdong and Chandraker, Manmohan}, title = {GeoNet: Benchmarking Unsupervised Adaptation Across Geographies}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15368-15379} }
Learning Transformation-Predictive Representations for Detection and Description of Local Features-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Zihao and Wu, Chunxu and Yang, Yifei and Li, Zhen}, title = {Learning Transformation-Predictive Representations for Detection and Description of Local Features}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11464-11473} }
Dionysus: Recovering Scene Structures by Dividing Into Semantic Pieces-
[pdf]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Likang and Chen, Lei}, title = {Dionysus: Recovering Scene Structures by Dividing Into Semantic Pieces}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12576-12587} }
Advancing Visual Grounding With Scene Knowledge: Benchmark and Method-
[pdf]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Zhihong and Zhang, Ruifei and Song, Yibing and Wan, Xiang and Li, Guanbin}, title = {Advancing Visual Grounding With Scene Knowledge: Benchmark and Method}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15039-15049} }
Multiview Compressive Coding for 3D Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_CVPR, author = {Wu, Chao-Yuan and Johnson, Justin and Malik, Jitendra and Feichtenhofer, Christoph and Gkioxari, Georgia}, title = {Multiview Compressive Coding for 3D Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9065-9075} }
Modeling Entities As Semantic Points for Visual Information Extraction in the Wild-
[pdf]
[arXiv]
[bibtex]@InProceedings{Yang_2023_CVPR, author = {Yang, Zhibo and Long, Rujiao and Wang, Pengfei and Song, Sibo and Zhong, Humen and Cheng, Wenqing and Bai, Xiang and Yao, Cong}, title = {Modeling Entities As Semantic Points for Visual Information Extraction in the Wild}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15358-15367} }
MobileVOS: Real-Time Video Object Segmentation Contrastive Learning Meets Knowledge Distillation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Miles_2023_CVPR, author = {Miles, Roy and Yucel, Mehmet Kerim and Manganelli, Bruno and Sa\`a-Garriga, Albert}, title = {MobileVOS: Real-Time Video Object Segmentation Contrastive Learning Meets Knowledge Distillation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10480-10490} }
Pose Synchronization Under Multiple Pair-Wise Relative Poses-
[pdf]
[supp]
[bibtex]@InProceedings{Sun_2023_CVPR, author = {Sun, Yifan and Huang, Qixing}, title = {Pose Synchronization Under Multiple Pair-Wise Relative Poses}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13072-13081} }
Controllable Light Diffusion for Portraits-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Futschik_2023_CVPR, author = {Futschik, David and Ritland, Kelvin and Vecore, James and Fanello, Sean and Orts-Escolano, Sergio and Curless, Brian and S\'ykora, Daniel and Pandey, Rohit}, title = {Controllable Light Diffusion for Portraits}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8412-8421} }
Boosting Low-Data Instance Segmentation by Unsupervised Pre-Training With Saliency Prompt-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Hao and Zhang, Dingwen and Liu, Nian and Cheng, Lechao and Dai, Yalun and Zhang, Chao and Wang, Xinggang and Han, Junwei}, title = {Boosting Low-Data Instance Segmentation by Unsupervised Pre-Training With Saliency Prompt}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15485-15494} }
Virtual Occlusions Through Implicit Depth-
[pdf]
[arXiv]
[bibtex]@InProceedings{Watson_2023_CVPR, author = {Watson, Jamie and Sayed, Mohamed and Qureshi, Zawar and Brostow, Gabriel J. and Vicente, Sara and Mac Aodha, Oisin and Firman, Michael}, title = {Virtual Occlusions Through Implicit Depth}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9053-9064} }
DiGA: Distil To Generalize and Then Adapt for Domain Adaptive Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shen_2023_CVPR, author = {Shen, Fengyi and Gurram, Akhil and Liu, Ziyuan and Wang, He and Knoll, Alois}, title = {DiGA: Distil To Generalize and Then Adapt for Domain Adaptive Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15866-15877} }
DiffSwap: High-Fidelity and Controllable Face Swapping via 3D-Aware Masked Diffusion-
[pdf]
[bibtex]@InProceedings{Zhao_2023_CVPR, author = {Zhao, Wenliang and Rao, Yongming and Shi, Weikang and Liu, Zuyan and Zhou, Jie and Lu, Jiwen}, title = {DiffSwap: High-Fidelity and Controllable Face Swapping via 3D-Aware Masked Diffusion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8568-8577} }
Learned Image Compression With Mixed Transformer-CNN Architectures-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Jinming and Sun, Heming and Katto, Jiro}, title = {Learned Image Compression With Mixed Transformer-CNN Architectures}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14388-14397} }
Quantum Multi-Model Fitting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Farina_2023_CVPR, author = {Farina, Matteo and Magri, Luca and Menapace, Willi and Ricci, Elisa and Golyanik, Vladislav and Arrigoni, Federica}, title = {Quantum Multi-Model Fitting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13640-13649} }
PermutoSDF: Fast Multi-View Reconstruction With Implicit Surfaces Using Permutohedral Lattices-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Rosu_2023_CVPR, author = {Rosu, Radu Alexandru and Behnke, Sven}, title = {PermutoSDF: Fast Multi-View Reconstruction With Implicit Surfaces Using Permutohedral Lattices}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8466-8475} }
Detection Hub: Unifying Object Detection Datasets via Query Adaptation on Language Embedding-
[pdf]
[arXiv]
[bibtex]@InProceedings{Meng_2023_CVPR, author = {Meng, Lingchen and Dai, Xiyang and Chen, Yinpeng and Zhang, Pengchuan and Chen, Dongdong and Liu, Mengchen and Wang, Jianfeng and Wu, Zuxuan and Yuan, Lu and Jiang, Yu-Gang}, title = {Detection Hub: Unifying Object Detection Datasets via Query Adaptation on Language Embedding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11402-11411} }
Adversarial Normalization: I Can Visualize Everything (ICE)-
[pdf]
[bibtex]@InProceedings{Choi_2023_CVPR, author = {Choi, Hoyoung and Jin, Seungwan and Han, Kyungsik}, title = {Adversarial Normalization: I Can Visualize Everything (ICE)}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12115-12124} }
Referring Multi-Object Tracking-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_CVPR, author = {Wu, Dongming and Han, Wencheng and Wang, Tiancai and Dong, Xingping and Zhang, Xiangyu and Shen, Jianbing}, title = {Referring Multi-Object Tracking}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14633-14642} }
Hint-Aug: Drawing Hints From Foundation Vision Transformers Towards Boosted Few-Shot Parameter-Efficient Tuning-
[pdf]
[bibtex]@InProceedings{Yu_2023_CVPR, author = {Yu, Zhongzhi and Wu, Shang and Fu, Yonggan and Zhang, Shunyao and Lin, Yingyan (Celine)}, title = {Hint-Aug: Drawing Hints From Foundation Vision Transformers Towards Boosted Few-Shot Parameter-Efficient Tuning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11102-11112} }
A Strong Baseline for Generalized Few-Shot Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hajimiri_2023_CVPR, author = {Hajimiri, Sina and Boudiaf, Malik and Ben Ayed, Ismail and Dolz, Jose}, title = {A Strong Baseline for Generalized Few-Shot Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11269-11278} }
DynaFed: Tackling Client Data Heterogeneity With Global Dynamics-
[pdf]
[arXiv]
[bibtex]@InProceedings{Pi_2023_CVPR, author = {Pi, Renjie and Zhang, Weizhong and Xie, Yueqi and Gao, Jiahui and Wang, Xiaoyu and Kim, Sunghun and Chen, Qifeng}, title = {DynaFed: Tackling Client Data Heterogeneity With Global Dynamics}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12177-12186} }
CUF: Continuous Upsampling Filters-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Vasconcelos_2023_CVPR, author = {Vasconcelos, Cristina N. and Oztireli, Cengiz and Matthews, Mark and Hashemi, Milad and Swersky, Kevin and Tagliasacchi, Andrea}, title = {CUF: Continuous Upsampling Filters}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9999-10008} }
Quantitative Manipulation of Custom Attributes on 3D-Aware Image Synthesis-
[pdf]
[supp]
[bibtex]@InProceedings{Do_2023_CVPR, author = {Do, Hoseok and Yoo, EunKyung and Kim, Taehyeong and Lee, Chul and Choi, Jin Young}, title = {Quantitative Manipulation of Custom Attributes on 3D-Aware Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8529-8538} }
HOTNAS: Hierarchical Optimal Transport for Neural Architecture Search-
[pdf]
[supp]
[bibtex]@InProceedings{Yang_2023_CVPR, author = {Yang, Jiechao and Liu, Yong and Xu, Hongteng}, title = {HOTNAS: Hierarchical Optimal Transport for Neural Architecture Search}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11990-12000} }
Neural Fields Meet Explicit Geometric Representations for Inverse Rendering of Urban Scenes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Zian and Shen, Tianchang and Gao, Jun and Huang, Shengyu and Munkberg, Jacob and Hasselgren, Jon and Gojcic, Zan and Chen, Wenzheng and Fidler, Sanja}, title = {Neural Fields Meet Explicit Geometric Representations for Inverse Rendering of Urban Scenes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8370-8380} }
Cross-Image-Attention for Conditional Embeddings in Deep Metric Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Kotovenko_2023_CVPR, author = {Kotovenko, Dmytro and Ma, Pingchuan and Milbich, Timo and Ommer, Bj\"orn}, title = {Cross-Image-Attention for Conditional Embeddings in Deep Metric Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11070-11081} }
Enhanced Multimodal Representation Learning With Cross-Modal KD-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Mengxi and Xing, Linyu and Wang, Yu and Zhang, Ya}, title = {Enhanced Multimodal Representation Learning With Cross-Modal KD}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11766-11775} }
Learning a Depth Covariance Function-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dexheimer_2023_CVPR, author = {Dexheimer, Eric and Davison, Andrew J.}, title = {Learning a Depth Covariance Function}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13122-13131} }
Evading DeepFake Detectors via Adversarial Statistical Consistency-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hou_2023_CVPR, author = {Hou, Yang and Guo, Qing and Huang, Yihao and Xie, Xiaofei and Ma, Lei and Zhao, Jianjun}, title = {Evading DeepFake Detectors via Adversarial Statistical Consistency}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12271-12280} }
V2V4Real: A Real-World Large-Scale Dataset for Vehicle-to-Vehicle Cooperative Perception-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_CVPR, author = {Xu, Runsheng and Xia, Xin and Li, Jinlong and Li, Hanzhao and Zhang, Shuo and Tu, Zhengzhong and Meng, Zonglin and Xiang, Hao and Dong, Xiaoyu and Song, Rui and Yu, Hongkai and Zhou, Bolei and Ma, Jiaqi}, title = {V2V4Real: A Real-World Large-Scale Dataset for Vehicle-to-Vehicle Cooperative Perception}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13712-13722} }
RMLVQA: A Margin Loss Approach for Visual Question Answering With Language Biases-
[pdf]
[supp]
[bibtex]@InProceedings{Basu_2023_CVPR, author = {Basu, Abhipsa and Addepalli, Sravanti and Babu, R. Venkatesh}, title = {RMLVQA: A Margin Loss Approach for Visual Question Answering With Language Biases}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11671-11680} }
Adaptive Sparse Convolutional Networks With Global Context Enhancement for Faster Object Detection on Drone Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Du_2023_CVPR, author = {Du, Bowei and Huang, Yecheng and Chen, Jiaxin and Huang, Di}, title = {Adaptive Sparse Convolutional Networks With Global Context Enhancement for Faster Object Detection on Drone Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13435-13444} }
Command-Driven Articulated Object Understanding and Manipulation-
[pdf]
[supp]
[bibtex]@InProceedings{Chu_2023_CVPR, author = {Chu, Ruihang and Liu, Zhengzhe and Ye, Xiaoqing and Tan, Xiao and Qi, Xiaojuan and Fu, Chi-Wing and Jia, Jiaya}, title = {Command-Driven Articulated Object Understanding and Manipulation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {8813-8823} }
ConStruct-VL: Data-Free Continual Structured VL Concepts Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Smith_2023_CVPR, author = {Smith, James Seale and Cascante-Bonilla, Paola and Arbelle, Assaf and Kim, Donghyun and Panda, Rameswar and Cox, David and Yang, Diyi and Kira, Zsolt and Feris, Rogerio and Karlinsky, Leonid}, title = {ConStruct-VL: Data-Free Continual Structured VL Concepts Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {14994-15004} }
HelixSurf: A Robust and Efficient Neural Implicit Surface Learning of Indoor Scenes With Iterative Intertwined Regularization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liang_2023_CVPR, author = {Liang, Zhihao and Huang, Zhangjin and Ding, Changxing and Jia, Kui}, title = {HelixSurf: A Robust and Efficient Neural Implicit Surface Learning of Indoor Scenes With Iterative Intertwined Regularization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {13165-13174} }
Towards a Smaller Student: Capacity Dynamic Distillation for Efficient Image Retrieval-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xie_2023_CVPR, author = {Xie, Yi and Zhang, Huaidong and Xu, Xuemiao and Zhu, Jianqing and He, Shengfeng}, title = {Towards a Smaller Student: Capacity Dynamic Distillation for Efficient Image Retrieval}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16006-16015} }
3D-Aware Facial Landmark Detection via Multi-View Consistent Training on Synthetic Data-
[pdf]
[supp]
[bibtex]@InProceedings{Zeng_2023_CVPR, author = {Zeng, Libing and Chen, Lele and Bao, Wentao and Li, Zhong and Xu, Yi and Yuan, Junsong and Kalantari, Nima Khademi}, title = {3D-Aware Facial Landmark Detection via Multi-View Consistent Training on Synthetic Data}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12747-12758} }
PC2: Projection-Conditioned Point Cloud Diffusion for Single-Image 3D Reconstruction-
[pdf]
[supp]
[bibtex]@InProceedings{Melas-Kyriazi_2023_CVPR, author = {Melas-Kyriazi, Luke and Rupprecht, Christian and Vedaldi, Andrea}, title = {PC2: Projection-Conditioned Point Cloud Diffusion for Single-Image 3D Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12923-12932} }
Gradient-Based Uncertainty Attribution for Explainable Bayesian Deep Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_CVPR, author = {Wang, Hanjing and Joshi, Dhiraj and Wang, Shiqiang and Ji, Qiang}, title = {Gradient-Based Uncertainty Attribution for Explainable Bayesian Deep Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12044-12053} }
Manipulating Transfer Learning for Property Inference-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tian_2023_CVPR, author = {Tian, Yulong and Suya, Fnu and Suri, Anshuman and Xu, Fengyuan and Evans, David}, title = {Manipulating Transfer Learning for Property Inference}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15975-15984} }
Class Adaptive Network Calibration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_CVPR, author = {Liu, Bingyuan and Rony, J\'er\^ome and Galdran, Adrian and Dolz, Jose and Ben Ayed, Ismail}, title = {Class Adaptive Network Calibration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16070-16079} }
Evading Forensic Classifiers With Attribute-Conditioned Adversarial Faces-
[pdf]
[supp]
[bibtex]@InProceedings{Shamshad_2023_CVPR, author = {Shamshad, Fahad and Srivatsan, Koushik and Nandakumar, Karthik}, title = {Evading Forensic Classifiers With Attribute-Conditioned Adversarial Faces}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16469-16478} }
OCTET: Object-Aware Counterfactual Explanations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zemni_2023_CVPR, author = {Zemni, Mehdi and Chen, Micka\"el and Zablocki, \'Eloi and Ben-Younes, H\'edi and P\'erez, Patrick and Cord, Matthieu}, title = {OCTET: Object-Aware Counterfactual Explanations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15062-15071} }
Polarized Color Image Denoising-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Zhuoxiao and Jiang, Haiyang and Cao, Mingdeng and Zheng, Yinqiang}, title = {Polarized Color Image Denoising}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9873-9882} }
UniDAformer: Unified Domain Adaptive Panoptic Segmentation Transformer via Hierarchical Mask Calibration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_CVPR, author = {Zhang, Jingyi and Huang, Jiaxing and Zhang, Xiaoqin and Lu, Shijian}, title = {UniDAformer: Unified Domain Adaptive Panoptic Segmentation Transformer via Hierarchical Mask Calibration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11227-11237} }
Non-Contrastive Learning Meets Language-Image Pre-Training-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhou_2023_CVPR, author = {Zhou, Jinghao and Dong, Li and Gan, Zhe and Wang, Lijuan and Wei, Furu}, title = {Non-Contrastive Learning Meets Language-Image Pre-Training}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {11028-11038} }
Switchable Representation Learning Framework With Self-Compatibility-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wu_2023_CVPR, author = {Wu, Shengsen and Bai, Yan and Lou, Yihang and Linghu, Xiongkun and He, Jianzhong and Duan, Ling-Yu}, title = {Switchable Representation Learning Framework With Self-Compatibility}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15943-15953} }
Zero-Shot Dual-Lens Super-Resolution-
[pdf]
[supp]
[bibtex]@InProceedings{Xu_2023_CVPR, author = {Xu, Ruikang and Yao, Mingde and Xiong, Zhiwei}, title = {Zero-Shot Dual-Lens Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {9130-9139} }
Improving Vision-and-Language Navigation by Generating Future-View Image Semantics-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_CVPR, author = {Li, Jialu and Bansal, Mohit}, title = {Improving Vision-and-Language Navigation by Generating Future-View Image Semantics}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {10803-10812} }
gSDF: Geometry-Driven Signed Distance Functions for 3D Hand-Object Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_CVPR, author = {Chen, Zerui and Chen, Shizhe and Schmid, Cordelia and Laptev, Ivan}, title = {gSDF: Geometry-Driven Signed Distance Functions for 3D Hand-Object Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12890-12900} }
CIMI4D: A Large Multimodal Climbing Motion Dataset Under Human-Scene Interactions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yan_2023_CVPR, author = {Yan, Ming and Wang, Xin and Dai, Yudi and Shen, Siqi and Wen, Chenglu and Xu, Lan and Ma, Yuexin and Wang, Cheng}, title = {CIMI4D: A Large Multimodal Climbing Motion Dataset Under Human-Scene Interactions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12977-12988} }
Modernizing Old Photos Using Multiple References via Photorealistic Style Transfer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gunawan_2023_CVPR, author = {Gunawan, Agus and Kim, Soo Ye and Sim, Hyeonjun and Lee, Jae-Ho and Kim, Munchurl}, title = {Modernizing Old Photos Using Multiple References via Photorealistic Style Transfer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {12460-12469} }
Curvature-Balanced Feature Manifold Learning for Long-Tailed Classification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ma_2023_CVPR, author = {Ma, Yanbiao and Jiao, Licheng and Liu, Fang and Yang, Shuyuan and Liu, Xu and Li, Lingling}, title = {Curvature-Balanced Feature Manifold Learning for Long-Tailed Classification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {15824-15835} }
Back