CVPR 2023 Open Access Repository

Papers

Back
Revisiting Self-Similarity: Structural Embedding for Image Retrieval: Seongwon Lee,

Suhyeon Lee,

Hongje Seong,

Euntai Kim; [pdf] [supp]
[bibtex]
@InProceedings{Lee_2023_CVPR, author = {Lee, Seongwon and Lee, Suhyeon and Seong, Hongje and Kim, Euntai}, title = {Revisiting Self-Similarity: Structural Embedding for Image Retrieval}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23412-23421} }
Decoupling-and-Aggregating for Image Exposure Correction: Yang Wang,

Long Peng,

Liang Li,

Yang Cao,

Zheng-Jun Zha; [pdf]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Yang and Peng, Long and Li, Liang and Cao, Yang and Zha, Zheng-Jun}, title = {Decoupling-and-Aggregating for Image Exposure Correction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18115-18124} }
MSeg3D: Multi-Modal 3D Semantic Segmentation for Autonomous Driving: Jiale Li,

Hang Dai,

Hao Han,

Yong Ding; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Jiale and Dai, Hang and Han, Hao and Ding, Yong}, title = {MSeg3D: Multi-Modal 3D Semantic Segmentation for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21694-21704} }
Dynamically Instance-Guided Adaptation: A Backward-Free Approach for Test-Time Domain Adaptive Semantic Segmentation: Wei Wang,

Zhun Zhong,

Weijie Wang,

Xi Chen,

Charles Ling,

Boyu Wang,

Nicu Sebe; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Wei and Zhong, Zhun and Wang, Weijie and Chen, Xi and Ling, Charles and Wang, Boyu and Sebe, Nicu}, title = {Dynamically Instance-Guided Adaptation: A Backward-Free Approach for Test-Time Domain Adaptive Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24090-24099} }
LANIT: Language-Driven Image-to-Image Translation for Unlabeled Data: Jihye Park,

Sunwoo Kim,

Soohyun Kim,

Seokju Cho,

Jaejun Yoo,

Youngjung Uh,

Seungryong Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Park_2023_CVPR, author = {Park, Jihye and Kim, Sunwoo and Kim, Soohyun and Cho, Seokju and Yoo, Jaejun and Uh, Youngjung and Kim, Seungryong}, title = {LANIT: Language-Driven Image-to-Image Translation for Unlabeled Data}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23401-23411} }
MoLo: Motion-Augmented Long-Short Contrastive Learning for Few-Shot Action Recognition: Xiang Wang,

Shiwei Zhang,

Zhiwu Qing,

Changxin Gao,

Yingya Zhang,

Deli Zhao,

Nong Sang; [pdf] [arXiv]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Xiang and Zhang, Shiwei and Qing, Zhiwu and Gao, Changxin and Zhang, Yingya and Zhao, Deli and Sang, Nong}, title = {MoLo: Motion-Augmented Long-Short Contrastive Learning for Few-Shot Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18011-18021} }
Text-Guided Unsupervised Latent Transformation for Multi-Attribute Image Manipulation: Xiwen Wei,

Zhen Xu,

Cheng Liu,

Si Wu,

Zhiwen Yu,

Hau San Wong; [pdf]
[bibtex]
@InProceedings{Wei_2023_CVPR, author = {Wei, Xiwen and Xu, Zhen and Liu, Cheng and Wu, Si and Yu, Zhiwen and Wong, Hau San}, title = {Text-Guided Unsupervised Latent Transformation for Multi-Attribute Image Manipulation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19285-19294} }
Contrastive Semi-Supervised Learning for Underwater Image Restoration via Reliable Bank: Shirui Huang,

Keyan Wang,

Huan Liu,

Jun Chen,

Yunsong Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_CVPR, author = {Huang, Shirui and Wang, Keyan and Liu, Huan and Chen, Jun and Li, Yunsong}, title = {Contrastive Semi-Supervised Learning for Underwater Image Restoration via Reliable Bank}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18145-18155} }
Multiclass Confidence and Localization Calibration for Object Detection: Bimsara Pathiraja,

Malitha Gunawardhana,

Muhammad Haris Khan; [pdf] [supp]
[bibtex]
@InProceedings{Pathiraja_2023_CVPR, author = {Pathiraja, Bimsara and Gunawardhana, Malitha and Khan, Muhammad Haris}, title = {Multiclass Confidence and Localization Calibration for Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19734-19743} }
Query-Dependent Video Representation for Moment Retrieval and Highlight Detection: WonJun Moon,

Sangeek Hyun,

SangUk Park,

Dongchan Park,

Jae-Pil Heo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Moon_2023_CVPR, author = {Moon, WonJun and Hyun, Sangeek and Park, SangUk and Park, Dongchan and Heo, Jae-Pil}, title = {Query-Dependent Video Representation for Moment Retrieval and Highlight Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23023-23033} }
Instance-Specific and Model-Adaptive Supervision for Semi-Supervised Semantic Segmentation: Zhen Zhao,

Sifan Long,

Jimin Pi,

Jingdong Wang,

Luping Zhou; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhao_2023_CVPR, author = {Zhao, Zhen and Long, Sifan and Pi, Jimin and Wang, Jingdong and Zhou, Luping}, title = {Instance-Specific and Model-Adaptive Supervision for Semi-Supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23705-23714} }
X-Pruner: eXplainable Pruning for Vision Transformers: Lu Yu,

Wei Xiang; [pdf]
[bibtex]
@InProceedings{Yu_2023_CVPR, author = {Yu, Lu and Xiang, Wei}, title = {X-Pruner: eXplainable Pruning for Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24355-24363} }
Hard Sample Matters a Lot in Zero-Shot Quantization: Huantong Li,

Xiangmiao Wu,

Fanbing Lv,

Daihai Liao,

Thomas H. Li,

Yonggang Zhang,

Bo Han,

Mingkui Tan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Huantong and Wu, Xiangmiao and Lv, Fanbing and Liao, Daihai and Li, Thomas H. and Zhang, Yonggang and Han, Bo and Tan, Mingkui}, title = {Hard Sample Matters a Lot in Zero-Shot Quantization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24417-24426} }
Meta Compositional Referring Expression Segmentation: Li Xu,

Mark He Huang,

Xindi Shang,

Zehuan Yuan,

Ying Sun,

Jun Liu; [pdf] [arXiv]
[bibtex]
@InProceedings{Xu_2023_CVPR, author = {Xu, Li and Huang, Mark He and Shang, Xindi and Yuan, Zehuan and Sun, Ying and Liu, Jun}, title = {Meta Compositional Referring Expression Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19478-19487} }
A Light Weight Model for Active Speaker Detection: Junhua Liao,

Haihan Duan,

Kanghui Feng,

Wanbing Zhao,

Yanbing Yang,

Liangyin Chen; [pdf] [arXiv]
[bibtex]
@InProceedings{Liao_2023_CVPR, author = {Liao, Junhua and Duan, Haihan and Feng, Kanghui and Zhao, Wanbing and Yang, Yanbing and Chen, Liangyin}, title = {A Light Weight Model for Active Speaker Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22932-22941} }
GCFAgg: Global and Cross-View Feature Aggregation for Multi-View Clustering: Weiqing Yan,

Yuanyang Zhang,

Chenlei Lv,

Chang Tang,

Guanghui Yue,

Liang Liao,

Weisi Lin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yan_2023_CVPR, author = {Yan, Weiqing and Zhang, Yuanyang and Lv, Chenlei and Tang, Chang and Yue, Guanghui and Liao, Liang and Lin, Weisi}, title = {GCFAgg: Global and Cross-View Feature Aggregation for Multi-View Clustering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19863-19872} }
DeGPR: Deep Guided Posterior Regularization for Multi-Class Cell Detection and Counting: Aayush Kumar Tyagi,

Chirag Mohapatra,

Prasenjit Das,

Govind Makharia,

Lalita Mehra,

Prathosh AP,

Mausam; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tyagi_2023_CVPR, author = {Tyagi, Aayush Kumar and Mohapatra, Chirag and Das, Prasenjit and Makharia, Govind and Mehra, Lalita and AP, Prathosh and Mausam}, title = {DeGPR: Deep Guided Posterior Regularization for Multi-Class Cell Detection and Counting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23913-23923} }
SliceMatch: Geometry-Guided Aggregation for Cross-View Pose Estimation: Ted Lentsch,

Zimin Xia,

Holger Caesar,

Julian F. P. Kooij; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lentsch_2023_CVPR, author = {Lentsch, Ted and Xia, Zimin and Caesar, Holger and Kooij, Julian F. P.}, title = {SliceMatch: Geometry-Guided Aggregation for Cross-View Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17225-17234} }
Single View Scene Scale Estimation Using Scale Field: Byeong-Uk Lee,

Jianming Zhang,

Yannick Hold-Geoffroy,

In So Kweon; [pdf] [supp]
[bibtex]
@InProceedings{Lee_2023_CVPR, author = {Lee, Byeong-Uk and Zhang, Jianming and Hold-Geoffroy, Yannick and Kweon, In So}, title = {Single View Scene Scale Estimation Using Scale Field}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21435-21444} }
Learning Semantic-Aware Disentangled Representation for Flexible 3D Human Body Editing: Xiaokun Sun,

Qiao Feng,

Xiongzheng Li,

Jinsong Zhang,

Yu-Kun Lai,

Jingyu Yang,

Kun Li; [pdf] [supp]
[bibtex]
@InProceedings{Sun_2023_CVPR, author = {Sun, Xiaokun and Feng, Qiao and Li, Xiongzheng and Zhang, Jinsong and Lai, Yu-Kun and Yang, Jingyu and Li, Kun}, title = {Learning Semantic-Aware Disentangled Representation for Flexible 3D Human Body Editing}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16985-16994} }
Generating Features With Increased Crop-Related Diversity for Few-Shot Object Detection: Jingyi Xu,

Hieu Le,

Dimitris Samaras; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_CVPR, author = {Xu, Jingyi and Le, Hieu and Samaras, Dimitris}, title = {Generating Features With Increased Crop-Related Diversity for Few-Shot Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19713-19722} }
Towards Compositional Adversarial Robustness: Generalizing Adversarial Training to Composite Semantic Perturbations: Lei Hsiung,

Yun-Yun Tsai,

Pin-Yu Chen,

Tsung-Yi Ho; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hsiung_2023_CVPR, author = {Hsiung, Lei and Tsai, Yun-Yun and Chen, Pin-Yu and Ho, Tsung-Yi}, title = {Towards Compositional Adversarial Robustness: Generalizing Adversarial Training to Composite Semantic Perturbations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24658-24667} }
CVT-SLR: Contrastive Visual-Textual Transformation for Sign Language Recognition With Variational Alignment: Jiangbin Zheng,

Yile Wang,

Cheng Tan,

Siyuan Li,

Ge Wang,

Jun Xia,

Yidong Chen,

Stan Z. Li; [pdf]
[bibtex]
@InProceedings{Zheng_2023_CVPR, author = {Zheng, Jiangbin and Wang, Yile and Tan, Cheng and Li, Siyuan and Wang, Ge and Xia, Jun and Chen, Yidong and Li, Stan Z.}, title = {CVT-SLR: Contrastive Visual-Textual Transformation for Sign Language Recognition With Variational Alignment}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23141-23150} }
Paint by Example: Exemplar-Based Image Editing With Diffusion Models: Binxin Yang,

Shuyang Gu,

Bo Zhang,

Ting Zhang,

Xuejin Chen,

Xiaoyan Sun,

Dong Chen,

Fang Wen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_CVPR, author = {Yang, Binxin and Gu, Shuyang and Zhang, Bo and Zhang, Ting and Chen, Xuejin and Sun, Xiaoyan and Chen, Dong and Wen, Fang}, title = {Paint by Example: Exemplar-Based Image Editing With Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18381-18391} }
Ego-Body Pose Estimation via Ego-Head Pose Estimation: Jiaman Li,

Karen Liu,

Jiajun Wu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Jiaman and Liu, Karen and Wu, Jiajun}, title = {Ego-Body Pose Estimation via Ego-Head Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17142-17151} }
Learning Rotation-Equivariant Features for Visual Correspondence: Jongmin Lee,

Byungjin Kim,

Seungwook Kim,

Minsu Cho; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2023_CVPR, author = {Lee, Jongmin and Kim, Byungjin and Kim, Seungwook and Cho, Minsu}, title = {Learning Rotation-Equivariant Features for Visual Correspondence}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21887-21897} }
DexArt: Benchmarking Generalizable Dexterous Manipulation With Articulated Objects: Chen Bao,

Helin Xu,

Yuzhe Qin,

Xiaolong Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bao_2023_CVPR, author = {Bao, Chen and Xu, Helin and Qin, Yuzhe and Wang, Xiaolong}, title = {DexArt: Benchmarking Generalizable Dexterous Manipulation With Articulated Objects}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21190-21200} }
You Do Not Need Additional Priors or Regularizers in Retinex-Based Low-Light Image Enhancement: Huiyuan Fu,

Wenkai Zheng,

Xiangyu Meng,

Xin Wang,

Chuanming Wang,

Huadong Ma; [pdf]
[bibtex]
@InProceedings{Fu_2023_CVPR, author = {Fu, Huiyuan and Zheng, Wenkai and Meng, Xiangyu and Wang, Xin and Wang, Chuanming and Ma, Huadong}, title = {You Do Not Need Additional Priors or Regularizers in Retinex-Based Low-Light Image Enhancement}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18125-18134} }
SCADE: NeRFs from Space Carving With Ambiguity-Aware Depth Estimates: Mikaela Angelina Uy,

Ricardo Martin-Brualla,

Leonidas Guibas,

Ke Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Uy_2023_CVPR, author = {Uy, Mikaela Angelina and Martin-Brualla, Ricardo and Guibas, Leonidas and Li, Ke}, title = {SCADE: NeRFs from Space Carving With Ambiguity-Aware Depth Estimates}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16518-16527} }
1% VS 100%: Parameter-Efficient Low Rank Adapter for Dense Predictions: Dongshuo Yin,

Yiran Yang,

Zhechao Wang,

Hongfeng Yu,

Kaiwen Wei,

Xian Sun; [pdf]
[bibtex]
@InProceedings{Yin_2023_CVPR, author = {Yin, Dongshuo and Yang, Yiran and Wang, Zhechao and Yu, Hongfeng and Wei, Kaiwen and Sun, Xian}, title = {1\% VS 100\%: Parameter-Efficient Low Rank Adapter for Dense Predictions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20116-20126} }
ResFormer: Scaling ViTs With Multi-Resolution Training: Rui Tian,

Zuxuan Wu,

Qi Dai,

Han Hu,

Yu Qiao,

Yu-Gang Jiang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tian_2023_CVPR, author = {Tian, Rui and Wu, Zuxuan and Dai, Qi and Hu, Han and Qiao, Yu and Jiang, Yu-Gang}, title = {ResFormer: Scaling ViTs With Multi-Resolution Training}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22721-22731} }
Hierarchical Video-Moment Retrieval and Step-Captioning: Abhay Zala,

Jaemin Cho,

Satwik Kottur,

Xilun Chen,

Barlas Oguz,

Yashar Mehdad,

Mohit Bansal; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zala_2023_CVPR, author = {Zala, Abhay and Cho, Jaemin and Kottur, Satwik and Chen, Xilun and Oguz, Barlas and Mehdad, Yashar and Bansal, Mohit}, title = {Hierarchical Video-Moment Retrieval and Step-Captioning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23056-23065} }
PD-Quant: Post-Training Quantization Based on Prediction Difference Metric: Jiawei Liu,

Lin Niu,

Zhihang Yuan,

Dawei Yang,

Xinggang Wang,

Wenyu Liu; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Jiawei and Niu, Lin and Yuan, Zhihang and Yang, Dawei and Wang, Xinggang and Liu, Wenyu}, title = {PD-Quant: Post-Training Quantization Based on Prediction Difference Metric}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24427-24437} }
AUNet: Learning Relations Between Action Units for Face Forgery Detection: Weiming Bai,

Yufan Liu,

Zhipeng Zhang,

Bing Li,

Weiming Hu; [pdf] [supp]
[bibtex]
@InProceedings{Bai_2023_CVPR, author = {Bai, Weiming and Liu, Yufan and Zhang, Zhipeng and Li, Bing and Hu, Weiming}, title = {AUNet: Learning Relations Between Action Units for Face Forgery Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24709-24719} }
PolyFormer: Referring Image Segmentation As Sequential Polygon Generation: Jiang Liu,

Hui Ding,

Zhaowei Cai,

Yuting Zhang,

Ravi Kumar Satzoda,

Vijay Mahadevan,

R. Manmatha; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Jiang and Ding, Hui and Cai, Zhaowei and Zhang, Yuting and Satzoda, Ravi Kumar and Mahadevan, Vijay and Manmatha, R.}, title = {PolyFormer: Referring Image Segmentation As Sequential Polygon Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18653-18663} }
Interactive Segmentation As Gaussion Process Classification: Minghao Zhou,

Hong Wang,

Qian Zhao,

Yuexiang Li,

Yawen Huang,

Deyu Meng,

Yefeng Zheng; [pdf] [supp]
[bibtex]
@InProceedings{Zhou_2023_CVPR, author = {Zhou, Minghao and Wang, Hong and Zhao, Qian and Li, Yuexiang and Huang, Yawen and Meng, Deyu and Zheng, Yefeng}, title = {Interactive Segmentation As Gaussion Process Classification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19488-19497} }
A Practical Stereo Depth System for Smart Glasses: Jialiang Wang,

Daniel Scharstein,

Akash Bapat,

Kevin Blackburn-Matzen,

Matthew Yu,

Jonathan Lehman,

Suhib Alsisan,

Yanghan Wang,

Sam Tsai,

Jan-Michael Frahm,

Zijian He,

Peter Vajda,

Michael F. Cohen,

Matt Uyttendaele; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Jialiang and Scharstein, Daniel and Bapat, Akash and Blackburn-Matzen, Kevin and Yu, Matthew and Lehman, Jonathan and Alsisan, Suhib and Wang, Yanghan and Tsai, Sam and Frahm, Jan-Michael and He, Zijian and Vajda, Peter and Cohen, Michael F. and Uyttendaele, Matt}, title = {A Practical Stereo Depth System for Smart Glasses}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21498-21507} }
PointConvFormer: Revenge of the Point-Based Convolution: Wenxuan Wu,

Li Fuxin,

Qi Shan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_CVPR, author = {Wu, Wenxuan and Fuxin, Li and Shan, Qi}, title = {PointConvFormer: Revenge of the Point-Based Convolution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21802-21813} }
Variational Distribution Learning for Unsupervised Text-to-Image Generation: Minsoo Kang,

Doyup Lee,

Jiseob Kim,

Saehoon Kim,

Bohyung Han; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kang_2023_CVPR, author = {Kang, Minsoo and Lee, Doyup and Kim, Jiseob and Kim, Saehoon and Han, Bohyung}, title = {Variational Distribution Learning for Unsupervised Text-to-Image Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23380-23389} }
MetaMix: Towards Corruption-Robust Continual Learning With Temporally Self-Adaptive Data Transformation: Zhenyi Wang,

Li Shen,

Donglin Zhan,

Qiuling Suo,

Yanjun Zhu,

Tiehang Duan,

Mingchen Gao; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Zhenyi and Shen, Li and Zhan, Donglin and Suo, Qiuling and Zhu, Yanjun and Duan, Tiehang and Gao, Mingchen}, title = {MetaMix: Towards Corruption-Robust Continual Learning With Temporally Self-Adaptive Data Transformation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24521-24531} }
Ultra-High Resolution Segmentation With Ultra-Rich Context: A Novel Benchmark: Deyi Ji,

Feng Zhao,

Hongtao Lu,

Mingyuan Tao,

Jieping Ye; [pdf] [arXiv]
[bibtex]
@InProceedings{Ji_2023_CVPR, author = {Ji, Deyi and Zhao, Feng and Lu, Hongtao and Tao, Mingyuan and Ye, Jieping}, title = {Ultra-High Resolution Segmentation With Ultra-Rich Context: A Novel Benchmark}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23621-23630} }
Accelerating Vision-Language Pretraining With Free Language Modeling: Teng Wang,

Yixiao Ge,

Feng Zheng,

Ran Cheng,

Ying Shan,

Xiaohu Qie,

Ping Luo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Teng and Ge, Yixiao and Zheng, Feng and Cheng, Ran and Shan, Ying and Qie, Xiaohu and Luo, Ping}, title = {Accelerating Vision-Language Pretraining With Free Language Modeling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23161-23170} }
Efficient Mask Correction for Click-Based Interactive Image Segmentation: Fei Du,

Jianlong Yuan,

Zhibin Wang,

Fan Wang; [pdf] [supp]
[bibtex]
@InProceedings{Du_2023_CVPR, author = {Du, Fei and Yuan, Jianlong and Wang, Zhibin and Wang, Fan}, title = {Efficient Mask Correction for Click-Based Interactive Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22773-22782} }
Graphics Capsule: Learning Hierarchical 3D Face Representations From 2D Images: Chang Yu,

Xiangyu Zhu,

Xiaomei Zhang,

Zhaoxiang Zhang,

Zhen Lei; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yu_2023_CVPR, author = {Yu, Chang and Zhu, Xiangyu and Zhang, Xiaomei and Zhang, Zhaoxiang and Lei, Zhen}, title = {Graphics Capsule: Learning Hierarchical 3D Face Representations From 2D Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20981-20990} }
Masked Autoencoders Enable Efficient Knowledge Distillers: Yutong Bai,

Zeyu Wang,

Junfei Xiao,

Chen Wei,

Huiyu Wang,

Alan L. Yuille,

Yuyin Zhou,

Cihang Xie; [pdf] [arXiv]
[bibtex]
@InProceedings{Bai_2023_CVPR, author = {Bai, Yutong and Wang, Zeyu and Xiao, Junfei and Wei, Chen and Wang, Huiyu and Yuille, Alan L. and Zhou, Yuyin and Xie, Cihang}, title = {Masked Autoencoders Enable Efficient Knowledge Distillers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24256-24265} }
Persistent Nature: A Generative Model of Unbounded 3D Worlds: Lucy Chai,

Richard Tucker,

Zhengqi Li,

Phillip Isola,

Noah Snavely; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chai_2023_CVPR, author = {Chai, Lucy and Tucker, Richard and Li, Zhengqi and Isola, Phillip and Snavely, Noah}, title = {Persistent Nature: A Generative Model of Unbounded 3D Worlds}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20863-20874} }
Hierarchical Neural Memory Network for Low Latency Event Processing: Ryuhei Hamaguchi,

Yasutaka Furukawa,

Masaki Onishi,

Ken Sakurada; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hamaguchi_2023_CVPR, author = {Hamaguchi, Ryuhei and Furukawa, Yasutaka and Onishi, Masaki and Sakurada, Ken}, title = {Hierarchical Neural Memory Network for Low Latency Event Processing}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22867-22876} }
DaFKD: Domain-Aware Federated Knowledge Distillation: Haozhao Wang,

Yichen Li,

Wenchao Xu,

Ruixuan Li,

Yufeng Zhan,

Zhigang Zeng; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Haozhao and Li, Yichen and Xu, Wenchao and Li, Ruixuan and Zhan, Yufeng and Zeng, Zhigang}, title = {DaFKD: Domain-Aware Federated Knowledge Distillation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20412-20421} }
Boost Vision Transformer With GPU-Friendly Sparsity and Quantization: Chong Yu,

Tao Chen,

Zhongxue Gan,

Jiayuan Fan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yu_2023_CVPR, author = {Yu, Chong and Chen, Tao and Gan, Zhongxue and Fan, Jiayuan}, title = {Boost Vision Transformer With GPU-Friendly Sparsity and Quantization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22658-22668} }
Spectral Bayesian Uncertainty for Image Super-Resolution: Tao Liu,

Jun Cheng,

Shan Tan; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Tao and Cheng, Jun and Tan, Shan}, title = {Spectral Bayesian Uncertainty for Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18166-18175} }
Mutual Information-Based Temporal Difference Learning for Human Pose Estimation in Video: Runyang Feng,

Yixing Gao,

Xueqing Ma,

Tze Ho Elden Tse,

Hyung Jin Chang; [pdf] [arXiv]
[bibtex]
@InProceedings{Feng_2023_CVPR, author = {Feng, Runyang and Gao, Yixing and Ma, Xueqing and Tse, Tze Ho Elden and Chang, Hyung Jin}, title = {Mutual Information-Based Temporal Difference Learning for Human Pose Estimation in Video}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17131-17141} }
SynthVSR: Scaling Up Visual Speech Recognition With Synthetic Supervision: Xubo Liu,

Egor Lakomkin,

Konstantinos Vougioukas,

Pingchuan Ma,

Honglie Chen,

Ruiming Xie,

Morrie Doulaty,

Niko Moritz,

Jachym Kolar,

Stavros Petridis,

Maja Pantic,

Christian Fuegen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Xubo and Lakomkin, Egor and Vougioukas, Konstantinos and Ma, Pingchuan and Chen, Honglie and Xie, Ruiming and Doulaty, Morrie and Moritz, Niko and Kolar, Jachym and Petridis, Stavros and Pantic, Maja and Fuegen, Christian}, title = {SynthVSR: Scaling Up Visual Speech Recognition With Synthetic Supervision}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18806-18815} }
BiasBed - Rigorous Texture Bias Evaluation: Nikolai Kalischek,

Rodrigo Caye Daudt,

Torben Peters,

Reinhard Furrer,

Jan D. Wegner,

Konrad Schindler; [pdf] [supp]
[bibtex]
@InProceedings{Kalischek_2023_CVPR, author = {Kalischek, Nikolai and Daudt, Rodrigo Caye and Peters, Torben and Furrer, Reinhard and Wegner, Jan D. and Schindler, Konrad}, title = {BiasBed - Rigorous Texture Bias Evaluation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22221-22230} }
Open-Category Human-Object Interaction Pre-Training via Language Modeling Framework: Sipeng Zheng,

Boshen Xu,

Qin Jin; [pdf] [supp]
[bibtex]
@InProceedings{Zheng_2023_CVPR, author = {Zheng, Sipeng and Xu, Boshen and Jin, Qin}, title = {Open-Category Human-Object Interaction Pre-Training via Language Modeling Framework}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19392-19402} }
Explicit Boundary Guided Semi-Push-Pull Contrastive Learning for Supervised Anomaly Detection: Xincheng Yao,

Ruoqi Li,

Jing Zhang,

Jun Sun,

Chongyang Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yao_2023_CVPR, author = {Yao, Xincheng and Li, Ruoqi and Zhang, Jing and Sun, Jun and Zhang, Chongyang}, title = {Explicit Boundary Guided Semi-Push-Pull Contrastive Learning for Supervised Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24490-24499} }
DeCo: Decomposition and Reconstruction for Compositional Temporal Grounding via Coarse-To-Fine Contrastive Ranking: Lijin Yang,

Quan Kong,

Hsuan-Kung Yang,

Wadim Kehl,

Yoichi Sato,

Norimasa Kobori; [pdf] [supp]
[bibtex]
@InProceedings{Yang_2023_CVPR, author = {Yang, Lijin and Kong, Quan and Yang, Hsuan-Kung and Kehl, Wadim and Sato, Yoichi and Kobori, Norimasa}, title = {DeCo: Decomposition and Reconstruction for Compositional Temporal Grounding via Coarse-To-Fine Contrastive Ranking}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23130-23140} }
Dynamic Aggregated Network for Gait Recognition: Kang Ma,

Ying Fu,

Dezhi Zheng,

Chunshui Cao,

Xuecai Hu,

Yongzhen Huang; [pdf]
[bibtex]
@InProceedings{Ma_2023_CVPR, author = {Ma, Kang and Fu, Ying and Zheng, Dezhi and Cao, Chunshui and Hu, Xuecai and Huang, Yongzhen}, title = {Dynamic Aggregated Network for Gait Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22076-22085} }
Sphere-Guided Training of Neural Implicit Surfaces: Andreea Dogaru,

Andrei-Timotei Ardelean,

Savva Ignatyev,

Egor Zakharov,

Evgeny Burnaev; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dogaru_2023_CVPR, author = {Dogaru, Andreea and Ardelean, Andrei-Timotei and Ignatyev, Savva and Zakharov, Egor and Burnaev, Evgeny}, title = {Sphere-Guided Training of Neural Implicit Surfaces}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20844-20853} }
Bias Mimicking: A Simple Sampling Approach for Bias Mitigation: Maan Qraitem,

Kate Saenko,

Bryan A. Plummer; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Qraitem_2023_CVPR, author = {Qraitem, Maan and Saenko, Kate and Plummer, Bryan A.}, title = {Bias Mimicking: A Simple Sampling Approach for Bias Mitigation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20311-20320} }
NoisyQuant: Noisy Bias-Enhanced Post-Training Activation Quantization for Vision Transformers: Yijiang Liu,

Huanrui Yang,

Zhen Dong,

Kurt Keutzer,

Li Du,

Shanghang Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Yijiang and Yang, Huanrui and Dong, Zhen and Keutzer, Kurt and Du, Li and Zhang, Shanghang}, title = {NoisyQuant: Noisy Bias-Enhanced Post-Training Activation Quantization for Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20321-20330} }
Semi-Supervised Stereo-Based 3D Object Detection via Cross-View Consensus: Wenhao Wu,

Hau San Wong,

Si Wu; [pdf] [supp]
[bibtex]
@InProceedings{Wu_2023_CVPR, author = {Wu, Wenhao and Wong, Hau San and Wu, Si}, title = {Semi-Supervised Stereo-Based 3D Object Detection via Cross-View Consensus}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17471-17481} }
Video Compression With Entropy-Constrained Neural Representations: Carlos Gomes,

Roberto Azevedo,

Christopher Schroers; [pdf] [supp]
[bibtex]
@InProceedings{Gomes_2023_CVPR, author = {Gomes, Carlos and Azevedo, Roberto and Schroers, Christopher}, title = {Video Compression With Entropy-Constrained Neural Representations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18497-18506} }
Deep Random Projector: Accelerated Deep Image Prior: Taihui Li,

Hengkang Wang,

Zhong Zhuang,

Ju Sun; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Taihui and Wang, Hengkang and Zhuang, Zhong and Sun, Ju}, title = {Deep Random Projector: Accelerated Deep Image Prior}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18176-18185} }
SCPNet: Semantic Scene Completion on Point Cloud: Zhaoyang Xia,

Youquan Liu,

Xin Li,

Xinge Zhu,

Yuexin Ma,

Yikang Li,

Yuenan Hou,

Yu Qiao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xia_2023_CVPR, author = {Xia, Zhaoyang and Liu, Youquan and Li, Xin and Zhu, Xinge and Ma, Yuexin and Li, Yikang and Hou, Yuenan and Qiao, Yu}, title = {SCPNet: Semantic Scene Completion on Point Cloud}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17642-17651} }
Revisiting Prototypical Network for Cross Domain Few-Shot Learning: Fei Zhou,

Peng Wang,

Lei Zhang,

Wei Wei,

Yanning Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Zhou_2023_CVPR, author = {Zhou, Fei and Wang, Peng and Zhang, Lei and Wei, Wei and Zhang, Yanning}, title = {Revisiting Prototypical Network for Cross Domain Few-Shot Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20061-20070} }
Learning Accurate 3D Shape Based on Stereo Polarimetric Imaging: Tianyu Huang,

Haoang Li,

Kejing He,

Congying Sui,

Bin Li,

Yun-Hui Liu; [pdf] [supp]
[bibtex]
@InProceedings{Huang_2023_CVPR, author = {Huang, Tianyu and Li, Haoang and He, Kejing and Sui, Congying and Li, Bin and Liu, Yun-Hui}, title = {Learning Accurate 3D Shape Based on Stereo Polarimetric Imaging}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17287-17296} }
RA-CLIP: Retrieval Augmented Contrastive Language-Image Pre-Training: Chen-Wei Xie,

Siyang Sun,

Xiong Xiong,

Yun Zheng,

Deli Zhao,

Jingren Zhou; [pdf] [supp]
[bibtex]
@InProceedings{Xie_2023_CVPR, author = {Xie, Chen-Wei and Sun, Siyang and Xiong, Xiong and Zheng, Yun and Zhao, Deli and Zhou, Jingren}, title = {RA-CLIP: Retrieval Augmented Contrastive Language-Image Pre-Training}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19265-19274} }
A Practical Upper Bound for the Worst-Case Attribution Deviations: Fan Wang,

Adams Wai-Kin Kong; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Fan and Kong, Adams Wai-Kin}, title = {A Practical Upper Bound for the Worst-Case Attribution Deviations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24616-24625} }
Teacher-Generated Spatial-Attention Labels Boost Robustness and Accuracy of Contrastive Models: Yushi Yao,

Chang Ye,

Junfeng He,

Gamaleldin F. Elsayed; [pdf] [supp]
[bibtex]
@InProceedings{Yao_2023_CVPR, author = {Yao, Yushi and Ye, Chang and He, Junfeng and Elsayed, Gamaleldin F.}, title = {Teacher-Generated Spatial-Attention Labels Boost Robustness and Accuracy of Contrastive Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23282-23291} }
Exploring and Exploiting Uncertainty for Incomplete Multi-View Classification: Mengyao Xie,

Zongbo Han,

Changqing Zhang,

Yichen Bai,

Qinghua Hu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xie_2023_CVPR, author = {Xie, Mengyao and Han, Zongbo and Zhang, Changqing and Bai, Yichen and Hu, Qinghua}, title = {Exploring and Exploiting Uncertainty for Incomplete Multi-View Classification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19873-19882} }
Discovering the Real Association: Multimodal Causal Reasoning in Video Question Answering: Chuanqi Zang,

Hanqing Wang,

Mingtao Pei,

Wei Liang; [pdf] [supp]
[bibtex]
@InProceedings{Zang_2023_CVPR, author = {Zang, Chuanqi and Wang, Hanqing and Pei, Mingtao and Liang, Wei}, title = {Discovering the Real Association: Multimodal Causal Reasoning in Video Question Answering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19027-19036} }
Learning Transformations To Reduce the Geometric Shift in Object Detection: Vidit Vidit,

Martin Engilberge,

Mathieu Salzmann; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Vidit_2023_CVPR, author = {Vidit, Vidit and Engilberge, Martin and Salzmann, Mathieu}, title = {Learning Transformations To Reduce the Geometric Shift in Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17441-17450} }
OReX: Object Reconstruction From Planar Cross-Sections Using Neural Fields: Haim Sawdayee,

Amir Vaxman,

Amit H. Bermano; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sawdayee_2023_CVPR, author = {Sawdayee, Haim and Vaxman, Amir and Bermano, Amit H.}, title = {OReX: Object Reconstruction From Planar Cross-Sections Using Neural Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20854-20862} }
SPIn-NeRF: Multiview Segmentation and Perceptual Inpainting With Neural Radiance Fields: Ashkan Mirzaei,

Tristan Aumentado-Armstrong,

Konstantinos G. Derpanis,

Jonathan Kelly,

Marcus A. Brubaker,

Igor Gilitschenski,

Alex Levinshtein; [pdf] [supp]
[bibtex]
@InProceedings{Mirzaei_2023_CVPR, author = {Mirzaei, Ashkan and Aumentado-Armstrong, Tristan and Derpanis, Konstantinos G. and Kelly, Jonathan and Brubaker, Marcus A. and Gilitschenski, Igor and Levinshtein, Alex}, title = {SPIn-NeRF: Multiview Segmentation and Perceptual Inpainting With Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20669-20679} }
Revisiting Rotation Averaging: Uncertainties and Robust Losses: Ganlin Zhang,

Viktor Larsson,

Daniel Barath; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_CVPR, author = {Zhang, Ganlin and Larsson, Viktor and Barath, Daniel}, title = {Revisiting Rotation Averaging: Uncertainties and Robust Losses}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17215-17224} }
Patch-Based 3D Natural Scene Generation From a Single Example: Weiyu Li,

Xuelin Chen,

Jue Wang,

Baoquan Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Weiyu and Chen, Xuelin and Wang, Jue and Chen, Baoquan}, title = {Patch-Based 3D Natural Scene Generation From a Single Example}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16762-16772} }
Leveraging Hidden Positives for Unsupervised Semantic Segmentation: Hyun Seok Seong,

WonJun Moon,

SuBeen Lee,

Jae-Pil Heo; [pdf] [arXiv]
[bibtex]
@InProceedings{Seong_2023_CVPR, author = {Seong, Hyun Seok and Moon, WonJun and Lee, SuBeen and Heo, Jae-Pil}, title = {Leveraging Hidden Positives for Unsupervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19540-19549} }
LG-BPN: Local and Global Blind-Patch Network for Self-Supervised Real-World Denoising: Zichun Wang,

Ying Fu,

Ji Liu,

Yulun Zhang; [pdf]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Zichun and Fu, Ying and Liu, Ji and Zhang, Yulun}, title = {LG-BPN: Local and Global Blind-Patch Network for Self-Supervised Real-World Denoising}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18156-18165} }
Efficient View Synthesis and 3D-Based Multi-Frame Denoising With Multiplane Feature Representations: Thomas Tanay,

Aleš Leonardis,

Matteo Maggioni; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tanay_2023_CVPR, author = {Tanay, Thomas and Leonardis, Ale\v{s} and Maggioni, Matteo}, title = {Efficient View Synthesis and 3D-Based Multi-Frame Denoising With Multiplane Feature Representations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20898-20907} }
Model Barrier: A Compact Un-Transferable Isolation Domain for Model Intellectual Property Protection: Lianyu Wang,

Meng Wang,

Daoqiang Zhang,

Huazhu Fu; [pdf] [arXiv]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Lianyu and Wang, Meng and Zhang, Daoqiang and Fu, Huazhu}, title = {Model Barrier: A Compact Un-Transferable Isolation Domain for Model Intellectual Property Protection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20475-20484} }
Object Detection With Self-Supervised Scene Adaptation: Zekun Zhang,

Minh Hoai; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_CVPR, author = {Zhang, Zekun and Hoai, Minh}, title = {Object Detection With Self-Supervised Scene Adaptation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21589-21599} }
Self-Positioning Point-Based Transformer for Point Cloud Understanding: Jinyoung Park,

Sanghyeok Lee,

Sihyeon Kim,

Yunyang Xiong,

Hyunwoo J. Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Park_2023_CVPR, author = {Park, Jinyoung and Lee, Sanghyeok and Kim, Sihyeon and Xiong, Yunyang and Kim, Hyunwoo J.}, title = {Self-Positioning Point-Based Transformer for Point Cloud Understanding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21814-21823} }
DeepLSD: Line Segment Detection and Refinement With Deep Image Gradients: Rémi Pautrat,

Daniel Barath,

Viktor Larsson,

Martin R. Oswald,

Marc Pollefeys; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Pautrat_2023_CVPR, author = {Pautrat, R\'emi and Barath, Daniel and Larsson, Viktor and Oswald, Martin R. and Pollefeys, Marc}, title = {DeepLSD: Line Segment Detection and Refinement With Deep Image Gradients}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17327-17336} }
Executing Your Commands via Motion Diffusion in Latent Space: Xin Chen,

Biao Jiang,

Wen Liu,

Zilong Huang,

Bin Fu,

Tao Chen,

Gang Yu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_CVPR, author = {Chen, Xin and Jiang, Biao and Liu, Wen and Huang, Zilong and Fu, Bin and Chen, Tao and Yu, Gang}, title = {Executing Your Commands via Motion Diffusion in Latent Space}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18000-18010} }
Reconstructing Animatable Categories From Videos: Gengshan Yang,

Chaoyang Wang,

N. Dinesh Reddy,

Deva Ramanan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_CVPR, author = {Yang, Gengshan and Wang, Chaoyang and Reddy, N. Dinesh and Ramanan, Deva}, title = {Reconstructing Animatable Categories From Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16995-17005} }
Co-Salient Object Detection With Uncertainty-Aware Group Exchange-Masking: Yang Wu,

Huihui Song,

Bo Liu,

Kaihua Zhang,

Dong Liu; [pdf] [supp]
[bibtex]
@InProceedings{Wu_2023_CVPR, author = {Wu, Yang and Song, Huihui and Liu, Bo and Zhang, Kaihua and Liu, Dong}, title = {Co-Salient Object Detection With Uncertainty-Aware Group Exchange-Masking}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19639-19648} }
Tangentially Elongated Gaussian Belief Propagation for Event-Based Incremental Optical Flow Estimation: Jun Nagata,

Yusuke Sekikawa; [pdf] [supp]
[bibtex]
@InProceedings{Nagata_2023_CVPR, author = {Nagata, Jun and Sekikawa, Yusuke}, title = {Tangentially Elongated Gaussian Belief Propagation for Event-Based Incremental Optical Flow Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21940-21949} }
Adaptive Sparse Pairwise Loss for Object Re-Identification: Xiao Zhou,

Yujie Zhong,

Zhen Cheng,

Fan Liang,

Lin Ma; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhou_2023_CVPR, author = {Zhou, Xiao and Zhong, Yujie and Cheng, Zhen and Liang, Fan and Ma, Lin}, title = {Adaptive Sparse Pairwise Loss for Object Re-Identification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19691-19701} }
Semi-Weakly Supervised Object Kinematic Motion Prediction: Gengxin Liu,

Qian Sun,

Haibin Huang,

Chongyang Ma,

Yulan Guo,

Li Yi,

Hui Huang,

Ruizhen Hu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Gengxin and Sun, Qian and Huang, Haibin and Ma, Chongyang and Guo, Yulan and Yi, Li and Huang, Hui and Hu, Ruizhen}, title = {Semi-Weakly Supervised Object Kinematic Motion Prediction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21726-21735} }
Learning a Simple Low-Light Image Enhancer From Paired Low-Light Instances: Zhenqi Fu,

Yan Yang,

Xiaotong Tu,

Yue Huang,

Xinghao Ding,

Kai-Kuang Ma; [pdf]
[bibtex]
@InProceedings{Fu_2023_CVPR, author = {Fu, Zhenqi and Yang, Yan and Tu, Xiaotong and Huang, Yue and Ding, Xinghao and Ma, Kai-Kuang}, title = {Learning a Simple Low-Light Image Enhancer From Paired Low-Light Instances}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22252-22261} }
PivoTAL: Prior-Driven Supervision for Weakly-Supervised Temporal Action Localization: Mamshad Nayeem Rizve,

Gaurav Mittal,

Ye Yu,

Matthew Hall,

Sandra Sajeev,

Mubarak Shah,

Mei Chen; [pdf] [supp]
[bibtex]
@InProceedings{Rizve_2023_CVPR, author = {Rizve, Mamshad Nayeem and Mittal, Gaurav and Yu, Ye and Hall, Matthew and Sajeev, Sandra and Shah, Mubarak and Chen, Mei}, title = {PivoTAL: Prior-Driven Supervision for Weakly-Supervised Temporal Action Localization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22992-23002} }
Improving Generalization With Domain Convex Game: Fangrui Lv,

Jian Liang,

Shuang Li,

Jinming Zhang,

Di Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lv_2023_CVPR, author = {Lv, Fangrui and Liang, Jian and Li, Shuang and Zhang, Jinming and Liu, Di}, title = {Improving Generalization With Domain Convex Game}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24315-24324} }
Fair Scratch Tickets: Finding Fair Sparse Networks Without Weight Training: Pengwei Tang,

Wei Yao,

Zhicong Li,

Yong Liu; [pdf] [supp]
[bibtex]
@InProceedings{Tang_2023_CVPR, author = {Tang, Pengwei and Yao, Wei and Li, Zhicong and Liu, Yong}, title = {Fair Scratch Tickets: Finding Fair Sparse Networks Without Weight Training}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24406-24416} }
Intrinsic Physical Concepts Discovery With Object-Centric Predictive Models: Qu Tang,

Xiangyu Zhu,

Zhen Lei,

Zhaoxiang Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tang_2023_CVPR, author = {Tang, Qu and Zhu, Xiangyu and Lei, Zhen and Zhang, Zhaoxiang}, title = {Intrinsic Physical Concepts Discovery With Object-Centric Predictive Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23252-23261} }
Towards Generalisable Video Moment Retrieval: Visual-Dynamic Injection to Image-Text Pre-Training: Dezhao Luo,

Jiabo Huang,

Shaogang Gong,

Hailin Jin,

Yang Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Luo_2023_CVPR, author = {Luo, Dezhao and Huang, Jiabo and Gong, Shaogang and Jin, Hailin and Liu, Yang}, title = {Towards Generalisable Video Moment Retrieval: Visual-Dynamic Injection to Image-Text Pre-Training}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23045-23055} }
Learning Adaptive Dense Event Stereo From the Image Domain: Hoonhee Cho,

Jegyeong Cho,

Kuk-Jin Yoon; [pdf] [supp]
[bibtex]
@InProceedings{Cho_2023_CVPR, author = {Cho, Hoonhee and Cho, Jegyeong and Yoon, Kuk-Jin}, title = {Learning Adaptive Dense Event Stereo From the Image Domain}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17797-17807} }
Foundation Model Drives Weakly Incremental Learning for Semantic Segmentation: Chaohui Yu,

Qiang Zhou,

Jingliang Li,

Jianlong Yuan,

Zhibin Wang,

Fan Wang; [pdf] [arXiv]
[bibtex]
@InProceedings{Yu_2023_CVPR, author = {Yu, Chaohui and Zhou, Qiang and Li, Jingliang and Yuan, Jianlong and Wang, Zhibin and Wang, Fan}, title = {Foundation Model Drives Weakly Incremental Learning for Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23685-23694} }
NeRFVS: Neural Radiance Fields for Free View Synthesis via Geometry Scaffolds: Chen Yang,

Peihao Li,

Zanwei Zhou,

Shanxin Yuan,

Bingbing Liu,

Xiaokang Yang,

Weichao Qiu,

Wei Shen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_CVPR, author = {Yang, Chen and Li, Peihao and Zhou, Zanwei and Yuan, Shanxin and Liu, Bingbing and Yang, Xiaokang and Qiu, Weichao and Shen, Wei}, title = {NeRFVS: Neural Radiance Fields for Free View Synthesis via Geometry Scaffolds}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16549-16558} }
Auto-CARD: Efficient and Robust Codec Avatar Driving for Real-Time Mobile Telepresence: Yonggan Fu,

Yuecheng Li,

Chenghui Li,

Jason Saragih,

Peizhao Zhang,

Xiaoliang Dai,

Yingyan (Celine) Lin; [pdf] [supp]
[bibtex]
@InProceedings{Fu_2023_CVPR, author = {Fu, Yonggan and Li, Yuecheng and Li, Chenghui and Saragih, Jason and Zhang, Peizhao and Dai, Xiaoliang and Lin, Yingyan (Celine)}, title = {Auto-CARD: Efficient and Robust Codec Avatar Driving for Real-Time Mobile Telepresence}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21036-21045} }
Conjugate Product Graphs for Globally Optimal 2D-3D Shape Matching: Paul Roetzer,

Zorah Lähner,

Florian Bernard; [pdf] [supp]
[bibtex]
@InProceedings{Roetzer_2023_CVPR, author = {Roetzer, Paul and L\"ahner, Zorah and Bernard, Florian}, title = {Conjugate Product Graphs for Globally Optimal 2D-3D Shape Matching}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21866-21875} }
Multi-Realism Image Compression With a Conditional Generator: Eirikur Agustsson,

David Minnen,

George Toderici,

Fabian Mentzer; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Agustsson_2023_CVPR, author = {Agustsson, Eirikur and Minnen, David and Toderici, George and Mentzer, Fabian}, title = {Multi-Realism Image Compression With a Conditional Generator}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22324-22333} }
Best of Both Worlds: Multimodal Contrastive Learning With Tabular and Imaging Data: Paul Hager,

Martin J. Menten,

Daniel Rueckert; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hager_2023_CVPR, author = {Hager, Paul and Menten, Martin J. and Rueckert, Daniel}, title = {Best of Both Worlds: Multimodal Contrastive Learning With Tabular and Imaging Data}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23924-23935} }
Masked Images Are Counterfactual Samples for Robust Fine-Tuning: Yao Xiao,

Ziyi Tang,

Pengxu Wei,

Cong Liu,

Liang Lin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xiao_2023_CVPR, author = {Xiao, Yao and Tang, Ziyi and Wei, Pengxu and Liu, Cong and Lin, Liang}, title = {Masked Images Are Counterfactual Samples for Robust Fine-Tuning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20301-20310} }
StepFormer: Self-Supervised Step Discovery and Localization in Instructional Videos: Nikita Dvornik,

Isma Hadji,

Ran Zhang,

Konstantinos G. Derpanis,

Richard P. Wildes,

Allan D. Jepson; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dvornik_2023_CVPR, author = {Dvornik, Nikita and Hadji, Isma and Zhang, Ran and Derpanis, Konstantinos G. and Wildes, Richard P. and Jepson, Allan D.}, title = {StepFormer: Self-Supervised Step Discovery and Localization in Instructional Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18952-18961} }
Open Vocabulary Semantic Segmentation With Patch Aligned Contrastive Learning: Jishnu Mukhoti,

Tsung-Yu Lin,

Omid Poursaeed,

Rui Wang,

Ashish Shah,

Philip H.S. Torr,

Ser-Nam Lim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mukhoti_2023_CVPR, author = {Mukhoti, Jishnu and Lin, Tsung-Yu and Poursaeed, Omid and Wang, Rui and Shah, Ashish and Torr, Philip H.S. and Lim, Ser-Nam}, title = {Open Vocabulary Semantic Segmentation With Patch Aligned Contrastive Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19413-19423} }
Camouflaged Instance Segmentation via Explicit De-Camouflaging: Naisong Luo,

Yuwen Pan,

Rui Sun,

Tianzhu Zhang,

Zhiwei Xiong,

Feng Wu; [pdf] [supp]
[bibtex]
@InProceedings{Luo_2023_CVPR, author = {Luo, Naisong and Pan, Yuwen and Sun, Rui and Zhang, Tianzhu and Xiong, Zhiwei and Wu, Feng}, title = {Camouflaged Instance Segmentation via Explicit De-Camouflaging}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17918-17927} }
Pic2Word: Mapping Pictures to Words for Zero-Shot Composed Image Retrieval: Kuniaki Saito,

Kihyuk Sohn,

Xiang Zhang,

Chun-Liang Li,

Chen-Yu Lee,

Kate Saenko,

Tomas Pfister; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Saito_2023_CVPR, author = {Saito, Kuniaki and Sohn, Kihyuk and Zhang, Xiang and Li, Chun-Liang and Lee, Chen-Yu and Saenko, Kate and Pfister, Tomas}, title = {Pic2Word: Mapping Pictures to Words for Zero-Shot Composed Image Retrieval}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19305-19314} }
MMANet: Margin-Aware Distillation and Modality-Aware Regularization for Incomplete Multimodal Learning: Shicai Wei,

Chunbo Luo,

Yang Luo; [pdf] [arXiv]
[bibtex]
@InProceedings{Wei_2023_CVPR, author = {Wei, Shicai and Luo, Chunbo and Luo, Yang}, title = {MMANet: Margin-Aware Distillation and Modality-Aware Regularization for Incomplete Multimodal Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20039-20049} }
Putting People in Their Place: Affordance-Aware Human Insertion Into Scenes: Sumith Kulal,

Tim Brooks,

Alex Aiken,

Jiajun Wu,

Jimei Yang,

Jingwan Lu,

Alexei A. Efros,

Krishna Kumar Singh; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kulal_2023_CVPR, author = {Kulal, Sumith and Brooks, Tim and Aiken, Alex and Wu, Jiajun and Yang, Jimei and Lu, Jingwan and Efros, Alexei A. and Singh, Krishna Kumar}, title = {Putting People in Their Place: Affordance-Aware Human Insertion Into Scenes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17089-17099} }
3D Neural Field Generation Using Triplane Diffusion: J. Ryan Shue,

Eric Ryan Chan,

Ryan Po,

Zachary Ankner,

Jiajun Wu,

Gordon Wetzstein; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shue_2023_CVPR, author = {Shue, J. Ryan and Chan, Eric Ryan and Po, Ryan and Ankner, Zachary and Wu, Jiajun and Wetzstein, Gordon}, title = {3D Neural Field Generation Using Triplane Diffusion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20875-20886} }
Regularized Vector Quantization for Tokenized Image Synthesis: Jiahui Zhang,

Fangneng Zhan,

Christian Theobalt,

Shijian Lu; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_CVPR, author = {Zhang, Jiahui and Zhan, Fangneng and Theobalt, Christian and Lu, Shijian}, title = {Regularized Vector Quantization for Tokenized Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18467-18476} }
Improving Image Recognition by Retrieving From Web-Scale Image-Text Data: Ahmet Iscen,

Alireza Fathi,

Cordelia Schmid; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Iscen_2023_CVPR, author = {Iscen, Ahmet and Fathi, Alireza and Schmid, Cordelia}, title = {Improving Image Recognition by Retrieving From Web-Scale Image-Text Data}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19295-19304} }
Multi-Level Logit Distillation: Ying Jin,

Jiaqi Wang,

Dahua Lin; [pdf] [supp]
[bibtex]
@InProceedings{Jin_2023_CVPR, author = {Jin, Ying and Wang, Jiaqi and Lin, Dahua}, title = {Multi-Level Logit Distillation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24276-24285} }
DA Wand: Distortion-Aware Selection Using Neural Mesh Parameterization: Richard Liu,

Noam Aigerman,

Vladimir G. Kim,

Rana Hanocka; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Richard and Aigerman, Noam and Kim, Vladimir G. and Hanocka, Rana}, title = {DA Wand: Distortion-Aware Selection Using Neural Mesh Parameterization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16739-16749} }
Hierarchical Semantic Correspondence Networks for Video Paragraph Grounding: Chaolei Tan,

Zihang Lin,

Jian-Fang Hu,

Wei-Shi Zheng,

Jianhuang Lai; [pdf] [supp]
[bibtex]
@InProceedings{Tan_2023_CVPR, author = {Tan, Chaolei and Lin, Zihang and Hu, Jian-Fang and Zheng, Wei-Shi and Lai, Jianhuang}, title = {Hierarchical Semantic Correspondence Networks for Video Paragraph Grounding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18973-18982} }
Temporal Attention Unit: Towards Efficient Spatiotemporal Predictive Learning: Cheng Tan,

Zhangyang Gao,

Lirong Wu,

Yongjie Xu,

Jun Xia,

Siyuan Li,

Stan Z. Li; [pdf] [arXiv]
[bibtex]
@InProceedings{Tan_2023_CVPR, author = {Tan, Cheng and Gao, Zhangyang and Wu, Lirong and Xu, Yongjie and Xia, Jun and Li, Siyuan and Li, Stan Z.}, title = {Temporal Attention Unit: Towards Efficient Spatiotemporal Predictive Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18770-18782} }
BiCro: Noisy Correspondence Rectification for Multi-Modality Data via Bi-Directional Cross-Modal Similarity Consistency: Shuo Yang,

Zhaopan Xu,

Kai Wang,

Yang You,

Hongxun Yao,

Tongliang Liu,

Min Xu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_CVPR, author = {Yang, Shuo and Xu, Zhaopan and Wang, Kai and You, Yang and Yao, Hongxun and Liu, Tongliang and Xu, Min}, title = {BiCro: Noisy Correspondence Rectification for Multi-Modality Data via Bi-Directional Cross-Modal Similarity Consistency}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19883-19892} }
Transfer Knowledge From Head to Tail: Uncertainty Calibration Under Long-Tailed Distribution: Jiahao Chen,

Bing Su; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_CVPR, author = {Chen, Jiahao and Su, Bing}, title = {Transfer Knowledge From Head to Tail: Uncertainty Calibration Under Long-Tailed Distribution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19978-19987} }
Global Vision Transformer Pruning With Hessian-Aware Saliency: Huanrui Yang,

Hongxu Yin,

Maying Shen,

Pavlo Molchanov,

Hai Li,

Jan Kautz; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_CVPR, author = {Yang, Huanrui and Yin, Hongxu and Shen, Maying and Molchanov, Pavlo and Li, Hai and Kautz, Jan}, title = {Global Vision Transformer Pruning With Hessian-Aware Saliency}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18547-18557} }
ScarceNet: Animal Pose Estimation With Scarce Annotations: Chen Li,

Gim Hee Lee; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Chen and Lee, Gim Hee}, title = {ScarceNet: Animal Pose Estimation With Scarce Annotations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17174-17183} }
OmniCity: Omnipotent City Understanding With Multi-Level and Multi-View Images: Weijia Li,

Yawen Lai,

Linning Xu,

Yuanbo Xiangli,

Jinhua Yu,

Conghui He,

Gui-Song Xia,

Dahua Lin; [pdf] [arXiv]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Weijia and Lai, Yawen and Xu, Linning and Xiangli, Yuanbo and Yu, Jinhua and He, Conghui and Xia, Gui-Song and Lin, Dahua}, title = {OmniCity: Omnipotent City Understanding With Multi-Level and Multi-View Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17397-17407} }
SViTT: Temporal Learning of Sparse Video-Text Transformers: Yi Li,

Kyle Min,

Subarna Tripathi,

Nuno Vasconcelos; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Yi and Min, Kyle and Tripathi, Subarna and Vasconcelos, Nuno}, title = {SViTT: Temporal Learning of Sparse Video-Text Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18919-18929} }
Deep Fair Clustering via Maximizing and Minimizing Mutual Information: Theory, Algorithm and Metric: Pengxin Zeng,

Yunfan Li,

Peng Hu,

Dezhong Peng,

Jiancheng Lv,

Xi Peng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zeng_2023_CVPR, author = {Zeng, Pengxin and Li, Yunfan and Hu, Peng and Peng, Dezhong and Lv, Jiancheng and Peng, Xi}, title = {Deep Fair Clustering via Maximizing and Minimizing Mutual Information: Theory, Algorithm and Metric}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23986-23995} }
High Fidelity 3D Hand Shape Reconstruction via Scalable Graph Frequency Decomposition: Tianyu Luan,

Yuanhao Zhai,

Jingjing Meng,

Zhong Li,

Zhang Chen,

Yi Xu,

Junsong Yuan; [pdf] [supp]
[bibtex]
@InProceedings{Luan_2023_CVPR, author = {Luan, Tianyu and Zhai, Yuanhao and Meng, Jingjing and Li, Zhong and Chen, Zhang and Xu, Yi and Yuan, Junsong}, title = {High Fidelity 3D Hand Shape Reconstruction via Scalable Graph Frequency Decomposition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16795-16804} }
COT: Unsupervised Domain Adaptation With Clustering and Optimal Transport: Yang Liu,

Zhipeng Zhou,

Baigui Sun; [pdf]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Yang and Zhou, Zhipeng and Sun, Baigui}, title = {COT: Unsupervised Domain Adaptation With Clustering and Optimal Transport}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19998-20007} }
Learning To Exploit the Sequence-Specific Prior Knowledge for Image Processing Pipelines Optimization: Haina Qin,

Longfei Han,

Weihua Xiong,

Juan Wang,

Wentao Ma,

Bing Li,

Weiming Hu; [pdf] [supp]
[bibtex]
@InProceedings{Qin_2023_CVPR, author = {Qin, Haina and Han, Longfei and Xiong, Weihua and Wang, Juan and Ma, Wentao and Li, Bing and Hu, Weiming}, title = {Learning To Exploit the Sequence-Specific Prior Knowledge for Image Processing Pipelines Optimization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22314-22323} }
Lite-Mono: A Lightweight CNN and Transformer Architecture for Self-Supervised Monocular Depth Estimation: Ning Zhang,

Francesco Nex,

George Vosselman,

Norman Kerle; [pdf]
[bibtex]
@InProceedings{Zhang_2023_CVPR, author = {Zhang, Ning and Nex, Francesco and Vosselman, George and Kerle, Norman}, title = {Lite-Mono: A Lightweight CNN and Transformer Architecture for Self-Supervised Monocular Depth Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18537-18546} }
Neural Scene Chronology: Haotong Lin,

Qianqian Wang,

Ruojin Cai,

Sida Peng,

Hadar Averbuch-Elor,

Xiaowei Zhou,

Noah Snavely; [pdf]
[bibtex]
@InProceedings{Lin_2023_CVPR, author = {Lin, Haotong and Wang, Qianqian and Cai, Ruojin and Peng, Sida and Averbuch-Elor, Hadar and Zhou, Xiaowei and Snavely, Noah}, title = {Neural Scene Chronology}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20752-20761} }
TIPI: Test Time Adaptation With Transformation Invariance: A. Tuan Nguyen,

Thanh Nguyen-Tang,

Ser-Nam Lim,

Philip H.S. Torr; [pdf] [supp]
[bibtex]
@InProceedings{Nguyen_2023_CVPR, author = {Nguyen, A. Tuan and Nguyen-Tang, Thanh and Lim, Ser-Nam and Torr, Philip H.S.}, title = {TIPI: Test Time Adaptation With Transformation Invariance}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24162-24171} }
OTAvatar: One-Shot Talking Face Avatar With Controllable Tri-Plane Rendering: Zhiyuan Ma,

Xiangyu Zhu,

Guo-Jun Qi,

Zhen Lei,

Lei Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ma_2023_CVPR, author = {Ma, Zhiyuan and Zhu, Xiangyu and Qi, Guo-Jun and Lei, Zhen and Zhang, Lei}, title = {OTAvatar: One-Shot Talking Face Avatar With Controllable Tri-Plane Rendering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16901-16910} }
Large-Capacity and Flexible Video Steganography via Invertible Neural Network: Chong Mou,

Youmin Xu,

Jiechong Song,

Chen Zhao,

Bernard Ghanem,

Jian Zhang; [pdf] [arXiv]
[bibtex]
@InProceedings{Mou_2023_CVPR, author = {Mou, Chong and Xu, Youmin and Song, Jiechong and Zhao, Chen and Ghanem, Bernard and Zhang, Jian}, title = {Large-Capacity and Flexible Video Steganography via Invertible Neural Network}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22606-22615} }
EVAL: Explainable Video Anomaly Localization: Ashish Singh,

Michael J. Jones,

Erik G. Learned-Miller; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Singh_2023_CVPR, author = {Singh, Ashish and Jones, Michael J. and Learned-Miller, Erik G.}, title = {EVAL: Explainable Video Anomaly Localization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18717-18726} }
Position-Guided Text Prompt for Vision-Language Pre-Training: Jinpeng Wang,

Pan Zhou,

Mike Zheng Shou,

Shuicheng Yan; [pdf] [arXiv]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Jinpeng and Zhou, Pan and Shou, Mike Zheng and Yan, Shuicheng}, title = {Position-Guided Text Prompt for Vision-Language Pre-Training}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23242-23251} }
HOLODIFFUSION: Training a 3D Diffusion Model Using 2D Images: Animesh Karnewar,

Andrea Vedaldi,

David Novotny,

Niloy J. Mitra; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Karnewar_2023_CVPR, author = {Karnewar, Animesh and Vedaldi, Andrea and Novotny, David and Mitra, Niloy J.}, title = {HOLODIFFUSION: Training a 3D Diffusion Model Using 2D Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18423-18433} }
Stimulus Verification Is a Universal and Effective Sampler in Multi-Modal Human Trajectory Prediction: Jianhua Sun,

Yuxuan Li,

Liang Chai,

Cewu Lu; [pdf] [supp]
[bibtex]
@InProceedings{Sun_2023_CVPR, author = {Sun, Jianhua and Li, Yuxuan and Chai, Liang and Lu, Cewu}, title = {Stimulus Verification Is a Universal and Effective Sampler in Multi-Modal Human Trajectory Prediction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22014-22023} }
LoGoNet: Towards Accurate 3D Object Detection With Local-to-Global Cross-Modal Fusion: Xin Li,

Tao Ma,

Yuenan Hou,

Botian Shi,

Yuchen Yang,

Youquan Liu,

Xingjiao Wu,

Qin Chen,

Yikang Li,

Yu Qiao,

Liang He; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Xin and Ma, Tao and Hou, Yuenan and Shi, Botian and Yang, Yuchen and Liu, Youquan and Wu, Xingjiao and Chen, Qin and Li, Yikang and Qiao, Yu and He, Liang}, title = {LoGoNet: Towards Accurate 3D Object Detection With Local-to-Global Cross-Modal Fusion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17524-17534} }
ScaleKD: Distilling Scale-Aware Knowledge in Small Object Detector: Yichen Zhu,

Qiqi Zhou,

Ning Liu,

Zhiyuan Xu,

Zhicai Ou,

Xiaofeng Mou,

Jian Tang; [pdf]
[bibtex]
@InProceedings{Zhu_2023_CVPR, author = {Zhu, Yichen and Zhou, Qiqi and Liu, Ning and Xu, Zhiyuan and Ou, Zhicai and Mou, Xiaofeng and Tang, Jian}, title = {ScaleKD: Distilling Scale-Aware Knowledge in Small Object Detector}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19723-19733} }
An Empirical Study of End-to-End Video-Language Transformers With Masked Visual Modeling: Tsu-Jui Fu,

Linjie Li,

Zhe Gan,

Kevin Lin,

William Yang Wang,

Lijuan Wang,

Zicheng Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Fu_2023_CVPR, author = {Fu, Tsu-Jui and Li, Linjie and Gan, Zhe and Lin, Kevin and Wang, William Yang and Wang, Lijuan and Liu, Zicheng}, title = {An Empirical Study of End-to-End Video-Language Transformers With Masked Visual Modeling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22898-22909} }
MethaneMapper: Spectral Absorption Aware Hyperspectral Transformer for Methane Detection: Satish Kumar,

Ivan Arevalo,

ASM Iftekhar,

B S Manjunath; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kumar_2023_CVPR, author = {Kumar, Satish and Arevalo, Ivan and Iftekhar, ASM and Manjunath, B S}, title = {MethaneMapper: Spectral Absorption Aware Hyperspectral Transformer for Methane Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17609-17618} }
Autonomous Manipulation Learning for Similar Deformable Objects via Only One Demonstration: Yu Ren,

Ronghan Chen,

Yang Cong; [pdf]
[bibtex]
@InProceedings{Ren_2023_CVPR, author = {Ren, Yu and Chen, Ronghan and Cong, Yang}, title = {Autonomous Manipulation Learning for Similar Deformable Objects via Only One Demonstration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17069-17078} }
Representation Learning for Visual Object Tracking by Masked Appearance Transfer: Haojie Zhao,

Dong Wang,

Huchuan Lu; [pdf] [supp]
[bibtex]
@InProceedings{Zhao_2023_CVPR, author = {Zhao, Haojie and Wang, Dong and Lu, Huchuan}, title = {Representation Learning for Visual Object Tracking by Masked Appearance Transfer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18696-18705} }
Learning To Name Classes for Vision and Language Models: Sarah Parisot,

Yongxin Yang,

Steven McDonagh; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Parisot_2023_CVPR, author = {Parisot, Sarah and Yang, Yongxin and McDonagh, Steven}, title = {Learning To Name Classes for Vision and Language Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23477-23486} }
Nighttime Smartphone Reflective Flare Removal Using Optical Center Symmetry Prior: Yuekun Dai,

Yihang Luo,

Shangchen Zhou,

Chongyi Li,

Chen Change Loy; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dai_2023_CVPR, author = {Dai, Yuekun and Luo, Yihang and Zhou, Shangchen and Li, Chongyi and Loy, Chen Change}, title = {Nighttime Smartphone Reflective Flare Removal Using Optical Center Symmetry Prior}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20783-20791} }
Balanced Spherical Grid for Egocentric View Synthesis: Changwoon Choi,

Sang Min Kim,

Young Min Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Choi_2023_CVPR, author = {Choi, Changwoon and Kim, Sang Min and Kim, Young Min}, title = {Balanced Spherical Grid for Egocentric View Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16590-16599} }
Box-Level Active Detection: Mengyao Lyu,

Jundong Zhou,

Hui Chen,

Yijie Huang,

Dongdong Yu,

Yaqian Li,

Yandong Guo,

Yuchen Guo,

Liuyu Xiang,

Guiguang Ding; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lyu_2023_CVPR, author = {Lyu, Mengyao and Zhou, Jundong and Chen, Hui and Huang, Yijie and Yu, Dongdong and Li, Yaqian and Guo, Yandong and Guo, Yuchen and Xiang, Liuyu and Ding, Guiguang}, title = {Box-Level Active Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23766-23775} }
Self-Supervised Non-Uniform Kernel Estimation With Flow-Based Motion Prior for Blind Image Deblurring: Zhenxuan Fang,

Fangfang Wu,

Weisheng Dong,

Xin Li,

Jinjian Wu,

Guangming Shi; [pdf] [supp]
[bibtex]
@InProceedings{Fang_2023_CVPR, author = {Fang, Zhenxuan and Wu, Fangfang and Dong, Weisheng and Li, Xin and Wu, Jinjian and Shi, Guangming}, title = {Self-Supervised Non-Uniform Kernel Estimation With Flow-Based Motion Prior for Blind Image Deblurring}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18105-18114} }
Collecting Cross-Modal Presence-Absence Evidence for Weakly-Supervised Audio-Visual Event Perception: Junyu Gao,

Mengyuan Chen,

Changsheng Xu; [pdf]
[bibtex]
@InProceedings{Gao_2023_CVPR, author = {Gao, Junyu and Chen, Mengyuan and Xu, Changsheng}, title = {Collecting Cross-Modal Presence-Absence Evidence for Weakly-Supervised Audio-Visual Event Perception}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18827-18836} }
AVFace: Towards Detailed Audio-Visual 4D Face Reconstruction: Aggelina Chatziagapi,

Dimitris Samaras; [pdf] [arXiv]
[bibtex]
@InProceedings{Chatziagapi_2023_CVPR, author = {Chatziagapi, Aggelina and Samaras, Dimitris}, title = {AVFace: Towards Detailed Audio-Visual 4D Face Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16878-16889} }
ERM-KTP: Knowledge-Level Machine Unlearning via Knowledge Transfer: Shen Lin,

Xiaoyu Zhang,

Chenyang Chen,

Xiaofeng Chen,

Willy Susilo; [pdf]
[bibtex]
@InProceedings{Lin_2023_CVPR, author = {Lin, Shen and Zhang, Xiaoyu and Chen, Chenyang and Chen, Xiaofeng and Susilo, Willy}, title = {ERM-KTP: Knowledge-Level Machine Unlearning via Knowledge Transfer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20147-20155} }
DATE: Domain Adaptive Product Seeker for E-Commerce: Haoyuan Li,

Hao Jiang,

Tao Jin,

Mengyan Li,

Yan Chen,

Zhijie Lin,

Yang Zhao,

Zhou Zhao; [pdf]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Haoyuan and Jiang, Hao and Jin, Tao and Li, Mengyan and Chen, Yan and Lin, Zhijie and Zhao, Yang and Zhao, Zhou}, title = {DATE: Domain Adaptive Product Seeker for E-Commerce}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19315-19324} }
Self-Supervised Super-Plane for Neural 3D Reconstruction: Botao Ye,

Sifei Liu,

Xueting Li,

Ming-Hsuan Yang; [pdf] [supp]
[bibtex]
@InProceedings{Ye_2023_CVPR, author = {Ye, Botao and Liu, Sifei and Li, Xueting and Yang, Ming-Hsuan}, title = {Self-Supervised Super-Plane for Neural 3D Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21415-21424} }
DisCo-CLIP: A Distributed Contrastive Loss for Memory Efficient CLIP Training: Yihao Chen,

Xianbiao Qi,

Jianan Wang,

Lei Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_CVPR, author = {Chen, Yihao and Qi, Xianbiao and Wang, Jianan and Zhang, Lei}, title = {DisCo-CLIP: A Distributed Contrastive Loss for Memory Efficient CLIP Training}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22648-22657} }
GM-NeRF: Learning Generalizable Model-Based Neural Radiance Fields From Multi-View Images: Jianchuan Chen,

Wentao Yi,

Liqian Ma,

Xu Jia,

Huchuan Lu; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_CVPR, author = {Chen, Jianchuan and Yi, Wentao and Ma, Liqian and Jia, Xu and Lu, Huchuan}, title = {GM-NeRF: Learning Generalizable Model-Based Neural Radiance Fields From Multi-View Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20648-20658} }
Perspective Fields for Single Image Camera Calibration: Linyi Jin,

Jianming Zhang,

Yannick Hold-Geoffroy,

Oliver Wang,

Kevin Blackburn-Matzen,

Matthew Sticha,

David F. Fouhey; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jin_2023_CVPR, author = {Jin, Linyi and Zhang, Jianming and Hold-Geoffroy, Yannick and Wang, Oliver and Blackburn-Matzen, Kevin and Sticha, Matthew and Fouhey, David F.}, title = {Perspective Fields for Single Image Camera Calibration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17307-17316} }
Towards Accurate Image Coding: Improved Autoregressive Image Generation With Dynamic Vector Quantization: Mengqi Huang,

Zhendong Mao,

Zhuowei Chen,

Yongdong Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_CVPR, author = {Huang, Mengqi and Mao, Zhendong and Chen, Zhuowei and Zhang, Yongdong}, title = {Towards Accurate Image Coding: Improved Autoregressive Image Generation With Dynamic Vector Quantization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22596-22605} }
WINNER: Weakly-Supervised hIerarchical decompositioN and aligNment for Spatio-tEmporal Video gRounding: Mengze Li,

Han Wang,

Wenqiao Zhang,

Jiaxu Miao,

Zhou Zhao,

Shengyu Zhang,

Wei Ji,

Fei Wu; [pdf]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Mengze and Wang, Han and Zhang, Wenqiao and Miao, Jiaxu and Zhao, Zhou and Zhang, Shengyu and Ji, Wei and Wu, Fei}, title = {WINNER: Weakly-Supervised hIerarchical decompositioN and aligNment for Spatio-tEmporal Video gRounding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23090-23099} }
Preserving Linear Separability in Continual Learning by Backward Feature Projection: Qiao Gu,

Dongsub Shim,

Florian Shkurti; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gu_2023_CVPR, author = {Gu, Qiao and Shim, Dongsub and Shkurti, Florian}, title = {Preserving Linear Separability in Continual Learning by Backward Feature Projection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24286-24295} }
MHPL: Minimum Happy Points Learning for Active Source Free Domain Adaptation: Fan Wang,

Zhongyi Han,

Zhiyan Zhang,

Rundong He,

Yilong Yin; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Fan and Han, Zhongyi and Zhang, Zhiyan and He, Rundong and Yin, Yilong}, title = {MHPL: Minimum Happy Points Learning for Active Source Free Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20008-20018} }
Metadata-Based RAW Reconstruction via Implicit Neural Functions: Leyi Li,

Huijie Qiao,

Qi Ye,

Qinmin Yang; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Leyi and Qiao, Huijie and Ye, Qi and Yang, Qinmin}, title = {Metadata-Based RAW Reconstruction via Implicit Neural Functions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18196-18205} }
Multimodality Helps Unimodality: Cross-Modal Few-Shot Learning With Multimodal Models: Zhiqiu Lin,

Samuel Yu,

Zhiyi Kuang,

Deepak Pathak,

Deva Ramanan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lin_2023_CVPR, author = {Lin, Zhiqiu and Yu, Samuel and Kuang, Zhiyi and Pathak, Deepak and Ramanan, Deva}, title = {Multimodality Helps Unimodality: Cross-Modal Few-Shot Learning With Multimodal Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19325-19337} }
3D Highlighter: Localizing Regions on 3D Shapes via Text Descriptions: Dale Decatur,

Itai Lang,

Rana Hanocka; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Decatur_2023_CVPR, author = {Decatur, Dale and Lang, Itai and Hanocka, Rana}, title = {3D Highlighter: Localizing Regions on 3D Shapes via Text Descriptions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20930-20939} }
Iterative Geometry Encoding Volume for Stereo Matching: Gangwei Xu,

Xianqi Wang,

Xiaohuan Ding,

Xin Yang; [pdf] [arXiv]
[bibtex]
@InProceedings{Xu_2023_CVPR, author = {Xu, Gangwei and Wang, Xianqi and Ding, Xiaohuan and Yang, Xin}, title = {Iterative Geometry Encoding Volume for Stereo Matching}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21919-21928} }
GRES: Generalized Referring Expression Segmentation: Chang Liu,

Henghui Ding,

Xudong Jiang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Chang and Ding, Henghui and Jiang, Xudong}, title = {GRES: Generalized Referring Expression Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23592-23601} }
Open-Set Fine-Grained Retrieval via Prompting Vision-Language Evaluator: Shijie Wang,

Jianlong Chang,

Haojie Li,

Zhihui Wang,

Wanli Ouyang,

Qi Tian; [pdf]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Shijie and Chang, Jianlong and Li, Haojie and Wang, Zhihui and Ouyang, Wanli and Tian, Qi}, title = {Open-Set Fine-Grained Retrieval via Prompting Vision-Language Evaluator}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19381-19391} }
Sibling-Attack: Rethinking Transferable Adversarial Attacks Against Face Recognition: Zexin Li,

Bangjie Yin,

Taiping Yao,

Junfeng Guo,

Shouhong Ding,

Simin Chen,

Cong Liu; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Zexin and Yin, Bangjie and Yao, Taiping and Guo, Junfeng and Ding, Shouhong and Chen, Simin and Liu, Cong}, title = {Sibling-Attack: Rethinking Transferable Adversarial Attacks Against Face Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24626-24637} }
PIRLNav: Pretraining With Imitation and RL Finetuning for ObjectNav: Ram Ramrakhya,

Dhruv Batra,

Erik Wijmans,

Abhishek Das; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ramrakhya_2023_CVPR, author = {Ramrakhya, Ram and Batra, Dhruv and Wijmans, Erik and Das, Abhishek}, title = {PIRLNav: Pretraining With Imitation and RL Finetuning for ObjectNav}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17896-17906} }
StyleGene: Crossover and Mutation of Region-Level Facial Genes for Kinship Face Synthesis: Hao Li,

Xianxu Hou,

Zepeng Huang,

Linlin Shen; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Hao and Hou, Xianxu and Huang, Zepeng and Shen, Linlin}, title = {StyleGene: Crossover and Mutation of Region-Level Facial Genes for Kinship Face Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20960-20969} }
Clothed Human Performance Capture With a Double-Layer Neural Radiance Fields: Kangkan Wang,

Guofeng Zhang,

Suxu Cong,

Jian Yang; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Kangkan and Zhang, Guofeng and Cong, Suxu and Yang, Jian}, title = {Clothed Human Performance Capture With a Double-Layer Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21098-21107} }
NeuFace: Realistic 3D Neural Face Rendering From Multi-View Images: Mingwu Zheng,

Haiyu Zhang,

Hongyu Yang,

Di Huang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zheng_2023_CVPR, author = {Zheng, Mingwu and Zhang, Haiyu and Yang, Hongyu and Huang, Di}, title = {NeuFace: Realistic 3D Neural Face Rendering From Multi-View Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16868-16877} }
Rethinking Domain Generalization for Face Anti-Spoofing: Separability and Alignment: Yiyou Sun,

Yaojie Liu,

Xiaoming Liu,

Yixuan Li,

Wen-Sheng Chu; [pdf] [supp]
[bibtex]
@InProceedings{Sun_2023_CVPR, author = {Sun, Yiyou and Liu, Yaojie and Liu, Xiaoming and Li, Yixuan and Chu, Wen-Sheng}, title = {Rethinking Domain Generalization for Face Anti-Spoofing: Separability and Alignment}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24563-24574} }
SMOC-Net: Leveraging Camera Pose for Self-Supervised Monocular Object Pose Estimation: Tao Tan,

Qiulei Dong; [pdf]
[bibtex]
@InProceedings{Tan_2023_CVPR, author = {Tan, Tao and Dong, Qiulei}, title = {SMOC-Net: Leveraging Camera Pose for Self-Supervised Monocular Object Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21307-21316} }
Learning Human Mesh Recovery in 3D Scenes: Zehong Shen,

Zhi Cen,

Sida Peng,

Qing Shuai,

Hujun Bao,

Xiaowei Zhou; [pdf]
[bibtex]
@InProceedings{Shen_2023_CVPR, author = {Shen, Zehong and Cen, Zhi and Peng, Sida and Shuai, Qing and Bao, Hujun and Zhou, Xiaowei}, title = {Learning Human Mesh Recovery in 3D Scenes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17038-17047} }
Learning Locally Editable Virtual Humans: Hsuan-I Ho,

Lixin Xue,

Jie Song,

Otmar Hilliges; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ho_2023_CVPR, author = {Ho, Hsuan-I and Xue, Lixin and Song, Jie and Hilliges, Otmar}, title = {Learning Locally Editable Virtual Humans}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21024-21035} }
PillarNeXt: Rethinking Network Designs for 3D Object Detection in LiDAR Point Clouds: Jinyu Li,

Chenxu Luo,

Xiaodong Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Jinyu and Luo, Chenxu and Yang, Xiaodong}, title = {PillarNeXt: Rethinking Network Designs for 3D Object Detection in LiDAR Point Clouds}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17567-17576} }
LINe: Out-of-Distribution Detection by Leveraging Important Neurons: Yong Hyun Ahn,

Gyeong-Moon Park,

Seong Tae Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ahn_2023_CVPR, author = {Ahn, Yong Hyun and Park, Gyeong-Moon and Kim, Seong Tae}, title = {LINe: Out-of-Distribution Detection by Leveraging Important Neurons}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19852-19862} }
Transforming Radiance Field With Lipschitz Network for Photorealistic 3D Scene Stylization: Zicheng Zhang,

Yinglu Liu,

Congying Han,

Yingwei Pan,

Tiande Guo,

Ting Yao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_CVPR, author = {Zhang, Zicheng and Liu, Yinglu and Han, Congying and Pan, Yingwei and Guo, Tiande and Yao, Ting}, title = {Transforming Radiance Field With Lipschitz Network for Photorealistic 3D Scene Stylization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20712-20721} }
Guided Depth Super-Resolution by Deep Anisotropic Diffusion: Nando Metzger,

Rodrigo Caye Daudt,

Konrad Schindler; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Metzger_2023_CVPR, author = {Metzger, Nando and Daudt, Rodrigo Caye and Schindler, Konrad}, title = {Guided Depth Super-Resolution by Deep Anisotropic Diffusion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18237-18246} }
Fresnel Microfacet BRDF: Unification of Polari-Radiometric Surface-Body Reflection: Tomoki Ichikawa,

Yoshiki Fukao,

Shohei Nobuhara,

Ko Nishino; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ichikawa_2023_CVPR, author = {Ichikawa, Tomoki and Fukao, Yoshiki and Nobuhara, Shohei and Nishino, Ko}, title = {Fresnel Microfacet BRDF: Unification of Polari-Radiometric Surface-Body Reflection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16489-16497} }
Simulated Annealing in Early Layers Leads to Better Generalization: Amir M. Sarfi,

Zahra Karimpour,

Muawiz Chaudhary,

Nasir M. Khalid,

Mirco Ravanelli,

Sudhir Mudur,

Eugene Belilovsky; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sarfi_2023_CVPR, author = {Sarfi, Amir M. and Karimpour, Zahra and Chaudhary, Muawiz and Khalid, Nasir M. and Ravanelli, Mirco and Mudur, Sudhir and Belilovsky, Eugene}, title = {Simulated Annealing in Early Layers Leads to Better Generalization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20205-20214} }
Exploring Data Geometry for Continual Learning: Zhi Gao,

Chen Xu,

Feng Li,

Yunde Jia,

Mehrtash Harandi,

Yuwei Wu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gao_2023_CVPR, author = {Gao, Zhi and Xu, Chen and Li, Feng and Jia, Yunde and Harandi, Mehrtash and Wu, Yuwei}, title = {Exploring Data Geometry for Continual Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24325-24334} }
Learning Neural Parametric Head Models: Simon Giebenhain,

Tobias Kirschstein,

Markos Georgopoulos,

Martin Rünz,

Lourdes Agapito,

Matthias Nießner; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Giebenhain_2023_CVPR, author = {Giebenhain, Simon and Kirschstein, Tobias and Georgopoulos, Markos and R\"unz, Martin and Agapito, Lourdes and Nie{\ss}ner, Matthias}, title = {Learning Neural Parametric Head Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21003-21012} }
Removing Objects From Neural Radiance Fields: Silvan Weder,

Guillermo Garcia-Hernando,

Áron Monszpart,

Marc Pollefeys,

Gabriel J. Brostow,

Michael Firman,

Sara Vicente; [pdf] [arXiv]
[bibtex]
@InProceedings{Weder_2023_CVPR, author = {Weder, Silvan and Garcia-Hernando, Guillermo and Monszpart, \'Aron and Pollefeys, Marc and Brostow, Gabriel J. and Firman, Michael and Vicente, Sara}, title = {Removing Objects From Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16528-16538} }
Structural Multiplane Image: Bridging Neural View Synthesis and 3D Reconstruction: Mingfang Zhang,

Jinglu Wang,

Xiao Li,

Yifei Huang,

Yoichi Sato,

Yan Lu; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_CVPR, author = {Zhang, Mingfang and Wang, Jinglu and Li, Xiao and Huang, Yifei and Sato, Yoichi and Lu, Yan}, title = {Structural Multiplane Image: Bridging Neural View Synthesis and 3D Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16707-16716} }
Harmonious Teacher for Cross-Domain Object Detection: Jinhong Deng,

Dongli Xu,

Wen Li,

Lixin Duan; [pdf] [supp]
[bibtex]
@InProceedings{Deng_2023_CVPR, author = {Deng, Jinhong and Xu, Dongli and Li, Wen and Duan, Lixin}, title = {Harmonious Teacher for Cross-Domain Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23829-23838} }
Learning To Predict Scene-Level Implicit 3D From Posed RGBD Data: Nilesh Kulkarni,

Linyi Jin,

Justin Johnson,

David F. Fouhey; [pdf] [supp]
[bibtex]
@InProceedings{Kulkarni_2023_CVPR, author = {Kulkarni, Nilesh and Jin, Linyi and Johnson, Justin and Fouhey, David F.}, title = {Learning To Predict Scene-Level Implicit 3D From Posed RGBD Data}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17256-17265} }
Physical-World Optical Adversarial Attacks on 3D Face Recognition: Yanjie Li,

Yiquan Li,

Xuelong Dai,

Songtao Guo,

Bin Xiao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Yanjie and Li, Yiquan and Dai, Xuelong and Guo, Songtao and Xiao, Bin}, title = {Physical-World Optical Adversarial Attacks on 3D Face Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24699-24708} }
Raw Image Reconstruction With Learned Compact Metadata: Yufei Wang,

Yi Yu,

Wenhan Yang,

Lanqing Guo,

Lap-Pui Chau,

Alex C. Kot,

Bihan Wen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Yufei and Yu, Yi and Yang, Wenhan and Guo, Lanqing and Chau, Lap-Pui and Kot, Alex C. and Wen, Bihan}, title = {Raw Image Reconstruction With Learned Compact Metadata}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18206-18215} }
Semi-Supervised Video Inpainting With Cycle Consistency Constraints: Zhiliang Wu,

Hanyu Xuan,

Changchang Sun,

Weili Guan,

Kang Zhang,

Yan Yan; [pdf] [arXiv]
[bibtex]
@InProceedings{Wu_2023_CVPR, author = {Wu, Zhiliang and Xuan, Hanyu and Sun, Changchang and Guan, Weili and Zhang, Kang and Yan, Yan}, title = {Semi-Supervised Video Inpainting With Cycle Consistency Constraints}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22586-22595} }
Level-S$^2$fM: Structure From Motion on Neural Level Set of Implicit Surfaces: Yuxi Xiao,

Nan Xue,

Tianfu Wu,

Gui-Song Xia; [pdf] [supp]
[bibtex]
@InProceedings{Xiao_2023_CVPR, author = {Xiao, Yuxi and Xue, Nan and Wu, Tianfu and Xia, Gui-Song}, title = {Level-S\${\textasciicircum}2\$fM: Structure From Motion on Neural Level Set of Implicit Surfaces}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17205-17214} }
Neuron Structure Modeling for Generalizable Remote Physiological Measurement: Hao Lu,

Zitong Yu,

Xuesong Niu,

Ying-Cong Chen; [pdf] [arXiv]
[bibtex]
@InProceedings{Lu_2023_CVPR, author = {Lu, Hao and Yu, Zitong and Niu, Xuesong and Chen, Ying-Cong}, title = {Neuron Structure Modeling for Generalizable Remote Physiological Measurement}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18589-18599} }
Out-of-Candidate Rectification for Weakly Supervised Semantic Segmentation: Zesen Cheng,

Pengchong Qiao,

Kehan Li,

Siheng Li,

Pengxu Wei,

Xiangyang Ji,

Li Yuan,

Chang Liu,

Jie Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cheng_2023_CVPR, author = {Cheng, Zesen and Qiao, Pengchong and Li, Kehan and Li, Siheng and Wei, Pengxu and Ji, Xiangyang and Yuan, Li and Liu, Chang and Chen, Jie}, title = {Out-of-Candidate Rectification for Weakly Supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23673-23684} }
MonoATT: Online Monocular 3D Object Detection With Adaptive Token Transformer: Yunsong Zhou,

Hongzi Zhu,

Quan Liu,

Shan Chang,

Minyi Guo; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhou_2023_CVPR, author = {Zhou, Yunsong and Zhu, Hongzi and Liu, Quan and Chang, Shan and Guo, Minyi}, title = {MonoATT: Online Monocular 3D Object Detection With Adaptive Token Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17493-17503} }
Image Quality-Aware Diagnosis via Meta-Knowledge Co-Embedding: Haoxuan Che,

Siyu Chen,

Hao Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Che_2023_CVPR, author = {Che, Haoxuan and Chen, Siyu and Chen, Hao}, title = {Image Quality-Aware Diagnosis via Meta-Knowledge Co-Embedding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19819-19829} }
Learning 3D Representations From 2D Pre-Trained Models via Image-to-Point Masked Autoencoders: Renrui Zhang,

Liuhui Wang,

Yu Qiao,

Peng Gao,

Hongsheng Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_CVPR, author = {Zhang, Renrui and Wang, Liuhui and Qiao, Yu and Gao, Peng and Li, Hongsheng}, title = {Learning 3D Representations From 2D Pre-Trained Models via Image-to-Point Masked Autoencoders}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21769-21780} }
BEVFormer v2: Adapting Modern Image Backbones to Bird's-Eye-View Recognition via Perspective Supervision: Chenyu Yang,

Yuntao Chen,

Hao Tian,

Chenxin Tao,

Xizhou Zhu,

Zhaoxiang Zhang,

Gao Huang,

Hongyang Li,

Yu Qiao,

Lewei Lu,

Jie Zhou,

Jifeng Dai; [pdf] [supp]
[bibtex]
@InProceedings{Yang_2023_CVPR, author = {Yang, Chenyu and Chen, Yuntao and Tian, Hao and Tao, Chenxin and Zhu, Xizhou and Zhang, Zhaoxiang and Huang, Gao and Li, Hongyang and Qiao, Yu and Lu, Lewei and Zhou, Jie and Dai, Jifeng}, title = {BEVFormer v2: Adapting Modern Image Backbones to Bird's-Eye-View Recognition via Perspective Supervision}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17830-17839} }
Object Discovery From Motion-Guided Tokens: Zhipeng Bao,

Pavel Tokmakov,

Yu-Xiong Wang,

Adrien Gaidon,

Martial Hebert; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bao_2023_CVPR, author = {Bao, Zhipeng and Tokmakov, Pavel and Wang, Yu-Xiong and Gaidon, Adrien and Hebert, Martial}, title = {Object Discovery From Motion-Guided Tokens}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22972-22981} }
Event-Based Video Frame Interpolation With Cross-Modal Asymmetric Bidirectional Motion Fields: Taewoo Kim,

Yujeong Chae,

Hyun-Kurl Jang,

Kuk-Jin Yoon; [pdf] [supp]
[bibtex]
@InProceedings{Kim_2023_CVPR, author = {Kim, Taewoo and Chae, Yujeong and Jang, Hyun-Kurl and Yoon, Kuk-Jin}, title = {Event-Based Video Frame Interpolation With Cross-Modal Asymmetric Bidirectional Motion Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18032-18042} }
VolRecon: Volume Rendering of Signed Ray Distance Functions for Generalizable Multi-View Reconstruction: Yufan Ren,

Fangjinhua Wang,

Tong Zhang,

Marc Pollefeys,

Sabine Süsstrunk; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ren_2023_CVPR, author = {Ren, Yufan and Wang, Fangjinhua and Zhang, Tong and Pollefeys, Marc and S\"usstrunk, Sabine}, title = {VolRecon: Volume Rendering of Signed Ray Distance Functions for Generalizable Multi-View Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16685-16695} }
DA-DETR: Domain Adaptive Detection Transformer With Information Fusion: Jingyi Zhang,

Jiaxing Huang,

Zhipeng Luo,

Gongjie Zhang,

Xiaoqin Zhang,

Shijian Lu; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_CVPR, author = {Zhang, Jingyi and Huang, Jiaxing and Luo, Zhipeng and Zhang, Gongjie and Zhang, Xiaoqin and Lu, Shijian}, title = {DA-DETR: Domain Adaptive Detection Transformer With Information Fusion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23787-23798} }
Vision Transformers Are Good Mask Auto-Labelers: Shiyi Lan,

Xitong Yang,

Zhiding Yu,

Zuxuan Wu,

Jose M. Alvarez,

Anima Anandkumar; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lan_2023_CVPR, author = {Lan, Shiyi and Yang, Xitong and Yu, Zhiding and Wu, Zuxuan and Alvarez, Jose M. and Anandkumar, Anima}, title = {Vision Transformers Are Good Mask Auto-Labelers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23745-23755} }
Neural Transformation Fields for Arbitrary-Styled Font Generation: Bin Fu,

Junjun He,

Jianjun Wang,

Yu Qiao; [pdf] [supp]
[bibtex]
@InProceedings{Fu_2023_CVPR, author = {Fu, Bin and He, Junjun and Wang, Jianjun and Qiao, Yu}, title = {Neural Transformation Fields for Arbitrary-Styled Font Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22438-22447} }
EDICT: Exact Diffusion Inversion via Coupled Transformations: Bram Wallace,

Akash Gokul,

Nikhil Naik; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wallace_2023_CVPR, author = {Wallace, Bram and Gokul, Akash and Naik, Nikhil}, title = {EDICT: Exact Diffusion Inversion via Coupled Transformations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22532-22541} }
AeDet: Azimuth-Invariant Multi-View 3D Object Detection: Chengjian Feng,

Zequn Jie,

Yujie Zhong,

Xiangxiang Chu,

Lin Ma; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Feng_2023_CVPR, author = {Feng, Chengjian and Jie, Zequn and Zhong, Yujie and Chu, Xiangxiang and Ma, Lin}, title = {AeDet: Azimuth-Invariant Multi-View 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21580-21588} }
OCELOT: Overlapped Cell on Tissue Dataset for Histopathology: Jeongun Ryu,

Aaron Valero Puche,

JaeWoong Shin,

Seonwook Park,

Biagio Brattoli,

Jinhee Lee,

Wonkyung Jung,

Soo Ick Cho,

Kyunghyun Paeng,

Chan-Young Ock,

Donggeun Yoo,

Sérgio Pereira; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ryu_2023_CVPR, author = {Ryu, Jeongun and Puche, Aaron Valero and Shin, JaeWoong and Park, Seonwook and Brattoli, Biagio and Lee, Jinhee and Jung, Wonkyung and Cho, Soo Ick and Paeng, Kyunghyun and Ock, Chan-Young and Yoo, Donggeun and Pereira, S\'ergio}, title = {OCELOT: Overlapped Cell on Tissue Dataset for Histopathology}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23902-23912} }
Unsupervised Sampling Promoting for Stochastic Human Trajectory Prediction: Guangyi Chen,

Zhenhao Chen,

Shunxing Fan,

Kun Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_CVPR, author = {Chen, Guangyi and Chen, Zhenhao and Fan, Shunxing and Zhang, Kun}, title = {Unsupervised Sampling Promoting for Stochastic Human Trajectory Prediction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17874-17884} }
Safe Latent Diffusion: Mitigating Inappropriate Degeneration in Diffusion Models: Patrick Schramowski,

Manuel Brack,

Björn Deiseroth,

Kristian Kersting; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Schramowski_2023_CVPR, author = {Schramowski, Patrick and Brack, Manuel and Deiseroth, Bj\"orn and Kersting, Kristian}, title = {Safe Latent Diffusion: Mitigating Inappropriate Degeneration in Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22522-22531} }
Superclass Learning With Representation Enhancement: Zeyu Gan,

Suyun Zhao,

Jinlong Kang,

Liyuan Shang,

Hong Chen,

Cuiping Li; [pdf] [supp]
[bibtex]
@InProceedings{Gan_2023_CVPR, author = {Gan, Zeyu and Zhao, Suyun and Kang, Jinlong and Shang, Liyuan and Chen, Hong and Li, Cuiping}, title = {Superclass Learning With Representation Enhancement}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24060-24069} }
Visual Prompt Tuning for Generative Transfer Learning: Kihyuk Sohn,

Huiwen Chang,

José Lezama,

Luisa Polania,

Han Zhang,

Yuan Hao,

Irfan Essa,

Lu Jiang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sohn_2023_CVPR, author = {Sohn, Kihyuk and Chang, Huiwen and Lezama, Jos\'e and Polania, Luisa and Zhang, Han and Hao, Yuan and Essa, Irfan and Jiang, Lu}, title = {Visual Prompt Tuning for Generative Transfer Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19840-19851} }
ReLight My NeRF: A Dataset for Novel View Synthesis and Relighting of Real World Objects: Marco Toschi,

Riccardo De Matteo,

Riccardo Spezialetti,

Daniele De Gregorio,

Luigi Di Stefano,

Samuele Salti; [pdf] [arXiv]
[bibtex]
@InProceedings{Toschi_2023_CVPR, author = {Toschi, Marco and De Matteo, Riccardo and Spezialetti, Riccardo and De Gregorio, Daniele and Di Stefano, Luigi and Salti, Samuele}, title = {ReLight My NeRF: A Dataset for Novel View Synthesis and Relighting of Real World Objects}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20762-20772} }
Content-Aware Token Sharing for Efficient Semantic Segmentation With Vision Transformers: Chenyang Lu,

Daan de Geus,

Gijs Dubbelman; [pdf] [supp]
[bibtex]
@InProceedings{Lu_2023_CVPR, author = {Lu, Chenyang and de Geus, Daan and Dubbelman, Gijs}, title = {Content-Aware Token Sharing for Efficient Semantic Segmentation With Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23631-23640} }
Are Binary Annotations Sufficient? Video Moment Retrieval via Hierarchical Uncertainty-Based Active Learning: Wei Ji,

Renjie Liang,

Zhedong Zheng,

Wenqiao Zhang,

Shengyu Zhang,

Juncheng Li,

Mengze Li,

Tat-seng Chua; [pdf]
[bibtex]
@InProceedings{Ji_2023_CVPR, author = {Ji, Wei and Liang, Renjie and Zheng, Zhedong and Zhang, Wenqiao and Zhang, Shengyu and Li, Juncheng and Li, Mengze and Chua, Tat-seng}, title = {Are Binary Annotations Sufficient? Video Moment Retrieval via Hierarchical Uncertainty-Based Active Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23013-23022} }
VGFlow: Visibility Guided Flow Network for Human Reposing: Rishabh Jain,

Krishna Kumar Singh,

Mayur Hemani,

Jingwan Lu,

Mausoom Sarkar,

Duygu Ceylan,

Balaji Krishnamurthy; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jain_2023_CVPR, author = {Jain, Rishabh and Singh, Krishna Kumar and Hemani, Mayur and Lu, Jingwan and Sarkar, Mausoom and Ceylan, Duygu and Krishnamurthy, Balaji}, title = {VGFlow: Visibility Guided Flow Network for Human Reposing}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21088-21097} }
Improving Selective Visual Question Answering by Learning From Your Peers: Corentin Dancette,

Spencer Whitehead,

Rishabh Maheshwary,

Ramakrishna Vedantam,

Stefan Scherer,

Xinlei Chen,

Matthieu Cord,

Marcus Rohrbach; [pdf] [supp]
[bibtex]
@InProceedings{Dancette_2023_CVPR, author = {Dancette, Corentin and Whitehead, Spencer and Maheshwary, Rishabh and Vedantam, Ramakrishna and Scherer, Stefan and Chen, Xinlei and Cord, Matthieu and Rohrbach, Marcus}, title = {Improving Selective Visual Question Answering by Learning From Your Peers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24049-24059} }
Look, Radiate, and Learn: Self-Supervised Localisation via Radio-Visual Correspondence: Mohammed Alloulah,

Maximilian Arnold; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Alloulah_2023_CVPR, author = {Alloulah, Mohammed and Arnold, Maximilian}, title = {Look, Radiate, and Learn: Self-Supervised Localisation via Radio-Visual Correspondence}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17430-17440} }
Shape-Erased Feature Learning for Visible-Infrared Person Re-Identification: Jiawei Feng,

Ancong Wu,

Wei-Shi Zheng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Feng_2023_CVPR, author = {Feng, Jiawei and Wu, Ancong and Zheng, Wei-Shi}, title = {Shape-Erased Feature Learning for Visible-Infrared Person Re-Identification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22752-22761} }
On Calibrating Semantic Segmentation Models: Analyses and an Algorithm: Dongdong Wang,

Boqing Gong,

Liqiang Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Dongdong and Gong, Boqing and Wang, Liqiang}, title = {On Calibrating Semantic Segmentation Models: Analyses and an Algorithm}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23652-23662} }
Visual Atoms: Pre-Training Vision Transformers With Sinusoidal Waves: Sora Takashima,

Ryo Hayamizu,

Nakamasa Inoue,

Hirokatsu Kataoka,

Rio Yokota; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Takashima_2023_CVPR, author = {Takashima, Sora and Hayamizu, Ryo and Inoue, Nakamasa and Kataoka, Hirokatsu and Yokota, Rio}, title = {Visual Atoms: Pre-Training Vision Transformers With Sinusoidal Waves}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18579-18588} }
Masked Autoencoding Does Not Help Natural Language Supervision at Scale: Floris Weers,

Vaishaal Shankar,

Angelos Katharopoulos,

Yinfei Yang,

Tom Gunter; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Weers_2023_CVPR, author = {Weers, Floris and Shankar, Vaishaal and Katharopoulos, Angelos and Yang, Yinfei and Gunter, Tom}, title = {Masked Autoencoding Does Not Help Natural Language Supervision at Scale}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23432-23444} }
Transductive Few-Shot Learning With Prototype-Based Label Propagation by Iterative Graph Refinement: Hao Zhu,

Piotr Koniusz; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhu_2023_CVPR, author = {Zhu, Hao and Koniusz, Piotr}, title = {Transductive Few-Shot Learning With Prototype-Based Label Propagation by Iterative Graph Refinement}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23996-24006} }
Binary Latent Diffusion: Ze Wang,

Jiang Wang,

Zicheng Liu,

Qiang Qiu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Ze and Wang, Jiang and Liu, Zicheng and Qiu, Qiang}, title = {Binary Latent Diffusion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22576-22585} }
FLAG3D: A 3D Fitness Activity Dataset With Language Instruction: Yansong Tang,

Jinpeng Liu,

Aoyang Liu,

Bin Yang,

Wenxun Dai,

Yongming Rao,

Jiwen Lu,

Jie Zhou,

Xiu Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tang_2023_CVPR, author = {Tang, Yansong and Liu, Jinpeng and Liu, Aoyang and Yang, Bin and Dai, Wenxun and Rao, Yongming and Lu, Jiwen and Zhou, Jie and Li, Xiu}, title = {FLAG3D: A 3D Fitness Activity Dataset With Language Instruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22106-22117} }
NeuralUDF: Learning Unsigned Distance Fields for Multi-View Reconstruction of Surfaces With Arbitrary Topologies: Xiaoxiao Long,

Cheng Lin,

Lingjie Liu,

Yuan Liu,

Peng Wang,

Christian Theobalt,

Taku Komura,

Wenping Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Long_2023_CVPR, author = {Long, Xiaoxiao and Lin, Cheng and Liu, Lingjie and Liu, Yuan and Wang, Peng and Theobalt, Christian and Komura, Taku and Wang, Wenping}, title = {NeuralUDF: Learning Unsigned Distance Fields for Multi-View Reconstruction of Surfaces With Arbitrary Topologies}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20834-20843} }
Collaborative Static and Dynamic Vision-Language Streams for Spatio-Temporal Video Grounding: Zihang Lin,

Chaolei Tan,

Jian-Fang Hu,

Zhi Jin,

Tiancai Ye,

Wei-Shi Zheng; [pdf] [supp]
[bibtex]
@InProceedings{Lin_2023_CVPR, author = {Lin, Zihang and Tan, Chaolei and Hu, Jian-Fang and Jin, Zhi and Ye, Tiancai and Zheng, Wei-Shi}, title = {Collaborative Static and Dynamic Vision-Language Streams for Spatio-Temporal Video Grounding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23100-23109} }
Residual Degradation Learning Unfolding Framework With Mixing Priors Across Spectral and Spatial for Compressive Spectral Imaging: Yubo Dong,

Dahua Gao,

Tian Qiu,

Yuyan Li,

Minxi Yang,

Guangming Shi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dong_2023_CVPR, author = {Dong, Yubo and Gao, Dahua and Qiu, Tian and Li, Yuyan and Yang, Minxi and Shi, Guangming}, title = {Residual Degradation Learning Unfolding Framework With Mixing Priors Across Spectral and Spatial for Compressive Spectral Imaging}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22262-22271} }
GamutMLP: A Lightweight MLP for Color Loss Recovery: Hoang M. Le,

Brian Price,

Scott Cohen,

Michael S. Brown; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Le_2023_CVPR, author = {Le, Hoang M. and Price, Brian and Cohen, Scott and Brown, Michael S.}, title = {GamutMLP: A Lightweight MLP for Color Loss Recovery}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18268-18277} }
Instance-Aware Domain Generalization for Face Anti-Spoofing: Qianyu Zhou,

Ke-Yue Zhang,

Taiping Yao,

Xuequan Lu,

Ran Yi,

Shouhong Ding,

Lizhuang Ma; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhou_2023_CVPR, author = {Zhou, Qianyu and Zhang, Ke-Yue and Yao, Taiping and Lu, Xuequan and Yi, Ran and Ding, Shouhong and Ma, Lizhuang}, title = {Instance-Aware Domain Generalization for Face Anti-Spoofing}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20453-20463} }
Robust and Scalable Gaussian Process Regression and Its Applications: Yifan Lu,

Jiayi Ma,

Leyuan Fang,

Xin Tian,

Junjun Jiang; [pdf] [supp]
[bibtex]
@InProceedings{Lu_2023_CVPR, author = {Lu, Yifan and Ma, Jiayi and Fang, Leyuan and Tian, Xin and Jiang, Junjun}, title = {Robust and Scalable Gaussian Process Regression and Its Applications}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21950-21959} }
Shepherding Slots to Objects: Towards Stable and Robust Object-Centric Learning: Jinwoo Kim,

Janghyuk Choi,

Ho-Jin Choi,

Seon Joo Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2023_CVPR, author = {Kim, Jinwoo and Choi, Janghyuk and Choi, Ho-Jin and Kim, Seon Joo}, title = {Shepherding Slots to Objects: Towards Stable and Robust Object-Centric Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19198-19207} }
High-Fidelity Event-Radiance Recovery via Transient Event Frequency: Jin Han,

Yuta Asano,

Boxin Shi,

Yinqiang Zheng,

Imari Sato; [pdf] [supp]
[bibtex]
@InProceedings{Han_2023_CVPR, author = {Han, Jin and Asano, Yuta and Shi, Boxin and Zheng, Yinqiang and Sato, Imari}, title = {High-Fidelity Event-Radiance Recovery via Transient Event Frequency}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20616-20625} }
NeMo: Learning 3D Neural Motion Fields From Multiple Video Instances of the Same Action: Kuan-Chieh Wang,

Zhenzhen Weng,

Maria Xenochristou,

João Pedro Araújo,

Jeffrey Gu,

Karen Liu,

Serena Yeung; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Kuan-Chieh and Weng, Zhenzhen and Xenochristou, Maria and Ara\'ujo, Jo\~ao Pedro and Gu, Jeffrey and Liu, Karen and Yeung, Serena}, title = {NeMo: Learning 3D Neural Motion Fields From Multiple Video Instances of the Same Action}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22129-22138} }
RIATIG: Reliable and Imperceptible Adversarial Text-to-Image Generation With Natural Prompts: Han Liu,

Yuhao Wu,

Shixuan Zhai,

Bo Yuan,

Ning Zhang; [pdf]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Han and Wu, Yuhao and Zhai, Shixuan and Yuan, Bo and Zhang, Ning}, title = {RIATIG: Reliable and Imperceptible Adversarial Text-to-Image Generation With Natural Prompts}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20585-20594} }
GLIGEN: Open-Set Grounded Text-to-Image Generation: Yuheng Li,

Haotian Liu,

Qingyang Wu,

Fangzhou Mu,

Jianwei Yang,

Jianfeng Gao,

Chunyuan Li,

Yong Jae Lee; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Yuheng and Liu, Haotian and Wu, Qingyang and Mu, Fangzhou and Yang, Jianwei and Gao, Jianfeng and Li, Chunyuan and Lee, Yong Jae}, title = {GLIGEN: Open-Set Grounded Text-to-Image Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22511-22521} }
Learning Geometry-Aware Representations by Sketching: Hyundo Lee,

Inwoo Hwang,

Hyunsung Go,

Won-Seok Choi,

Kibeom Kim,

Byoung-Tak Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2023_CVPR, author = {Lee, Hyundo and Hwang, Inwoo and Go, Hyunsung and Choi, Won-Seok and Kim, Kibeom and Zhang, Byoung-Tak}, title = {Learning Geometry-Aware Representations by Sketching}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23315-23326} }
SVFormer: Semi-Supervised Video Transformer for Action Recognition: Zhen Xing,

Qi Dai,

Han Hu,

Jingjing Chen,

Zuxuan Wu,

Yu-Gang Jiang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xing_2023_CVPR, author = {Xing, Zhen and Dai, Qi and Hu, Han and Chen, Jingjing and Wu, Zuxuan and Jiang, Yu-Gang}, title = {SVFormer: Semi-Supervised Video Transformer for Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18816-18826} }
X-Avatar: Expressive Human Avatars: Kaiyue Shen,

Chen Guo,

Manuel Kaufmann,

Juan Jose Zarate,

Julien Valentin,

Jie Song,

Otmar Hilliges; [pdf] [supp]
[bibtex]
@InProceedings{Shen_2023_CVPR, author = {Shen, Kaiyue and Guo, Chen and Kaufmann, Manuel and Zarate, Juan Jose and Valentin, Julien and Song, Jie and Hilliges, Otmar}, title = {X-Avatar: Expressive Human Avatars}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16911-16921} }
AccelIR: Task-Aware Image Compression for Accelerating Neural Restoration: Juncheol Ye,

Hyunho Yeo,

Jinwoo Park,

Dongsu Han; [pdf] [supp]
[bibtex]
@InProceedings{Ye_2023_CVPR, author = {Ye, Juncheol and Yeo, Hyunho and Park, Jinwoo and Han, Dongsu}, title = {AccelIR: Task-Aware Image Compression for Accelerating Neural Restoration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18216-18226} }
BEV-Guided Multi-Modality Fusion for Driving Perception: Yunze Man,

Liang-Yan Gui,

Yu-Xiong Wang; [pdf] [supp]
[bibtex]
@InProceedings{Man_2023_CVPR, author = {Man, Yunze and Gui, Liang-Yan and Wang, Yu-Xiong}, title = {BEV-Guided Multi-Modality Fusion for Driving Perception}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21960-21969} }
Proximal Splitting Adversarial Attack for Semantic Segmentation: Jérôme Rony,

Jean-Christophe Pesquet,

Ismail Ben Ayed; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Rony_2023_CVPR, author = {Rony, J\'er\^ome and Pesquet, Jean-Christophe and Ben Ayed, Ismail}, title = {Proximal Splitting Adversarial Attack for Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20524-20533} }
Improved Test-Time Adaptation for Domain Generalization: Liang Chen,

Yong Zhang,

Yibing Song,

Ying Shan,

Lingqiao Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_CVPR, author = {Chen, Liang and Zhang, Yong and Song, Yibing and Shan, Ying and Liu, Lingqiao}, title = {Improved Test-Time Adaptation for Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24172-24182} }
Correspondence Transformers With Asymmetric Feature Learning and Matching Flow Super-Resolution: Yixuan Sun,

Dongyang Zhao,

Zhangyue Yin,

Yiwen Huang,

Tao Gui,

Wenqiang Zhang,

Weifeng Ge; [pdf] [supp]
[bibtex]
@InProceedings{Sun_2023_CVPR, author = {Sun, Yixuan and Zhao, Dongyang and Yin, Zhangyue and Huang, Yiwen and Gui, Tao and Zhang, Wenqiang and Ge, Weifeng}, title = {Correspondence Transformers With Asymmetric Feature Learning and Matching Flow Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17787-17796} }
Adjustment and Alignment for Unbiased Open Set Domain Adaptation: Wuyang Li,

Jie Liu,

Bo Han,

Yixuan Yuan; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Wuyang and Liu, Jie and Han, Bo and Yuan, Yixuan}, title = {Adjustment and Alignment for Unbiased Open Set Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24110-24119} }
ESLAM: Efficient Dense SLAM System Based on Hybrid Representation of Signed Distance Fields: Mohammad Mahdi Johari,

Camilla Carta,

François Fleuret; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Johari_2023_CVPR, author = {Johari, Mohammad Mahdi and Carta, Camilla and Fleuret, Fran\c{c}ois}, title = {ESLAM: Efficient Dense SLAM System Based on Hybrid Representation of Signed Distance Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17408-17419} }
Unsupervised Space-Time Network for Temporally-Consistent Segmentation of Multiple Motions: Etienne Meunier,

Patrick Bouthemy; [pdf] [supp]
[bibtex]
@InProceedings{Meunier_2023_CVPR, author = {Meunier, Etienne and Bouthemy, Patrick}, title = {Unsupervised Space-Time Network for Temporally-Consistent Segmentation of Multiple Motions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22139-22148} }
iDisc: Internal Discretization for Monocular Depth Estimation: Luigi Piccinelli,

Christos Sakaridis,

Fisher Yu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Piccinelli_2023_CVPR, author = {Piccinelli, Luigi and Sakaridis, Christos and Yu, Fisher}, title = {iDisc: Internal Discretization for Monocular Depth Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21477-21487} }
Balancing Logit Variation for Long-Tailed Semantic Segmentation: Yuchao Wang,

Jingjing Fei,

Haochen Wang,

Wei Li,

Tianpeng Bao,

Liwei Wu,

Rui Zhao,

Yujun Shen; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Yuchao and Fei, Jingjing and Wang, Haochen and Li, Wei and Bao, Tianpeng and Wu, Liwei and Zhao, Rui and Shen, Yujun}, title = {Balancing Logit Variation for Long-Tailed Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19561-19573} }
Single Image Depth Prediction Made Better: A Multivariate Gaussian Take: Ce Liu,

Suryansh Kumar,

Shuhang Gu,

Radu Timofte,

Luc Van Gool; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Ce and Kumar, Suryansh and Gu, Shuhang and Timofte, Radu and Van Gool, Luc}, title = {Single Image Depth Prediction Made Better: A Multivariate Gaussian Take}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17346-17356} }
Query-Centric Trajectory Prediction: Zikang Zhou,

Jianping Wang,

Yung-Hui Li,

Yu-Kai Huang; [pdf] [supp]
[bibtex]
@InProceedings{Zhou_2023_CVPR, author = {Zhou, Zikang and Wang, Jianping and Li, Yung-Hui and Huang, Yu-Kai}, title = {Query-Centric Trajectory Prediction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17863-17873} }
The Enemy of My Enemy Is My Friend: Exploring Inverse Adversaries for Improving Adversarial Training: Junhao Dong,

Seyed-Mohsen Moosavi-Dezfooli,

Jianhuang Lai,

Xiaohua Xie; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dong_2023_CVPR, author = {Dong, Junhao and Moosavi-Dezfooli, Seyed-Mohsen and Lai, Jianhuang and Xie, Xiaohua}, title = {The Enemy of My Enemy Is My Friend: Exploring Inverse Adversaries for Improving Adversarial Training}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24678-24687} }
Exploring Motion Ambiguity and Alignment for High-Quality Video Frame Interpolation: Kun Zhou,

Wenbo Li,

Xiaoguang Han,

Jiangbo Lu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhou_2023_CVPR, author = {Zhou, Kun and Li, Wenbo and Han, Xiaoguang and Lu, Jiangbo}, title = {Exploring Motion Ambiguity and Alignment for High-Quality Video Frame Interpolation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22169-22179} }
Knowledge Distillation for 6D Pose Estimation by Aligning Distributions of Local Predictions: Shuxuan Guo,

Yinlin Hu,

Jose M. Alvarez,

Mathieu Salzmann; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Guo_2023_CVPR, author = {Guo, Shuxuan and Hu, Yinlin and Alvarez, Jose M. and Salzmann, Mathieu}, title = {Knowledge Distillation for 6D Pose Estimation by Aligning Distributions of Local Predictions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18633-18642} }
Adaptive Annealing for Robust Geometric Estimation: Chitturi Sidhartha,

Lalit Manam,

Venu Madhav Govindu; [pdf] [supp]
[bibtex]
@InProceedings{Sidhartha_2023_CVPR, author = {Sidhartha, Chitturi and Manam, Lalit and Govindu, Venu Madhav}, title = {Adaptive Annealing for Robust Geometric Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21929-21939} }
PointListNet: Deep Learning on 3D Point Lists: Hehe Fan,

Linchao Zhu,

Yi Yang,

Mohan Kankanhalli; [pdf] [supp]
[bibtex]
@InProceedings{Fan_2023_CVPR, author = {Fan, Hehe and Zhu, Linchao and Yang, Yi and Kankanhalli, Mohan}, title = {PointListNet: Deep Learning on 3D Point Lists}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17692-17701} }
Upcycling Models Under Domain and Category Shift: Sanqing Qu,

Tianpei Zou,

Florian Röhrbein,

Cewu Lu,

Guang Chen,

Dacheng Tao,

Changjun Jiang; [pdf] [supp]
[bibtex]
@InProceedings{Qu_2023_CVPR, author = {Qu, Sanqing and Zou, Tianpei and R\"ohrbein, Florian and Lu, Cewu and Chen, Guang and Tao, Dacheng and Jiang, Changjun}, title = {Upcycling Models Under Domain and Category Shift}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20019-20028} }
Single Domain Generalization for LiDAR Semantic Segmentation: Hyeonseong Kim,

Yoonsu Kang,

Changgyoon Oh,

Kuk-Jin Yoon; [pdf] [supp]
[bibtex]
@InProceedings{Kim_2023_CVPR, author = {Kim, Hyeonseong and Kang, Yoonsu and Oh, Changgyoon and Yoon, Kuk-Jin}, title = {Single Domain Generalization for LiDAR Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17587-17598} }
SLACK: Stable Learning of Augmentations With Cold-Start and KL Regularization: Juliette Marrie,

Michael Arbel,

Diane Larlus,

Julien Mairal; [pdf] [supp]
[bibtex]
@InProceedings{Marrie_2023_CVPR, author = {Marrie, Juliette and Arbel, Michael and Larlus, Diane and Mairal, Julien}, title = {SLACK: Stable Learning of Augmentations With Cold-Start and KL Regularization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24306-24314} }
Gradient Norm Aware Minimization Seeks First-Order Flatness and Improves Generalization: Xingxuan Zhang,

Renzhe Xu,

Han Yu,

Hao Zou,

Peng Cui; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_CVPR, author = {Zhang, Xingxuan and Xu, Renzhe and Yu, Han and Zou, Hao and Cui, Peng}, title = {Gradient Norm Aware Minimization Seeks First-Order Flatness and Improves Generalization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20247-20257} }
Latency Matters: Real-Time Action Forecasting Transformer: Harshayu Girase,

Nakul Agarwal,

Chiho Choi,

Karttikeya Mangalam; [pdf] [supp]
[bibtex]
@InProceedings{Girase_2023_CVPR, author = {Girase, Harshayu and Agarwal, Nakul and Choi, Chiho and Mangalam, Karttikeya}, title = {Latency Matters: Real-Time Action Forecasting Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18759-18769} }
HierVL: Learning Hierarchical Video-Language Embeddings: Kumar Ashutosh,

Rohit Girdhar,

Lorenzo Torresani,

Kristen Grauman; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ashutosh_2023_CVPR, author = {Ashutosh, Kumar and Girdhar, Rohit and Torresani, Lorenzo and Grauman, Kristen}, title = {HierVL: Learning Hierarchical Video-Language Embeddings}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23066-23078} }
GraVoS: Voxel Selection for 3D Point-Cloud Detection: Oren Shrout,

Yizhak Ben-Shabat,

Ayellet Tal; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shrout_2023_CVPR, author = {Shrout, Oren and Ben-Shabat, Yizhak and Tal, Ayellet}, title = {GraVoS: Voxel Selection for 3D Point-Cloud Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21684-21693} }
RobustNeRF: Ignoring Distractors With Robust Losses: Sara Sabour,

Suhani Vora,

Daniel Duckworth,

Ivan Krasin,

David J. Fleet,

Andrea Tagliasacchi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sabour_2023_CVPR, author = {Sabour, Sara and Vora, Suhani and Duckworth, Daniel and Krasin, Ivan and Fleet, David J. and Tagliasacchi, Andrea}, title = {RobustNeRF: Ignoring Distractors With Robust Losses}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20626-20636} }
Spherical Transformer for LiDAR-Based 3D Recognition: Xin Lai,

Yukang Chen,

Fanbin Lu,

Jianhui Liu,

Jiaya Jia; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lai_2023_CVPR, author = {Lai, Xin and Chen, Yukang and Lu, Fanbin and Liu, Jianhui and Jia, Jiaya}, title = {Spherical Transformer for LiDAR-Based 3D Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17545-17555} }
Watch or Listen: Robust Audio-Visual Speech Recognition With Visual Corruption Modeling and Reliability Scoring: Joanna Hong,

Minsu Kim,

Jeongsoo Choi,

Yong Man Ro; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hong_2023_CVPR, author = {Hong, Joanna and Kim, Minsu and Choi, Jeongsoo and Ro, Yong Man}, title = {Watch or Listen: Robust Audio-Visual Speech Recognition With Visual Corruption Modeling and Reliability Scoring}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18783-18794} }
VisFusion: Visibility-Aware Online 3D Scene Reconstruction From Videos: Huiyu Gao,

Wei Mao,

Miaomiao Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gao_2023_CVPR, author = {Gao, Huiyu and Mao, Wei and Liu, Miaomiao}, title = {VisFusion: Visibility-Aware Online 3D Scene Reconstruction From Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17317-17326} }
Towards Transferable Targeted Adversarial Examples: Zhibo Wang,

Hongshan Yang,

Yunhe Feng,

Peng Sun,

Hengchang Guo,

Zhifei Zhang,

Kui Ren; [pdf]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Zhibo and Yang, Hongshan and Feng, Yunhe and Sun, Peng and Guo, Hengchang and Zhang, Zhifei and Ren, Kui}, title = {Towards Transferable Targeted Adversarial Examples}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20534-20543} }
C-SFDA: A Curriculum Learning Aided Self-Training Framework for Efficient Source Free Domain Adaptation: Nazmul Karim,

Niluthpol Chowdhury Mithun,

Abhinav Rajvanshi,

Han-pang Chiu,

Supun Samarasekera,

Nazanin Rahnavard; [pdf] [supp]
[bibtex]
@InProceedings{Karim_2023_CVPR, author = {Karim, Nazmul and Mithun, Niluthpol Chowdhury and Rajvanshi, Abhinav and Chiu, Han-pang and Samarasekera, Supun and Rahnavard, Nazanin}, title = {C-SFDA: A Curriculum Learning Aided Self-Training Framework for Efficient Source Free Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24120-24131} }
Modeling the Distributional Uncertainty for Salient Object Detection Models: Xinyu Tian,

Jing Zhang,

Mochu Xiang,

Yuchao Dai; [pdf]
[bibtex]
@InProceedings{Tian_2023_CVPR, author = {Tian, Xinyu and Zhang, Jing and Xiang, Mochu and Dai, Yuchao}, title = {Modeling the Distributional Uncertainty for Salient Object Detection Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19660-19670} }
Kernel Aware Resampler: Michael Bernasconi,

Abdelaziz Djelouah,

Farnood Salehi,

Markus Gross,

Christopher Schroers; [pdf] [supp]
[bibtex]
@InProceedings{Bernasconi_2023_CVPR, author = {Bernasconi, Michael and Djelouah, Abdelaziz and Salehi, Farnood and Gross, Markus and Schroers, Christopher}, title = {Kernel Aware Resampler}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22347-22355} }
LaserMix for Semi-Supervised LiDAR Semantic Segmentation: Lingdong Kong,

Jiawei Ren,

Liang Pan,

Ziwei Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kong_2023_CVPR, author = {Kong, Lingdong and Ren, Jiawei and Pan, Liang and Liu, Ziwei}, title = {LaserMix for Semi-Supervised LiDAR Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21705-21715} }
Complementary Intrinsics From Neural Radiance Fields and CNNs for Outdoor Scene Relighting: Siqi Yang,

Xuanning Cui,

Yongjie Zhu,

Jiajun Tang,

Si Li,

Zhaofei Yu,

Boxin Shi; [pdf] [supp]
[bibtex]
@InProceedings{Yang_2023_CVPR, author = {Yang, Siqi and Cui, Xuanning and Zhu, Yongjie and Tang, Jiajun and Li, Si and Yu, Zhaofei and Shi, Boxin}, title = {Complementary Intrinsics From Neural Radiance Fields and CNNs for Outdoor Scene Relighting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16600-16609} }
Azimuth Super-Resolution for FMCW Radar in Autonomous Driving: Yu-Jhe Li,

Shawn Hunt,

Jinhyung Park,

Matthew O’Toole,

Kris Kitani; [pdf]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Yu-Jhe and Hunt, Shawn and Park, Jinhyung and O{\textquoteright}Toole, Matthew and Kitani, Kris}, title = {Azimuth Super-Resolution for FMCW Radar in Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17504-17513} }
VQACL: A Novel Visual Question Answering Continual Learning Setting: Xi Zhang,

Feifei Zhang,

Changsheng Xu; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_CVPR, author = {Zhang, Xi and Zhang, Feifei and Xu, Changsheng}, title = {VQACL: A Novel Visual Question Answering Continual Learning Setting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19102-19112} }
High-Res Facial Appearance Capture From Polarized Smartphone Images: Dejan Azinović,

Olivier Maury,

Christophe Hery,

Matthias Nießner,

Justus Thies; [pdf] [supp]
[bibtex]
@InProceedings{Azinovic_2023_CVPR, author = {Azinovi\'c, Dejan and Maury, Olivier and Hery, Christophe and Nie{\ss}ner, Matthias and Thies, Justus}, title = {High-Res Facial Appearance Capture From Polarized Smartphone Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16836-16846} }
JAWS: Just a Wild Shot for Cinematic Transfer in Neural Radiance Fields: Xi Wang,

Robin Courant,

Jinglei Shi,

Eric Marchand,

Marc Christie; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Xi and Courant, Robin and Shi, Jinglei and Marchand, Eric and Christie, Marc}, title = {JAWS: Just a Wild Shot for Cinematic Transfer in Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16933-16942} }
EfficientSCI: Densely Connected Network With Space-Time Factorization for Large-Scale Video Snapshot Compressive Imaging: Lishun Wang,

Miao Cao,

Xin Yuan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Lishun and Cao, Miao and Yuan, Xin}, title = {EfficientSCI: Densely Connected Network With Space-Time Factorization for Large-Scale Video Snapshot Compressive Imaging}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18477-18486} }
MotionTrack: Learning Robust Short-Term and Long-Term Motions for Multi-Object Tracking: Zheng Qin,

Sanping Zhou,

Le Wang,

Jinghai Duan,

Gang Hua,

Wei Tang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Qin_2023_CVPR, author = {Qin, Zheng and Zhou, Sanping and Wang, Le and Duan, Jinghai and Hua, Gang and Tang, Wei}, title = {MotionTrack: Learning Robust Short-Term and Long-Term Motions for Multi-Object Tracking}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17939-17948} }
3D Registration With Maximal Cliques: Xiyu Zhang,

Jiaqi Yang,

Shikun Zhang,

Yanning Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_CVPR, author = {Zhang, Xiyu and Yang, Jiaqi and Zhang, Shikun and Zhang, Yanning}, title = {3D Registration With Maximal Cliques}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17745-17754} }
MetaPortrait: Identity-Preserving Talking Head Generation With Fast Personalized Adaptation: Bowen Zhang,

Chenyang Qi,

Pan Zhang,

Bo Zhang,

HsiangTao Wu,

Dong Chen,

Qifeng Chen,

Yong Wang,

Fang Wen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_CVPR, author = {Zhang, Bowen and Qi, Chenyang and Zhang, Pan and Zhang, Bo and Wu, HsiangTao and Chen, Dong and Chen, Qifeng and Wang, Yong and Wen, Fang}, title = {MetaPortrait: Identity-Preserving Talking Head Generation With Fast Personalized Adaptation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22096-22105} }
UniHCP: A Unified Model for Human-Centric Perceptions: Yuanzheng Ci,

Yizhou Wang,

Meilin Chen,

Shixiang Tang,

Lei Bai,

Feng Zhu,

Rui Zhao,

Fengwei Yu,

Donglian Qi,

Wanli Ouyang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ci_2023_CVPR, author = {Ci, Yuanzheng and Wang, Yizhou and Chen, Meilin and Tang, Shixiang and Bai, Lei and Zhu, Feng and Zhao, Rui and Yu, Fengwei and Qi, Donglian and Ouyang, Wanli}, title = {UniHCP: A Unified Model for Human-Centric Perceptions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17840-17852} }
VoxelNeXt: Fully Sparse VoxelNet for 3D Object Detection and Tracking: Yukang Chen,

Jianhui Liu,

Xiangyu Zhang,

Xiaojuan Qi,

Jiaya Jia; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_CVPR, author = {Chen, Yukang and Liu, Jianhui and Zhang, Xiangyu and Qi, Xiaojuan and Jia, Jiaya}, title = {VoxelNeXt: Fully Sparse VoxelNet for 3D Object Detection and Tracking}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21674-21683} }
Bias in Pruned Vision Models: In-Depth Analysis and Countermeasures: Eugenia Iofinova,

Alexandra Peste,

Dan Alistarh; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Iofinova_2023_CVPR, author = {Iofinova, Eugenia and Peste, Alexandra and Alistarh, Dan}, title = {Bias in Pruned Vision Models: In-Depth Analysis and Countermeasures}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24364-24373} }
AttentionShift: Iteratively Estimated Part-Based Attention Map for Pointly Supervised Instance Segmentation: Mingxiang Liao,

Zonghao Guo,

Yuze Wang,

Peng Yuan,

Bailan Feng,

Fang Wan; [pdf] [supp]
[bibtex]
@InProceedings{Liao_2023_CVPR, author = {Liao, Mingxiang and Guo, Zonghao and Wang, Yuze and Yuan, Peng and Feng, Bailan and Wan, Fang}, title = {AttentionShift: Iteratively Estimated Part-Based Attention Map for Pointly Supervised Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19519-19528} }
PlaneDepth: Self-Supervised Depth Estimation via Orthogonal Planes: Ruoyu Wang,

Zehao Yu,

Shenghua Gao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Ruoyu and Yu, Zehao and Gao, Shenghua}, title = {PlaneDepth: Self-Supervised Depth Estimation via Orthogonal Planes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21425-21434} }
Semantic-Conditional Diffusion Networks for Image Captioning: Jianjie Luo,

Yehao Li,

Yingwei Pan,

Ting Yao,

Jianlin Feng,

Hongyang Chao,

Tao Mei; [pdf] [arXiv]
[bibtex]
@InProceedings{Luo_2023_CVPR, author = {Luo, Jianjie and Li, Yehao and Pan, Yingwei and Yao, Ting and Feng, Jianlin and Chao, Hongyang and Mei, Tao}, title = {Semantic-Conditional Diffusion Networks for Image Captioning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23359-23368} }
TranSG: Transformer-Based Skeleton Graph Prototype Contrastive Learning With Structure-Trajectory Prompted Reconstruction for Person Re-Identification: Haocong Rao,

Chunyan Miao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Rao_2023_CVPR, author = {Rao, Haocong and Miao, Chunyan}, title = {TranSG: Transformer-Based Skeleton Graph Prototype Contrastive Learning With Structure-Trajectory Prompted Reconstruction for Person Re-Identification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22118-22128} }
All Are Worth Words: A ViT Backbone for Diffusion Models: Fan Bao,

Shen Nie,

Kaiwen Xue,

Yue Cao,

Chongxuan Li,

Hang Su,

Jun Zhu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bao_2023_CVPR, author = {Bao, Fan and Nie, Shen and Xue, Kaiwen and Cao, Yue and Li, Chongxuan and Su, Hang and Zhu, Jun}, title = {All Are Worth Words: A ViT Backbone for Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22669-22679} }
SteerNeRF: Accelerating NeRF Rendering via Smooth Viewpoint Trajectory: Sicheng Li,

Hao Li,

Yue Wang,

Yiyi Liao,

Lu Yu; [pdf] [arXiv]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Sicheng and Li, Hao and Wang, Yue and Liao, Yiyi and Yu, Lu}, title = {SteerNeRF: Accelerating NeRF Rendering via Smooth Viewpoint Trajectory}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20701-20711} }
Spatial-Frequency Mutual Learning for Face Super-Resolution: Chenyang Wang,

Junjun Jiang,

Zhiwei Zhong,

Xianming Liu; [pdf]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Chenyang and Jiang, Junjun and Zhong, Zhiwei and Liu, Xianming}, title = {Spatial-Frequency Mutual Learning for Face Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22356-22366} }
Being Comes From Not-Being: Open-Vocabulary Text-to-Motion Generation With Wordless Training: Junfan Lin,

Jianlong Chang,

Lingbo Liu,

Guanbin Li,

Liang Lin,

Qi Tian,

Chang-Wen Chen; [pdf] [supp]
[bibtex]
@InProceedings{Lin_2023_CVPR, author = {Lin, Junfan and Chang, Jianlong and Liu, Lingbo and Li, Guanbin and Lin, Liang and Tian, Qi and Chen, Chang-Wen}, title = {Being Comes From Not-Being: Open-Vocabulary Text-to-Motion Generation With Wordless Training}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23222-23231} }
MonoHuman: Animatable Human Neural Field From Monocular Video: Zhengming Yu,

Wei Cheng,

Xian Liu,

Wayne Wu,

Kwan-Yee Lin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yu_2023_CVPR, author = {Yu, Zhengming and Cheng, Wei and Liu, Xian and Wu, Wayne and Lin, Kwan-Yee}, title = {MonoHuman: Animatable Human Neural Field From Monocular Video}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16943-16953} }
SINE: Semantic-Driven Image-Based NeRF Editing With Prior-Guided Editing Field: Chong Bao,

Yinda Zhang,

Bangbang Yang,

Tianxing Fan,

Zesong Yang,

Hujun Bao,

Guofeng Zhang,

Zhaopeng Cui; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bao_2023_CVPR, author = {Bao, Chong and Zhang, Yinda and Yang, Bangbang and Fan, Tianxing and Yang, Zesong and Bao, Hujun and Zhang, Guofeng and Cui, Zhaopeng}, title = {SINE: Semantic-Driven Image-Based NeRF Editing With Prior-Guided Editing Field}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20919-20929} }
MetaCLUE: Towards Comprehensive Visual Metaphors Research: Arjun R. Akula,

Brendan Driscoll,

Pradyumna Narayana,

Soravit Changpinyo,

Zhiwei Jia,

Suyash Damle,

Garima Pruthi,

Sugato Basu,

Leonidas Guibas,

William T. Freeman,

Yuanzhen Li,

Varun Jampani; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Akula_2023_CVPR, author = {Akula, Arjun R. and Driscoll, Brendan and Narayana, Pradyumna and Changpinyo, Soravit and Jia, Zhiwei and Damle, Suyash and Pruthi, Garima and Basu, Sugato and Guibas, Leonidas and Freeman, William T. and Li, Yuanzhen and Jampani, Varun}, title = {MetaCLUE: Towards Comprehensive Visual Metaphors Research}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23201-23211} }
Towards End-to-End Generative Modeling of Long Videos With Memory-Efficient Bidirectional Transformers: Jaehoon Yoo,

Semin Kim,

Doyup Lee,

Chiheon Kim,

Seunghoon Hong; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yoo_2023_CVPR, author = {Yoo, Jaehoon and Kim, Semin and Lee, Doyup and Kim, Chiheon and Hong, Seunghoon}, title = {Towards End-to-End Generative Modeling of Long Videos With Memory-Efficient Bidirectional Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22888-22897} }
HaLP: Hallucinating Latent Positives for Skeleton-Based Self-Supervised Learning of Actions: Anshul Shah,

Aniket Roy,

Ketul Shah,

Shlok Mishra,

David Jacobs,

Anoop Cherian,

Rama Chellappa; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shah_2023_CVPR, author = {Shah, Anshul and Roy, Aniket and Shah, Ketul and Mishra, Shlok and Jacobs, David and Cherian, Anoop and Chellappa, Rama}, title = {HaLP: Hallucinating Latent Positives for Skeleton-Based Self-Supervised Learning of Actions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18846-18856} }
FLEX: Full-Body Grasping Without Full-Body Grasps: Purva Tendulkar,

Dídac Surís,

Carl Vondrick; [pdf] [supp]
[bibtex]
@InProceedings{Tendulkar_2023_CVPR, author = {Tendulkar, Purva and Sur{\'\i}s, D{\'\i}dac and Vondrick, Carl}, title = {FLEX: Full-Body Grasping Without Full-Body Grasps}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21179-21189} }
EVA: Exploring the Limits of Masked Visual Representation Learning at Scale: Yuxin Fang,

Wen Wang,

Binhui Xie,

Quan Sun,

Ledell Wu,

Xinggang Wang,

Tiejun Huang,

Xinlong Wang,

Yue Cao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Fang_2023_CVPR, author = {Fang, Yuxin and Wang, Wen and Xie, Binhui and Sun, Quan and Wu, Ledell and Wang, Xinggang and Huang, Tiejun and Wang, Xinlong and Cao, Yue}, title = {EVA: Exploring the Limits of Masked Visual Representation Learning at Scale}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19358-19369} }
Discrete Point-Wise Attack Is Not Enough: Generalized Manifold Adversarial Attack for Face Recognition: Qian Li,

Yuxiao Hu,

Ye Liu,

Dongxiao Zhang,

Xin Jin,

Yuntian Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Qian and Hu, Yuxiao and Liu, Ye and Zhang, Dongxiao and Jin, Xin and Chen, Yuntian}, title = {Discrete Point-Wise Attack Is Not Enough: Generalized Manifold Adversarial Attack for Face Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20575-20584} }
FREDOM: Fairness Domain Adaptation Approach to Semantic Scene Understanding: Thanh-Dat Truong,

Ngan Le,

Bhiksha Raj,

Jackson Cothren,

Khoa Luu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Truong_2023_CVPR, author = {Truong, Thanh-Dat and Le, Ngan and Raj, Bhiksha and Cothren, Jackson and Luu, Khoa}, title = {FREDOM: Fairness Domain Adaptation Approach to Semantic Scene Understanding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19988-19997} }
IMP: Iterative Matching and Pose Estimation With Adaptive Pooling: Fei Xue,

Ignas Budvytis,

Roberto Cipolla; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xue_2023_CVPR, author = {Xue, Fei and Budvytis, Ignas and Cipolla, Roberto}, title = {IMP: Iterative Matching and Pose Estimation With Adaptive Pooling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21317-21326} }
PATS: Patch Area Transportation With Subdivision for Local Feature Matching: Junjie Ni,

Yijin Li,

Zhaoyang Huang,

Hongsheng Li,

Hujun Bao,

Zhaopeng Cui,

Guofeng Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ni_2023_CVPR, author = {Ni, Junjie and Li, Yijin and Huang, Zhaoyang and Li, Hongsheng and Bao, Hujun and Cui, Zhaopeng and Zhang, Guofeng}, title = {PATS: Patch Area Transportation With Subdivision for Local Feature Matching}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17776-17786} }
MEDIC: Remove Model Backdoors via Importance Driven Cloning: Qiuling Xu,

Guanhong Tao,

Jean Honorio,

Yingqi Liu,

Shengwei An,

Guangyu Shen,

Siyuan Cheng,

Xiangyu Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Xu_2023_CVPR, author = {Xu, Qiuling and Tao, Guanhong and Honorio, Jean and Liu, Yingqi and An, Shengwei and Shen, Guangyu and Cheng, Siyuan and Zhang, Xiangyu}, title = {MEDIC: Remove Model Backdoors via Importance Driven Cloning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20485-20494} }
SimpleNet: A Simple Network for Image Anomaly Detection and Localization: Zhikang Liu,

Yiming Zhou,

Yuansheng Xu,

Zilei Wang; [pdf] [arXiv]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Zhikang and Zhou, Yiming and Xu, Yuansheng and Wang, Zilei}, title = {SimpleNet: A Simple Network for Image Anomaly Detection and Localization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20402-20411} }
G-MSM: Unsupervised Multi-Shape Matching With Graph-Based Affinity Priors: Marvin Eisenberger,

Aysim Toker,

Laura Leal-Taixé,

Daniel Cremers; [pdf] [supp]
[bibtex]
@InProceedings{Eisenberger_2023_CVPR, author = {Eisenberger, Marvin and Toker, Aysim and Leal-Taix\'e, Laura and Cremers, Daniel}, title = {G-MSM: Unsupervised Multi-Shape Matching With Graph-Based Affinity Priors}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22762-22772} }
Mixed Autoencoder for Self-Supervised Visual Representation Learning: Kai Chen,

Zhili Liu,

Lanqing Hong,

Hang Xu,

Zhenguo Li,

Dit-Yan Yeung; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_CVPR, author = {Chen, Kai and Liu, Zhili and Hong, Lanqing and Xu, Hang and Li, Zhenguo and Yeung, Dit-Yan}, title = {Mixed Autoencoder for Self-Supervised Visual Representation Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22742-22751} }
ProphNet: Efficient Agent-Centric Motion Forecasting With Anchor-Informed Proposals: Xishun Wang,

Tong Su,

Fang Da,

Xiaodong Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Xishun and Su, Tong and Da, Fang and Yang, Xiaodong}, title = {ProphNet: Efficient Agent-Centric Motion Forecasting With Anchor-Informed Proposals}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21995-22003} }
Learning Multi-Modal Class-Specific Tokens for Weakly Supervised Dense Object Localization: Lian Xu,

Wanli Ouyang,

Mohammed Bennamoun,

Farid Boussaid,

Dan Xu; [pdf] [supp]
[bibtex]
@InProceedings{Xu_2023_CVPR, author = {Xu, Lian and Ouyang, Wanli and Bennamoun, Mohammed and Boussaid, Farid and Xu, Dan}, title = {Learning Multi-Modal Class-Specific Tokens for Weakly Supervised Dense Object Localization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19596-19605} }
GlassesGAN: Eyewear Personalization Using Synthetic Appearance Discovery and Targeted Subspace Modeling: Richard Plesh,

Peter Peer,

Vitomir Struc; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Plesh_2023_CVPR, author = {Plesh, Richard and Peer, Peter and Struc, Vitomir}, title = {GlassesGAN: Eyewear Personalization Using Synthetic Appearance Discovery and Targeted Subspace Modeling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16847-16857} }
Deep Hashing With Minimal-Distance-Separated Hash Centers: Liangdao Wang,

Yan Pan,

Cong Liu,

Hanjiang Lai,

Jian Yin,

Ye Liu; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Liangdao and Pan, Yan and Liu, Cong and Lai, Hanjiang and Yin, Jian and Liu, Ye}, title = {Deep Hashing With Minimal-Distance-Separated Hash Centers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23455-23464} }
VL-SAT: Visual-Linguistic Semantics Assisted Training for 3D Semantic Scene Graph Prediction in Point Cloud: Ziqin Wang,

Bowen Cheng,

Lichen Zhao,

Dong Xu,

Yang Tang,

Lu Sheng; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Ziqin and Cheng, Bowen and Zhao, Lichen and Xu, Dong and Tang, Yang and Sheng, Lu}, title = {VL-SAT: Visual-Linguistic Semantics Assisted Training for 3D Semantic Scene Graph Prediction in Point Cloud}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21560-21569} }
Learning Emotion Representations From Verbal and Nonverbal Communication: Sitao Zhang,

Yimu Pan,

James Z. Wang; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_CVPR, author = {Zhang, Sitao and Pan, Yimu and Wang, James Z.}, title = {Learning Emotion Representations From Verbal and Nonverbal Communication}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18993-19004} }
Architectural Backdoors in Neural Networks: Mikel Bober-Irizar,

Ilia Shumailov,

Yiren Zhao,

Robert Mullins,

Nicolas Papernot; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bober-Irizar_2023_CVPR, author = {Bober-Irizar, Mikel and Shumailov, Ilia and Zhao, Yiren and Mullins, Robert and Papernot, Nicolas}, title = {Architectural Backdoors in Neural Networks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24595-24604} }
Semantic Human Parsing via Scalable Semantic Transfer Over Multiple Label Domains: Jie Yang,

Chaoqun Wang,

Zhen Li,

Junle Wang,

Ruimao Zhang; [pdf] [arXiv]
[bibtex]
@InProceedings{Yang_2023_CVPR, author = {Yang, Jie and Wang, Chaoqun and Li, Zhen and Wang, Junle and Zhang, Ruimao}, title = {Semantic Human Parsing via Scalable Semantic Transfer Over Multiple Label Domains}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19424-19433} }
GEN: Pushing the Limits of Softmax-Based Out-of-Distribution Detection: Xixi Liu,

Yaroslava Lochman,

Christopher Zach; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Xixi and Lochman, Yaroslava and Zach, Christopher}, title = {GEN: Pushing the Limits of Softmax-Based Out-of-Distribution Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23946-23955} }
Learnable Skeleton-Aware 3D Point Cloud Sampling: Cheng Wen,

Baosheng Yu,

Dacheng Tao; [pdf] [supp]
[bibtex]
@InProceedings{Wen_2023_CVPR, author = {Wen, Cheng and Yu, Baosheng and Tao, Dacheng}, title = {Learnable Skeleton-Aware 3D Point Cloud Sampling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17671-17681} }
Boundary-Enhanced Co-Training for Weakly Supervised Semantic Segmentation: Shenghai Rong,

Bohai Tu,

Zilei Wang,

Junjie Li; [pdf] [supp]
[bibtex]
@InProceedings{Rong_2023_CVPR, author = {Rong, Shenghai and Tu, Bohai and Wang, Zilei and Li, Junjie}, title = {Boundary-Enhanced Co-Training for Weakly Supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19574-19584} }
Sample-Level Multi-View Graph Clustering: Yuze Tan,

Yixi Liu,

Shudong Huang,

Wentao Feng,

Jiancheng Lv; [pdf]
[bibtex]
@InProceedings{Tan_2023_CVPR, author = {Tan, Yuze and Liu, Yixi and Huang, Shudong and Feng, Wentao and Lv, Jiancheng}, title = {Sample-Level Multi-View Graph Clustering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23966-23975} }
Next3D: Generative Neural Texture Rasterization for 3D-Aware Head Avatars: Jingxiang Sun,

Xuan Wang,

Lizhen Wang,

Xiaoyu Li,

Yong Zhang,

Hongwen Zhang,

Yebin Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sun_2023_CVPR, author = {Sun, Jingxiang and Wang, Xuan and Wang, Lizhen and Li, Xiaoyu and Zhang, Yong and Zhang, Hongwen and Liu, Yebin}, title = {Next3D: Generative Neural Texture Rasterization for 3D-Aware Head Avatars}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20991-21002} }
Linking Garment With Person via Semantically Associated Landmarks for Virtual Try-On: Keyu Yan,

Tingwei Gao,

Hui Zhang,

Chengjun Xie; [pdf] [supp]
[bibtex]
@InProceedings{Yan_2023_CVPR, author = {Yan, Keyu and Gao, Tingwei and Zhang, Hui and Xie, Chengjun}, title = {Linking Garment With Person via Semantically Associated Landmarks for Virtual Try-On}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17194-17204} }
Devil's on the Edges: Selective Quad Attention for Scene Graph Generation: Deunsol Jung,

Sanghyun Kim,

Won Hwa Kim,

Minsu Cho; [pdf] [supp]
[bibtex]
@InProceedings{Jung_2023_CVPR, author = {Jung, Deunsol and Kim, Sanghyun and Kim, Won Hwa and Cho, Minsu}, title = {Devil's on the Edges: Selective Quad Attention for Scene Graph Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18664-18674} }
NIFF: Alleviating Forgetting in Generalized Few-Shot Object Detection via Neural Instance Feature Forging: Karim Guirguis,

Johannes Meier,

George Eskandar,

Matthias Kayser,

Bin Yang,

Jürgen Beyerer; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Guirguis_2023_CVPR, author = {Guirguis, Karim and Meier, Johannes and Eskandar, George and Kayser, Matthias and Yang, Bin and Beyerer, J\"urgen}, title = {NIFF: Alleviating Forgetting in Generalized Few-Shot Object Detection via Neural Instance Feature Forging}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24193-24202} }
Post-Processing Temporal Action Detection: Sauradip Nag,

Xiatian Zhu,

Yi-Zhe Song,

Tao Xiang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Nag_2023_CVPR, author = {Nag, Sauradip and Zhu, Xiatian and Song, Yi-Zhe and Xiang, Tao}, title = {Post-Processing Temporal Action Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18837-18845} }
ConZIC: Controllable Zero-Shot Image Captioning by Sampling-Based Polishing: Zequn Zeng,

Hao Zhang,

Ruiying Lu,

Dongsheng Wang,

Bo Chen,

Zhengjue Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zeng_2023_CVPR, author = {Zeng, Zequn and Zhang, Hao and Lu, Ruiying and Wang, Dongsheng and Chen, Bo and Wang, Zhengjue}, title = {ConZIC: Controllable Zero-Shot Image Captioning by Sampling-Based Polishing}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23465-23476} }
Learning From Noisy Labels With Decoupled Meta Label Purifier: Yuanpeng Tu,

Boshen Zhang,

Yuxi Li,

Liang Liu,

Jian Li,

Yabiao Wang,

Chengjie Wang,

Cai Rong Zhao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tu_2023_CVPR, author = {Tu, Yuanpeng and Zhang, Boshen and Li, Yuxi and Liu, Liang and Li, Jian and Wang, Yabiao and Wang, Chengjie and Zhao, Cai Rong}, title = {Learning From Noisy Labels With Decoupled Meta Label Purifier}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19934-19943} }
Language in a Bottle: Language Model Guided Concept Bottlenecks for Interpretable Image Classification: Yue Yang,

Artemis Panagopoulou,

Shenghao Zhou,

Daniel Jin,

Chris Callison-Burch,

Mark Yatskar; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_CVPR, author = {Yang, Yue and Panagopoulou, Artemis and Zhou, Shenghao and Jin, Daniel and Callison-Burch, Chris and Yatskar, Mark}, title = {Language in a Bottle: Language Model Guided Concept Bottlenecks for Interpretable Image Classification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19187-19197} }
ViPLO: Vision Transformer Based Pose-Conditioned Self-Loop Graph for Human-Object Interaction Detection: Jeeseung Park,

Jin-Woo Park,

Jong-Seok Lee; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Park_2023_CVPR, author = {Park, Jeeseung and Park, Jin-Woo and Lee, Jong-Seok}, title = {ViPLO: Vision Transformer Based Pose-Conditioned Self-Loop Graph for Human-Object Interaction Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17152-17162} }
MSINet: Twins Contrastive Search of Multi-Scale Interaction for Object ReID: Jianyang Gu,

Kai Wang,

Hao Luo,

Chen Chen,

Wei Jiang,

Yuqiang Fang,

Shanghang Zhang,

Yang You,

Jian Zhao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gu_2023_CVPR, author = {Gu, Jianyang and Wang, Kai and Luo, Hao and Chen, Chen and Jiang, Wei and Fang, Yuqiang and Zhang, Shanghang and You, Yang and Zhao, Jian}, title = {MSINet: Twins Contrastive Search of Multi-Scale Interaction for Object ReID}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19243-19253} }
WIRE: Wavelet Implicit Neural Representations: Vishwanath Saragadam,

Daniel LeJeune,

Jasper Tan,

Guha Balakrishnan,

Ashok Veeraraghavan,

Richard G. Baraniuk; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Saragadam_2023_CVPR, author = {Saragadam, Vishwanath and LeJeune, Daniel and Tan, Jasper and Balakrishnan, Guha and Veeraraghavan, Ashok and Baraniuk, Richard G.}, title = {WIRE: Wavelet Implicit Neural Representations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18507-18516} }
Bringing Inputs to Shared Domains for 3D Interacting Hands Recovery in the Wild: Gyeongsik Moon; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Moon_2023_CVPR, author = {Moon, Gyeongsik}, title = {Bringing Inputs to Shared Domains for 3D Interacting Hands Recovery in the Wild}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17028-17037} }
Deep Deterministic Uncertainty: A New Simple Baseline: Jishnu Mukhoti,

Andreas Kirsch,

Joost van Amersfoort,

Philip H.S. Torr,

Yarin Gal; [pdf] [supp]
[bibtex]
@InProceedings{Mukhoti_2023_CVPR, author = {Mukhoti, Jishnu and Kirsch, Andreas and van Amersfoort, Joost and Torr, Philip H.S. and Gal, Yarin}, title = {Deep Deterministic Uncertainty: A New Simple Baseline}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24384-24394} }
NeRDi: Single-View NeRF Synthesis With Language-Guided Diffusion As General Image Priors: Congyue Deng,

Chiyu “Max” Jiang,

Charles R. Qi,

Xinchen Yan,

Yin Zhou,

Leonidas Guibas,

Dragomir Anguelov; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Deng_2023_CVPR, author = {Deng, Congyue and Jiang, Chiyu {\textquotedblleft}Max{\textquotedblright} and Qi, Charles R. and Yan, Xinchen and Zhou, Yin and Guibas, Leonidas and Anguelov, Dragomir}, title = {NeRDi: Single-View NeRF Synthesis With Language-Guided Diffusion As General Image Priors}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20637-20647} }
InstantAvatar: Learning Avatars From Monocular Video in 60 Seconds: Tianjian Jiang,

Xu Chen,

Jie Song,

Otmar Hilliges; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jiang_2023_CVPR, author = {Jiang, Tianjian and Chen, Xu and Song, Jie and Hilliges, Otmar}, title = {InstantAvatar: Learning Avatars From Monocular Video in 60 Seconds}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16922-16932} }
You Only Segment Once: Towards Real-Time Panoptic Segmentation: Jie Hu,

Linyan Huang,

Tianhe Ren,

Shengchuan Zhang,

Rongrong Ji,

Liujuan Cao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hu_2023_CVPR, author = {Hu, Jie and Huang, Linyan and Ren, Tianhe and Zhang, Shengchuan and Ji, Rongrong and Cao, Liujuan}, title = {You Only Segment Once: Towards Real-Time Panoptic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17819-17829} }
Robust Single Image Reflection Removal Against Adversarial Attacks: Zhenbo Song,

Zhenyuan Zhang,

Kaihao Zhang,

Wenhan Luo,

Zhaoxin Fan,

Wenqi Ren,

Jianfeng Lu; [pdf]
[bibtex]
@InProceedings{Song_2023_CVPR, author = {Song, Zhenbo and Zhang, Zhenyuan and Zhang, Kaihao and Luo, Wenhan and Fan, Zhaoxin and Ren, Wenqi and Lu, Jianfeng}, title = {Robust Single Image Reflection Removal Against Adversarial Attacks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24688-24698} }
PartMix: Regularization Strategy To Learn Part Discovery for Visible-Infrared Person Re-Identification: Minsu Kim,

Seungryong Kim,

Jungin Park,

Seongheon Park,

Kwanghoon Sohn; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2023_CVPR, author = {Kim, Minsu and Kim, Seungryong and Park, Jungin and Park, Seongheon and Sohn, Kwanghoon}, title = {PartMix: Regularization Strategy To Learn Part Discovery for Visible-Infrared Person Re-Identification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18621-18632} }
Feature Representation Learning With Adaptive Displacement Generation and Transformer Fusion for Micro-Expression Recognition: Zhijun Zhai,

Jianhui Zhao,

Chengjiang Long,

Wenju Xu,

Shuangjiang He,

Huijuan Zhao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhai_2023_CVPR, author = {Zhai, Zhijun and Zhao, Jianhui and Long, Chengjiang and Xu, Wenju and He, Shuangjiang and Zhao, Huijuan}, title = {Feature Representation Learning With Adaptive Displacement Generation and Transformer Fusion for Micro-Expression Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22086-22095} }
ViewNet: A Novel Projection-Based Backbone With View Pooling for Few-Shot Point Cloud Classification: Jiajing Chen,

Minmin Yang,

Senem Velipasalar; [pdf]
[bibtex]
@InProceedings{Chen_2023_CVPR, author = {Chen, Jiajing and Yang, Minmin and Velipasalar, Senem}, title = {ViewNet: A Novel Projection-Based Backbone With View Pooling for Few-Shot Point Cloud Classification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17652-17660} }
ANetQA: A Large-Scale Benchmark for Fine-Grained Compositional Reasoning Over Untrimmed Videos: Zhou Yu,

Lixiang Zheng,

Zhou Zhao,

Fei Wu,

Jianping Fan,

Kui Ren,

Jun Yu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yu_2023_CVPR, author = {Yu, Zhou and Zheng, Lixiang and Zhao, Zhou and Wu, Fei and Fan, Jianping and Ren, Kui and Yu, Jun}, title = {ANetQA: A Large-Scale Benchmark for Fine-Grained Compositional Reasoning Over Untrimmed Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23191-23200} }
CLAMP: Prompt-Based Contrastive Learning for Connecting Language and Animal Pose: Xu Zhang,

Wen Wang,

Zhe Chen,

Yufei Xu,

Jing Zhang,

Dacheng Tao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_CVPR, author = {Zhang, Xu and Wang, Wen and Chen, Zhe and Xu, Yufei and Zhang, Jing and Tao, Dacheng}, title = {CLAMP: Prompt-Based Contrastive Learning for Connecting Language and Animal Pose}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23272-23281} }
Standing Between Past and Future: Spatio-Temporal Modeling for Multi-Camera 3D Multi-Object Tracking: Ziqi Pang,

Jie Li,

Pavel Tokmakov,

Dian Chen,

Sergey Zagoruyko,

Yu-Xiong Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Pang_2023_CVPR, author = {Pang, Ziqi and Li, Jie and Tokmakov, Pavel and Chen, Dian and Zagoruyko, Sergey and Wang, Yu-Xiong}, title = {Standing Between Past and Future: Spatio-Temporal Modeling for Multi-Camera 3D Multi-Object Tracking}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17928-17938} }
TTA-COPE: Test-Time Adaptation for Category-Level Object Pose Estimation: Taeyeop Lee,

Jonathan Tremblay,

Valts Blukis,

Bowen Wen,

Byeong-Uk Lee,

Inkyu Shin,

Stan Birchfield,

In So Kweon,

Kuk-Jin Yoon; [pdf] [supp]
[bibtex]
@InProceedings{Lee_2023_CVPR, author = {Lee, Taeyeop and Tremblay, Jonathan and Blukis, Valts and Wen, Bowen and Lee, Byeong-Uk and Shin, Inkyu and Birchfield, Stan and Kweon, In So and Yoon, Kuk-Jin}, title = {TTA-COPE: Test-Time Adaptation for Category-Level Object Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21285-21295} }
Geometry and Uncertainty-Aware 3D Point Cloud Class-Incremental Semantic Segmentation: Yuwei Yang,

Munawar Hayat,

Zhao Jin,

Chao Ren,

Yinjie Lei; [pdf] [supp]
[bibtex]
@InProceedings{Yang_2023_CVPR, author = {Yang, Yuwei and Hayat, Munawar and Jin, Zhao and Ren, Chao and Lei, Yinjie}, title = {Geometry and Uncertainty-Aware 3D Point Cloud Class-Incremental Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21759-21768} }
Cooperation or Competition: Avoiding Player Domination for Multi-Target Robustness via Adaptive Budgets: Yimu Wang,

Dinghuai Zhang,

Yihan Wu,

Heng Huang,

Hongyang Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Yimu and Zhang, Dinghuai and Wu, Yihan and Huang, Heng and Zhang, Hongyang}, title = {Cooperation or Competition: Avoiding Player Domination for Multi-Target Robustness via Adaptive Budgets}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20564-20574} }
CAT: LoCalization and IdentificAtion Cascade Detection Transformer for Open-World Object Detection: Shuailei Ma,

Yuefeng Wang,

Ying Wei,

Jiaqi Fan,

Thomas H. Li,

Hongli Liu,

Fanbing Lv; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ma_2023_CVPR, author = {Ma, Shuailei and Wang, Yuefeng and Wei, Ying and Fan, Jiaqi and Li, Thomas H. and Liu, Hongli and Lv, Fanbing}, title = {CAT: LoCalization and IdentificAtion Cascade Detection Transformer for Open-World Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19681-19690} }
TruFor: Leveraging All-Round Clues for Trustworthy Image Forgery Detection and Localization: Fabrizio Guillaro,

Davide Cozzolino,

Avneesh Sud,

Nicholas Dufour,

Luisa Verdoliva; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Guillaro_2023_CVPR, author = {Guillaro, Fabrizio and Cozzolino, Davide and Sud, Avneesh and Dufour, Nicholas and Verdoliva, Luisa}, title = {TruFor: Leveraging All-Round Clues for Trustworthy Image Forgery Detection and Localization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20606-20615} }
LANA: A Language-Capable Navigator for Instruction Following and Generation: Xiaohan Wang,

Wenguan Wang,

Jiayi Shao,

Yi Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Xiaohan and Wang, Wenguan and Shao, Jiayi and Yang, Yi}, title = {LANA: A Language-Capable Navigator for Instruction Following and Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19048-19058} }
CAPE: Camera View Position Embedding for Multi-View 3D Object Detection: Kaixin Xiong,

Shi Gong,

Xiaoqing Ye,

Xiao Tan,

Ji Wan,

Errui Ding,

Jingdong Wang,

Xiang Bai; [pdf] [arXiv]
[bibtex]
@InProceedings{Xiong_2023_CVPR, author = {Xiong, Kaixin and Gong, Shi and Ye, Xiaoqing and Tan, Xiao and Wan, Ji and Ding, Errui and Wang, Jingdong and Bai, Xiang}, title = {CAPE: Camera View Position Embedding for Multi-View 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21570-21579} }
Bi-Directional Distribution Alignment for Transductive Zero-Shot Learning: Zhicai Wang,

Yanbin Hao,

Tingting Mu,

Ouxiang Li,

Shuo Wang,

Xiangnan He; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Zhicai and Hao, Yanbin and Mu, Tingting and Li, Ouxiang and Wang, Shuo and He, Xiangnan}, title = {Bi-Directional Distribution Alignment for Transductive Zero-Shot Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19893-19902} }
FlexNeRF: Photorealistic Free-Viewpoint Rendering of Moving Humans From Sparse Views: Vinoj Jayasundara,

Amit Agrawal,

Nicolas Heron,

Abhinav Shrivastava,

Larry S. Davis; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jayasundara_2023_CVPR, author = {Jayasundara, Vinoj and Agrawal, Amit and Heron, Nicolas and Shrivastava, Abhinav and Davis, Larry S.}, title = {FlexNeRF: Photorealistic Free-Viewpoint Rendering of Moving Humans From Sparse Views}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21118-21127} }
Towards Better Gradient Consistency for Neural Signed Distance Functions via Level Set Alignment: Baorui Ma,

Junsheng Zhou,

Yu-Shen Liu,

Zhizhong Han; [pdf] [supp]
[bibtex]
@InProceedings{Ma_2023_CVPR, author = {Ma, Baorui and Zhou, Junsheng and Liu, Yu-Shen and Han, Zhizhong}, title = {Towards Better Gradient Consistency for Neural Signed Distance Functions via Level Set Alignment}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17724-17734} }
Zero-Shot Everything Sketch-Based Image Retrieval, and in Explainable Style: Fengyin Lin,

Mingkang Li,

Da Li,

Timothy Hospedales,

Yi-Zhe Song,

Yonggang Qi; [pdf] [arXiv]
[bibtex]
@InProceedings{Lin_2023_CVPR, author = {Lin, Fengyin and Li, Mingkang and Li, Da and Hospedales, Timothy and Song, Yi-Zhe and Qi, Yonggang}, title = {Zero-Shot Everything Sketch-Based Image Retrieval, and in Explainable Style}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23349-23358} }
Graph Representation for Order-Aware Visual Transformation: Yue Qiu,

Yanjun Sun,

Fumiya Matsuzawa,

Kenji Iwata,

Hirokatsu Kataoka; [pdf] [supp]
[bibtex]
@InProceedings{Qiu_2023_CVPR, author = {Qiu, Yue and Sun, Yanjun and Matsuzawa, Fumiya and Iwata, Kenji and Kataoka, Hirokatsu}, title = {Graph Representation for Order-Aware Visual Transformation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22793-22802} }
StarCraftImage: A Dataset for Prototyping Spatial Reasoning Methods for Multi-Agent Environments: Sean Kulinski,

Nicholas R. Waytowich,

James Z. Hare,

David I. Inouye; [pdf] [supp]
[bibtex]
@InProceedings{Kulinski_2023_CVPR, author = {Kulinski, Sean and Waytowich, Nicholas R. and Hare, James Z. and Inouye, David I.}, title = {StarCraftImage: A Dataset for Prototyping Spatial Reasoning Methods for Multi-Agent Environments}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22004-22013} }
Quality-Aware Pre-Trained Models for Blind Image Quality Assessment: Kai Zhao,

Kun Yuan,

Ming Sun,

Mading Li,

Xing Wen; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhao_2023_CVPR, author = {Zhao, Kai and Yuan, Kun and Sun, Ming and Li, Mading and Wen, Xing}, title = {Quality-Aware Pre-Trained Models for Blind Image Quality Assessment}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22302-22313} }
Network Expansion for Practical Training Acceleration: Ning Ding,

Yehui Tang,

Kai Han,

Chao Xu,

Yunhe Wang; [pdf]
[bibtex]
@InProceedings{Ding_2023_CVPR, author = {Ding, Ning and Tang, Yehui and Han, Kai and Xu, Chao and Wang, Yunhe}, title = {Network Expansion for Practical Training Acceleration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20269-20279} }
FCC: Feature Clusters Compression for Long-Tailed Visual Recognition: Jian Li,

Ziyao Meng,

Daqian Shi,

Rui Song,

Xiaolei Diao,

Jingwen Wang,

Hao Xu; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Jian and Meng, Ziyao and Shi, Daqian and Song, Rui and Diao, Xiaolei and Wang, Jingwen and Xu, Hao}, title = {FCC: Feature Clusters Compression for Long-Tailed Visual Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24080-24089} }
Rethinking the Learning Paradigm for Dynamic Facial Expression Recognition: Hanyang Wang,

Bo Li,

Shuang Wu,

Siyuan Shen,

Feng Liu,

Shouhong Ding,

Aimin Zhou; [pdf]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Hanyang and Li, Bo and Wu, Shuang and Shen, Siyuan and Liu, Feng and Ding, Shouhong and Zhou, Aimin}, title = {Rethinking the Learning Paradigm for Dynamic Facial Expression Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17958-17968} }
Self-Supervised Learning for Multimodal Non-Rigid 3D Shape Matching: Dongliang Cao,

Florian Bernard; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cao_2023_CVPR, author = {Cao, Dongliang and Bernard, Florian}, title = {Self-Supervised Learning for Multimodal Non-Rigid 3D Shape Matching}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17735-17744} }
Ham2Pose: Animating Sign Language Notation Into Pose Sequences: Rotem Shalev Arkushin,

Amit Moryossef,

Ohad Fried; [pdf] [supp]
[bibtex]
@InProceedings{Arkushin_2023_CVPR, author = {Arkushin, Rotem Shalev and Moryossef, Amit and Fried, Ohad}, title = {Ham2Pose: Animating Sign Language Notation Into Pose Sequences}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21046-21056} }
Open-Set Likelihood Maximization for Few-Shot Learning: Malik Boudiaf,

Etienne Bennequin,

Myriam Tami,

Antoine Toubhans,

Pablo Piantanida,

Celine Hudelot,

Ismail Ben Ayed; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Boudiaf_2023_CVPR, author = {Boudiaf, Malik and Bennequin, Etienne and Tami, Myriam and Toubhans, Antoine and Piantanida, Pablo and Hudelot, Celine and Ben Ayed, Ismail}, title = {Open-Set Likelihood Maximization for Few-Shot Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24007-24016} }
Boosting Accuracy and Robustness of Student Models via Adaptive Adversarial Distillation: Bo Huang,

Mingyang Chen,

Yi Wang,

Junda Lu,

Minhao Cheng,

Wei Wang; [pdf]
[bibtex]
@InProceedings{Huang_2023_CVPR, author = {Huang, Bo and Chen, Mingyang and Wang, Yi and Lu, Junda and Cheng, Minhao and Wang, Wei}, title = {Boosting Accuracy and Robustness of Student Models via Adaptive Adversarial Distillation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24668-24677} }
PixHt-Lab: Pixel Height Based Light Effect Generation for Image Compositing: Yichen Sheng,

Jianming Zhang,

Julien Philip,

Yannick Hold-Geoffroy,

Xin Sun,

He Zhang,

Lu Ling,

Bedrich Benes; [pdf] [supp]
[bibtex]
@InProceedings{Sheng_2023_CVPR, author = {Sheng, Yichen and Zhang, Jianming and Philip, Julien and Hold-Geoffroy, Yannick and Sun, Xin and Zhang, He and Ling, Lu and Benes, Bedrich}, title = {PixHt-Lab: Pixel Height Based Light Effect Generation for Image Compositing}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16643-16653} }
RGB No More: Minimally-Decoded JPEG Vision Transformers: Jeongsoo Park,

Justin Johnson; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Park_2023_CVPR, author = {Park, Jeongsoo and Johnson, Justin}, title = {RGB No More: Minimally-Decoded JPEG Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22334-22346} }
Hybrid Active Learning via Deep Clustering for Video Action Detection: Aayush J. Rana,

Yogesh S. Rawat; [pdf] [supp]
[bibtex]
@InProceedings{Rana_2023_CVPR, author = {Rana, Aayush J. and Rawat, Yogesh S.}, title = {Hybrid Active Learning via Deep Clustering for Video Action Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18867-18877} }
Fine-Grained Image-Text Matching by Cross-Modal Hard Aligning Network: Zhengxin Pan,

Fangyu Wu,

Bailing Zhang; [pdf]
[bibtex]
@InProceedings{Pan_2023_CVPR, author = {Pan, Zhengxin and Wu, Fangyu and Zhang, Bailing}, title = {Fine-Grained Image-Text Matching by Cross-Modal Hard Aligning Network}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19275-19284} }
Sparsifiner: Learning Sparse Instance-Dependent Attention for Efficient Vision Transformers: Cong Wei,

Brendan Duke,

Ruowei Jiang,

Parham Aarabi,

Graham W. Taylor,

Florian Shkurti; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wei_2023_CVPR, author = {Wei, Cong and Duke, Brendan and Jiang, Ruowei and Aarabi, Parham and Taylor, Graham W. and Shkurti, Florian}, title = {Sparsifiner: Learning Sparse Instance-Dependent Attention for Efficient Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22680-22689} }
Structured Sparsity Learning for Efficient Video Super-Resolution: Bin Xia,

Jingwen He,

Yulun Zhang,

Yitong Wang,

Yapeng Tian,

Wenming Yang,

Luc Van Gool; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xia_2023_CVPR, author = {Xia, Bin and He, Jingwen and Zhang, Yulun and Wang, Yitong and Tian, Yapeng and Yang, Wenming and Van Gool, Luc}, title = {Structured Sparsity Learning for Efficient Video Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22638-22647} }
"Seeing" Electric Network Frequency From Events: Lexuan Xu,

Guang Hua,

Haijian Zhang,

Lei Yu,

Ning Qiao; [pdf] [arXiv]
[bibtex]
@InProceedings{Xu_2023_CVPR, author = {Xu, Lexuan and Hua, Guang and Zhang, Haijian and Yu, Lei and Qiao, Ning}, title = {''Seeing'' Electric Network Frequency From Events}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18022-18031} }
MMVC: Learned Multi-Mode Video Compression With Block-Based Prediction Mode Selection and Density-Adaptive Entropy Coding: Bowen Liu,

Yu Chen,

Rakesh Chowdary Machineni,

Shiyu Liu,

Hun-Seok Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Bowen and Chen, Yu and Machineni, Rakesh Chowdary and Liu, Shiyu and Kim, Hun-Seok}, title = {MMVC: Learned Multi-Mode Video Compression With Block-Based Prediction Mode Selection and Density-Adaptive Entropy Coding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18487-18496} }
Omni Aggregation Networks for Lightweight Image Super-Resolution: Hang Wang,

Xuanhong Chen,

Bingbing Ni,

Yutian Liu,

Jinfan Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Hang and Chen, Xuanhong and Ni, Bingbing and Liu, Yutian and Liu, Jinfan}, title = {Omni Aggregation Networks for Lightweight Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22378-22387} }
Exploring the Effect of Primitives for Compositional Generalization in Vision-and-Language: Chuanhao Li,

Zhen Li,

Chenchen Jing,

Yunde Jia,

Yuwei Wu; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Chuanhao and Li, Zhen and Jing, Chenchen and Jia, Yunde and Wu, Yuwei}, title = {Exploring the Effect of Primitives for Compositional Generalization in Vision-and-Language}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19092-19101} }
DC2: Dual-Camera Defocus Control by Learning To Refocus: Hadi Alzayer,

Abdullah Abuolaim,

Leung Chun Chan,

Yang Yang,

Ying Chen Lou,

Jia-Bin Huang,

Abhishek Kar; [pdf] [supp]
[bibtex]
@InProceedings{Alzayer_2023_CVPR, author = {Alzayer, Hadi and Abuolaim, Abdullah and Chan, Leung Chun and Yang, Yang and Lou, Ying Chen and Huang, Jia-Bin and Kar, Abhishek}, title = {DC2: Dual-Camera Defocus Control by Learning To Refocus}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21488-21497} }
Looking Through the Glass: Neural Surface Reconstruction Against High Specular Reflections: Jiaxiong Qiu,

Peng-Tao Jiang,

Yifan Zhu,

Ze-Xin Yin,

Ming-Ming Cheng,

Bo Ren; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Qiu_2023_CVPR, author = {Qiu, Jiaxiong and Jiang, Peng-Tao and Zhu, Yifan and Yin, Ze-Xin and Cheng, Ming-Ming and Ren, Bo}, title = {Looking Through the Glass: Neural Surface Reconstruction Against High Specular Reflections}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20823-20833} }
PartSLIP: Low-Shot Part Segmentation for 3D Point Clouds via Pretrained Image-Language Models: Minghua Liu,

Yinhao Zhu,

Hong Cai,

Shizhong Han,

Zhan Ling,

Fatih Porikli,

Hao Su; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Minghua and Zhu, Yinhao and Cai, Hong and Han, Shizhong and Ling, Zhan and Porikli, Fatih and Su, Hao}, title = {PartSLIP: Low-Shot Part Segmentation for 3D Point Clouds via Pretrained Image-Language Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21736-21746} }
MAGVLT: Masked Generative Vision-and-Language Transformer: Sungwoong Kim,

Daejin Jo,

Donghoon Lee,

Jongmin Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2023_CVPR, author = {Kim, Sungwoong and Jo, Daejin and Lee, Donghoon and Kim, Jongmin}, title = {MAGVLT: Masked Generative Vision-and-Language Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23338-23348} }
Decoupling Human and Camera Motion From Videos in the Wild: Vickie Ye,

Georgios Pavlakos,

Jitendra Malik,

Angjoo Kanazawa; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ye_2023_CVPR, author = {Ye, Vickie and Pavlakos, Georgios and Malik, Jitendra and Kanazawa, Angjoo}, title = {Decoupling Human and Camera Motion From Videos in the Wild}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21222-21232} }
DetCLIPv2: Scalable Open-Vocabulary Object Detection Pre-Training via Word-Region Alignment: Lewei Yao,

Jianhua Han,

Xiaodan Liang,

Dan Xu,

Wei Zhang,

Zhenguo Li,

Hang Xu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yao_2023_CVPR, author = {Yao, Lewei and Han, Jianhua and Liang, Xiaodan and Xu, Dan and Zhang, Wei and Li, Zhenguo and Xu, Hang}, title = {DetCLIPv2: Scalable Open-Vocabulary Object Detection Pre-Training via Word-Region Alignment}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23497-23506} }
GrowSP: Unsupervised Semantic Segmentation of 3D Point Clouds: Zihui Zhang,

Bo Yang,

Bing Wang,

Bo Li; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_CVPR, author = {Zhang, Zihui and Yang, Bo and Wang, Bing and Li, Bo}, title = {GrowSP: Unsupervised Semantic Segmentation of 3D Point Clouds}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17619-17629} }
One-Stage 3D Whole-Body Mesh Recovery With Component Aware Transformer: Jing Lin,

Ailing Zeng,

Haoqian Wang,

Lei Zhang,

Yu Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lin_2023_CVPR, author = {Lin, Jing and Zeng, Ailing and Wang, Haoqian and Zhang, Lei and Li, Yu}, title = {One-Stage 3D Whole-Body Mesh Recovery With Component Aware Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21159-21168} }
Masked Jigsaw Puzzle: A Versatile Position Embedding for Vision Transformers: Bin Ren,

Yahui Liu,

Yue Song,

Wei Bi,

Rita Cucchiara,

Nicu Sebe,

Wei Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ren_2023_CVPR, author = {Ren, Bin and Liu, Yahui and Song, Yue and Bi, Wei and Cucchiara, Rita and Sebe, Nicu and Wang, Wei}, title = {Masked Jigsaw Puzzle: A Versatile Position Embedding for Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20382-20391} }
LayoutDiffusion: Controllable Diffusion Model for Layout-to-Image Generation: Guangcong Zheng,

Xianpan Zhou,

Xuewei Li,

Zhongang Qi,

Ying Shan,

Xi Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zheng_2023_CVPR, author = {Zheng, Guangcong and Zhou, Xianpan and Li, Xuewei and Qi, Zhongang and Shan, Ying and Li, Xi}, title = {LayoutDiffusion: Controllable Diffusion Model for Layout-to-Image Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22490-22499} }
DISC: Learning From Noisy Labels via Dynamic Instance-Specific Selection and Correction: Yifan Li,

Hu Han,

Shiguang Shan,

Xilin Chen; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Yifan and Han, Hu and Shan, Shiguang and Chen, Xilin}, title = {DISC: Learning From Noisy Labels via Dynamic Instance-Specific Selection and Correction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24070-24079} }
Imagen Editor and EditBench: Advancing and Evaluating Text-Guided Image Inpainting: Su Wang,

Chitwan Saharia,

Ceslee Montgomery,

Jordi Pont-Tuset,

Shai Noy,

Stefano Pellegrini,

Yasumasa Onoe,

Sarah Laszlo,

David J. Fleet,

Radu Soricut,

Jason Baldridge,

Mohammad Norouzi,

Peter Anderson,

William Chan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Su and Saharia, Chitwan and Montgomery, Ceslee and Pont-Tuset, Jordi and Noy, Shai and Pellegrini, Stefano and Onoe, Yasumasa and Laszlo, Sarah and Fleet, David J. and Soricut, Radu and Baldridge, Jason and Norouzi, Mohammad and Anderson, Peter and Chan, William}, title = {Imagen Editor and EditBench: Advancing and Evaluating Text-Guided Image Inpainting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18359-18369} }
Text With Knowledge Graph Augmented Transformer for Video Captioning: Xin Gu,

Guang Chen,

Yufei Wang,

Libo Zhang,

Tiejian Luo,

Longyin Wen; [pdf] [arXiv]
[bibtex]
@InProceedings{Gu_2023_CVPR, author = {Gu, Xin and Chen, Guang and Wang, Yufei and Zhang, Libo and Luo, Tiejian and Wen, Longyin}, title = {Text With Knowledge Graph Augmented Transformer for Video Captioning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18941-18951} }
Devil Is in the Queries: Advancing Mask Transformers for Real-World Medical Image Segmentation and Out-of-Distribution Localization: Mingze Yuan,

Yingda Xia,

Hexin Dong,

Zifan Chen,

Jiawen Yao,

Mingyan Qiu,

Ke Yan,

Xiaoli Yin,

Yu Shi,

Xin Chen,

Zaiyi Liu,

Bin Dong,

Jingren Zhou,

Le Lu,

Ling Zhang,

Li Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yuan_2023_CVPR, author = {Yuan, Mingze and Xia, Yingda and Dong, Hexin and Chen, Zifan and Yao, Jiawen and Qiu, Mingyan and Yan, Ke and Yin, Xiaoli and Shi, Yu and Chen, Xin and Liu, Zaiyi and Dong, Bin and Zhou, Jingren and Lu, Le and Zhang, Ling and Zhang, Li}, title = {Devil Is in the Queries: Advancing Mask Transformers for Real-World Medical Image Segmentation and Out-of-Distribution Localization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23879-23889} }
T-SEA: Transfer-Based Self-Ensemble Attack on Object Detection: Hao Huang,

Ziyan Chen,

Huanran Chen,

Yongtao Wang,

Kevin Zhang; [pdf]
[bibtex]
@InProceedings{Huang_2023_CVPR, author = {Huang, Hao and Chen, Ziyan and Chen, Huanran and Wang, Yongtao and Zhang, Kevin}, title = {T-SEA: Transfer-Based Self-Ensemble Attack on Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20514-20523} }
PSVT: End-to-End Multi-Person 3D Pose and Shape Estimation With Progressive Video Transformers: Zhongwei Qiu,

Qiansheng Yang,

Jian Wang,

Haocheng Feng,

Junyu Han,

Errui Ding,

Chang Xu,

Dongmei Fu,

Jingdong Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Qiu_2023_CVPR, author = {Qiu, Zhongwei and Yang, Qiansheng and Wang, Jian and Feng, Haocheng and Han, Junyu and Ding, Errui and Xu, Chang and Fu, Dongmei and Wang, Jingdong}, title = {PSVT: End-to-End Multi-Person 3D Pose and Shape Estimation With Progressive Video Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21254-21263} }
Unifying Vision, Text, and Layout for Universal Document Processing: Zineng Tang,

Ziyi Yang,

Guoxin Wang,

Yuwei Fang,

Yang Liu,

Chenguang Zhu,

Michael Zeng,

Cha Zhang,

Mohit Bansal; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tang_2023_CVPR, author = {Tang, Zineng and Yang, Ziyi and Wang, Guoxin and Fang, Yuwei and Liu, Yang and Zhu, Chenguang and Zeng, Michael and Zhang, Cha and Bansal, Mohit}, title = {Unifying Vision, Text, and Layout for Universal Document Processing}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19254-19264} }
SparsePose: Sparse-View Camera Pose Regression and Refinement: Samarth Sinha,

Jason Y. Zhang,

Andrea Tagliasacchi,

Igor Gilitschenski,

David B. Lindell; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sinha_2023_CVPR, author = {Sinha, Samarth and Zhang, Jason Y. and Tagliasacchi, Andrea and Gilitschenski, Igor and Lindell, David B.}, title = {SparsePose: Sparse-View Camera Pose Regression and Refinement}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21349-21359} }
Flow Supervision for Deformable NeRF: Chaoyang Wang,

Lachlan Ewen MacDonald,

László A. Jeni,

Simon Lucey; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Chaoyang and MacDonald, Lachlan Ewen and Jeni, L\'aszl\'o A. and Lucey, Simon}, title = {Flow Supervision for Deformable NeRF}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21128-21137} }
Zero-Shot Text-to-Parameter Translation for Game Character Auto-Creation: Rui Zhao,

Wei Li,

Zhipeng Hu,

Lincheng Li,

Zhengxia Zou,

Zhenwei Shi,

Changjie Fan; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhao_2023_CVPR, author = {Zhao, Rui and Li, Wei and Hu, Zhipeng and Li, Lincheng and Zou, Zhengxia and Shi, Zhenwei and Fan, Changjie}, title = {Zero-Shot Text-to-Parameter Translation for Game Character Auto-Creation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21013-21023} }
PIVOT: Prompting for Video Continual Learning: Andrés Villa,

Juan León Alcázar,

Motasem Alfarra,

Kumail Alhamoud,

Julio Hurtado,

Fabian Caba Heilbron,

Alvaro Soto,

Bernard Ghanem; [pdf] [supp]
[bibtex]
@InProceedings{Villa_2023_CVPR, author = {Villa, Andr\'es and Alc\'azar, Juan Le\'on and Alfarra, Motasem and Alhamoud, Kumail and Hurtado, Julio and Heilbron, Fabian Caba and Soto, Alvaro and Ghanem, Bernard}, title = {PIVOT: Prompting for Video Continual Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24214-24223} }
Panoptic Video Scene Graph Generation: Jingkang Yang,

Wenxuan Peng,

Xiangtai Li,

Zujin Guo,

Liangyu Chen,

Bo Li,

Zheng Ma,

Kaiyang Zhou,

Wayne Zhang,

Chen Change Loy,

Ziwei Liu; [pdf]
[bibtex]
@InProceedings{Yang_2023_CVPR, author = {Yang, Jingkang and Peng, Wenxuan and Li, Xiangtai and Guo, Zujin and Chen, Liangyu and Li, Bo and Ma, Zheng and Zhou, Kaiyang and Zhang, Wayne and Loy, Chen Change and Liu, Ziwei}, title = {Panoptic Video Scene Graph Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18675-18685} }
Understanding Imbalanced Semantic Segmentation Through Neural Collapse: Zhisheng Zhong,

Jiequan Cui,

Yibo Yang,

Xiaoyang Wu,

Xiaojuan Qi,

Xiangyu Zhang,

Jiaya Jia; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhong_2023_CVPR, author = {Zhong, Zhisheng and Cui, Jiequan and Yang, Yibo and Wu, Xiaoyang and Qi, Xiaojuan and Zhang, Xiangyu and Jia, Jiaya}, title = {Understanding Imbalanced Semantic Segmentation Through Neural Collapse}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19550-19560} }
HOICLIP: Efficient Knowledge Transfer for HOI Detection With Vision-Language Models: Shan Ning,

Longtian Qiu,

Yongfei Liu,

Xuming He; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ning_2023_CVPR, author = {Ning, Shan and Qiu, Longtian and Liu, Yongfei and He, Xuming}, title = {HOICLIP: Efficient Knowledge Transfer for HOI Detection With Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23507-23517} }
Focused and Collaborative Feedback Integration for Interactive Image Segmentation: Qiaoqiao Wei,

Hui Zhang,

Jun-Hai Yong; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wei_2023_CVPR, author = {Wei, Qiaoqiao and Zhang, Hui and Yong, Jun-Hai}, title = {Focused and Collaborative Feedback Integration for Interactive Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18643-18652} }
Class Prototypes Based Contrastive Learning for Classifying Multi-Label and Fine-Grained Educational Videos: Rohit Gupta,

Anirban Roy,

Claire Christensen,

Sujeong Kim,

Sarah Gerard,

Madeline Cincebeaux,

Ajay Divakaran,

Todd Grindal,

Mubarak Shah; [pdf] [supp]
[bibtex]
@InProceedings{Gupta_2023_CVPR, author = {Gupta, Rohit and Roy, Anirban and Christensen, Claire and Kim, Sujeong and Gerard, Sarah and Cincebeaux, Madeline and Divakaran, Ajay and Grindal, Todd and Shah, Mubarak}, title = {Class Prototypes Based Contrastive Learning for Classifying Multi-Label and Fine-Grained Educational Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19923-19933} }
Source-Free Adaptive Gaze Estimation by Uncertainty Reduction: Xin Cai,

Jiabei Zeng,

Shiguang Shan,

Xilin Chen; [pdf] [supp]
[bibtex]
@InProceedings{Cai_2023_CVPR, author = {Cai, Xin and Zeng, Jiabei and Shan, Shiguang and Chen, Xilin}, title = {Source-Free Adaptive Gaze Estimation by Uncertainty Reduction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22035-22045} }
SuperDisco: Super-Class Discovery Improves Visual Recognition for the Long-Tail: Yingjun Du,

Jiayi Shen,

Xiantong Zhen,

Cees G. M. Snoek; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Du_2023_CVPR, author = {Du, Yingjun and Shen, Jiayi and Zhen, Xiantong and Snoek, Cees G. M.}, title = {SuperDisco: Super-Class Discovery Improves Visual Recognition for the Long-Tail}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19944-19954} }
Im2Hands: Learning Attentive Implicit Representation of Interacting Two-Hand Shapes: Jihyun Lee,

Minhyuk Sung,

Honggyu Choi,

Tae-Kyun Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2023_CVPR, author = {Lee, Jihyun and Sung, Minhyuk and Choi, Honggyu and Kim, Tae-Kyun}, title = {Im2Hands: Learning Attentive Implicit Representation of Interacting Two-Hand Shapes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21169-21178} }
Long-Term Visual Localization With Mobile Sensors: Shen Yan,

Yu Liu,

Long Wang,

Zehong Shen,

Zhen Peng,

Haomin Liu,

Maojun Zhang,

Guofeng Zhang,

Xiaowei Zhou; [pdf] [arXiv]
[bibtex]
@InProceedings{Yan_2023_CVPR, author = {Yan, Shen and Liu, Yu and Wang, Long and Shen, Zehong and Peng, Zhen and Liu, Haomin and Zhang, Maojun and Zhang, Guofeng and Zhou, Xiaowei}, title = {Long-Term Visual Localization With Mobile Sensors}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17245-17255} }
Data-Efficient Large Scale Place Recognition With Graded Similarity Supervision: María Leyva-Vallina,

Nicola Strisciuglio,

Nicolai Petkov; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Leyva-Vallina_2023_CVPR, author = {Leyva-Vallina, Mar{\'\i}a and Strisciuglio, Nicola and Petkov, Nicolai}, title = {Data-Efficient Large Scale Place Recognition With Graded Similarity Supervision}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23487-23496} }
Weakly Supervised Class-Agnostic Motion Prediction for Autonomous Driving: Ruibo Li,

Hanyu Shi,

Ziang Fu,

Zhe Wang,

Guosheng Lin; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Ruibo and Shi, Hanyu and Fu, Ziang and Wang, Zhe and Lin, Guosheng}, title = {Weakly Supervised Class-Agnostic Motion Prediction for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17599-17608} }
Where We Are and What We're Looking At: Query Based Worldwide Image Geo-Localization Using Hierarchies and Scenes: Brandon Clark,

Alec Kerrigan,

Parth Parag Kulkarni,

Vicente Vivanco Cepeda,

Mubarak Shah; [pdf] [supp]
[bibtex]
@InProceedings{Clark_2023_CVPR, author = {Clark, Brandon and Kerrigan, Alec and Kulkarni, Parth Parag and Cepeda, Vicente Vivanco and Shah, Mubarak}, title = {Where We Are and What We're Looking At: Query Based Worldwide Image Geo-Localization Using Hierarchies and Scenes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23182-23190} }
Critical Learning Periods for Multisensory Integration in Deep Networks: Michael Kleinman,

Alessandro Achille,

Stefano Soatto; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kleinman_2023_CVPR, author = {Kleinman, Michael and Achille, Alessandro and Soatto, Stefano}, title = {Critical Learning Periods for Multisensory Integration in Deep Networks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24296-24305} }
GarmentTracking: Category-Level Garment Pose Tracking: Han Xue,

Wenqiang Xu,

Jieyi Zhang,

Tutian Tang,

Yutong Li,

Wenxin Du,

Ruolin Ye,

Cewu Lu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xue_2023_CVPR, author = {Xue, Han and Xu, Wenqiang and Zhang, Jieyi and Tang, Tutian and Li, Yutong and Du, Wenxin and Ye, Ruolin and Lu, Cewu}, title = {GarmentTracking: Category-Level Garment Pose Tracking}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21233-21242} }
MagicNet: Semi-Supervised Multi-Organ Segmentation via Magic-Cube Partition and Recovery: Duowen Chen,

Yunhao Bai,

Wei Shen,

Qingli Li,

Lequan Yu,

Yan Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_CVPR, author = {Chen, Duowen and Bai, Yunhao and Shen, Wei and Li, Qingli and Yu, Lequan and Wang, Yan}, title = {MagicNet: Semi-Supervised Multi-Organ Segmentation via Magic-Cube Partition and Recovery}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23869-23878} }
Neural Intrinsic Embedding for Non-Rigid Point Cloud Matching: Puhua Jiang,

Mingze Sun,

Ruqi Huang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jiang_2023_CVPR, author = {Jiang, Puhua and Sun, Mingze and Huang, Ruqi}, title = {Neural Intrinsic Embedding for Non-Rigid Point Cloud Matching}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21835-21845} }
Few-Shot Geometry-Aware Keypoint Localization: Xingzhe He,

Gaurav Bharaj,

David Ferman,

Helge Rhodin,

Pablo Garrido; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{He_2023_CVPR, author = {He, Xingzhe and Bharaj, Gaurav and Ferman, David and Rhodin, Helge and Garrido, Pablo}, title = {Few-Shot Geometry-Aware Keypoint Localization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21337-21348} }
Neural Vector Fields: Implicit Representation by Explicit Learning: Xianghui Yang,

Guosheng Lin,

Zhenghao Chen,

Luping Zhou; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_CVPR, author = {Yang, Xianghui and Lin, Guosheng and Chen, Zhenghao and Zhou, Luping}, title = {Neural Vector Fields: Implicit Representation by Explicit Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16727-16738} }
Think Twice Before Driving: Towards Scalable Decoders for End-to-End Autonomous Driving: Xiaosong Jia,

Penghao Wu,

Li Chen,

Jiangwei Xie,

Conghui He,

Junchi Yan,

Hongyang Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jia_2023_CVPR, author = {Jia, Xiaosong and Wu, Penghao and Chen, Li and Xie, Jiangwei and He, Conghui and Yan, Junchi and Li, Hongyang}, title = {Think Twice Before Driving: Towards Scalable Decoders for End-to-End Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21983-21994} }
Disentangling Orthogonal Planes for Indoor Panoramic Room Layout Estimation With Cross-Scale Distortion Awareness: Zhijie Shen,

Zishuo Zheng,

Chunyu Lin,

Lang Nie,

Kang Liao,

Shuai Zheng,

Yao Zhao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shen_2023_CVPR, author = {Shen, Zhijie and Zheng, Zishuo and Lin, Chunyu and Nie, Lang and Liao, Kang and Zheng, Shuai and Zhao, Yao}, title = {Disentangling Orthogonal Planes for Indoor Panoramic Room Layout Estimation With Cross-Scale Distortion Awareness}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17337-17345} }
Neural Map Prior for Autonomous Driving: Xuan Xiong,

Yicheng Liu,

Tianyuan Yuan,

Yue Wang,

Yilun Wang,

Hang Zhao; [pdf] [arXiv]
[bibtex]
@InProceedings{Xiong_2023_CVPR, author = {Xiong, Xuan and Liu, Yicheng and Yuan, Tianyuan and Wang, Yue and Wang, Yilun and Zhao, Hang}, title = {Neural Map Prior for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17535-17544} }
PEAL: Prior-Embedded Explicit Attention Learning for Low-Overlap Point Cloud Registration: Junle Yu,

Luwei Ren,

Yu Zhang,

Wenhui Zhou,

Lili Lin,

Guojun Dai; [pdf]
[bibtex]
@InProceedings{Yu_2023_CVPR, author = {Yu, Junle and Ren, Luwei and Zhang, Yu and Zhou, Wenhui and Lin, Lili and Dai, Guojun}, title = {PEAL: Prior-Embedded Explicit Attention Learning for Low-Overlap Point Cloud Registration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17702-17711} }
GeoVLN: Learning Geometry-Enhanced Visual Representation With Slot Attention for Vision-and-Language Navigation: Jingyang Huo,

Qiang Sun,

Boyan Jiang,

Haitao Lin,

Yanwei Fu; [pdf] [supp]
[bibtex]
@InProceedings{Huo_2023_CVPR, author = {Huo, Jingyang and Sun, Qiang and Jiang, Boyan and Lin, Haitao and Fu, Yanwei}, title = {GeoVLN: Learning Geometry-Enhanced Visual Representation With Slot Attention for Vision-and-Language Navigation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23212-23221} }
KiUT: Knowledge-Injected U-Transformer for Radiology Report Generation: Zhongzhen Huang,

Xiaofan Zhang,

Shaoting Zhang; [pdf]
[bibtex]
@InProceedings{Huang_2023_CVPR, author = {Huang, Zhongzhen and Zhang, Xiaofan and Zhang, Shaoting}, title = {KiUT: Knowledge-Injected U-Transformer for Radiology Report Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19809-19818} }
Neural Video Compression With Diverse Contexts: Jiahao Li,

Bin Li,

Yan Lu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Jiahao and Li, Bin and Lu, Yan}, title = {Neural Video Compression With Diverse Contexts}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22616-22626} }
Markerless Camera-to-Robot Pose Estimation via Self-Supervised Sim-to-Real Transfer: Jingpei Lu,

Florian Richter,

Michael C. Yip; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lu_2023_CVPR, author = {Lu, Jingpei and Richter, Florian and Yip, Michael C.}, title = {Markerless Camera-to-Robot Pose Estimation via Self-Supervised Sim-to-Real Transfer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21296-21306} }
CARTO: Category and Joint Agnostic Reconstruction of ARTiculated Objects: Nick Heppert,

Muhammad Zubair Irshad,

Sergey Zakharov,

Katherine Liu,

Rares Andrei Ambrus,

Jeannette Bohg,

Abhinav Valada,

Thomas Kollar; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Heppert_2023_CVPR, author = {Heppert, Nick and Irshad, Muhammad Zubair and Zakharov, Sergey and Liu, Katherine and Ambrus, Rares Andrei and Bohg, Jeannette and Valada, Abhinav and Kollar, Thomas}, title = {CARTO: Category and Joint Agnostic Reconstruction of ARTiculated Objects}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21201-21210} }
Event-Guided Person Re-Identification via Sparse-Dense Complementary Learning: Chengzhi Cao,

Xueyang Fu,

Hongjian Liu,

Yukun Huang,

Kunyu Wang,

Jiebo Luo,

Zheng-Jun Zha; [pdf] [supp]
[bibtex]
@InProceedings{Cao_2023_CVPR, author = {Cao, Chengzhi and Fu, Xueyang and Liu, Hongjian and Huang, Yukun and Wang, Kunyu and Luo, Jiebo and Zha, Zheng-Jun}, title = {Event-Guided Person Re-Identification via Sparse-Dense Complementary Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17990-17999} }
Regularizing Second-Order Influences for Continual Learning: Zhicheng Sun,

Yadong Mu,

Gang Hua; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sun_2023_CVPR, author = {Sun, Zhicheng and Mu, Yadong and Hua, Gang}, title = {Regularizing Second-Order Influences for Continual Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20166-20175} }
Super-Resolution Neural Operator: Min Wei,

Xuesong Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wei_2023_CVPR, author = {Wei, Min and Zhang, Xuesong}, title = {Super-Resolution Neural Operator}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18247-18256} }
GradICON: Approximate Diffeomorphisms via Gradient Inverse Consistency: Lin Tian,

Hastings Greer,

François-Xavier Vialard,

Roland Kwitt,

Raúl San José Estépar,

Richard Jarrett Rushmore,

Nikolaos Makris,

Sylvain Bouix,

Marc Niethammer; [pdf] [supp]
[bibtex]
@InProceedings{Tian_2023_CVPR, author = {Tian, Lin and Greer, Hastings and Vialard, Fran\c{c}ois-Xavier and Kwitt, Roland and Est\'epar, Ra\'ul San Jos\'e and Rushmore, Richard Jarrett and Makris, Nikolaos and Bouix, Sylvain and Niethammer, Marc}, title = {GradICON: Approximate Diffeomorphisms via Gradient Inverse Consistency}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18084-18094} }
LP-DIF: Learning Local Pattern-Specific Deep Implicit Function for 3D Objects and Scenes: Meng Wang,

Yu-Shen Liu,

Yue Gao,

Kanle Shi,

Yi Fang,

Zhizhong Han; [pdf]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Meng and Liu, Yu-Shen and Gao, Yue and Shi, Kanle and Fang, Yi and Han, Zhizhong}, title = {LP-DIF: Learning Local Pattern-Specific Deep Implicit Function for 3D Objects and Scenes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21856-21865} }
PeakConv: Learning Peak Receptive Field for Radar Semantic Segmentation: Liwen Zhang,

Xinyan Zhang,

Youcheng Zhang,

Yufei Guo,

Yuanpei Chen,

Xuhui Huang,

Zhe Ma; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_CVPR, author = {Zhang, Liwen and Zhang, Xinyan and Zhang, Youcheng and Guo, Yufei and Chen, Yuanpei and Huang, Xuhui and Ma, Zhe}, title = {PeakConv: Learning Peak Receptive Field for Radar Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17577-17586} }
Explaining Image Classifiers With Multiscale Directional Image Representation: Stefan Kolek,

Robert Windesheim,

Hector Andrade-Loarca,

Gitta Kutyniok,

Ron Levie; [pdf] [supp]
[bibtex]
@InProceedings{Kolek_2023_CVPR, author = {Kolek, Stefan and Windesheim, Robert and Andrade-Loarca, Hector and Kutyniok, Gitta and Levie, Ron}, title = {Explaining Image Classifiers With Multiscale Directional Image Representation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18600-18609} }
Deep Polarization Reconstruction With PDAVIS Events: Haiyang Mei,

Zuowen Wang,

Xin Yang,

Xiaopeng Wei,

Tobi Delbruck; [pdf] [supp]
[bibtex]
@InProceedings{Mei_2023_CVPR, author = {Mei, Haiyang and Wang, Zuowen and Yang, Xin and Wei, Xiaopeng and Delbruck, Tobi}, title = {Deep Polarization Reconstruction With PDAVIS Events}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22149-22158} }
VideoTrack: Learning To Track Objects via Video Transformer: Fei Xie,

Lei Chu,

Jiahao Li,

Yan Lu,

Chao Ma; [pdf] [supp]
[bibtex]
@InProceedings{Xie_2023_CVPR, author = {Xie, Fei and Chu, Lei and Li, Jiahao and Lu, Yan and Ma, Chao}, title = {VideoTrack: Learning To Track Objects via Video Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22826-22835} }
Distilling Self-Supervised Vision Transformers for Weakly-Supervised Few-Shot Classification & Segmentation: Dahyun Kang,

Piotr Koniusz,

Minsu Cho,

Naila Murray; [pdf] [supp]
[bibtex]
@InProceedings{Kang_2023_CVPR, author = {Kang, Dahyun and Koniusz, Piotr and Cho, Minsu and Murray, Naila}, title = {Distilling Self-Supervised Vision Transformers for Weakly-Supervised Few-Shot Classification \& Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19627-19638} }
Collaborative Noisy Label Cleaner: Learning Scene-Aware Trailers for Multi-Modal Highlight Detection in Movies: Bei Gan,

Xiujun Shu,

Ruizhi Qiao,

Haoqian Wu,

Keyu Chen,

Hanjun Li,

Bo Ren; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gan_2023_CVPR, author = {Gan, Bei and Shu, Xiujun and Qiao, Ruizhi and Wu, Haoqian and Chen, Keyu and Li, Hanjun and Ren, Bo}, title = {Collaborative Noisy Label Cleaner: Learning Scene-Aware Trailers for Multi-Modal Highlight Detection in Movies}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18898-18907} }
ContraNeRF: Generalizable Neural Radiance Fields for Synthetic-to-Real Novel View Synthesis via Contrastive Learning: Hao Yang,

Lanqing Hong,

Aoxue Li,

Tianyang Hu,

Zhenguo Li,

Gim Hee Lee,

Liwei Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_CVPR, author = {Yang, Hao and Hong, Lanqing and Li, Aoxue and Hu, Tianyang and Li, Zhenguo and Lee, Gim Hee and Wang, Liwei}, title = {ContraNeRF: Generalizable Neural Radiance Fields for Synthetic-to-Real Novel View Synthesis via Contrastive Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16508-16517} }
PaletteNeRF: Palette-Based Appearance Editing of Neural Radiance Fields: Zhengfei Kuang,

Fujun Luan,

Sai Bi,

Zhixin Shu,

Gordon Wetzstein,

Kalyan Sunkavalli; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kuang_2023_CVPR, author = {Kuang, Zhengfei and Luan, Fujun and Bi, Sai and Shu, Zhixin and Wetzstein, Gordon and Sunkavalli, Kalyan}, title = {PaletteNeRF: Palette-Based Appearance Editing of Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20691-20700} }
Contrastive Mean Teacher for Domain Adaptive Object Detectors: Shengcao Cao,

Dhiraj Joshi,

Liang-Yan Gui,

Yu-Xiong Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cao_2023_CVPR, author = {Cao, Shengcao and Joshi, Dhiraj and Gui, Liang-Yan and Wang, Yu-Xiong}, title = {Contrastive Mean Teacher for Domain Adaptive Object Detectors}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23839-23848} }
Learning Transferable Spatiotemporal Representations From Natural Script Knowledge: Ziyun Zeng,

Yuying Ge,

Xihui Liu,

Bin Chen,

Ping Luo,

Shu-Tao Xia,

Yixiao Ge; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zeng_2023_CVPR, author = {Zeng, Ziyun and Ge, Yuying and Liu, Xihui and Chen, Bin and Luo, Ping and Xia, Shu-Tao and Ge, Yixiao}, title = {Learning Transferable Spatiotemporal Representations From Natural Script Knowledge}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23079-23089} }
CiCo: Domain-Aware Sign Language Retrieval via Cross-Lingual Contrastive Learning: Yiting Cheng,

Fangyun Wei,

Jianmin Bao,

Dong Chen,

Wenqiang Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cheng_2023_CVPR, author = {Cheng, Yiting and Wei, Fangyun and Bao, Jianmin and Chen, Dong and Zhang, Wenqiang}, title = {CiCo: Domain-Aware Sign Language Retrieval via Cross-Lingual Contrastive Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19016-19026} }
Video Dehazing via a Multi-Range Temporal Alignment Network With Physical Prior: Jiaqi Xu,

Xiaowei Hu,

Lei Zhu,

Qi Dou,

Jifeng Dai,

Yu Qiao,

Pheng-Ann Heng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_CVPR, author = {Xu, Jiaqi and Hu, Xiaowei and Zhu, Lei and Dou, Qi and Dai, Jifeng and Qiao, Yu and Heng, Pheng-Ann}, title = {Video Dehazing via a Multi-Range Temporal Alignment Network With Physical Prior}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18053-18062} }
Integrally Pre-Trained Transformer Pyramid Networks: Yunjie Tian,

Lingxi Xie,

Zhaozhi Wang,

Longhui Wei,

Xiaopeng Zhang,

Jianbin Jiao,

Yaowei Wang,

Qi Tian,

Qixiang Ye; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tian_2023_CVPR, author = {Tian, Yunjie and Xie, Lingxi and Wang, Zhaozhi and Wei, Longhui and Zhang, Xiaopeng and Jiao, Jianbin and Wang, Yaowei and Tian, Qi and Ye, Qixiang}, title = {Integrally Pre-Trained Transformer Pyramid Networks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18610-18620} }
Adaptive Channel Sparsity for Federated Learning Under System Heterogeneity: Dongping Liao,

Xitong Gao,

Yiren Zhao,

Cheng-Zhong Xu; [pdf] [supp]
[bibtex]
@InProceedings{Liao_2023_CVPR, author = {Liao, Dongping and Gao, Xitong and Zhao, Yiren and Xu, Cheng-Zhong}, title = {Adaptive Channel Sparsity for Federated Learning Under System Heterogeneity}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20432-20441} }
Sequential Training of GANs Against GAN-Classifiers Reveals Correlated "Knowledge Gaps" Present Among Independently Trained GAN Instances: Arkanath Pathak,

Nicholas Dufour; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Pathak_2023_CVPR, author = {Pathak, Arkanath and Dufour, Nicholas}, title = {Sequential Training of GANs Against GAN-Classifiers Reveals Correlated ''Knowledge Gaps'' Present Among Independently Trained GAN Instances}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24460-24469} }
TriVol: Point Cloud Rendering via Triple Volumes: Tao Hu,

Xiaogang Xu,

Ruihang Chu,

Jiaya Jia; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hu_2023_CVPR, author = {Hu, Tao and Xu, Xiaogang and Chu, Ruihang and Jia, Jiaya}, title = {TriVol: Point Cloud Rendering via Triple Volumes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20732-20741} }
(ML)$^2$P-Encoder: On Exploration of Channel-Class Correlation for Multi-Label Zero-Shot Learning: Ziming Liu,

Song Guo,

Xiaocheng Lu,

Jingcai Guo,

Jiewei Zhang,

Yue Zeng,

Fushuo Huo; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Ziming and Guo, Song and Lu, Xiaocheng and Guo, Jingcai and Zhang, Jiewei and Zeng, Yue and Huo, Fushuo}, title = {(ML)\${\textasciicircum}2\$P-Encoder: On Exploration of Channel-Class Correlation for Multi-Label Zero-Shot Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23859-23868} }
Image as a Foreign Language: BEiT Pretraining for Vision and Vision-Language Tasks: Wenhui Wang,

Hangbo Bao,

Li Dong,

Johan Bjorck,

Zhiliang Peng,

Qiang Liu,

Kriti Aggarwal,

Owais Khan Mohammed,

Saksham Singhal,

Subhojit Som,

Furu Wei; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Wenhui and Bao, Hangbo and Dong, Li and Bjorck, Johan and Peng, Zhiliang and Liu, Qiang and Aggarwal, Kriti and Mohammed, Owais Khan and Singhal, Saksham and Som, Subhojit and Wei, Furu}, title = {Image as a Foreign Language: BEiT Pretraining for Vision and Vision-Language Tasks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19175-19186} }
Density-Insensitive Unsupervised Domain Adaption on 3D Object Detection: Qianjiang Hu,

Daizong Liu,

Wei Hu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hu_2023_CVPR, author = {Hu, Qianjiang and Liu, Daizong and Hu, Wei}, title = {Density-Insensitive Unsupervised Domain Adaption on 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17556-17566} }
Learning Action Changes by Measuring Verb-Adverb Textual Relationships: Davide Moltisanti,

Frank Keller,

Hakan Bilen,

Laura Sevilla-Lara; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Moltisanti_2023_CVPR, author = {Moltisanti, Davide and Keller, Frank and Bilen, Hakan and Sevilla-Lara, Laura}, title = {Learning Action Changes by Measuring Verb-Adverb Textual Relationships}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23110-23118} }
Context-Aware Pretraining for Efficient Blind Image Decomposition: Chao Wang,

Zhedong Zheng,

Ruijie Quan,

Yifan Sun,

Yi Yang; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Chao and Zheng, Zhedong and Quan, Ruijie and Sun, Yifan and Yang, Yi}, title = {Context-Aware Pretraining for Efficient Blind Image Decomposition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18186-18195} }
Weakly Supervised Posture Mining for Fine-Grained Classification: Zhenchao Tang,

Hualin Yang,

Calvin Yu-Chian Chen; [pdf] [supp]
[bibtex]
@InProceedings{Tang_2023_CVPR, author = {Tang, Zhenchao and Yang, Hualin and Chen, Calvin Yu-Chian}, title = {Weakly Supervised Posture Mining for Fine-Grained Classification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23735-23744} }
LAVENDER: Unifying Video-Language Understanding As Masked Language Modeling: Linjie Li,

Zhe Gan,

Kevin Lin,

Chung-Ching Lin,

Zicheng Liu,

Ce Liu,

Lijuan Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Linjie and Gan, Zhe and Lin, Kevin and Lin, Chung-Ching and Liu, Zicheng and Liu, Ce and Wang, Lijuan}, title = {LAVENDER: Unifying Video-Language Understanding As Masked Language Modeling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23119-23129} }
Robust Unsupervised StyleGAN Image Restoration: Yohan Poirier-Ginter,

Jean-François Lalonde; [pdf] [arXiv]
[bibtex]
@InProceedings{Poirier-Ginter_2023_CVPR, author = {Poirier-Ginter, Yohan and Lalonde, Jean-Fran\c{c}ois}, title = {Robust Unsupervised StyleGAN Image Restoration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22292-22301} }
Event-Based Frame Interpolation With Ad-Hoc Deblurring: Lei Sun,

Christos Sakaridis,

Jingyun Liang,

Peng Sun,

Jiezhang Cao,

Kai Zhang,

Qi Jiang,

Kaiwei Wang,

Luc Van Gool; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sun_2023_CVPR, author = {Sun, Lei and Sakaridis, Christos and Liang, Jingyun and Sun, Peng and Cao, Jiezhang and Zhang, Kai and Jiang, Qi and Wang, Kaiwei and Van Gool, Luc}, title = {Event-Based Frame Interpolation With Ad-Hoc Deblurring}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18043-18052} }
OvarNet: Towards Open-Vocabulary Object Attribute Recognition: Keyan Chen,

Xiaolong Jiang,

Yao Hu,

Xu Tang,

Yan Gao,

Jianqi Chen,

Weidi Xie; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_CVPR, author = {Chen, Keyan and Jiang, Xiaolong and Hu, Yao and Tang, Xu and Gao, Yan and Chen, Jianqi and Xie, Weidi}, title = {OvarNet: Towards Open-Vocabulary Object Attribute Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23518-23527} }
3D Line Mapping Revisited: Shaohui Liu,

Yifan Yu,

Rémi Pautrat,

Marc Pollefeys,

Viktor Larsson; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Shaohui and Yu, Yifan and Pautrat, R\'emi and Pollefeys, Marc and Larsson, Viktor}, title = {3D Line Mapping Revisited}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21445-21455} }
Efficient and Explicit Modelling of Image Hierarchies for Image Restoration: Yawei Li,

Yuchen Fan,

Xiaoyu Xiang,

Denis Demandolx,

Rakesh Ranjan,

Radu Timofte,

Luc Van Gool; [pdf] [arXiv]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Yawei and Fan, Yuchen and Xiang, Xiaoyu and Demandolx, Denis and Ranjan, Rakesh and Timofte, Radu and Van Gool, Luc}, title = {Efficient and Explicit Modelling of Image Hierarchies for Image Restoration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18278-18289} }
DKT: Diverse Knowledge Transfer Transformer for Class Incremental Learning: Xinyuan Gao,

Yuhang He,

Songlin Dong,

Jie Cheng,

Xing Wei,

Yihong Gong; [pdf] [supp]
[bibtex]
@InProceedings{Gao_2023_CVPR, author = {Gao, Xinyuan and He, Yuhang and Dong, Songlin and Cheng, Jie and Wei, Xing and Gong, Yihong}, title = {DKT: Diverse Knowledge Transfer Transformer for Class Incremental Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24236-24245} }
TarViS: A Unified Approach for Target-Based Video Segmentation: Ali Athar,

Alexander Hermans,

Jonathon Luiten,

Deva Ramanan,

Bastian Leibe; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Athar_2023_CVPR, author = {Athar, Ali and Hermans, Alexander and Luiten, Jonathon and Ramanan, Deva and Leibe, Bastian}, title = {TarViS: A Unified Approach for Target-Based Video Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18738-18748} }
IDGI: A Framework To Eliminate Explanation Noise From Integrated Gradients: Ruo Yang,

Binghui Wang,

Mustafa Bilgic; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_CVPR, author = {Yang, Ruo and Wang, Binghui and Bilgic, Mustafa}, title = {IDGI: A Framework To Eliminate Explanation Noise From Integrated Gradients}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23725-23734} }
Implicit Surface Contrastive Clustering for LiDAR Point Clouds: Zaiwei Zhang,

Min Bai,

Erran Li; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_CVPR, author = {Zhang, Zaiwei and Bai, Min and Li, Erran}, title = {Implicit Surface Contrastive Clustering for LiDAR Point Clouds}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21716-21725} }
Semantic Ray: Learning a Generalizable Semantic Field With Cross-Reprojection Attention: Fangfu Liu,

Chubin Zhang,

Yu Zheng,

Yueqi Duan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Fangfu and Zhang, Chubin and Zheng, Yu and Duan, Yueqi}, title = {Semantic Ray: Learning a Generalizable Semantic Field With Cross-Reprojection Attention}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17386-17396} }
ORCa: Glossy Objects As Radiance-Field Cameras: Kushagra Tiwary,

Akshat Dave,

Nikhil Behari,

Tzofi Klinghoffer,

Ashok Veeraraghavan,

Ramesh Raskar; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tiwary_2023_CVPR, author = {Tiwary, Kushagra and Dave, Akshat and Behari, Nikhil and Klinghoffer, Tzofi and Veeraraghavan, Ashok and Raskar, Ramesh}, title = {ORCa: Glossy Objects As Radiance-Field Cameras}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20773-20782} }
SECAD-Net: Self-Supervised CAD Reconstruction by Learning Sketch-Extrude Operations: Pu Li,

Jianwei Guo,

Xiaopeng Zhang,

Dong-Ming Yan; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Pu and Guo, Jianwei and Zhang, Xiaopeng and Yan, Dong-Ming}, title = {SECAD-Net: Self-Supervised CAD Reconstruction by Learning Sketch-Extrude Operations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16816-16826} }
MDL-NAS: A Joint Multi-Domain Learning Framework for Vision Transformer: Shiguang Wang,

Tao Xie,

Jian Cheng,

Xingcheng Zhang,

Haijun Liu; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Shiguang and Xie, Tao and Cheng, Jian and Zhang, Xingcheng and Liu, Haijun}, title = {MDL-NAS: A Joint Multi-Domain Learning Framework for Vision Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20094-20104} }
Dual Alignment Unsupervised Domain Adaptation for Video-Text Retrieval: Xiaoshuai Hao,

Wanqian Zhang,

Dayan Wu,

Fei Zhu,

Bo Li; [pdf]
[bibtex]
@InProceedings{Hao_2023_CVPR, author = {Hao, Xiaoshuai and Zhang, Wanqian and Wu, Dayan and Zhu, Fei and Li, Bo}, title = {Dual Alignment Unsupervised Domain Adaptation for Video-Text Retrieval}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18962-18972} }
Computational Flash Photography Through Intrinsics: Sepideh Sarajian Maralan,

Chris Careaga,

Yagiz Aksoy; [pdf] [supp]
[bibtex]
@InProceedings{Maralan_2023_CVPR, author = {Maralan, Sepideh Sarajian and Careaga, Chris and Aksoy, Yagiz}, title = {Computational Flash Photography Through Intrinsics}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16654-16662} }
SpaText: Spatio-Textual Representation for Controllable Image Generation: Omri Avrahami,

Thomas Hayes,

Oran Gafni,

Sonal Gupta,

Yaniv Taigman,

Devi Parikh,

Dani Lischinski,

Ohad Fried,

Xi Yin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Avrahami_2023_CVPR, author = {Avrahami, Omri and Hayes, Thomas and Gafni, Oran and Gupta, Sonal and Taigman, Yaniv and Parikh, Devi and Lischinski, Dani and Fried, Ohad and Yin, Xi}, title = {SpaText: Spatio-Textual Representation for Controllable Image Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18370-18380} }
The ObjectFolder Benchmark: Multisensory Learning With Neural and Real Objects: Ruohan Gao,

Yiming Dou,

Hao Li,

Tanmay Agarwal,

Jeannette Bohg,

Yunzhu Li,

Li Fei-Fei,

Jiajun Wu; [pdf]
[bibtex]
@InProceedings{Gao_2023_CVPR, author = {Gao, Ruohan and Dou, Yiming and Li, Hao and Agarwal, Tanmay and Bohg, Jeannette and Li, Yunzhu and Fei-Fei, Li and Wu, Jiajun}, title = {The ObjectFolder Benchmark: Multisensory Learning With Neural and Real Objects}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17276-17286} }
ScaleFL: Resource-Adaptive Federated Learning With Heterogeneous Clients: Fatih Ilhan,

Gong Su,

Ling Liu; [pdf] [supp]
[bibtex]
@InProceedings{Ilhan_2023_CVPR, author = {Ilhan, Fatih and Su, Gong and Liu, Ling}, title = {ScaleFL: Resource-Adaptive Federated Learning With Heterogeneous Clients}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24532-24541} }
Reliable and Interpretable Personalized Federated Learning: Zixuan Qin,

Liu Yang,

Qilong Wang,

Yahong Han,

Qinghua Hu; [pdf]
[bibtex]
@InProceedings{Qin_2023_CVPR, author = {Qin, Zixuan and Yang, Liu and Wang, Qilong and Han, Yahong and Hu, Qinghua}, title = {Reliable and Interpretable Personalized Federated Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20422-20431} }
Optimal Transport Minimization: Crowd Localization on Density Maps for Semi-Supervised Counting: Wei Lin,

Antoni B. Chan; [pdf] [supp]
[bibtex]
@InProceedings{Lin_2023_CVPR, author = {Lin, Wei and Chan, Antoni B.}, title = {Optimal Transport Minimization: Crowd Localization on Density Maps for Semi-Supervised Counting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21663-21673} }
AdamsFormer for Spatial Action Localization in the Future: Hyung-gun Chi,

Kwonjoon Lee,

Nakul Agarwal,

Yi Xu,

Karthik Ramani,

Chiho Choi; [pdf] [supp]
[bibtex]
@InProceedings{Chi_2023_CVPR, author = {Chi, Hyung-gun and Lee, Kwonjoon and Agarwal, Nakul and Xu, Yi and Ramani, Karthik and Choi, Chiho}, title = {AdamsFormer for Spatial Action Localization in the Future}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17885-17895} }
Leveraging per Image-Token Consistency for Vision-Language Pre-Training: Yunhao Gou,

Tom Ko,

Hansi Yang,

James Kwok,

Yu Zhang,

Mingxuan Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gou_2023_CVPR, author = {Gou, Yunhao and Ko, Tom and Yang, Hansi and Kwok, James and Zhang, Yu and Wang, Mingxuan}, title = {Leveraging per Image-Token Consistency for Vision-Language Pre-Training}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19155-19164} }
UTM: A Unified Multiple Object Tracking Model With Identity-Aware Feature Enhancement: Sisi You,

Hantao Yao,

Bing-Kun Bao,

Changsheng Xu; [pdf] [supp]
[bibtex]
@InProceedings{You_2023_CVPR, author = {You, Sisi and Yao, Hantao and Bao, Bing-Kun and Xu, Changsheng}, title = {UTM: A Unified Multiple Object Tracking Model With Identity-Aware Feature Enhancement}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21876-21886} }
On the Stability-Plasticity Dilemma of Class-Incremental Learning: Dongwan Kim,

Bohyung Han; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2023_CVPR, author = {Kim, Dongwan and Han, Bohyung}, title = {On the Stability-Plasticity Dilemma of Class-Incremental Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20196-20204} }
Generalization Matters: Loss Minima Flattening via Parameter Hybridization for Efficient Online Knowledge Distillation: Tianli Zhang,

Mengqi Xue,

Jiangtao Zhang,

Haofei Zhang,

Yu Wang,

Lechao Cheng,

Jie Song,

Mingli Song; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_CVPR, author = {Zhang, Tianli and Xue, Mengqi and Zhang, Jiangtao and Zhang, Haofei and Wang, Yu and Cheng, Lechao and Song, Jie and Song, Mingli}, title = {Generalization Matters: Loss Minima Flattening via Parameter Hybridization for Efficient Online Knowledge Distillation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20176-20185} }
L-CoIns: Language-Based Colorization With Instance Awareness: Zheng Chang,

Shuchen Weng,

Peixuan Zhang,

Yu Li,

Si Li,

Boxin Shi; [pdf] [supp]
[bibtex]
@InProceedings{Chang_2023_CVPR, author = {Chang, Zheng and Weng, Shuchen and Zhang, Peixuan and Li, Yu and Li, Si and Shi, Boxin}, title = {L-CoIns: Language-Based Colorization With Instance Awareness}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19221-19230} }
On the Effects of Self-Supervision and Contrastive Alignment in Deep Multi-View Clustering: Daniel J. Trosten,

Sigurd Løkse,

Robert Jenssen,

Michael C. Kampffmeyer; [pdf] [supp]
[bibtex]
@InProceedings{Trosten_2023_CVPR, author = {Trosten, Daniel J. and L{\o}kse, Sigurd and Jenssen, Robert and Kampffmeyer, Michael C.}, title = {On the Effects of Self-Supervision and Contrastive Alignment in Deep Multi-View Clustering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23976-23985} }
Activating More Pixels in Image Super-Resolution Transformer: Xiangyu Chen,

Xintao Wang,

Jiantao Zhou,

Yu Qiao,

Chao Dong; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_CVPR, author = {Chen, Xiangyu and Wang, Xintao and Zhou, Jiantao and Qiao, Yu and Dong, Chao}, title = {Activating More Pixels in Image Super-Resolution Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22367-22377} }
BEV-SAN: Accurate BEV 3D Object Detection via Slice Attention Networks: Xiaowei Chi,

Jiaming Liu,

Ming Lu,

Rongyu Zhang,

Zhaoqing Wang,

Yandong Guo,

Shanghang Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Chi_2023_CVPR, author = {Chi, Xiaowei and Liu, Jiaming and Lu, Ming and Zhang, Rongyu and Wang, Zhaoqing and Guo, Yandong and Zhang, Shanghang}, title = {BEV-SAN: Accurate BEV 3D Object Detection via Slice Attention Networks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17461-17470} }
The Dark Side of Dynamic Routing Neural Networks: Towards Efficiency Backdoor Injection: Simin Chen,

Hanlin Chen,

Mirazul Haque,

Cong Liu,

Wei Yang; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_CVPR, author = {Chen, Simin and Chen, Hanlin and Haque, Mirazul and Liu, Cong and Yang, Wei}, title = {The Dark Side of Dynamic Routing Neural Networks: Towards Efficiency Backdoor Injection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24585-24594} }
NeRF in the Palm of Your Hand: Corrective Augmentation for Robotics via Novel-View Synthesis: Allan Zhou,

Moo Jin Kim,

Lirui Wang,

Pete Florence,

Chelsea Finn; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhou_2023_CVPR, author = {Zhou, Allan and Kim, Moo Jin and Wang, Lirui and Florence, Pete and Finn, Chelsea}, title = {NeRF in the Palm of Your Hand: Corrective Augmentation for Robotics via Novel-View Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17907-17917} }
Building Rearticulable Models for Arbitrary 3D Objects From 4D Point Clouds: Shaowei Liu,

Saurabh Gupta,

Shenlong Wang; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Shaowei and Gupta, Saurabh and Wang, Shenlong}, title = {Building Rearticulable Models for Arbitrary 3D Objects From 4D Point Clouds}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21138-21147} }
Neural Congealing: Aligning Images to a Joint Semantic Atlas: Dolev Ofri-Amar,

Michal Geyer,

Yoni Kasten,

Tali Dekel; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ofri-Amar_2023_CVPR, author = {Ofri-Amar, Dolev and Geyer, Michal and Kasten, Yoni and Dekel, Tali}, title = {Neural Congealing: Aligning Images to a Joint Semantic Atlas}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19403-19412} }
Adaptive Spot-Guided Transformer for Consistent Local Feature Matching: Jiahuan Yu,

Jiahao Chang,

Jianfeng He,

Tianzhu Zhang,

Jiyang Yu,

Feng Wu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yu_2023_CVPR, author = {Yu, Jiahuan and Chang, Jiahao and He, Jianfeng and Zhang, Tianzhu and Yu, Jiyang and Wu, Feng}, title = {Adaptive Spot-Guided Transformer for Consistent Local Feature Matching}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21898-21908} }
Wide-Angle Rectification via Content-Aware Conformal Mapping: Qi Zhang,

Hongdong Li,

Qing Wang; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_CVPR, author = {Zhang, Qi and Li, Hongdong and Wang, Qing}, title = {Wide-Angle Rectification via Content-Aware Conformal Mapping}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17357-17365} }
Token Turing Machines: Michael S. Ryoo,

Keerthana Gopalakrishnan,

Kumara Kahatapitiya,

Ted Xiao,

Kanishka Rao,

Austin Stone,

Yao Lu,

Julian Ibarz,

Anurag Arnab; [pdf] [arXiv]
[bibtex]
@InProceedings{Ryoo_2023_CVPR, author = {Ryoo, Michael S. and Gopalakrishnan, Keerthana and Kahatapitiya, Kumara and Xiao, Ted and Rao, Kanishka and Stone, Austin and Lu, Yao and Ibarz, Julian and Arnab, Anurag}, title = {Token Turing Machines}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19070-19081} }
Solving 3D Inverse Problems Using Pre-Trained 2D Diffusion Models: Hyungjin Chung,

Dohoon Ryu,

Michael T. McCann,

Marc L. Klasky,

Jong Chul Ye; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chung_2023_CVPR, author = {Chung, Hyungjin and Ryu, Dohoon and McCann, Michael T. and Klasky, Marc L. and Ye, Jong Chul}, title = {Solving 3D Inverse Problems Using Pre-Trained 2D Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22542-22551} }
DyNCA: Real-Time Dynamic Texture Synthesis Using Neural Cellular Automata: Ehsan Pajouheshgar,

Yitao Xu,

Tong Zhang,

Sabine Süsstrunk; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Pajouheshgar_2023_CVPR, author = {Pajouheshgar, Ehsan and Xu, Yitao and Zhang, Tong and S\"usstrunk, Sabine}, title = {DyNCA: Real-Time Dynamic Texture Synthesis Using Neural Cellular Automata}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20742-20751} }
Semantic-Promoted Debiasing and Background Disambiguation for Zero-Shot Instance Segmentation: Shuting He,

Henghui Ding,

Wei Jiang; [pdf] [supp]
[bibtex]
@InProceedings{He_2023_CVPR, author = {He, Shuting and Ding, Henghui and Jiang, Wei}, title = {Semantic-Promoted Debiasing and Background Disambiguation for Zero-Shot Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19498-19507} }
RelightableHands: Efficient Neural Relighting of Articulated Hand Models: Shun Iwase,

Shunsuke Saito,

Tomas Simon,

Stephen Lombardi,

Timur Bagautdinov,

Rohan Joshi,

Fabian Prada,

Takaaki Shiratori,

Yaser Sheikh,

Jason Saragih; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Iwase_2023_CVPR, author = {Iwase, Shun and Saito, Shunsuke and Simon, Tomas and Lombardi, Stephen and Bagautdinov, Timur and Joshi, Rohan and Prada, Fabian and Shiratori, Takaaki and Sheikh, Yaser and Saragih, Jason}, title = {RelightableHands: Efficient Neural Relighting of Articulated Hand Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16663-16673} }
Paired-Point Lifting for Enhanced Privacy-Preserving Visual Localization: Chunghwan Lee,

Jaihoon Kim,

Chanhyuk Yun,

Je Hyeong Hong; [pdf]
[bibtex]
@InProceedings{Lee_2023_CVPR, author = {Lee, Chunghwan and Kim, Jaihoon and Yun, Chanhyuk and Hong, Je Hyeong}, title = {Paired-Point Lifting for Enhanced Privacy-Preserving Visual Localization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17266-17275} }
What Happened 3 Seconds Ago? Inferring the Past With Thermal Imaging: Zitian Tang,

Wenjie Ye,

Wei-Chiu Ma,

Hang Zhao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tang_2023_CVPR, author = {Tang, Zitian and Ye, Wenjie and Ma, Wei-Chiu and Zhao, Hang}, title = {What Happened 3 Seconds Ago? Inferring the Past With Thermal Imaging}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17111-17120} }
Vector Quantization With Self-Attention for Quality-Independent Representation Learning: Zhou Yang,

Weisheng Dong,

Xin Li,

Mengluan Huang,

Yulin Sun,

Guangming Shi; [pdf] [supp]
[bibtex]
@InProceedings{Yang_2023_CVPR, author = {Yang, Zhou and Dong, Weisheng and Li, Xin and Huang, Mengluan and Sun, Yulin and Shi, Guangming}, title = {Vector Quantization With Self-Attention for Quality-Independent Representation Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24438-24448} }
Generating Anomalies for Video Anomaly Detection With Prompt-Based Feature Mapping: Zuhao Liu,

Xiao-Ming Wu,

Dian Zheng,

Kun-Yu Lin,

Wei-Shi Zheng; [pdf]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Zuhao and Wu, Xiao-Ming and Zheng, Dian and Lin, Kun-Yu and Zheng, Wei-Shi}, title = {Generating Anomalies for Video Anomaly Detection With Prompt-Based Feature Mapping}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24500-24510} }
Diffusion-Based Signed Distance Fields for 3D Shape Generation: Jaehyeok Shim,

Changwoo Kang,

Kyungdon Joo; [pdf] [supp]
[bibtex]
@InProceedings{Shim_2023_CVPR, author = {Shim, Jaehyeok and Kang, Changwoo and Joo, Kyungdon}, title = {Diffusion-Based Signed Distance Fields for 3D Shape Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20887-20897} }
Hierarchical Temporal Transformer for 3D Hand Pose Estimation and Action Recognition From Egocentric RGB Videos: Yilin Wen,

Hao Pan,

Lei Yang,

Jia Pan,

Taku Komura,

Wenping Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wen_2023_CVPR, author = {Wen, Yilin and Pan, Hao and Yang, Lei and Pan, Jia and Komura, Taku and Wang, Wenping}, title = {Hierarchical Temporal Transformer for 3D Hand Pose Estimation and Action Recognition From Egocentric RGB Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21243-21253} }
CAP-VSTNet: Content Affinity Preserved Versatile Style Transfer: Linfeng Wen,

Chengying Gao,

Changqing Zou; [pdf] [supp]
[bibtex]
@InProceedings{Wen_2023_CVPR, author = {Wen, Linfeng and Gao, Chengying and Zou, Changqing}, title = {CAP-VSTNet: Content Affinity Preserved Versatile Style Transfer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18300-18309} }
Tunable Convolutions With Parametric Multi-Loss Optimization: Matteo Maggioni,

Thomas Tanay,

Francesca Babiloni,

Steven McDonagh,

Aleš Leonardis; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Maggioni_2023_CVPR, author = {Maggioni, Matteo and Tanay, Thomas and Babiloni, Francesca and McDonagh, Steven and Leonardis, Ale\v{s}}, title = {Tunable Convolutions With Parametric Multi-Loss Optimization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20226-20236} }
DeepSolo: Let Transformer Decoder With Explicit Points Solo for Text Spotting: Maoyuan Ye,

Jing Zhang,

Shanshan Zhao,

Juhua Liu,

Tongliang Liu,

Bo Du,

Dacheng Tao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ye_2023_CVPR, author = {Ye, Maoyuan and Zhang, Jing and Zhao, Shanshan and Liu, Juhua and Liu, Tongliang and Du, Bo and Tao, Dacheng}, title = {DeepSolo: Let Transformer Decoder With Explicit Points Solo for Text Spotting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19348-19357} }
DreamBooth: Fine Tuning Text-to-Image Diffusion Models for Subject-Driven Generation: Nataniel Ruiz,

Yuanzhen Li,

Varun Jampani,

Yael Pritch,

Michael Rubinstein,

Kfir Aberman; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ruiz_2023_CVPR, author = {Ruiz, Nataniel and Li, Yuanzhen and Jampani, Varun and Pritch, Yael and Rubinstein, Michael and Aberman, Kfir}, title = {DreamBooth: Fine Tuning Text-to-Image Diffusion Models for Subject-Driven Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22500-22510} }
MOSO: Decomposing MOtion, Scene and Object for Video Prediction: Mingzhen Sun,

Weining Wang,

Xinxin Zhu,

Jing Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sun_2023_CVPR, author = {Sun, Mingzhen and Wang, Weining and Zhu, Xinxin and Liu, Jing}, title = {MOSO: Decomposing MOtion, Scene and Object for Video Prediction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18727-18737} }
Learning the Distribution of Errors in Stereo Matching for Joint Disparity and Uncertainty Estimation: Liyan Chen,

Weihan Wang,

Philippos Mordohai; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_CVPR, author = {Chen, Liyan and Wang, Weihan and Mordohai, Philippos}, title = {Learning the Distribution of Errors in Stereo Matching for Joint Disparity and Uncertainty Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17235-17244} }
Samples With Low Loss Curvature Improve Data Efficiency: Isha Garg,

Kaushik Roy; [pdf] [supp]
[bibtex]
@InProceedings{Garg_2023_CVPR, author = {Garg, Isha and Roy, Kaushik}, title = {Samples With Low Loss Curvature Improve Data Efficiency}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20290-20300} }
TINC: Tree-Structured Implicit Neural Compression: Runzhao Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_CVPR, author = {Yang, Runzhao}, title = {TINC: Tree-Structured Implicit Neural Compression}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18517-18526} }
Unifying Short and Long-Term Tracking With Graph Hierarchies: Orcun Cetintas,

Guillem Brasó,

Laura Leal-Taixé; [pdf] [supp]
[bibtex]
@InProceedings{Cetintas_2023_CVPR, author = {Cetintas, Orcun and Bras\'o, Guillem and Leal-Taix\'e, Laura}, title = {Unifying Short and Long-Term Tracking With Graph Hierarchies}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22877-22887} }
Re-Basin via Implicit Sinkhorn Differentiation: Fidel A. Guerrero Peña,

Heitor Rapela Medeiros,

Thomas Dubail,

Masih Aminbeidokhti,

Eric Granger,

Marco Pedersoli; [pdf] [supp]
[bibtex]
@InProceedings{Pena_2023_CVPR, author = {Pe\~na, Fidel A. Guerrero and Medeiros, Heitor Rapela and Dubail, Thomas and Aminbeidokhti, Masih and Granger, Eric and Pedersoli, Marco}, title = {Re-Basin via Implicit Sinkhorn Differentiation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20237-20246} }
Supervised Masked Knowledge Distillation for Few-Shot Transformers: Han Lin,

Guangxing Han,

Jiawei Ma,

Shiyuan Huang,

Xudong Lin,

Shih-Fu Chang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lin_2023_CVPR, author = {Lin, Han and Han, Guangxing and Ma, Jiawei and Huang, Shiyuan and Lin, Xudong and Chang, Shih-Fu}, title = {Supervised Masked Knowledge Distillation for Few-Shot Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19649-19659} }
RIDCP: Revitalizing Real Image Dehazing via High-Quality Codebook Priors: Rui-Qi Wu,

Zheng-Peng Duan,

Chun-Le Guo,

Zhi Chai,

Chongyi Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_CVPR, author = {Wu, Rui-Qi and Duan, Zheng-Peng and Guo, Chun-Le and Chai, Zhi and Li, Chongyi}, title = {RIDCP: Revitalizing Real Image Dehazing via High-Quality Codebook Priors}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22282-22291} }
Recurrence Without Recurrence: Stable Video Landmark Detection With Deep Equilibrium Models: Paul Micaelli,

Arash Vahdat,

Hongxu Yin,

Jan Kautz,

Pavlo Molchanov; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Micaelli_2023_CVPR, author = {Micaelli, Paul and Vahdat, Arash and Yin, Hongxu and Kautz, Jan and Molchanov, Pavlo}, title = {Recurrence Without Recurrence: Stable Video Landmark Detection With Deep Equilibrium Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22814-22825} }
Generalized Relation Modeling for Transformer Tracking: Shenyuan Gao,

Chunluan Zhou,

Jun Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gao_2023_CVPR, author = {Gao, Shenyuan and Zhou, Chunluan and Zhang, Jun}, title = {Generalized Relation Modeling for Transformer Tracking}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18686-18695} }
Non-Line-of-Sight Imaging With Signal Superresolution Network: Jianyu Wang,

Xintong Liu,

Leping Xiao,

Zuoqiang Shi,

Lingyun Qiu,

Xing Fu; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Jianyu and Liu, Xintong and Xiao, Leping and Shi, Zuoqiang and Qiu, Lingyun and Fu, Xing}, title = {Non-Line-of-Sight Imaging With Signal Superresolution Network}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17420-17429} }
MixNeRF: Modeling a Ray With Mixture Density for Novel View Synthesis From Sparse Inputs: Seunghyeon Seo,

Donghoon Han,

Yeonjin Chang,

Nojun Kwak; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Seo_2023_CVPR, author = {Seo, Seunghyeon and Han, Donghoon and Chang, Yeonjin and Kwak, Nojun}, title = {MixNeRF: Modeling a Ray With Mixture Density for Novel View Synthesis From Sparse Inputs}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20659-20668} }
Cross-Domain 3D Hand Pose Estimation With Dual Modalities: Qiuxia Lin,

Linlin Yang,

Angela Yao; [pdf] [supp]
[bibtex]
@InProceedings{Lin_2023_CVPR, author = {Lin, Qiuxia and Yang, Linlin and Yao, Angela}, title = {Cross-Domain 3D Hand Pose Estimation With Dual Modalities}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17184-17193} }
Delving Into Discrete Normalizing Flows on SO(3) Manifold for Probabilistic Rotation Modeling: Yulin Liu,

Haoran Liu,

Yingda Yin,

Yang Wang,

Baoquan Chen,

He Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Yulin and Liu, Haoran and Yin, Yingda and Wang, Yang and Chen, Baoquan and Wang, He}, title = {Delving Into Discrete Normalizing Flows on SO(3) Manifold for Probabilistic Rotation Modeling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21264-21273} }
SfM-TTR: Using Structure From Motion for Test-Time Refinement of Single-View Depth Networks: Sergio Izquierdo,

Javier Civera; [pdf] [supp]
[bibtex]
@InProceedings{Izquierdo_2023_CVPR, author = {Izquierdo, Sergio and Civera, Javier}, title = {SfM-TTR: Using Structure From Motion for Test-Time Refinement of Single-View Depth Networks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21466-21476} }
MELTR: Meta Loss Transformer for Learning To Fine-Tune Video Foundation Models: Dohwan Ko,

Joonmyung Choi,

Hyeong Kyu Choi,

Kyoung-Woon On,

Byungseok Roh,

Hyunwoo J. Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ko_2023_CVPR, author = {Ko, Dohwan and Choi, Joonmyung and Choi, Hyeong Kyu and On, Kyoung-Woon and Roh, Byungseok and Kim, Hyunwoo J.}, title = {MELTR: Meta Loss Transformer for Learning To Fine-Tune Video Foundation Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20105-20115} }
Meta-Personalizing Vision-Language Models To Find Named Instances in Video: Chun-Hsiao Yeh,

Bryan Russell,

Josef Sivic,

Fabian Caba Heilbron,

Simon Jenni; [pdf] [supp]
[bibtex]
@InProceedings{Yeh_2023_CVPR, author = {Yeh, Chun-Hsiao and Russell, Bryan and Sivic, Josef and Heilbron, Fabian Caba and Jenni, Simon}, title = {Meta-Personalizing Vision-Language Models To Find Named Instances in Video}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19123-19132} }
Egocentric Audio-Visual Object Localization: Chao Huang,

Yapeng Tian,

Anurag Kumar,

Chenliang Xu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_CVPR, author = {Huang, Chao and Tian, Yapeng and Kumar, Anurag and Xu, Chenliang}, title = {Egocentric Audio-Visual Object Localization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22910-22921} }
DropKey for Vision Transformer: Bonan Li,

Yinhan Hu,

Xuecheng Nie,

Congying Han,

Xiangjian Jiang,

Tiande Guo,

Luoqi Liu; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Bonan and Hu, Yinhan and Nie, Xuecheng and Han, Congying and Jiang, Xiangjian and Guo, Tiande and Liu, Luoqi}, title = {DropKey for Vision Transformer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22700-22709} }
Meta Architecture for Point Cloud Analysis: Haojia Lin,

Xiawu Zheng,

Lijiang Li,

Fei Chao,

Shanshan Wang,

Yan Wang,

Yonghong Tian,

Rongrong Ji; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lin_2023_CVPR, author = {Lin, Haojia and Zheng, Xiawu and Li, Lijiang and Chao, Fei and Wang, Shanshan and Wang, Yan and Tian, Yonghong and Ji, Rongrong}, title = {Meta Architecture for Point Cloud Analysis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17682-17691} }
CIRCLE: Capture in Rich Contextual Environments: João Pedro Araújo,

Jiaman Li,

Karthik Vetrivel,

Rishi Agarwal,

Jiajun Wu,

Deepak Gopinath,

Alexander William Clegg,

Karen Liu; [pdf] [supp]
[bibtex]
@InProceedings{Araujo_2023_CVPR, author = {Ara\'ujo, Jo\~ao Pedro and Li, Jiaman and Vetrivel, Karthik and Agarwal, Rishi and Wu, Jiajun and Gopinath, Deepak and Clegg, Alexander William and Liu, Karen}, title = {CIRCLE: Capture in Rich Contextual Environments}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21211-21221} }
PyPose: A Library for Robot Learning With Physics-Based Optimization: Chen Wang,

Dasong Gao,

Kuan Xu,

Junyi Geng,

Yaoyu Hu,

Yuheng Qiu,

Bowen Li,

Fan Yang,

Brady Moon,

Abhinav Pandey,

Aryan,

Jiahe Xu,

Tianhao Wu,

Haonan He,

Daning Huang,

Zhongqiang Ren,

Shibo Zhao,

Taimeng Fu,

Pranay Reddy,

Xiao Lin,

Wenshan Wang,

Jingnan Shi,

Rajat Talak,

Kun Cao,

Yi Du,

Han Wang,

Huai Yu,

Shanzhao Wang,

Siyu Chen,

Ananth Kashyap,

Rohan Bandaru,

Karthik Dantu,

Jiajun Wu,

Lihua Xie,

Luca Carlone,

Marco Hutter,

Sebastian Scherer; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Chen and Gao, Dasong and Xu, Kuan and Geng, Junyi and Hu, Yaoyu and Qiu, Yuheng and Li, Bowen and Yang, Fan and Moon, Brady and Pandey, Abhinav and Aryan and Xu, Jiahe and Wu, Tianhao and He, Haonan and Huang, Daning and Ren, Zhongqiang and Zhao, Shibo and Fu, Taimeng and Reddy, Pranay and Lin, Xiao and Wang, Wenshan and Shi, Jingnan and Talak, Rajat and Cao, Kun and Du, Yi and Wang, Han and Yu, Huai and Wang, Shanzhao and Chen, Siyu and Kashyap, Ananth and Bandaru, Rohan and Dantu, Karthik and Wu, Jiajun and Xie, Lihua and Carlone, Luca and Hutter, Marco and Scherer, Sebastian}, title = {PyPose: A Library for Robot Learning With Physics-Based Optimization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22024-22034} }
Make Landscape Flatter in Differentially Private Federated Learning: Yifan Shi,

Yingqi Liu,

Kang Wei,

Li Shen,

Xueqian Wang,

Dacheng Tao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shi_2023_CVPR, author = {Shi, Yifan and Liu, Yingqi and Wei, Kang and Shen, Li and Wang, Xueqian and Tao, Dacheng}, title = {Make Landscape Flatter in Differentially Private Federated Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24552-24562} }
BlackVIP: Black-Box Visual Prompting for Robust Transfer Learning: Changdae Oh,

Hyeji Hwang,

Hee-young Lee,

YongTaek Lim,

Geunyoung Jung,

Jiyoung Jung,

Hosik Choi,

Kyungwoo Song; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Oh_2023_CVPR, author = {Oh, Changdae and Hwang, Hyeji and Lee, Hee-young and Lim, YongTaek and Jung, Geunyoung and Jung, Jiyoung and Choi, Hosik and Song, Kyungwoo}, title = {BlackVIP: Black-Box Visual Prompting for Robust Transfer Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24224-24235} }
DeepVecFont-v2: Exploiting Transformers To Synthesize Vector Fonts With Higher Quality: Yuqing Wang,

Yizhi Wang,

Longhui Yu,

Yuesheng Zhu,

Zhouhui Lian; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Yuqing and Wang, Yizhi and Yu, Longhui and Zhu, Yuesheng and Lian, Zhouhui}, title = {DeepVecFont-v2: Exploiting Transformers To Synthesize Vector Fonts With Higher Quality}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18320-18328} }
pCON: Polarimetric Coordinate Networks for Neural Scene Representations: Henry Peters,

Yunhao Ba,

Achuta Kadambi; [pdf] [supp]
[bibtex]
@InProceedings{Peters_2023_CVPR, author = {Peters, Henry and Ba, Yunhao and Kadambi, Achuta}, title = {pCON: Polarimetric Coordinate Networks for Neural Scene Representations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16579-16589} }
Uncertainty-Aware Vision-Based Metric Cross-View Geolocalization: Florian Fervers,

Sebastian Bullinger,

Christoph Bodensteiner,

Michael Arens,

Rainer Stiefelhagen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Fervers_2023_CVPR, author = {Fervers, Florian and Bullinger, Sebastian and Bodensteiner, Christoph and Arens, Michael and Stiefelhagen, Rainer}, title = {Uncertainty-Aware Vision-Based Metric Cross-View Geolocalization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21621-21631} }
Continuous Landmark Detection With 3D Queries: Prashanth Chandran,

Gaspard Zoss,

Paulo Gotardo,

Derek Bradley; [pdf] [supp]
[bibtex]
@InProceedings{Chandran_2023_CVPR, author = {Chandran, Prashanth and Zoss, Gaspard and Gotardo, Paulo and Bradley, Derek}, title = {Continuous Landmark Detection With 3D Queries}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16858-16867} }
Unbiased Scene Graph Generation in Videos: Sayak Nag,

Kyle Min,

Subarna Tripathi,

Amit K. Roy-Chowdhury; [pdf] [supp] [arXiv ]
[bibtex]
@InProceedings{Nag_2023_CVPR, author = {Nag, Sayak and Min, Kyle and Tripathi, Subarna and Roy-Chowdhury, Amit K.}, title = {Unbiased Scene Graph Generation in Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22803-22813} }
Visual Language Pretrained Multiple Instance Zero-Shot Transfer for Histopathology Images: Ming Y. Lu,

Bowen Chen,

Andrew Zhang,

Drew F. K. Williamson,

Richard J. Chen,

Tong Ding,

Long Phi Le,

Yung-Sung Chuang,

Faisal Mahmood; [pdf] [supp]
[bibtex]
@InProceedings{Lu_2023_CVPR, author = {Lu, Ming Y. and Chen, Bowen and Zhang, Andrew and Williamson, Drew F. K. and Chen, Richard J. and Ding, Tong and Le, Long Phi and Chuang, Yung-Sung and Mahmood, Faisal}, title = {Visual Language Pretrained Multiple Instance Zero-Shot Transfer for Histopathology Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19764-19775} }
PMR: Prototypical Modal Rebalance for Multimodal Learning: Yunfeng Fan,

Wenchao Xu,

Haozhao Wang,

Junxiao Wang,

Song Guo; [pdf] [arXiv]
[bibtex]
@InProceedings{Fan_2023_CVPR, author = {Fan, Yunfeng and Xu, Wenchao and Wang, Haozhao and Wang, Junxiao and Guo, Song}, title = {PMR: Prototypical Modal Rebalance for Multimodal Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20029-20038} }
Multi-Sensor Large-Scale Dataset for Multi-View 3D Reconstruction: Oleg Voynov,

Gleb Bobrovskikh,

Pavel Karpyshev,

Saveliy Galochkin,

Andrei-Timotei Ardelean,

Arseniy Bozhenko,

Ekaterina Karmanova,

Pavel Kopanev,

Yaroslav Labutin-Rymsho,

Ruslan Rakhimov,

Aleksandr Safin,

Valerii Serpiva,

Alexey Artemov,

Evgeny Burnaev,

Dzmitry Tsetserukou,

Denis Zorin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Voynov_2023_CVPR, author = {Voynov, Oleg and Bobrovskikh, Gleb and Karpyshev, Pavel and Galochkin, Saveliy and Ardelean, Andrei-Timotei and Bozhenko, Arseniy and Karmanova, Ekaterina and Kopanev, Pavel and Labutin-Rymsho, Yaroslav and Rakhimov, Ruslan and Safin, Aleksandr and Serpiva, Valerii and Artemov, Alexey and Burnaev, Evgeny and Tsetserukou, Dzmitry and Zorin, Denis}, title = {Multi-Sensor Large-Scale Dataset for Multi-View 3D Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21392-21403} }
PanoHead: Geometry-Aware 3D Full-Head Synthesis in 360deg: Sizhe An,

Hongyi Xu,

Yichun Shi,

Guoxian Song,

Umit Y. Ogras,

Linjie Luo; [pdf] [supp]
[bibtex]
@InProceedings{An_2023_CVPR, author = {An, Sizhe and Xu, Hongyi and Shi, Yichun and Song, Guoxian and Ogras, Umit Y. and Luo, Linjie}, title = {PanoHead: Geometry-Aware 3D Full-Head Synthesis in 360deg}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20950-20959} }
Rethinking Feature-Based Knowledge Distillation for Face Recognition: Jingzhi Li,

Zidong Guo,

Hui Li,

Seungju Han,

Ji-won Baek,

Min Yang,

Ran Yang,

Sungjoo Suh; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Jingzhi and Guo, Zidong and Li, Hui and Han, Seungju and Baek, Ji-won and Yang, Min and Yang, Ran and Suh, Sungjoo}, title = {Rethinking Feature-Based Knowledge Distillation for Face Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20156-20165} }
NeurOCS: Neural NOCS Supervision for Monocular 3D Object Localization: Zhixiang Min,

Bingbing Zhuang,

Samuel Schulter,

Buyu Liu,

Enrique Dunn,

Manmohan Chandraker; [pdf] [supp]
[bibtex]
@InProceedings{Min_2023_CVPR, author = {Min, Zhixiang and Zhuang, Bingbing and Schulter, Samuel and Liu, Buyu and Dunn, Enrique and Chandraker, Manmohan}, title = {NeurOCS: Neural NOCS Supervision for Monocular 3D Object Localization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21404-21414} }
Revisiting Reverse Distillation for Anomaly Detection: Tran Dinh Tien,

Anh Tuan Nguyen,

Nguyen Hoang Tran,

Ta Duc Huy,

Soan T.M. Duong,

Chanh D. Tr. Nguyen,

Steven Q. H. Truong; [pdf]
[bibtex]
@InProceedings{Tien_2023_CVPR, author = {Tien, Tran Dinh and Nguyen, Anh Tuan and Tran, Nguyen Hoang and Huy, Ta Duc and Duong, Soan T.M. and Nguyen, Chanh D. Tr. and Truong, Steven Q. H.}, title = {Revisiting Reverse Distillation for Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24511-24520} }
Diffusion-Based Generation, Optimization, and Planning in 3D Scenes: Siyuan Huang,

Zan Wang,

Puhao Li,

Baoxiong Jia,

Tengyu Liu,

Yixin Zhu,

Wei Liang,

Song-Chun Zhu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_CVPR, author = {Huang, Siyuan and Wang, Zan and Li, Puhao and Jia, Baoxiong and Liu, Tengyu and Zhu, Yixin and Liang, Wei and Zhu, Song-Chun}, title = {Diffusion-Based Generation, Optimization, and Planning in 3D Scenes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16750-16761} }
TMO: Textured Mesh Acquisition of Objects With a Mobile Device by Using Differentiable Rendering: Jaehoon Choi,

Dongki Jung,

Taejae Lee,

Sangwook Kim,

Youngdong Jung,

Dinesh Manocha,

Donghwan Lee; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Choi_2023_CVPR, author = {Choi, Jaehoon and Jung, Dongki and Lee, Taejae and Kim, Sangwook and Jung, Youngdong and Manocha, Dinesh and Lee, Donghwan}, title = {TMO: Textured Mesh Acquisition of Objects With a Mobile Device by Using Differentiable Rendering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16674-16684} }
MP-Former: Mask-Piloted Transformer for Image Segmentation: Hao Zhang,

Feng Li,

Huaizhe Xu,

Shijia Huang,

Shilong Liu,

Lionel M. Ni,

Lei Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_CVPR, author = {Zhang, Hao and Li, Feng and Xu, Huaizhe and Huang, Shijia and Liu, Shilong and Ni, Lionel M. and Zhang, Lei}, title = {MP-Former: Mask-Piloted Transformer for Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18074-18083} }
TAPS3D: Text-Guided 3D Textured Shape Generation From Pseudo Supervision: Jiacheng Wei,

Hao Wang,

Jiashi Feng,

Guosheng Lin,

Kim-Hui Yap; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wei_2023_CVPR, author = {Wei, Jiacheng and Wang, Hao and Feng, Jiashi and Lin, Guosheng and Yap, Kim-Hui}, title = {TAPS3D: Text-Guided 3D Textured Shape Generation From Pseudo Supervision}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16805-16815} }
Video Test-Time Adaptation for Action Recognition: Wei Lin,

Muhammad Jehanzeb Mirza,

Mateusz Kozinski,

Horst Possegger,

Hilde Kuehne,

Horst Bischof; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lin_2023_CVPR, author = {Lin, Wei and Mirza, Muhammad Jehanzeb and Kozinski, Mateusz and Possegger, Horst and Kuehne, Hilde and Bischof, Horst}, title = {Video Test-Time Adaptation for Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22952-22961} }
Tensor4D: Efficient Neural 4D Decomposition for High-Fidelity Dynamic Reconstruction and Rendering: Ruizhi Shao,

Zerong Zheng,

Hanzhang Tu,

Boning Liu,

Hongwen Zhang,

Yebin Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shao_2023_CVPR, author = {Shao, Ruizhi and Zheng, Zerong and Tu, Hanzhang and Liu, Boning and Zhang, Hongwen and Liu, Yebin}, title = {Tensor4D: Efficient Neural 4D Decomposition for High-Fidelity Dynamic Reconstruction and Rendering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16632-16642} }
Learning Personalized High Quality Volumetric Head Avatars From Monocular RGB Videos: Ziqian Bai,

Feitong Tan,

Zeng Huang,

Kripasindhu Sarkar,

Danhang Tang,

Di Qiu,

Abhimitra Meka,

Ruofei Du,

Mingsong Dou,

Sergio Orts-Escolano,

Rohit Pandey,

Ping Tan,

Thabo Beeler,

Sean Fanello,

Yinda Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bai_2023_CVPR, author = {Bai, Ziqian and Tan, Feitong and Huang, Zeng and Sarkar, Kripasindhu and Tang, Danhang and Qiu, Di and Meka, Abhimitra and Du, Ruofei and Dou, Mingsong and Orts-Escolano, Sergio and Pandey, Rohit and Tan, Ping and Beeler, Thabo and Fanello, Sean and Zhang, Yinda}, title = {Learning Personalized High Quality Volumetric Head Avatars From Monocular RGB Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16890-16900} }
Progressive Backdoor Erasing via Connecting Backdoor and Adversarial Attacks: Bingxu Mu,

Zhenxing Niu,

Le Wang,

Xue Wang,

Qiguang Miao,

Rong Jin,

Gang Hua; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mu_2023_CVPR, author = {Mu, Bingxu and Niu, Zhenxing and Wang, Le and Wang, Xue and Miao, Qiguang and Jin, Rong and Hua, Gang}, title = {Progressive Backdoor Erasing via Connecting Backdoor and Adversarial Attacks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20495-20503} }
LayoutFormer++: Conditional Graphic Layout Generation via Constraint Serialization and Decoding Space Restriction: Zhaoyun Jiang,

Jiaqi Guo,

Shizhao Sun,

Huayu Deng,

Zhongkai Wu,

Vuksan Mijovic,

Zijiang James Yang,

Jian-Guang Lou,

Dongmei Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Jiang_2023_CVPR, author = {Jiang, Zhaoyun and Guo, Jiaqi and Sun, Shizhao and Deng, Huayu and Wu, Zhongkai and Mijovic, Vuksan and Yang, Zijiang James and Lou, Jian-Guang and Zhang, Dongmei}, title = {LayoutFormer++: Conditional Graphic Layout Generation via Constraint Serialization and Decoding Space Restriction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18403-18412} }
Stare at What You See: Masked Image Modeling Without Reconstruction: Hongwei Xue,

Peng Gao,

Hongyang Li,

Yu Qiao,

Hao Sun,

Houqiang Li,

Jiebo Luo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xue_2023_CVPR, author = {Xue, Hongwei and Gao, Peng and Li, Hongyang and Qiao, Yu and Sun, Hao and Li, Houqiang and Luo, Jiebo}, title = {Stare at What You See: Masked Image Modeling Without Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22732-22741} }
Joint Visual Grounding and Tracking With Natural Language Specification: Li Zhou,

Zikun Zhou,

Kaige Mao,

Zhenyu He; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhou_2023_CVPR, author = {Zhou, Li and Zhou, Zikun and Mao, Kaige and He, Zhenyu}, title = {Joint Visual Grounding and Tracking With Natural Language Specification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23151-23160} }
Few-Shot Semantic Image Synthesis With Class Affinity Transfer: Marlène Careil,

Jakob Verbeek,

Stéphane Lathuilière; [pdf] [supp]
[bibtex]
@InProceedings{Careil_2023_CVPR, author = {Careil, Marl\`ene and Verbeek, Jakob and Lathuili\`ere, St\'ephane}, title = {Few-Shot Semantic Image Synthesis With Class Affinity Transfer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23611-23620} }
HIER: Metric Learning Beyond Class Labels via Hierarchical Regularization: Sungyeon Kim,

Boseung Jeong,

Suha Kwak; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2023_CVPR, author = {Kim, Sungyeon and Jeong, Boseung and Kwak, Suha}, title = {HIER: Metric Learning Beyond Class Labels via Hierarchical Regularization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19903-19912} }
Diffusion Probabilistic Model Made Slim: Xingyi Yang,

Daquan Zhou,

Jiashi Feng,

Xinchao Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_CVPR, author = {Yang, Xingyi and Zhou, Daquan and Feng, Jiashi and Wang, Xinchao}, title = {Diffusion Probabilistic Model Made Slim}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22552-22562} }
Confidence-Aware Personalized Federated Learning via Variational Expectation Maximization: Junyi Zhu,

Xingchen Ma,

Matthew B. Blaschko; [pdf] [supp]
[bibtex]
@InProceedings{Zhu_2023_CVPR, author = {Zhu, Junyi and Ma, Xingchen and Blaschko, Matthew B.}, title = {Confidence-Aware Personalized Federated Learning via Variational Expectation Maximization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24542-24551} }
Hierarchical Supervision and Shuffle Data Augmentation for 3D Semi-Supervised Object Detection: Chuandong Liu,

Chenqiang Gao,

Fangcen Liu,

Pengcheng Li,

Deyu Meng,

Xinbo Gao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Chuandong and Gao, Chenqiang and Liu, Fangcen and Li, Pengcheng and Meng, Deyu and Gao, Xinbo}, title = {Hierarchical Supervision and Shuffle Data Augmentation for 3D Semi-Supervised Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23819-23828} }
Planning-Oriented Autonomous Driving: Yihan Hu,

Jiazhi Yang,

Li Chen,

Keyu Li,

Chonghao Sima,

Xizhou Zhu,

Siqi Chai,

Senyao Du,

Tianwei Lin,

Wenhai Wang,

Lewei Lu,

Xiaosong Jia,

Qiang Liu,

Jifeng Dai,

Yu Qiao,

Hongyang Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hu_2023_CVPR, author = {Hu, Yihan and Yang, Jiazhi and Chen, Li and Li, Keyu and Sima, Chonghao and Zhu, Xizhou and Chai, Siqi and Du, Senyao and Lin, Tianwei and Wang, Wenhai and Lu, Lewei and Jia, Xiaosong and Liu, Qiang and Dai, Jifeng and Qiao, Yu and Li, Hongyang}, title = {Planning-Oriented Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17853-17862} }
Independent Component Alignment for Multi-Task Learning: Dmitry Senushkin,

Nikolay Patakin,

Arseny Kuznetsov,

Anton Konushin; [pdf] [supp]
[bibtex]
@InProceedings{Senushkin_2023_CVPR, author = {Senushkin, Dmitry and Patakin, Nikolay and Kuznetsov, Arseny and Konushin, Anton}, title = {Independent Component Alignment for Multi-Task Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20083-20093} }
Edges to Shapes to Concepts: Adversarial Augmentation for Robust Vision: Aditay Tripathi,

Rishubh Singh,

Anirban Chakraborty,

Pradeep Shenoy; [pdf] [supp]
[bibtex]
@InProceedings{Tripathi_2023_CVPR, author = {Tripathi, Aditay and Singh, Rishubh and Chakraborty, Anirban and Shenoy, Pradeep}, title = {Edges to Shapes to Concepts: Adversarial Augmentation for Robust Vision}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24470-24479} }
ReVISE: Self-Supervised Speech Resynthesis With Visual Input for Universal and Generalized Speech Regeneration: Wei-Ning Hsu,

Tal Remez,

Bowen Shi,

Jacob Donley,

Yossi Adi; [pdf] [supp]
[bibtex]
@InProceedings{Hsu_2023_CVPR, author = {Hsu, Wei-Ning and Remez, Tal and Shi, Bowen and Donley, Jacob and Adi, Yossi}, title = {ReVISE: Self-Supervised Speech Resynthesis With Visual Input for Universal and Generalized Speech Regeneration}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18795-18805} }
Data-Free Knowledge Distillation via Feature Exchange and Activation Region Constraint: Shikang Yu,

Jiachen Chen,

Hu Han,

Shuqiang Jiang; [pdf] [supp]
[bibtex]
@InProceedings{Yu_2023_CVPR, author = {Yu, Shikang and Chen, Jiachen and Han, Hu and Jiang, Shuqiang}, title = {Data-Free Knowledge Distillation via Feature Exchange and Activation Region Constraint}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24266-24275} }
CLIP-Sculptor: Zero-Shot Generation of High-Fidelity and Diverse Shapes From Natural Language: Aditya Sanghi,

Rao Fu,

Vivian Liu,

Karl D.D. Willis,

Hooman Shayani,

Amir H. Khasahmadi,

Srinath Sridhar,

Daniel Ritchie; [pdf] [supp]
[bibtex]
@InProceedings{Sanghi_2023_CVPR, author = {Sanghi, Aditya and Fu, Rao and Liu, Vivian and Willis, Karl D.D. and Shayani, Hooman and Khasahmadi, Amir H. and Sridhar, Srinath and Ritchie, Daniel}, title = {CLIP-Sculptor: Zero-Shot Generation of High-Fidelity and Diverse Shapes From Natural Language}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18339-18348} }
Mask-Free Video Instance Segmentation: Lei Ke,

Martin Danelljan,

Henghui Ding,

Yu-Wing Tai,

Chi-Keung Tang,

Fisher Yu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ke_2023_CVPR, author = {Ke, Lei and Danelljan, Martin and Ding, Henghui and Tai, Yu-Wing and Tang, Chi-Keung and Yu, Fisher}, title = {Mask-Free Video Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22857-22866} }
Continual Detection Transformer for Incremental Object Detection: Yaoyao Liu,

Bernt Schiele,

Andrea Vedaldi,

Christian Rupprecht; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Yaoyao and Schiele, Bernt and Vedaldi, Andrea and Rupprecht, Christian}, title = {Continual Detection Transformer for Incremental Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23799-23808} }
Two-Stream Networks for Weakly-Supervised Temporal Action Localization With Semantic-Aware Mechanisms: Yu Wang,

Yadong Li,

Hongbin Wang; [pdf]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Yu and Li, Yadong and Wang, Hongbin}, title = {Two-Stream Networks for Weakly-Supervised Temporal Action Localization With Semantic-Aware Mechanisms}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18878-18887} }
HyperMatch: Noise-Tolerant Semi-Supervised Learning via Relaxed Contrastive Constraint: Beitong Zhou,

Jing Lu,

Kerui Liu,

Yunlu Xu,

Zhanzhan Cheng,

Yi Niu; [pdf] [supp]
[bibtex]
@InProceedings{Zhou_2023_CVPR, author = {Zhou, Beitong and Lu, Jing and Liu, Kerui and Xu, Yunlu and Cheng, Zhanzhan and Niu, Yi}, title = {HyperMatch: Noise-Tolerant Semi-Supervised Learning via Relaxed Contrastive Constraint}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24017-24026} }
LEGO-Net: Learning Regular Rearrangements of Objects in Rooms: Qiuhong Anna Wei,

Sijie Ding,

Jeong Joon Park,

Rahul Sajnani,

Adrien Poulenard,

Srinath Sridhar,

Leonidas Guibas; [pdf] [supp]
[bibtex]
@InProceedings{Wei_2023_CVPR, author = {Wei, Qiuhong Anna and Ding, Sijie and Park, Jeong Joon and Sajnani, Rahul and Poulenard, Adrien and Sridhar, Srinath and Guibas, Leonidas}, title = {LEGO-Net: Learning Regular Rearrangements of Objects in Rooms}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19037-19047} }
FastInst: A Simple Query-Based Model for Real-Time Instance Segmentation: Junjie He,

Pengyu Li,

Yifeng Geng,

Xuansong Xie; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{He_2023_CVPR, author = {He, Junjie and Li, Pengyu and Geng, Yifeng and Xie, Xuansong}, title = {FastInst: A Simple Query-Based Model for Real-Time Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23663-23672} }
Self-Supervised Representation Learning for CAD: Benjamin T. Jones,

Michael Hu,

Milin Kodnongbua,

Vladimir G. Kim,

Adriana Schulz; [pdf] [supp]
[bibtex]
@InProceedings{Jones_2023_CVPR, author = {Jones, Benjamin T. and Hu, Michael and Kodnongbua, Milin and Kim, Vladimir G. and Schulz, Adriana}, title = {Self-Supervised Representation Learning for CAD}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21327-21336} }
DETRs With Hybrid Matching: Ding Jia,

Yuhui Yuan,

Haodi He,

Xiaopei Wu,

Haojun Yu,

Weihong Lin,

Lei Sun,

Chao Zhang,

Han Hu; [pdf] [arXiv]
[bibtex]
@InProceedings{Jia_2023_CVPR, author = {Jia, Ding and Yuan, Yuhui and He, Haodi and Wu, Xiaopei and Yu, Haojun and Lin, Weihong and Sun, Lei and Zhang, Chao and Hu, Han}, title = {DETRs With Hybrid Matching}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19702-19712} }
Angelic Patches for Improving Third-Party Object Detector Performance: Wenwen Si,

Shuo Li,

Sangdon Park,

Insup Lee,

Osbert Bastani; [pdf] [supp]
[bibtex]
@InProceedings{Si_2023_CVPR, author = {Si, Wenwen and Li, Shuo and Park, Sangdon and Lee, Insup and Bastani, Osbert}, title = {Angelic Patches for Improving Third-Party Object Detector Performance}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24638-24647} }
Mask-Free OVIS: Open-Vocabulary Instance Segmentation Without Manual Mask Annotations: Vibashan VS,

Ning Yu,

Chen Xing,

Can Qin,

Mingfei Gao,

Juan Carlos Niebles,

Vishal M. Patel,

Ran Xu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{VS_2023_CVPR, author = {VS, Vibashan and Yu, Ning and Xing, Chen and Qin, Can and Gao, Mingfei and Niebles, Juan Carlos and Patel, Vishal M. and Xu, Ran}, title = {Mask-Free OVIS: Open-Vocabulary Instance Segmentation Without Manual Mask Annotations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23539-23549} }
Complete-to-Partial 4D Distillation for Self-Supervised Point Cloud Sequence Representation Learning: Zhuoyang Zhang,

Yuhao Dong,

Yunze Liu,

Li Yi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_CVPR, author = {Zhang, Zhuoyang and Dong, Yuhao and Liu, Yunze and Yi, Li}, title = {Complete-to-Partial 4D Distillation for Self-Supervised Point Cloud Sequence Representation Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17661-17670} }
Multi-Modal Gait Recognition via Effective Spatial-Temporal Feature Fusion: Yufeng Cui,

Yimei Kang; [pdf]
[bibtex]
@InProceedings{Cui_2023_CVPR, author = {Cui, Yufeng and Kang, Yimei}, title = {Multi-Modal Gait Recognition via Effective Spatial-Temporal Feature Fusion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17949-17957} }
Hierarchical Discriminative Learning Improves Visual Representations of Biomedical Microscopy: Cheng Jiang,

Xinhai Hou,

Akhil Kondepudi,

Asadur Chowdury,

Christian W. Freudiger,

Daniel A. Orringer,

Honglak Lee,

Todd C. Hollon; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jiang_2023_CVPR, author = {Jiang, Cheng and Hou, Xinhai and Kondepudi, Akhil and Chowdury, Asadur and Freudiger, Christian W. and Orringer, Daniel A. and Lee, Honglak and Hollon, Todd C.}, title = {Hierarchical Discriminative Learning Improves Visual Representations of Biomedical Microscopy}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19798-19808} }
ProD: Prompting-To-Disentangle Domain Knowledge for Cross-Domain Few-Shot Image Classification: Tianyi Ma,

Yifan Sun,

Zongxin Yang,

Yi Yang; [pdf] [supp]
[bibtex]
@InProceedings{Ma_2023_CVPR, author = {Ma, Tianyi and Sun, Yifan and Yang, Zongxin and Yang, Yi}, title = {ProD: Prompting-To-Disentangle Domain Knowledge for Cross-Domain Few-Shot Image Classification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19754-19763} }
ImageNet-E: Benchmarking Neural Network Robustness via Attribute Editing: Xiaodan Li,

Yuefeng Chen,

Yao Zhu,

Shuhui Wang,

Rong Zhang,

Hui Xue; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Xiaodan and Chen, Yuefeng and Zhu, Yao and Wang, Shuhui and Zhang, Rong and Xue, Hui}, title = {ImageNet-E: Benchmarking Neural Network Robustness via Attribute Editing}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20371-20381} }
Learning With Fantasy: Semantic-Aware Virtual Contrastive Constraint for Few-Shot Class-Incremental Learning: Zeyin Song,

Yifan Zhao,

Yujun Shi,

Peixi Peng,

Li Yuan,

Yonghong Tian; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Song_2023_CVPR, author = {Song, Zeyin and Zhao, Yifan and Shi, Yujun and Peng, Peixi and Yuan, Li and Tian, Yonghong}, title = {Learning With Fantasy: Semantic-Aware Virtual Contrastive Constraint for Few-Shot Class-Incremental Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24183-24192} }
Cascaded Local Implicit Transformer for Arbitrary-Scale Super-Resolution: Hao-Wei Chen,

Yu-Syuan Xu,

Min-Fong Hong,

Yi-Min Tsai,

Hsien-Kai Kuo,

Chun-Yi Lee; [pdf] [arXiv]
[bibtex]
@InProceedings{Chen_2023_CVPR, author = {Chen, Hao-Wei and Xu, Yu-Syuan and Hong, Min-Fong and Tsai, Yi-Min and Kuo, Hsien-Kai and Lee, Chun-Yi}, title = {Cascaded Local Implicit Transformer for Arbitrary-Scale Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18257-18267} }
Network-Free, Unsupervised Semantic Segmentation With Synthetic Images: Qianli Feng,

Raghudeep Gadde,

Wentong Liao,

Eduard Ramon,

Aleix Martinez; [pdf] [supp]
[bibtex]
@InProceedings{Feng_2023_CVPR, author = {Feng, Qianli and Gadde, Raghudeep and Liao, Wentong and Ramon, Eduard and Martinez, Aleix}, title = {Network-Free, Unsupervised Semantic Segmentation With Synthetic Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23602-23610} }
Hierarchical Dense Correlation Distillation for Few-Shot Segmentation: Bohao Peng,

Zhuotao Tian,

Xiaoyang Wu,

Chengyao Wang,

Shu Liu,

Jingyong Su,

Jiaya Jia; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Peng_2023_CVPR, author = {Peng, Bohao and Tian, Zhuotao and Wu, Xiaoyang and Wang, Chengyao and Liu, Shu and Su, Jingyong and Jia, Jiaya}, title = {Hierarchical Dense Correlation Distillation for Few-Shot Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23641-23651} }
Hi4D: 4D Instance Segmentation of Close Human Interaction: Yifei Yin,

Chen Guo,

Manuel Kaufmann,

Juan Jose Zarate,

Jie Song,

Otmar Hilliges; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yin_2023_CVPR, author = {Yin, Yifei and Guo, Chen and Kaufmann, Manuel and Zarate, Juan Jose and Song, Jie and Hilliges, Otmar}, title = {Hi4D: 4D Instance Segmentation of Close Human Interaction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17016-17027} }
SQUID: Deep Feature In-Painting for Unsupervised Anomaly Detection: Tiange Xiang,

Yixiao Zhang,

Yongyi Lu,

Alan L. Yuille,

Chaoyi Zhang,

Weidong Cai,

Zongwei Zhou; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xiang_2023_CVPR, author = {Xiang, Tiange and Zhang, Yixiao and Lu, Yongyi and Yuille, Alan L. and Zhang, Chaoyi and Cai, Weidong and Zhou, Zongwei}, title = {SQUID: Deep Feature In-Painting for Unsupervised Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23890-23901} }
On the Convergence of IRLS and Its Variants in Outlier-Robust Estimation: Liangzu Peng,

Christian Kümmerle,

René Vidal; [pdf] [supp]
[bibtex]
@InProceedings{Peng_2023_CVPR, author = {Peng, Liangzu and K\"ummerle, Christian and Vidal, Ren\'e}, title = {On the Convergence of IRLS and Its Variants in Outlier-Robust Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17808-17818} }
A New Comprehensive Benchmark for Semi-Supervised Video Anomaly Detection and Anticipation: Congqi Cao,

Yue Lu,

Peng Wang,

Yanning Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Cao_2023_CVPR, author = {Cao, Congqi and Lu, Yue and Wang, Peng and Zhang, Yanning}, title = {A New Comprehensive Benchmark for Semi-Supervised Video Anomaly Detection and Anticipation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20392-20401} }
HumanBench: Towards General Human-Centric Perception With Projector Assisted Pretraining: Shixiang Tang,

Cheng Chen,

Qingsong Xie,

Meilin Chen,

Yizhou Wang,

Yuanzheng Ci,

Lei Bai,

Feng Zhu,

Haiyang Yang,

Li Yi,

Rui Zhao,

Wanli Ouyang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tang_2023_CVPR, author = {Tang, Shixiang and Chen, Cheng and Xie, Qingsong and Chen, Meilin and Wang, Yizhou and Ci, Yuanzheng and Bai, Lei and Zhu, Feng and Yang, Haiyang and Yi, Li and Zhao, Rui and Ouyang, Wanli}, title = {HumanBench: Towards General Human-Centric Perception With Projector Assisted Pretraining}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21970-21982} }
Deep Graph Reprogramming: Yongcheng Jing,

Chongbin Yuan,

Li Ju,

Yiding Yang,

Xinchao Wang,

Dacheng Tao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jing_2023_CVPR, author = {Jing, Yongcheng and Yuan, Chongbin and Ju, Li and Yang, Yiding and Wang, Xinchao and Tao, Dacheng}, title = {Deep Graph Reprogramming}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24345-24354} }
Compacting Binary Neural Networks by Sparse Kernel Selection: Yikai Wang,

Wenbing Huang,

Yinpeng Dong,

Fuchun Sun,

Anbang Yao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Yikai and Huang, Wenbing and Dong, Yinpeng and Sun, Fuchun and Yao, Anbang}, title = {Compacting Binary Neural Networks by Sparse Kernel Selection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24374-24383} }
Unified Mask Embedding and Correspondence Learning for Self-Supervised Video Segmentation: Liulei Li,

Wenguan Wang,

Tianfei Zhou,

Jianwu Li,

Yi Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Liulei and Wang, Wenguan and Zhou, Tianfei and Li, Jianwu and Yang, Yi}, title = {Unified Mask Embedding and Correspondence Learning for Self-Supervised Video Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18706-18716} }
Seeing Beyond the Brain: Conditional Diffusion Model With Sparse Masked Modeling for Vision Decoding: Zijiao Chen,

Jiaxin Qing,

Tiange Xiang,

Wan Lin Yue,

Juan Helen Zhou; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_CVPR, author = {Chen, Zijiao and Qing, Jiaxin and Xiang, Tiange and Yue, Wan Lin and Zhou, Juan Helen}, title = {Seeing Beyond the Brain: Conditional Diffusion Model With Sparse Masked Modeling for Vision Decoding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22710-22720} }
PointAvatar: Deformable Point-Based Head Avatars From Videos: Yufeng Zheng,

Wang Yifan,

Gordon Wetzstein,

Michael J. Black,

Otmar Hilliges; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zheng_2023_CVPR, author = {Zheng, Yufeng and Yifan, Wang and Wetzstein, Gordon and Black, Michael J. and Hilliges, Otmar}, title = {PointAvatar: Deformable Point-Based Head Avatars From Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21057-21067} }
OrienterNet: Visual Localization in 2D Public Maps With Neural Matching: Paul-Edouard Sarlin,

Daniel DeTone,

Tsun-Yi Yang,

Armen Avetisyan,

Julian Straub,

Tomasz Malisiewicz,

Samuel Rota Bulò,

Richard Newcombe,

Peter Kontschieder,

Vasileios Balntas; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sarlin_2023_CVPR, author = {Sarlin, Paul-Edouard and DeTone, Daniel and Yang, Tsun-Yi and Avetisyan, Armen and Straub, Julian and Malisiewicz, Tomasz and Bul\`o, Samuel Rota and Newcombe, Richard and Kontschieder, Peter and Balntas, Vasileios}, title = {OrienterNet: Visual Localization in 2D Public Maps With Neural Matching}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21632-21642} }
PMatch: Paired Masked Image Modeling for Dense Geometric Matching: Shengjie Zhu,

Xiaoming Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhu_2023_CVPR, author = {Zhu, Shengjie and Liu, Xiaoming}, title = {PMatch: Paired Masked Image Modeling for Dense Geometric Matching}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21909-21918} }
Masked and Adaptive Transformer for Exemplar Based Image Translation: Chang Jiang,

Fei Gao,

Biao Ma,

Yuhao Lin,

Nannan Wang,

Gang Xu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jiang_2023_CVPR, author = {Jiang, Chang and Gao, Fei and Ma, Biao and Lin, Yuhao and Wang, Nannan and Xu, Gang}, title = {Masked and Adaptive Transformer for Exemplar Based Image Translation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22418-22427} }
You Are Catching My Attention: Are Vision Transformers Bad Learners Under Backdoor Attacks?: Zenghui Yuan,

Pan Zhou,

Kai Zou,

Yu Cheng; [pdf] [supp]
[bibtex]
@InProceedings{Yuan_2023_CVPR, author = {Yuan, Zenghui and Zhou, Pan and Zou, Kai and Cheng, Yu}, title = {You Are Catching My Attention: Are Vision Transformers Bad Learners Under Backdoor Attacks?}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24605-24615} }
Contrastive Grouping With Transformer for Referring Image Segmentation: Jiajin Tang,

Ge Zheng,

Cheng Shi,

Sibei Yang; [pdf]
[bibtex]
@InProceedings{Tang_2023_CVPR, author = {Tang, Jiajin and Zheng, Ge and Shi, Cheng and Yang, Sibei}, title = {Contrastive Grouping With Transformer for Referring Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23570-23580} }
PaCa-ViT: Learning Patch-to-Cluster Attention in Vision Transformers: Ryan Grainger,

Thomas Paniagua,

Xi Song,

Naresh Cuntoor,

Mun Wai Lee,

Tianfu Wu; [pdf] [supp]
[bibtex]
@InProceedings{Grainger_2023_CVPR, author = {Grainger, Ryan and Paniagua, Thomas and Song, Xi and Cuntoor, Naresh and Lee, Mun Wai and Wu, Tianfu}, title = {PaCa-ViT: Learning Patch-to-Cluster Attention in Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18568-18578} }
Pix2map: Cross-Modal Retrieval for Inferring Street Maps From Images: Xindi Wu,

KwunFung Lau,

Francesco Ferroni,

Aljoša Ošep,

Deva Ramanan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_CVPR, author = {Wu, Xindi and Lau, KwunFung and Ferroni, Francesco and O\v{s}ep, Aljo\v{s}a and Ramanan, Deva}, title = {Pix2map: Cross-Modal Retrieval for Inferring Street Maps From Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17514-17523} }
Unsupervised Inference of Signed Distance Functions From Single Sparse Point Clouds Without Learning Priors: Chao Chen,

Yu-Shen Liu,

Zhizhong Han; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_CVPR, author = {Chen, Chao and Liu, Yu-Shen and Han, Zhizhong}, title = {Unsupervised Inference of Signed Distance Functions From Single Sparse Point Clouds Without Learning Priors}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17712-17723} }
Deep Discriminative Spatial and Temporal Network for Efficient Video Deblurring: Jinshan Pan,

Boming Xu,

Jiangxin Dong,

Jianjun Ge,

Jinhui Tang; [pdf] [supp]
[bibtex]
@InProceedings{Pan_2023_CVPR, author = {Pan, Jinshan and Xu, Boming and Dong, Jiangxin and Ge, Jianjun and Tang, Jinhui}, title = {Deep Discriminative Spatial and Temporal Network for Efficient Video Deblurring}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22191-22200} }
Prototype-Based Embedding Network for Scene Graph Generation: Chaofan Zheng,

Xinyu Lyu,

Lianli Gao,

Bo Dai,

Jingkuan Song; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zheng_2023_CVPR, author = {Zheng, Chaofan and Lyu, Xinyu and Gao, Lianli and Dai, Bo and Song, Jingkuan}, title = {Prototype-Based Embedding Network for Scene Graph Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22783-22792} }
Efficient Movie Scene Detection Using State-Space Transformers: Md Mohaiminul Islam,

Mahmudul Hasan,

Kishan Shamsundar Athrey,

Tony Braskich,

Gedas Bertasius; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Islam_2023_CVPR, author = {Islam, Md Mohaiminul and Hasan, Mahmudul and Athrey, Kishan Shamsundar and Braskich, Tony and Bertasius, Gedas}, title = {Efficient Movie Scene Detection Using State-Space Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18749-18758} }
Efficient Semantic Segmentation by Altering Resolutions for Compressed Videos: Yubin Hu,

Yuze He,

Yanghao Li,

Jisheng Li,

Yuxing Han,

Jiangtao Wen,

Yong-Jin Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hu_2023_CVPR, author = {Hu, Yubin and He, Yuze and Li, Yanghao and Li, Jisheng and Han, Yuxing and Wen, Jiangtao and Liu, Yong-Jin}, title = {Efficient Semantic Segmentation by Altering Resolutions for Compressed Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22627-22637} }
Discriminating Known From Unknown Objects via Structure-Enhanced Recurrent Variational AutoEncoder: Aming Wu,

Cheng Deng; [pdf] [supp]
[bibtex]
@InProceedings{Wu_2023_CVPR, author = {Wu, Aming and Deng, Cheng}, title = {Discriminating Known From Unknown Objects via Structure-Enhanced Recurrent Variational AutoEncoder}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23956-23965} }
Occlusion-Free Scene Recovery via Neural Radiance Fields: Chengxuan Zhu,

Renjie Wan,

Yunkai Tang,

Boxin Shi; [pdf] [supp]
[bibtex]
@InProceedings{Zhu_2023_CVPR, author = {Zhu, Chengxuan and Wan, Renjie and Tang, Yunkai and Shi, Boxin}, title = {Occlusion-Free Scene Recovery via Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20722-20731} }
Semi-Supervised Domain Adaptation With Source Label Adaptation: Yu-Chu Yu,

Hsuan-Tien Lin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yu_2023_CVPR, author = {Yu, Yu-Chu and Lin, Hsuan-Tien}, title = {Semi-Supervised Domain Adaptation With Source Label Adaptation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24100-24109} }
Range-Nullspace Video Frame Interpolation With Focalized Motion Estimation: Zhiyang Yu,

Yu Zhang,

Dongqing Zou,

Xijun Chen,

Jimmy S. Ren,

Shunqing Ren; [pdf] [supp]
[bibtex]
@InProceedings{Yu_2023_CVPR, author = {Yu, Zhiyang and Zhang, Yu and Zou, Dongqing and Chen, Xijun and Ren, Jimmy S. and Ren, Shunqing}, title = {Range-Nullspace Video Frame Interpolation With Focalized Motion Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22159-22168} }
FlowGrad: Controlling the Output of Generative ODEs With Gradients: Xingchao Liu,

Lemeng Wu,

Shujian Zhang,

Chengyue Gong,

Wei Ping,

Qiang Liu; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Xingchao and Wu, Lemeng and Zhang, Shujian and Gong, Chengyue and Ping, Wei and Liu, Qiang}, title = {FlowGrad: Controlling the Output of Generative ODEs With Gradients}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24335-24344} }
Learning Weather-General and Weather-Specific Features for Image Restoration Under Multiple Adverse Weather Conditions: Yurui Zhu,

Tianyu Wang,

Xueyang Fu,

Xuanyu Yang,

Xin Guo,

Jifeng Dai,

Yu Qiao,

Xiaowei Hu; [pdf]
[bibtex]
@InProceedings{Zhu_2023_CVPR, author = {Zhu, Yurui and Wang, Tianyu and Fu, Xueyang and Yang, Xuanyu and Guo, Xin and Dai, Jifeng and Qiao, Yu and Hu, Xiaowei}, title = {Learning Weather-General and Weather-Specific Features for Image Restoration Under Multiple Adverse Weather Conditions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21747-21758} }
Generalized Deep 3D Shape Prior via Part-Discretized Diffusion Process: Yuhan Li,

Yishun Dou,

Xuanhong Chen,

Bingbing Ni,

Yilin Sun,

Yutian Liu,

Fuzhen Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Yuhan and Dou, Yishun and Chen, Xuanhong and Ni, Bingbing and Sun, Yilin and Liu, Yutian and Wang, Fuzhen}, title = {Generalized Deep 3D Shape Prior via Part-Discretized Diffusion Process}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16784-16794} }
Conflict-Based Cross-View Consistency for Semi-Supervised Semantic Segmentation: Zicheng Wang,

Zhen Zhao,

Xiaoxia Xing,

Dong Xu,

Xiangyu Kong,

Luping Zhou; [pdf] [arXiv]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Zicheng and Zhao, Zhen and Xing, Xiaoxia and Xu, Dong and Kong, Xiangyu and Zhou, Luping}, title = {Conflict-Based Cross-View Consistency for Semi-Supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19585-19595} }
SCoDA: Domain Adaptive Shape Completion for Real Scans: Yushuang Wu,

Zizheng Yan,

Ce Chen,

Lai Wei,

Xiao Li,

Guanbin Li,

Yihao Li,

Shuguang Cui,

Xiaoguang Han; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_CVPR, author = {Wu, Yushuang and Yan, Zizheng and Chen, Ce and Wei, Lai and Li, Xiao and Li, Guanbin and Li, Yihao and Cui, Shuguang and Han, Xiaoguang}, title = {SCoDA: Domain Adaptive Shape Completion for Real Scans}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17630-17641} }
TransFlow: Transformer As Flow Learner: Yawen Lu,

Qifan Wang,

Siqi Ma,

Tong Geng,

Yingjie Victor Chen,

Huaijin Chen,

Dongfang Liu; [pdf] [arXiv]
[bibtex]
@InProceedings{Lu_2023_CVPR, author = {Lu, Yawen and Wang, Qifan and Ma, Siqi and Geng, Tong and Chen, Yingjie Victor and Chen, Huaijin and Liu, Dongfang}, title = {TransFlow: Transformer As Flow Learner}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18063-18073} }
AutoFocusFormer: Image Segmentation off the Grid: Chen Ziwen,

Kaushik Patnaik,

Shuangfei Zhai,

Alvin Wan,

Zhile Ren,

Alexander G. Schwing,

Alex Colburn,

Li Fuxin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ziwen_2023_CVPR, author = {Ziwen, Chen and Patnaik, Kaushik and Zhai, Shuangfei and Wan, Alvin and Ren, Zhile and Schwing, Alexander G. and Colburn, Alex and Fuxin, Li}, title = {AutoFocusFormer: Image Segmentation off the Grid}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18227-18236} }
CLIP2Protect: Protecting Facial Privacy Using Text-Guided Makeup via Adversarial Latent Search: Fahad Shamshad,

Muzammal Naseer,

Karthik Nandakumar; [pdf] [supp]
[bibtex]
@InProceedings{Shamshad_2023_CVPR, author = {Shamshad, Fahad and Naseer, Muzammal and Nandakumar, Karthik}, title = {CLIP2Protect: Protecting Facial Privacy Using Text-Guided Makeup via Adversarial Latent Search}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20595-20605} }
Improving Weakly Supervised Temporal Action Localization by Bridging Train-Test Gap in Pseudo Labels: Jingqiu Zhou,

Linjiang Huang,

Liang Wang,

Si Liu,

Hongsheng Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhou_2023_CVPR, author = {Zhou, Jingqiu and Huang, Linjiang and Wang, Liang and Liu, Si and Li, Hongsheng}, title = {Improving Weakly Supervised Temporal Action Localization by Bridging Train-Test Gap in Pseudo Labels}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23003-23012} }
REVEAL: Retrieval-Augmented Visual-Language Pre-Training With Multi-Source Multimodal Knowledge Memory: Ziniu Hu,

Ahmet Iscen,

Chen Sun,

Zirui Wang,

Kai-Wei Chang,

Yizhou Sun,

Cordelia Schmid,

David A. Ross,

Alireza Fathi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hu_2023_CVPR, author = {Hu, Ziniu and Iscen, Ahmet and Sun, Chen and Wang, Zirui and Chang, Kai-Wei and Sun, Yizhou and Schmid, Cordelia and Ross, David A. and Fathi, Alireza}, title = {REVEAL: Retrieval-Augmented Visual-Language Pre-Training With Multi-Source Multimodal Knowledge Memory}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23369-23379} }
Why Is the Winner the Best?: Matthias Eisenmann,

Annika Reinke,

Vivienn Weru,

Minu D. Tizabi,

Fabian Isensee,

Tim J. Adler,

Sharib Ali,

Vincent Andrearczyk,

Marc Aubreville,

Ujjwal Baid,

Spyridon Bakas,

Niranjan Balu,

Sophia Bano,

Jorge Bernal,

Sebastian Bodenstedt,

Alessandro Casella,

Veronika Cheplygina,

Marie Daum,

Marleen de Bruijne,

Adrien Depeursinge,

Reuben Dorent,

Jan Egger,

David G. Ellis,

Sandy Engelhardt,

Melanie Ganz,

Noha Ghatwary,

Gabriel Girard,

Patrick Godau,

Anubha Gupta,

Lasse Hansen,

Kanako Harada,

Mattias P. Heinrich,

Nicholas Heller,

Alessa Hering,

Arnaud Huaulmé,

Pierre Jannin,

Ali Emre Kavur,

Oldřich Kodym,

Michal Kozubek,

Jianning Li,

Hongwei Li,

Jun Ma,

Carlos Martín-Isla,

Bjoern Menze,

Alison Noble,

Valentin Oreiller,

Nicolas Padoy,

Sarthak Pati,

Kelly Payette,

Tim Rädsch,

Jonathan Rafael-Patiño,

Vivek Singh Bawa,

Stefanie Speidel,

Carole H. Sudre,

Kimberlin van Wijnen,

Martin Wagner,

Donglai Wei,

Amine Yamlahi,

Moi Hoon Yap,

Chun Yuan,

Maximilian Zenk,

Aneeq Zia,

David Zimmerer,

Dogu Baran Aydogan,

Binod Bhattarai,

Louise Bloch,

Raphael Brüngel,

Jihoon Cho,

Chanyeol Choi,

Qi Dou,

Ivan Ezhov,

Christoph M. Friedrich,

Clifton D. Fuller,

Rebati Raman Gaire,

Adrian Galdran,

Álvaro García Faura,

Maria Grammatikopoulou,

SeulGi Hong,

Mostafa Jahanifar,

Ikbeom Jang,

Abdolrahim Kadkhodamohammadi,

Inha Kang,

Florian Kofler,

Satoshi Kondo,

Hugo Kuijf,

Mingxing Li,

Minh Luu,

Tomaž Martinčič,

Pedro Morais,

Mohamed A. Naser,

Bruno Oliveira,

David Owen,

Subeen Pang,

Jinah Park,

Sung-Hong Park,

Szymon Plotka,

Elodie Puybareau,

Nasir Rajpoot,

Kanghyun Ryu,

Numan Saeed,

Adam Shephard,

Pengcheng Shi,

Dejan Štepec,

Ronast Subedi,

Guillaume Tochon,

Helena R. Torres,

Helene Urien,

João L. Vilaça,

Kareem A. Wahid,

Haojie Wang,

Jiacheng Wang,

Liansheng Wang,

Xiyue Wang,

Benedikt Wiestler,

Marek Wodzinski,

Fangfang Xia,

Juanying Xie,

Zhiwei Xiong,

Sen Yang,

Yanwu Yang,

Zixuan Zhao,

Klaus Maier-Hein,

Paul F. Jäger,

Annette Kopp-Schneider,

Lena Maier-Hein; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Eisenmann_2023_CVPR, author = {Eisenmann, Matthias and Reinke, Annika and Weru, Vivienn and Tizabi, Minu D. and Isensee, Fabian and Adler, Tim J. and Ali, Sharib and Andrearczyk, Vincent and Aubreville, Marc and Baid, Ujjwal and Bakas, Spyridon and Balu, Niranjan and Bano, Sophia and Bernal, Jorge and Bodenstedt, Sebastian and Casella, Alessandro and Cheplygina, Veronika and Daum, Marie and de Bruijne, Marleen and Depeursinge, Adrien and Dorent, Reuben and Egger, Jan and Ellis, David G. and Engelhardt, Sandy and Ganz, Melanie and Ghatwary, Noha and Girard, Gabriel and Godau, Patrick and Gupta, Anubha and Hansen, Lasse and Harada, Kanako and Heinrich, Mattias P. and Heller, Nicholas and Hering, Alessa and Huaulm\'e, Arnaud and Jannin, Pierre and Kavur, Ali Emre and Kodym, Old\v{r}ich and Kozubek, Michal and Li, Jianning and Li, Hongwei and Ma, Jun and Mart{\'\i}n-Isla, Carlos and Menze, Bjoern and Noble, Alison and Oreiller, Valentin and Padoy, Nicolas and Pati, Sarthak and Payette, Kelly and R\"adsch, Tim and Rafael-Pati\~no, Jonathan and Bawa, Vivek Singh and Speidel, Stefanie and Sudre, Carole H. and van Wijnen, Kimberlin and Wagner, Martin and Wei, Donglai and Yamlahi, Amine and Yap, Moi Hoon and Yuan, Chun and Zenk, Maximilian and Zia, Aneeq and Zimmerer, David and Aydogan, Dogu Baran and Bhattarai, Binod and Bloch, Louise and Br\"ungel, Raphael and Cho, Jihoon and Choi, Chanyeol and Dou, Qi and Ezhov, Ivan and Friedrich, Christoph M. and Fuller, Clifton D. and Gaire, Rebati Raman and Galdran, Adrian and Faura, \'Alvaro Garc{\'\i}a and Grammatikopoulou, Maria and Hong, SeulGi and Jahanifar, Mostafa and Jang, Ikbeom and Kadkhodamohammadi, Abdolrahim and Kang, Inha and Kofler, Florian and Kondo, Satoshi and Kuijf, Hugo and Li, Mingxing and Luu, Minh and Martin\v{c}i\v{c}, Toma\v{z} and Morais, Pedro and Naser, Mohamed A. and Oliveira, Bruno and Owen, David and Pang, Subeen and Park, Jinah and Park, Sung-Hong and Plotka, Szymon and Puybareau, Elodie and Rajpoot, Nasir and Ryu, Kanghyun and Saeed, Numan and Shephard, Adam and Shi, Pengcheng and \v{S}tepec, Dejan and Subedi, Ronast and Tochon, Guillaume and Torres, Helena R. and Urien, Helene and Vila\c{c}a, Jo\~ao L. and Wahid, Kareem A. and Wang, Haojie and Wang, Jiacheng and Wang, Liansheng and Wang, Xiyue and Wiestler, Benedikt and Wodzinski, Marek and Xia, Fangfang and Xie, Juanying and Xiong, Zhiwei and Yang, Sen and Yang, Yanwu and Zhao, Zixuan and Maier-Hein, Klaus and J\"ager, Paul F. and Kopp-Schneider, Annette and Maier-Hein, Lena}, title = {Why Is the Winner the Best?}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19955-19966} }
HGNet: Learning Hierarchical Geometry From Points, Edges, and Surfaces: Ting Yao,

Yehao Li,

Yingwei Pan,

Tao Mei; [pdf] [supp]
[bibtex]
@InProceedings{Yao_2023_CVPR, author = {Yao, Ting and Li, Yehao and Pan, Yingwei and Mei, Tao}, title = {HGNet: Learning Hierarchical Geometry From Points, Edges, and Surfaces}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21846-21855} }
PAniC-3D: Stylized Single-View 3D Reconstruction From Portraits of Anime Characters: Shuhong Chen,

Kevin Zhang,

Yichun Shi,

Heng Wang,

Yiheng Zhu,

Guoxian Song,

Sizhe An,

Janus Kristjansson,

Xiao Yang,

Matthias Zwicker; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_CVPR, author = {Chen, Shuhong and Zhang, Kevin and Shi, Yichun and Wang, Heng and Zhu, Yiheng and Song, Guoxian and An, Sizhe and Kristjansson, Janus and Yang, Xiao and Zwicker, Matthias}, title = {PAniC-3D: Stylized Single-View 3D Reconstruction From Portraits of Anime Characters}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21068-21077} }
SunStage: Portrait Reconstruction and Relighting Using the Sun as a Light Stage: Yifan Wang,

Aleksander Holynski,

Xiuming Zhang,

Xuaner Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Yifan and Holynski, Aleksander and Zhang, Xiuming and Zhang, Xuaner}, title = {SunStage: Portrait Reconstruction and Relighting Using the Sun as a Light Stage}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20792-20802} }
Private Image Generation With Dual-Purpose Auxiliary Classifier: Chen Chen,

Daochang Liu,

Siqi Ma,

Surya Nepal,

Chang Xu; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_CVPR, author = {Chen, Chen and Liu, Daochang and Ma, Siqi and Nepal, Surya and Xu, Chang}, title = {Private Image Generation With Dual-Purpose Auxiliary Classifier}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20361-20370} }
3D-POP - An Automated Annotation Approach to Facilitate Markerless 2D-3D Tracking of Freely Moving Birds With Marker-Based Motion Capture: Hemal Naik,

Alex Hoi Hang Chan,

Junran Yang,

Mathilde Delacoux,

Iain D. Couzin,

Fumihiro Kano,

Máté Nagy; [pdf] [supp]
[bibtex]
@InProceedings{Naik_2023_CVPR, author = {Naik, Hemal and Chan, Alex Hoi Hang and Yang, Junran and Delacoux, Mathilde and Couzin, Iain D. and Kano, Fumihiro and Nagy, M\'at\'e}, title = {3D-POP - An Automated Annotation Approach to Facilitate Markerless 2D-3D Tracking of Freely Moving Birds With Marker-Based Motion Capture}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21274-21284} }
Unified Keypoint-Based Action Recognition Framework via Structured Keypoint Pooling: Ryo Hachiuma,

Fumiaki Sato,

Taiki Sekii; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hachiuma_2023_CVPR, author = {Hachiuma, Ryo and Sato, Fumiaki and Sekii, Taiki}, title = {Unified Keypoint-Based Action Recognition Framework via Structured Keypoint Pooling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22962-22971} }
Multi-View Reconstruction Using Signed Ray Distance Functions (SRDF): Pierre Zins,

Yuanlu Xu,

Edmond Boyer,

Stefanie Wuhrer,

Tony Tung; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zins_2023_CVPR, author = {Zins, Pierre and Xu, Yuanlu and Boyer, Edmond and Wuhrer, Stefanie and Tung, Tony}, title = {Multi-View Reconstruction Using Signed Ray Distance Functions (SRDF)}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16696-16706} }
Improving Cross-Modal Retrieval With Set of Diverse Embeddings: Dongwon Kim,

Namyup Kim,

Suha Kwak; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2023_CVPR, author = {Kim, Dongwon and Kim, Namyup and Kwak, Suha}, title = {Improving Cross-Modal Retrieval With Set of Diverse Embeddings}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23422-23431} }
Policy Adaptation From Foundation Model Feedback: Yuying Ge,

Annabella Macaluso,

Li Erran Li,

Ping Luo,

Xiaolong Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ge_2023_CVPR, author = {Ge, Yuying and Macaluso, Annabella and Li, Li Erran and Luo, Ping and Wang, Xiaolong}, title = {Policy Adaptation From Foundation Model Feedback}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19059-19069} }
Semi-DETR: Semi-Supervised Object Detection With Detection Transformers: Jiacheng Zhang,

Xiangru Lin,

Wei Zhang,

Kuo Wang,

Xiao Tan,

Junyu Han,

Errui Ding,

Jingdong Wang,

Guanbin Li; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_CVPR, author = {Zhang, Jiacheng and Lin, Xiangru and Zhang, Wei and Wang, Kuo and Tan, Xiao and Han, Junyu and Ding, Errui and Wang, Jingdong and Li, Guanbin}, title = {Semi-DETR: Semi-Supervised Object Detection With Detection Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23809-23818} }
GP-VTON: Towards General Purpose Virtual Try-On via Collaborative Local-Flow Global-Parsing Learning: Zhenyu Xie,

Zaiyu Huang,

Xin Dong,

Fuwei Zhao,

Haoye Dong,

Xijin Zhang,

Feida Zhu,

Xiaodan Liang; [pdf] [supp]
[bibtex]
@InProceedings{Xie_2023_CVPR, author = {Xie, Zhenyu and Huang, Zaiyu and Dong, Xin and Zhao, Fuwei and Dong, Haoye and Zhang, Xijin and Zhu, Feida and Liang, Xiaodan}, title = {GP-VTON: Towards General Purpose Virtual Try-On via Collaborative Local-Flow Global-Parsing Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23550-23559} }
Decomposed Soft Prompt Guided Fusion Enhancing for Compositional Zero-Shot Learning: Xiaocheng Lu,

Song Guo,

Ziming Liu,

Jingcai Guo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lu_2023_CVPR, author = {Lu, Xiaocheng and Guo, Song and Liu, Ziming and Guo, Jingcai}, title = {Decomposed Soft Prompt Guided Fusion Enhancing for Compositional Zero-Shot Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23560-23569} }
Hierarchical Semantic Contrast for Scene-Aware Video Anomaly Detection: Shengyang Sun,

Xiaojin Gong; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sun_2023_CVPR, author = {Sun, Shengyang and Gong, Xiaojin}, title = {Hierarchical Semantic Contrast for Scene-Aware Video Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22846-22856} }
All-in-Focus Imaging From Event Focal Stack: Hanyue Lou,

Minggui Teng,

Yixin Yang,

Boxin Shi; [pdf] [supp]
[bibtex]
@InProceedings{Lou_2023_CVPR, author = {Lou, Hanyue and Teng, Minggui and Yang, Yixin and Shi, Boxin}, title = {All-in-Focus Imaging From Event Focal Stack}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17366-17375} }
Video Probabilistic Diffusion Models in Projected Latent Space: Sihyun Yu,

Kihyuk Sohn,

Subin Kim,

Jinwoo Shin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yu_2023_CVPR, author = {Yu, Sihyun and Sohn, Kihyuk and Kim, Subin and Shin, Jinwoo}, title = {Video Probabilistic Diffusion Models in Projected Latent Space}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18456-18466} }
Defining and Quantifying the Emergence of Sparse Concepts in DNNs: Jie Ren,

Mingjie Li,

Qirui Chen,

Huiqi Deng,

Quanshi Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ren_2023_CVPR, author = {Ren, Jie and Li, Mingjie and Chen, Qirui and Deng, Huiqi and Zhang, Quanshi}, title = {Defining and Quantifying the Emergence of Sparse Concepts in DNNs}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20280-20289} }
FreeSeg: Unified, Universal and Open-Vocabulary Image Segmentation: Jie Qin,

Jie Wu,

Pengxiang Yan,

Ming Li,

Ren Yuxi,

Xuefeng Xiao,

Yitong Wang,

Rui Wang,

Shilei Wen,

Xin Pan,

Xingang Wang; [pdf] [arXiv]
[bibtex]
@InProceedings{Qin_2023_CVPR, author = {Qin, Jie and Wu, Jie and Yan, Pengxiang and Li, Ming and Yuxi, Ren and Xiao, Xuefeng and Wang, Yitong and Wang, Rui and Wen, Shilei and Pan, Xin and Wang, Xingang}, title = {FreeSeg: Unified, Universal and Open-Vocabulary Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19446-19455} }
AVFormer: Injecting Vision Into Frozen Speech Models for Zero-Shot AV-ASR: Paul Hongsuck Seo,

Arsha Nagrani,

Cordelia Schmid; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Seo_2023_CVPR, author = {Seo, Paul Hongsuck and Nagrani, Arsha and Schmid, Cordelia}, title = {AVFormer: Injecting Vision Into Frozen Speech Models for Zero-Shot AV-ASR}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22922-22931} }
Self-Guided Diffusion Models: Vincent Tao Hu,

David W. Zhang,

Yuki M. Asano,

Gertjan J. Burghouts,

Cees G. M. Snoek; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hu_2023_CVPR, author = {Hu, Vincent Tao and Zhang, David W. and Asano, Yuki M. and Burghouts, Gertjan J. and Snoek, Cees G. M.}, title = {Self-Guided Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18413-18422} }
One-Shot High-Fidelity Talking-Head Synthesis With Deformable Neural Radiance Field: Weichuang Li,

Longhao Zhang,

Dong Wang,

Bin Zhao,

Zhigang Wang,

Mulin Chen,

Bang Zhang,

Zhongjian Wang,

Liefeng Bo,

Xuelong Li; [pdf] [arXiv]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Weichuang and Zhang, Longhao and Wang, Dong and Zhao, Bin and Wang, Zhigang and Chen, Mulin and Zhang, Bang and Wang, Zhongjian and Bo, Liefeng and Li, Xuelong}, title = {One-Shot High-Fidelity Talking-Head Synthesis With Deformable Neural Radiance Field}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17969-17978} }
Trajectory-Aware Body Interaction Transformer for Multi-Person Pose Forecasting: Xiaogang Peng,

Siyuan Mao,

Zizhao Wu; [pdf] [arXiv]
[bibtex]
@InProceedings{Peng_2023_CVPR, author = {Peng, Xiaogang and Mao, Siyuan and Wu, Zizhao}, title = {Trajectory-Aware Body Interaction Transformer for Multi-Person Pose Forecasting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17121-17130} }
Conditional Image-to-Video Generation With Latent Flow Diffusion Models: Haomiao Ni,

Changhao Shi,

Kai Li,

Sharon X. Huang,

Martin Renqiang Min; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ni_2023_CVPR, author = {Ni, Haomiao and Shi, Changhao and Li, Kai and Huang, Sharon X. and Min, Martin Renqiang}, title = {Conditional Image-to-Video Generation With Latent Flow Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18444-18455} }
Virtual Sparse Convolution for Multimodal 3D Object Detection: Hai Wu,

Chenglu Wen,

Shaoshuai Shi,

Xin Li,

Cheng Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_CVPR, author = {Wu, Hai and Wen, Chenglu and Shi, Shaoshuai and Li, Xin and Wang, Cheng}, title = {Virtual Sparse Convolution for Multimodal 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21653-21662} }
Towards Universal Fake Image Detectors That Generalize Across Generative Models: Utkarsh Ojha,

Yuheng Li,

Yong Jae Lee; [pdf] [arXiv]
[bibtex]
@InProceedings{Ojha_2023_CVPR, author = {Ojha, Utkarsh and Li, Yuheng and Lee, Yong Jae}, title = {Towards Universal Fake Image Detectors That Generalize Across Generative Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24480-24489} }
A Large-Scale Homography Benchmark: Daniel Barath,

Dmytro Mishkin,

Michal Polic,

Wolfgang Förstner,

Jiri Matas; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Barath_2023_CVPR, author = {Barath, Daniel and Mishkin, Dmytro and Polic, Michal and F\"orstner, Wolfgang and Matas, Jiri}, title = {A Large-Scale Homography Benchmark}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21360-21370} }
Weakly Supervised Video Emotion Detection and Prediction via Cross-Modal Temporal Erasing Network: Zhicheng Zhang,

Lijuan Wang,

Jufeng Yang; [pdf]
[bibtex]
@InProceedings{Zhang_2023_CVPR, author = {Zhang, Zhicheng and Wang, Lijuan and Yang, Jufeng}, title = {Weakly Supervised Video Emotion Detection and Prediction via Cross-Modal Temporal Erasing Network}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18888-18897} }
Consistent View Synthesis With Pose-Guided Diffusion Models: Hung-Yu Tseng,

Qinbo Li,

Changil Kim,

Suhib Alsisan,

Jia-Bin Huang,

Johannes Kopf; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tseng_2023_CVPR, author = {Tseng, Hung-Yu and Li, Qinbo and Kim, Changil and Alsisan, Suhib and Huang, Jia-Bin and Kopf, Johannes}, title = {Consistent View Synthesis With Pose-Guided Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16773-16783} }
MSMDFusion: Fusing LiDAR and Camera at Multiple Scales With Multi-Depth Seeds for 3D Object Detection: Yang Jiao,

Zequn Jie,

Shaoxiang Chen,

Jingjing Chen,

Lin Ma,

Yu-Gang Jiang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jiao_2023_CVPR, author = {Jiao, Yang and Jie, Zequn and Chen, Shaoxiang and Chen, Jingjing and Ma, Lin and Jiang, Yu-Gang}, title = {MSMDFusion: Fusing LiDAR and Camera at Multiple Scales With Multi-Depth Seeds for 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21643-21652} }
Dense-Localizing Audio-Visual Events in Untrimmed Videos: A Large-Scale Benchmark and Baseline: Tiantian Geng,

Teng Wang,

Jinming Duan,

Runmin Cong,

Feng Zheng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Geng_2023_CVPR, author = {Geng, Tiantian and Wang, Teng and Duan, Jinming and Cong, Runmin and Zheng, Feng}, title = {Dense-Localizing Audio-Visual Events in Untrimmed Videos: A Large-Scale Benchmark and Baseline}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22942-22951} }
Weak-Shot Object Detection Through Mutual Knowledge Transfer: Xuanyi Du,

Weitao Wan,

Chong Sun,

Chen Li; [pdf]
[bibtex]
@InProceedings{Du_2023_CVPR, author = {Du, Xuanyi and Wan, Weitao and Sun, Chong and Li, Chen}, title = {Weak-Shot Object Detection Through Mutual Knowledge Transfer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19671-19680} }
Toward Stable, Interpretable, and Lightweight Hyperspectral Super-Resolution: Wen-jin Guo,

Weiying Xie,

Kai Jiang,

Yunsong Li,

Jie Lei,

Leyuan Fang; [pdf] [supp]
[bibtex]
@InProceedings{Guo_2023_CVPR, author = {Guo, Wen-jin and Xie, Weiying and Jiang, Kai and Li, Yunsong and Lei, Jie and Fang, Leyuan}, title = {Toward Stable, Interpretable, and Lightweight Hyperspectral Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22272-22281} }
Masked Auto-Encoders Meet Generative Adversarial Networks and Beyond: Zhengcong Fei,

Mingyuan Fan,

Li Zhu,

Junshi Huang,

Xiaoming Wei,

Xiaolin Wei; [pdf] [supp]
[bibtex]
@InProceedings{Fei_2023_CVPR, author = {Fei, Zhengcong and Fan, Mingyuan and Zhu, Li and Huang, Junshi and Wei, Xiaoming and Wei, Xiaolin}, title = {Masked Auto-Encoders Meet Generative Adversarial Networks and Beyond}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24449-24459} }
RILS: Masked Visual Reconstruction in Language Semantic Space: Shusheng Yang,

Yixiao Ge,

Kun Yi,

Dian Li,

Ying Shan,

Xiaohu Qie,

Xinggang Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_CVPR, author = {Yang, Shusheng and Ge, Yixiao and Yi, Kun and Li, Dian and Shan, Ying and Qie, Xiaohu and Wang, Xinggang}, title = {RILS: Masked Visual Reconstruction in Language Semantic Space}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23304-23314} }
Decoupling Learning and Remembering: A Bilevel Memory Framework With Knowledge Projection for Task-Incremental Learning: Wenju Sun,

Qingyong Li,

Jing Zhang,

Wen Wang,

Yangli-ao Geng; [pdf] [supp]
[bibtex]
@InProceedings{Sun_2023_CVPR, author = {Sun, Wenju and Li, Qingyong and Zhang, Jing and Wang, Wen and Geng, Yangli-ao}, title = {Decoupling Learning and Remembering: A Bilevel Memory Framework With Knowledge Projection for Task-Incremental Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20186-20195} }
R2Former: Unified Retrieval and Reranking Transformer for Place Recognition: Sijie Zhu,

Linjie Yang,

Chen Chen,

Mubarak Shah,

Xiaohui Shen,

Heng Wang; [pdf] [supp]
[bibtex]
@InProceedings{Zhu_2023_CVPR, author = {Zhu, Sijie and Yang, Linjie and Chen, Chen and Shah, Mubarak and Shen, Xiaohui and Wang, Heng}, title = {R2Former: Unified Retrieval and Reranking Transformer for Place Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19370-19380} }
Modality-Agnostic Debiasing for Single Domain Generalization: Sanqing Qu,

Yingwei Pan,

Guang Chen,

Ting Yao,

Changjun Jiang,

Tao Mei; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Qu_2023_CVPR, author = {Qu, Sanqing and Pan, Yingwei and Chen, Guang and Yao, Ting and Jiang, Changjun and Mei, Tao}, title = {Modality-Agnostic Debiasing for Single Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24142-24151} }
Difficulty-Based Sampling for Debiased Contrastive Representation Learning: Taeuk Jang,

Xiaoqian Wang; [pdf] [supp]
[bibtex]
@InProceedings{Jang_2023_CVPR, author = {Jang, Taeuk and Wang, Xiaoqian}, title = {Difficulty-Based Sampling for Debiased Contrastive Representation Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24039-24048} }
CompletionFormer: Depth Completion With Convolutions and Vision Transformers: Youmin Zhang,

Xianda Guo,

Matteo Poggi,

Zheng Zhu,

Guan Huang,

Stefano Mattoccia; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_CVPR, author = {Zhang, Youmin and Guo, Xianda and Poggi, Matteo and Zhu, Zheng and Huang, Guan and Mattoccia, Stefano}, title = {CompletionFormer: Depth Completion With Convolutions and Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18527-18536} }
Improving Visual Grounding by Encouraging Consistent Gradient-Based Explanations: Ziyan Yang,

Kushal Kafle,

Franck Dernoncourt,

Vicente Ordonez; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_CVPR, author = {Yang, Ziyan and Kafle, Kushal and Dernoncourt, Franck and Ordonez, Vicente}, title = {Improving Visual Grounding by Encouraging Consistent Gradient-Based Explanations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19165-19174} }
Physically Realizable Natural-Looking Clothing Textures Evade Person Detectors via 3D Modeling: Zhanhao Hu,

Wenda Chu,

Xiaopei Zhu,

Hui Zhang,

Bo Zhang,

Xiaolin Hu; [pdf] [supp]
[bibtex]
@InProceedings{Hu_2023_CVPR, author = {Hu, Zhanhao and Chu, Wenda and Zhu, Xiaopei and Zhang, Hui and Zhang, Bo and Hu, Xiaolin}, title = {Physically Realizable Natural-Looking Clothing Textures Evade Person Detectors via 3D Modeling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16975-16984} }
Camouflaged Object Detection With Feature Decomposition and Edge Reconstruction: Chunming He,

Kai Li,

Yachao Zhang,

Longxiang Tang,

Yulun Zhang,

Zhenhua Guo,

Xiu Li; [pdf] [supp]
[bibtex]
@InProceedings{He_2023_CVPR, author = {He, Chunming and Li, Kai and Zhang, Yachao and Tang, Longxiang and Zhang, Yulun and Guo, Zhenhua and Li, Xiu}, title = {Camouflaged Object Detection With Feature Decomposition and Edge Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22046-22055} }
ALOFT: A Lightweight MLP-Like Architecture With Dynamic Low-Frequency Transform for Domain Generalization: Jintao Guo,

Na Wang,

Lei Qi,

Yinghuan Shi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Guo_2023_CVPR, author = {Guo, Jintao and Wang, Na and Qi, Lei and Shi, Yinghuan}, title = {ALOFT: A Lightweight MLP-Like Architecture With Dynamic Low-Frequency Transform for Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24132-24141} }
Learning Visual Representations via Language-Guided Sampling: Mohamed El Banani,

Karan Desai,

Justin Johnson; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{El_Banani_2023_CVPR, author = {El Banani, Mohamed and Desai, Karan and Johnson, Justin}, title = {Learning Visual Representations via Language-Guided Sampling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19208-19220} }
Master: Meta Style Transformer for Controllable Zero-Shot and Few-Shot Artistic Style Transfer: Hao Tang,

Songhua Liu,

Tianwei Lin,

Shaoli Huang,

Fu Li,

Dongliang He,

Xinchao Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tang_2023_CVPR, author = {Tang, Hao and Liu, Songhua and Lin, Tianwei and Huang, Shaoli and Li, Fu and He, Dongliang and Wang, Xinchao}, title = {Master: Meta Style Transformer for Controllable Zero-Shot and Few-Shot Artistic Style Transfer}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18329-18338} }
Affordance Diffusion: Synthesizing Hand-Object Interactions: Yufei Ye,

Xueting Li,

Abhinav Gupta,

Shalini De Mello,

Stan Birchfield,

Jiaming Song,

Shubham Tulsiani,

Sifei Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ye_2023_CVPR, author = {Ye, Yufei and Li, Xueting and Gupta, Abhinav and De Mello, Shalini and Birchfield, Stan and Song, Jiaming and Tulsiani, Shubham and Liu, Sifei}, title = {Affordance Diffusion: Synthesizing Hand-Object Interactions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22479-22489} }
Towards Artistic Image Aesthetics Assessment: A Large-Scale Dataset and a New Method: Ran Yi,

Haoyuan Tian,

Zhihao Gu,

Yu-Kun Lai,

Paul L. Rosin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yi_2023_CVPR, author = {Yi, Ran and Tian, Haoyuan and Gu, Zhihao and Lai, Yu-Kun and Rosin, Paul L.}, title = {Towards Artistic Image Aesthetics Assessment: A Large-Scale Dataset and a New Method}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22388-22397} }
Inverting the Imaging Process by Learning an Implicit Camera Model: Xin Huang,

Qi Zhang,

Ying Feng,

Hongdong Li,

Qing Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_CVPR, author = {Huang, Xin and Zhang, Qi and Feng, Ying and Li, Hongdong and Wang, Qing}, title = {Inverting the Imaging Process by Learning an Implicit Camera Model}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21456-21465} }
Enhanced Training of Query-Based Object Detection via Selective Query Recollection: Fangyi Chen,

Han Zhang,

Kai Hu,

Yu-Kai Huang,

Chenchen Zhu,

Marios Savvides; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_CVPR, author = {Chen, Fangyi and Zhang, Han and Hu, Kai and Huang, Yu-Kai and Zhu, Chenchen and Savvides, Marios}, title = {Enhanced Training of Query-Based Object Detection via Selective Query Recollection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23756-23765} }
Detecting Human-Object Contact in Images: Yixin Chen,

Sai Kumar Dwivedi,

Michael J. Black,

Dimitrios Tzionas; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_CVPR, author = {Chen, Yixin and Dwivedi, Sai Kumar and Black, Michael J. and Tzionas, Dimitrios}, title = {Detecting Human-Object Contact in Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17100-17110} }
PointClustering: Unsupervised Point Cloud Pre-Training Using Transformation Invariance in Clustering: Fuchen Long,

Ting Yao,

Zhaofan Qiu,

Lusong Li,

Tao Mei; [pdf]
[bibtex]
@InProceedings{Long_2023_CVPR, author = {Long, Fuchen and Yao, Ting and Qiu, Zhaofan and Li, Lusong and Mei, Tao}, title = {PointClustering: Unsupervised Point Cloud Pre-Training Using Transformation Invariance in Clustering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21824-21834} }
Out-of-Distributed Semantic Pruning for Robust Semi-Supervised Learning: Yu Wang,

Pengchong Qiao,

Chang Liu,

Guoli Song,

Xiawu Zheng,

Jie Chen; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Yu and Qiao, Pengchong and Liu, Chang and Song, Guoli and Zheng, Xiawu and Chen, Jie}, title = {Out-of-Distributed Semantic Pruning for Robust Semi-Supervised Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23849-23858} }
Understanding and Improving Visual Prompting: A Label-Mapping Perspective: Aochuan Chen,

Yuguang Yao,

Pin-Yu Chen,

Yihua Zhang,

Sijia Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_CVPR, author = {Chen, Aochuan and Yao, Yuguang and Chen, Pin-Yu and Zhang, Yihua and Liu, Sijia}, title = {Understanding and Improving Visual Prompting: A Label-Mapping Perspective}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19133-19143} }
DegAE: A New Pretraining Paradigm for Low-Level Vision: Yihao Liu,

Jingwen He,

Jinjin Gu,

Xiangtao Kong,

Yu Qiao,

Chao Dong; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Yihao and He, Jingwen and Gu, Jinjin and Kong, Xiangtao and Qiao, Yu and Dong, Chao}, title = {DegAE: A New Pretraining Paradigm for Low-Level Vision}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23292-23303} }
The Differentiable Lens: Compound Lens Search Over Glass Surfaces and Materials for Object Detection: Geoffroi Côté,

Fahim Mannan,

Simon Thibault,

Jean-François Lalonde,

Felix Heide; [pdf] [supp]
[bibtex]
@InProceedings{Cote_2023_CVPR, author = {C\^ot\'e, Geoffroi and Mannan, Fahim and Thibault, Simon and Lalonde, Jean-Fran\c{c}ois and Heide, Felix}, title = {The Differentiable Lens: Compound Lens Search Over Glass Surfaces and Materials for Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20803-20812} }
Adversarially Masking Synthetic To Mimic Real: Adaptive Noise Injection for Point Cloud Segmentation Adaptation: Guangrui Li,

Guoliang Kang,

Xiaohan Wang,

Yunchao Wei,

Yi Yang; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Guangrui and Kang, Guoliang and Wang, Xiaohan and Wei, Yunchao and Yang, Yi}, title = {Adversarially Masking Synthetic To Mimic Real: Adaptive Noise Injection for Point Cloud Segmentation Adaptation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20464-20474} }
Understanding Deep Generative Models With Generalized Empirical Likelihoods: Suman Ravuri,

Mélanie Rey,

Shakir Mohamed,

Marc Peter Deisenroth; [pdf] [supp]
[bibtex]
@InProceedings{Ravuri_2023_CVPR, author = {Ravuri, Suman and Rey, M\'elanie and Mohamed, Shakir and Deisenroth, Marc Peter}, title = {Understanding Deep Generative Models With Generalized Empirical Likelihoods}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24395-24405} }
CLIPPING: Distilling CLIP-Based Models With a Student Base for Video-Language Retrieval: Renjing Pei,

Jianzhuang Liu,

Weimian Li,

Bin Shao,

Songcen Xu,

Peng Dai,

Juwei Lu,

Youliang Yan; [pdf] [supp]
[bibtex]
@InProceedings{Pei_2023_CVPR, author = {Pei, Renjing and Liu, Jianzhuang and Li, Weimian and Shao, Bin and Xu, Songcen and Dai, Peng and Lu, Juwei and Yan, Youliang}, title = {CLIPPING: Distilling CLIP-Based Models With a Student Base for Video-Language Retrieval}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18983-18992} }
BEVHeight: A Robust Framework for Vision-Based Roadside 3D Object Detection: Lei Yang,

Kaicheng Yu,

Tao Tang,

Jun Li,

Kun Yuan,

Li Wang,

Xinyu Zhang,

Peng Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_CVPR, author = {Yang, Lei and Yu, Kaicheng and Tang, Tao and Li, Jun and Yuan, Kun and Wang, Li and Zhang, Xinyu and Chen, Peng}, title = {BEVHeight: A Robust Framework for Vision-Based Roadside 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21611-21620} }
LASP: Text-to-Text Optimization for Language-Aware Soft Prompting of Vision & Language Models: Adrian Bulat,

Georgios Tzimiropoulos; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bulat_2023_CVPR, author = {Bulat, Adrian and Tzimiropoulos, Georgios}, title = {LASP: Text-to-Text Optimization for Language-Aware Soft Prompting of Vision \& Language Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23232-23241} }
AutoAD: Movie Description in Context: Tengda Han,

Max Bain,

Arsha Nagrani,

Gül Varol,

Weidi Xie,

Andrew Zisserman; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Han_2023_CVPR, author = {Han, Tengda and Bain, Max and Nagrani, Arsha and Varol, G\"ul and Xie, Weidi and Zisserman, Andrew}, title = {AutoAD: Movie Description in Context}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18930-18940} }
SceneComposer: Any-Level Semantic Image Synthesis: Yu Zeng,

Zhe Lin,

Jianming Zhang,

Qing Liu,

John Collomosse,

Jason Kuen,

Vishal M. Patel; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zeng_2023_CVPR, author = {Zeng, Yu and Lin, Zhe and Zhang, Jianming and Liu, Qing and Collomosse, John and Kuen, Jason and Patel, Vishal M.}, title = {SceneComposer: Any-Level Semantic Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22468-22478} }
MaPLe: Multi-Modal Prompt Learning: Muhammad Uzair Khattak,

Hanoona Rasheed,

Muhammad Maaz,

Salman Khan,

Fahad Shahbaz Khan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Khattak_2023_CVPR, author = {Khattak, Muhammad Uzair and Rasheed, Hanoona and Maaz, Muhammad and Khan, Salman and Khan, Fahad Shahbaz}, title = {MaPLe: Multi-Modal Prompt Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19113-19122} }
Scaling Language-Image Pre-Training via Masking: Yanghao Li,

Haoqi Fan,

Ronghang Hu,

Christoph Feichtenhofer,

Kaiming He; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Yanghao and Fan, Haoqi and Hu, Ronghang and Feichtenhofer, Christoph and He, Kaiming}, title = {Scaling Language-Image Pre-Training via Masking}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23390-23400} }
DNF: Decouple and Feedback Network for Seeing in the Dark: Xin Jin,

Ling-Hao Han,

Zhen Li,

Chun-Le Guo,

Zhi Chai,

Chongyi Li; [pdf] [supp]
[bibtex]
@InProceedings{Jin_2023_CVPR, author = {Jin, Xin and Han, Ling-Hao and Li, Zhen and Guo, Chun-Le and Chai, Zhi and Li, Chongyi}, title = {DNF: Decouple and Feedback Network for Seeing in the Dark}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18135-18144} }
Deformable Mesh Transformer for 3D Human Mesh Recovery: Yusuke Yoshiyasu; [pdf] [supp]
[bibtex]
@InProceedings{Yoshiyasu_2023_CVPR, author = {Yoshiyasu, Yusuke}, title = {Deformable Mesh Transformer for 3D Human Mesh Recovery}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17006-17015} }
Vita-CLIP: Video and Text Adaptive CLIP via Multimodal Prompting: Syed Talal Wasim,

Muzammal Naseer,

Salman Khan,

Fahad Shahbaz Khan,

Mubarak Shah; [pdf]
[bibtex]
@InProceedings{Wasim_2023_CVPR, author = {Wasim, Syed Talal and Naseer, Muzammal and Khan, Salman and Khan, Fahad Shahbaz and Shah, Mubarak}, title = {Vita-CLIP: Video and Text Adaptive CLIP via Multimodal Prompting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23034-23044} }
HS-Pose: Hybrid Scope Feature Extraction for Category-Level Object Pose Estimation: Linfang Zheng,

Chen Wang,

Yinghan Sun,

Esha Dasgupta,

Hua Chen,

Aleš Leonardis,

Wei Zhang,

Hyung Jin Chang; [pdf] [supp]
[bibtex]
@InProceedings{Zheng_2023_CVPR, author = {Zheng, Linfang and Wang, Chen and Sun, Yinghan and Dasgupta, Esha and Chen, Hua and Leonardis, Ale\v{s} and Zhang, Wei and Chang, Hyung Jin}, title = {HS-Pose: Hybrid Scope Feature Extraction for Category-Level Object Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17163-17173} }
LayoutDM: Transformer-Based Diffusion Model for Layout Generation: Shang Chai,

Liansheng Zhuang,

Fengying Yan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chai_2023_CVPR, author = {Chai, Shang and Zhuang, Liansheng and Yan, Fengying}, title = {LayoutDM: Transformer-Based Diffusion Model for Layout Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18349-18358} }
HandNeRF: Neural Radiance Fields for Animatable Interacting Hands: Zhiyang Guo,

Wengang Zhou,

Min Wang,

Li Li,

Houqiang Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Guo_2023_CVPR, author = {Guo, Zhiyang and Zhou, Wengang and Wang, Min and Li, Li and Li, Houqiang}, title = {HandNeRF: Neural Radiance Fields for Animatable Interacting Hands}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21078-21087} }
Introducing Competition To Boost the Transferability of Targeted Adversarial Examples Through Clean Feature Mixup: Junyoung Byun,

Myung-Joon Kwon,

Seungju Cho,

Yoonji Kim,

Changick Kim; [pdf] [supp]
[bibtex]
@InProceedings{Byun_2023_CVPR, author = {Byun, Junyoung and Kwon, Myung-Joon and Cho, Seungju and Kim, Yoonji and Kim, Changick}, title = {Introducing Competition To Boost the Transferability of Targeted Adversarial Examples Through Clean Feature Mixup}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24648-24657} }
A Whac-a-Mole Dilemma: Shortcuts Come in Multiples Where Mitigating One Amplifies Others: Zhiheng Li,

Ivan Evtimov,

Albert Gordo,

Caner Hazirbas,

Tal Hassner,

Cristian Canton Ferrer,

Chenliang Xu,

Mark Ibrahim; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Zhiheng and Evtimov, Ivan and Gordo, Albert and Hazirbas, Caner and Hassner, Tal and Ferrer, Cristian Canton and Xu, Chenliang and Ibrahim, Mark}, title = {A Whac-a-Mole Dilemma: Shortcuts Come in Multiples Where Mitigating One Amplifies Others}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20071-20082} }
Efficient Scale-Invariant Generator With Column-Row Entangled Pixel Synthesis: Thuan Hoang Nguyen,

Thanh Van Le,

Anh Tran; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Nguyen_2023_CVPR, author = {Nguyen, Thuan Hoang and Van Le, Thanh and Tran, Anh}, title = {Efficient Scale-Invariant Generator With Column-Row Entangled Pixel Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22408-22417} }
H2ONet: Hand-Occlusion-and-Orientation-Aware Network for Real-Time 3D Hand Mesh Reconstruction: Hao Xu,

Tianyu Wang,

Xiao Tang,

Chi-Wing Fu; [pdf] [supp]
[bibtex]
@InProceedings{Xu_2023_CVPR, author = {Xu, Hao and Wang, Tianyu and Tang, Xiao and Fu, Chi-Wing}, title = {H2ONet: Hand-Occlusion-and-Orientation-Aware Network for Real-Time 3D Hand Mesh Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17048-17058} }
Interventional Bag Multi-Instance Learning on Whole-Slide Pathological Images: Tiancheng Lin,

Zhimiao Yu,

Hongyu Hu,

Yi Xu,

Chang-Wen Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lin_2023_CVPR, author = {Lin, Tiancheng and Yu, Zhimiao and Hu, Hongyu and Xu, Yi and Chen, Chang-Wen}, title = {Interventional Bag Multi-Instance Learning on Whole-Slide Pathological Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19830-19839} }
RankMix: Data Augmentation for Weakly Supervised Learning of Classifying Whole Slide Images With Diverse Sizes and Imbalanced Categories: Yuan-Chih Chen,

Chun-Shien Lu; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_CVPR, author = {Chen, Yuan-Chih and Lu, Chun-Shien}, title = {RankMix: Data Augmentation for Weakly Supervised Learning of Classifying Whole Slide Images With Diverse Sizes and Imbalanced Categories}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23936-23945} }
ActMAD: Activation Matching To Align Distributions for Test-Time-Training: Muhammad Jehanzeb Mirza,

Pol Jané Soneira,

Wei Lin,

Mateusz Kozinski,

Horst Possegger,

Horst Bischof; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mirza_2023_CVPR, author = {Mirza, Muhammad Jehanzeb and Soneira, Pol Jan\'e and Lin, Wei and Kozinski, Mateusz and Possegger, Horst and Bischof, Horst}, title = {ActMAD: Activation Matching To Align Distributions for Test-Time-Training}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24152-24161} }
DKM: Dense Kernelized Feature Matching for Geometry Estimation: Johan Edstedt,

Ioannis Athanasiadis,

Mårten Wadenbäck,

Michael Felsberg; [pdf] [supp]
[bibtex]
@InProceedings{Edstedt_2023_CVPR, author = {Edstedt, Johan and Athanasiadis, Ioannis and Wadenb\"ack, M\r{a}rten and Felsberg, Michael}, title = {DKM: Dense Kernelized Feature Matching for Geometry Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17765-17775} }
Structured 3D Features for Reconstructing Controllable Avatars: Enric Corona,

Mihai Zanfir,

Thiemo Alldieck,

Eduard Gabriel Bazavan,

Andrei Zanfir,

Cristian Sminchisescu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Corona_2023_CVPR, author = {Corona, Enric and Zanfir, Mihai and Alldieck, Thiemo and Bazavan, Eduard Gabriel and Zanfir, Andrei and Sminchisescu, Cristian}, title = {Structured 3D Features for Reconstructing Controllable Avatars}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16954-16964} }
Active Finetuning: Exploiting Annotation Budget in the Pretraining-Finetuning Paradigm: Yichen Xie,

Han Lu,

Junchi Yan,

Xiaokang Yang,

Masayoshi Tomizuka,

Wei Zhan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xie_2023_CVPR, author = {Xie, Yichen and Lu, Han and Yan, Junchi and Yang, Xiaokang and Tomizuka, Masayoshi and Zhan, Wei}, title = {Active Finetuning: Exploiting Annotation Budget in the Pretraining-Finetuning Paradigm}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23715-23724} }
In-Hand 3D Object Scanning From an RGB Sequence: Shreyas Hampali,

Tomas Hodan,

Luan Tran,

Lingni Ma,

Cem Keskin,

Vincent Lepetit; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hampali_2023_CVPR, author = {Hampali, Shreyas and Hodan, Tomas and Tran, Luan and Ma, Lingni and Keskin, Cem and Lepetit, Vincent}, title = {In-Hand 3D Object Scanning From an RGB Sequence}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17079-17088} }
Zero-Shot Referring Image Segmentation With Global-Local Context Features: Seonghoon Yu,

Paul Hongsuck Seo,

Jeany Son; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yu_2023_CVPR, author = {Yu, Seonghoon and Seo, Paul Hongsuck and Son, Jeany}, title = {Zero-Shot Referring Image Segmentation With Global-Local Context Features}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19456-19465} }
SketchXAI: A First Look at Explainability for Human Sketches: Zhiyu Qu,

Yulia Gryaditskaya,

Ke Li,

Kaiyue Pang,

Tao Xiang,

Yi-Zhe Song; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Qu_2023_CVPR, author = {Qu, Zhiyu and Gryaditskaya, Yulia and Li, Ke and Pang, Kaiyue and Xiang, Tao and Song, Yi-Zhe}, title = {SketchXAI: A First Look at Explainability for Human Sketches}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23327-23337} }
Rebalancing Batch Normalization for Exemplar-Based Class-Incremental Learning: Sungmin Cha,

Sungjun Cho,

Dasol Hwang,

Sunwon Hong,

Moontae Lee,

Taesup Moon; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cha_2023_CVPR, author = {Cha, Sungmin and Cho, Sungjun and Hwang, Dasol and Hong, Sunwon and Lee, Moontae and Moon, Taesup}, title = {Rebalancing Batch Normalization for Exemplar-Based Class-Incremental Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20127-20136} }
OmniVidar: Omnidirectional Depth Estimation From Multi-Fisheye Images: Sheng Xie,

Daochuan Wang,

Yun-Hui Liu; [pdf]
[bibtex]
@InProceedings{Xie_2023_CVPR, author = {Xie, Sheng and Wang, Daochuan and Liu, Yun-Hui}, title = {OmniVidar: Omnidirectional Depth Estimation From Multi-Fisheye Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21529-21538} }
RWSC-Fusion: Region-Wise Style-Controlled Fusion Network for the Prohibited X-Ray Security Image Synthesis: Luwen Duan,

Min Wu,

Lijian Mao,

Jun Yin,

Jianping Xiong,

Xi Li; [pdf] [supp]
[bibtex]
@InProceedings{Duan_2023_CVPR, author = {Duan, Luwen and Wu, Min and Mao, Lijian and Yin, Jun and Xiong, Jianping and Li, Xi}, title = {RWSC-Fusion: Region-Wise Style-Controlled Fusion Network for the Prohibited X-Ray Security Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22398-22407} }
Octree Guided Unoriented Surface Reconstruction: Chamin Hewa Koneputugodage,

Yizhak Ben-Shabat,

Stephen Gould; [pdf] [supp]
[bibtex]
@InProceedings{Koneputugodage_2023_CVPR, author = {Koneputugodage, Chamin Hewa and Ben-Shabat, Yizhak and Gould, Stephen}, title = {Octree Guided Unoriented Surface Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16717-16726} }
ToThePoint: Efficient Contrastive Learning of 3D Point Clouds via Recycling: Xinglin Li,

Jiajing Chen,

Jinhui Ouyang,

Hanhui Deng,

Senem Velipasalar,

Di Wu; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Xinglin and Chen, Jiajing and Ouyang, Jinhui and Deng, Hanhui and Velipasalar, Senem and Wu, Di}, title = {ToThePoint: Efficient Contrastive Learning of 3D Point Clouds via Recycling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21781-21790} }
Weakly Supervised Monocular 3D Object Detection Using Multi-View Projection and Direction Consistency: Runzhou Tao,

Wencheng Han,

Zhongying Qiu,

Cheng-Zhong Xu,

Jianbing Shen; [pdf] [arXiv]
[bibtex]
@InProceedings{Tao_2023_CVPR, author = {Tao, Runzhou and Han, Wencheng and Qiu, Zhongying and Xu, Cheng-Zhong and Shen, Jianbing}, title = {Weakly Supervised Monocular 3D Object Detection Using Multi-View Projection and Direction Consistency}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17482-17492} }
EDA: Explicit Text-Decoupling and Dense Alignment for 3D Visual Grounding: Yanmin Wu,

Xinhua Cheng,

Renrui Zhang,

Zesen Cheng,

Jian Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_CVPR, author = {Wu, Yanmin and Cheng, Xinhua and Zhang, Renrui and Cheng, Zesen and Zhang, Jian}, title = {EDA: Explicit Text-Decoupling and Dense Alignment for 3D Visual Grounding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19231-19242} }
MixPHM: Redundancy-Aware Parameter-Efficient Tuning for Low-Resource Visual Question Answering: Jingjing Jiang,

Nanning Zheng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jiang_2023_CVPR, author = {Jiang, Jingjing and Zheng, Nanning}, title = {MixPHM: Redundancy-Aware Parameter-Efficient Tuning for Low-Resource Visual Question Answering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24203-24213} }
DejaVu: Conditional Regenerative Learning To Enhance Dense Prediction: Shubhankar Borse,

Debasmit Das,

Hyojin Park,

Hong Cai,

Risheek Garrepalli,

Fatih Porikli; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Borse_2023_CVPR, author = {Borse, Shubhankar and Das, Debasmit and Park, Hyojin and Cai, Hong and Garrepalli, Risheek and Porikli, Fatih}, title = {DejaVu: Conditional Regenerative Learning To Enhance Dense Prediction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19466-19477} }
SmartBrush: Text and Shape Guided Object Inpainting With Diffusion Model: Shaoan Xie,

Zhifei Zhang,

Zhe Lin,

Tobias Hinz,

Kun Zhang; [pdf] [arXiv]
[bibtex]
@InProceedings{Xie_2023_CVPR, author = {Xie, Shaoan and Zhang, Zhifei and Lin, Zhe and Hinz, Tobias and Zhang, Kun}, title = {SmartBrush: Text and Shape Guided Object Inpainting With Diffusion Model}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22428-22437} }
RUST: Latent Neural Scene Representations From Unposed Imagery: Mehdi S. M. Sajjadi,

Aravindh Mahendran,

Thomas Kipf,

Etienne Pot,

Daniel Duckworth,

Mario Lučić,

Klaus Greff; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sajjadi_2023_CVPR, author = {Sajjadi, Mehdi S. M. and Mahendran, Aravindh and Kipf, Thomas and Pot, Etienne and Duckworth, Daniel and Lu\v{c}i\'c, Mario and Greff, Klaus}, title = {RUST: Latent Neural Scene Representations From Unposed Imagery}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17297-17306} }
Open Set Action Recognition via Multi-Label Evidential Learning: Chen Zhao,

Dawei Du,

Anthony Hoogs,

Christopher Funk; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhao_2023_CVPR, author = {Zhao, Chen and Du, Dawei and Hoogs, Anthony and Funk, Christopher}, title = {Open Set Action Recognition via Multi-Label Evidential Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22982-22991} }
MAP: Multimodal Uncertainty-Aware Vision-Language Pre-Training Model: Yatai Ji,

Junjie Wang,

Yuan Gong,

Lin Zhang,

Yanru Zhu,

Hongfa Wang,

Jiaxing Zhang,

Tetsuya Sakai,

Yujiu Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ji_2023_CVPR, author = {Ji, Yatai and Wang, Junjie and Gong, Yuan and Zhang, Lin and Zhu, Yanru and Wang, Hongfa and Zhang, Jiaxing and Sakai, Tetsuya and Yang, Yujiu}, title = {MAP: Multimodal Uncertainty-Aware Vision-Language Pre-Training Model}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23262-23271} }
DualRel: Semi-Supervised Mitochondria Segmentation From a Prototype Perspective: Huayu Mai,

Rui Sun,

Tianzhu Zhang,

Zhiwei Xiong,

Feng Wu; [pdf] [supp]
[bibtex]
@InProceedings{Mai_2023_CVPR, author = {Mai, Huayu and Sun, Rui and Zhang, Tianzhu and Xiong, Zhiwei and Wu, Feng}, title = {DualRel: Semi-Supervised Mitochondria Segmentation From a Prototype Perspective}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19617-19626} }
Gated Multi-Resolution Transfer Network for Burst Restoration and Enhancement: Nancy Mehta,

Akshay Dudhane,

Subrahmanyam Murala,

Syed Waqas Zamir,

Salman Khan,

Fahad Shahbaz Khan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mehta_2023_CVPR, author = {Mehta, Nancy and Dudhane, Akshay and Murala, Subrahmanyam and Zamir, Syed Waqas and Khan, Salman and Khan, Fahad Shahbaz}, title = {Gated Multi-Resolution Transfer Network for Burst Restoration and Enhancement}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22201-22210} }
PIDNet: A Real-Time Semantic Segmentation Network Inspired by PID Controllers: Jiacong Xu,

Zixiang Xiong,

Shankar P. Bhattacharyya; [pdf] [arXiv]
[bibtex]
@InProceedings{Xu_2023_CVPR, author = {Xu, Jiacong and Xiong, Zixiang and Bhattacharyya, Shankar P.}, title = {PIDNet: A Real-Time Semantic Segmentation Network Inspired by PID Controllers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19529-19539} }
Frustratingly Easy Regularization on Representation Can Boost Deep Reinforcement Learning: Qiang He,

Huangyuan Su,

Jieyu Zhang,

Xinwen Hou; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{He_2023_CVPR, author = {He, Qiang and Su, Huangyuan and Zhang, Jieyu and Hou, Xinwen}, title = {Frustratingly Easy Regularization on Representation Can Boost Deep Reinforcement Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20215-20225} }
PointDistiller: Structured Knowledge Distillation Towards Efficient and Compact 3D Detection: Linfeng Zhang,

Runpei Dong,

Hung-Shuo Tai,

Kaisheng Ma; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_CVPR, author = {Zhang, Linfeng and Dong, Runpei and Tai, Hung-Shuo and Ma, Kaisheng}, title = {PointDistiller: Structured Knowledge Distillation Towards Efficient and Compact 3D Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21791-21801} }
LEMaRT: Label-Efficient Masked Region Transform for Image Harmonization: Sheng Liu,

Cong Phuoc Huynh,

Cong Chen,

Maxim Arap,

Raffay Hamid; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Sheng and Huynh, Cong Phuoc and Chen, Cong and Arap, Maxim and Hamid, Raffay}, title = {LEMaRT: Label-Efficient Masked Region Transform for Image Harmonization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18290-18299} }
Discriminator-Cooperated Feature Map Distillation for GAN Compression: Tie Hu,

Mingbao Lin,

Lizhou You,

Fei Chao,

Rongrong Ji; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hu_2023_CVPR, author = {Hu, Tie and Lin, Mingbao and You, Lizhou and Chao, Fei and Ji, Rongrong}, title = {Discriminator-Cooperated Feature Map Distillation for GAN Compression}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20351-20360} }
StyleAdv: Meta Style Adversarial Training for Cross-Domain Few-Shot Learning: Yuqian Fu,

Yu Xie,

Yanwei Fu,

Yu-Gang Jiang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Fu_2023_CVPR, author = {Fu, Yuqian and Xie, Yu and Fu, Yanwei and Jiang, Yu-Gang}, title = {StyleAdv: Meta Style Adversarial Training for Cross-Domain Few-Shot Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24575-24584} }
Long-Tailed Visual Recognition via Self-Heterogeneous Integration With Knowledge Excavation: Yan Jin,

Mengke Li,

Yang Lu,

Yiu-ming Cheung,

Hanzi Wang; [pdf] [arXiv]
[bibtex]
@InProceedings{Jin_2023_CVPR, author = {Jin, Yan and Li, Mengke and Lu, Yang and Cheung, Yiu-ming and Wang, Hanzi}, title = {Long-Tailed Visual Recognition via Self-Heterogeneous Integration With Knowledge Excavation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23695-23704} }
Context De-Confounded Emotion Recognition: Dingkang Yang,

Zhaoyu Chen,

Yuzheng Wang,

Shunli Wang,

Mingcheng Li,

Siao Liu,

Xiao Zhao,

Shuai Huang,

Zhiyan Dong,

Peng Zhai,

Lihua Zhang; [pdf] [arXiv]
[bibtex]
@InProceedings{Yang_2023_CVPR, author = {Yang, Dingkang and Chen, Zhaoyu and Wang, Yuzheng and Wang, Shunli and Li, Mingcheng and Liu, Siao and Zhao, Xiao and Huang, Shuai and Dong, Zhiyan and Zhai, Peng and Zhang, Lihua}, title = {Context De-Confounded Emotion Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19005-19015} }
InstructPix2Pix: Learning To Follow Image Editing Instructions: Tim Brooks,

Aleksander Holynski,

Alexei A. Efros; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Brooks_2023_CVPR, author = {Brooks, Tim and Holynski, Aleksander and Efros, Alexei A.}, title = {InstructPix2Pix: Learning To Follow Image Editing Instructions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18392-18402} }
Progressive Disentangled Representation Learning for Fine-Grained Controllable Talking Head Synthesis: Duomin Wang,

Yu Deng,

Zixin Yin,

Heung-Yeung Shum,

Baoyuan Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Duomin and Deng, Yu and Yin, Zixin and Shum, Heung-Yeung and Wang, Baoyuan}, title = {Progressive Disentangled Representation Learning for Fine-Grained Controllable Talking Head Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17979-17989} }
Breaking the "Object" in Video Object Segmentation: Pavel Tokmakov,

Jie Li,

Adrien Gaidon; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tokmakov_2023_CVPR, author = {Tokmakov, Pavel and Li, Jie and Gaidon, Adrien}, title = {Breaking the ''Object'' in Video Object Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22836-22845} }
CoWs on Pasture: Baselines and Benchmarks for Language-Driven Zero-Shot Object Navigation: Samir Yitzhak Gadre,

Mitchell Wortsman,

Gabriel Ilharco,

Ludwig Schmidt,

Shuran Song; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gadre_2023_CVPR, author = {Gadre, Samir Yitzhak and Wortsman, Mitchell and Ilharco, Gabriel and Schmidt, Ludwig and Song, Shuran}, title = {CoWs on Pasture: Baselines and Benchmarks for Language-Driven Zero-Shot Object Navigation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23171-23181} }
CIGAR: Cross-Modality Graph Reasoning for Domain Adaptive Object Detection: Yabo Liu,

Jinghua Wang,

Chao Huang,

Yaowei Wang,

Yong Xu; [pdf]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Yabo and Wang, Jinghua and Huang, Chao and Wang, Yaowei and Xu, Yong}, title = {CIGAR: Cross-Modality Graph Reasoning for Domain Adaptive Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23776-23786} }
HOOD: Hierarchical Graphs for Generalized Modelling of Clothing Dynamics: Artur Grigorev,

Michael J. Black,

Otmar Hilliges; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Grigorev_2023_CVPR, author = {Grigorev, Artur and Black, Michael J. and Hilliges, Otmar}, title = {HOOD: Hierarchical Graphs for Generalized Modelling of Clothing Dynamics}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16965-16974} }
HyperReel: High-Fidelity 6-DoF Video With Ray-Conditioned Sampling: Benjamin Attal,

Jia-Bin Huang,

Christian Richardt,

Michael Zollhöfer,

Johannes Kopf,

Matthew O’Toole,

Changil Kim; [pdf] [supp]
[bibtex]
@InProceedings{Attal_2023_CVPR, author = {Attal, Benjamin and Huang, Jia-Bin and Richardt, Christian and Zollh\"ofer, Michael and Kopf, Johannes and O{\textquoteright}Toole, Matthew and Kim, Changil}, title = {HyperReel: High-Fidelity 6-DoF Video With Ray-Conditioned Sampling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16610-16620} }
PCR: Proxy-Based Contrastive Replay for Online Class-Incremental Continual Learning: Huiwei Lin,

Baoquan Zhang,

Shanshan Feng,

Xutao Li,

Yunming Ye; [pdf] [arXiv]
[bibtex]
@InProceedings{Lin_2023_CVPR, author = {Lin, Huiwei and Zhang, Baoquan and Feng, Shanshan and Li, Xutao and Ye, Yunming}, title = {PCR: Proxy-Based Contrastive Replay for Online Class-Incremental Continual Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24246-24255} }
Token Boosting for Robust Self-Supervised Visual Transformer Pre-Training: Tianjiao Li,

Lin Geng Foo,

Ping Hu,

Xindi Shang,

Hossein Rahmani,

Zehuan Yuan,

Jun Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Tianjiao and Foo, Lin Geng and Hu, Ping and Shang, Xindi and Rahmani, Hossein and Yuan, Zehuan and Liu, Jun}, title = {Token Boosting for Robust Self-Supervised Visual Transformer Pre-Training}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {24027-24038} }
MaskCon: Masked Contrastive Learning for Coarse-Labelled Dataset: Chen Feng,

Ioannis Patras; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Feng_2023_CVPR, author = {Feng, Chen and Patras, Ioannis}, title = {MaskCon: Masked Contrastive Learning for Coarse-Labelled Dataset}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19913-19922} }
AGAIN: Adversarial Training With Attribution Span Enlargement and Hybrid Feature Fusion: Shenglin Yin,

Kelu Yao,

Sheng Shi,

Yangzhou Du,

Zhen Xiao; [pdf] [supp]
[bibtex]
@InProceedings{Yin_2023_CVPR, author = {Yin, Shenglin and Yao, Kelu and Shi, Sheng and Du, Yangzhou and Xiao, Zhen}, title = {AGAIN: Adversarial Training With Attribution Span Enlargement and Hybrid Feature Fusion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20544-20553} }
ABLE-NeRF: Attention-Based Rendering With Learnable Embeddings for Neural Radiance Field: Zhe Jun Tang,

Tat-Jen Cham,

Haiyu Zhao; [pdf] [supp]
[bibtex]
@InProceedings{Tang_2023_CVPR, author = {Tang, Zhe Jun and Cham, Tat-Jen and Zhao, Haiyu}, title = {ABLE-NeRF: Attention-Based Rendering With Learnable Embeddings for Neural Radiance Field}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16559-16568} }
WinCLIP: Zero-/Few-Shot Anomaly Classification and Segmentation: Jongheon Jeong,

Yang Zou,

Taewan Kim,

Dongqing Zhang,

Avinash Ravichandran,

Onkar Dabeer; [pdf] [supp]
[bibtex]
@InProceedings{Jeong_2023_CVPR, author = {Jeong, Jongheon and Zou, Yang and Kim, Taewan and Zhang, Dongqing and Ravichandran, Avinash and Dabeer, Onkar}, title = {WinCLIP: Zero-/Few-Shot Anomaly Classification and Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19606-19616} }
TriDet: Temporal Action Detection With Relative Boundary Modeling: Dingfeng Shi,

Yujie Zhong,

Qiong Cao,

Lin Ma,

Jia Li,

Dacheng Tao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shi_2023_CVPR, author = {Shi, Dingfeng and Zhong, Yujie and Cao, Qiong and Ma, Lin and Li, Jia and Tao, Dacheng}, title = {TriDet: Temporal Action Detection With Relative Boundary Modeling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18857-18866} }
Dream3D: Zero-Shot Text-to-3D Synthesis Using 3D Shape Prior and Text-to-Image Diffusion Models: Jiale Xu,

Xintao Wang,

Weihao Cheng,

Yan-Pei Cao,

Ying Shan,

Xiaohu Qie,

Shenghua Gao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_CVPR, author = {Xu, Jiale and Wang, Xintao and Cheng, Weihao and Cao, Yan-Pei and Shan, Ying and Qie, Xiaohu and Gao, Shenghua}, title = {Dream3D: Zero-Shot Text-to-3D Synthesis Using 3D Shape Prior and Text-to-Image Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20908-20918} }
Reinforcement Learning-Based Black-Box Model Inversion Attacks: Gyojin Han,

Jaehyun Choi,

Haeil Lee,

Junmo Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Han_2023_CVPR, author = {Han, Gyojin and Choi, Jaehyun and Lee, Haeil and Kim, Junmo}, title = {Reinforcement Learning-Based Black-Box Model Inversion Attacks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20504-20513} }
Learning a Deep Color Difference Metric for Photographic Images: Haoyu Chen,

Zhihua Wang,

Yang Yang,

Qilin Sun,

Kede Ma; [pdf] [arXiv]
[bibtex]
@InProceedings{Chen_2023_CVPR, author = {Chen, Haoyu and Wang, Zhihua and Yang, Yang and Sun, Qilin and Ma, Kede}, title = {Learning a Deep Color Difference Metric for Photographic Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22242-22251} }
1000 FPS HDR Video With a Spike-RGB Hybrid Camera: Yakun Chang,

Chu Zhou,

Yuchen Hong,

Liwen Hu,

Chao Xu,

Tiejun Huang,

Boxin Shi; [pdf] [supp]
[bibtex]
@InProceedings{Chang_2023_CVPR, author = {Chang, Yakun and Zhou, Chu and Hong, Yuchen and Hu, Liwen and Xu, Chao and Huang, Tiejun and Shi, Boxin}, title = {1000 FPS HDR Video With a Spike-RGB Hybrid Camera}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22180-22190} }
DINN360: Deformable Invertible Neural Network for Latitude-Aware 360deg Image Rescaling: Yichen Guo,

Mai Xu,

Lai Jiang,

Leonid Sigal,

Yunjin Chen; [pdf] [supp]
[bibtex]
@InProceedings{Guo_2023_CVPR, author = {Guo, Yichen and Xu, Mai and Jiang, Lai and Sigal, Leonid and Chen, Yunjin}, title = {DINN360: Deformable Invertible Neural Network for Latitude-Aware 360deg Image Rescaling}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21519-21528} }
Learning Geometric-Aware Properties in 2D Representation Using Lightweight CAD Models, or Zero Real 3D Pairs: Pattaramanee Arsomngern,

Sarana Nutanong,

Supasorn Suwajanakorn; [pdf] [supp]
[bibtex]
@InProceedings{Arsomngern_2023_CVPR, author = {Arsomngern, Pattaramanee and Nutanong, Sarana and Suwajanakorn, Supasorn}, title = {Learning Geometric-Aware Properties in 2D Representation Using Lightweight CAD Models, or Zero Real 3D Pairs}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21371-21381} }
Few-Shot Learning With Visual Distribution Calibration and Cross-Modal Distribution Alignment: Runqi Wang,

Hao Zheng,

Xiaoyue Duan,

Jianzhuang Liu,

Yuning Lu,

Tian Wang,

Songcen Xu,

Baochang Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Runqi and Zheng, Hao and Duan, Xiaoyue and Liu, Jianzhuang and Lu, Yuning and Wang, Tian and Xu, Songcen and Zhang, Baochang}, title = {Few-Shot Learning With Visual Distribution Calibration and Cross-Modal Distribution Alignment}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23445-23454} }
Finetune Like You Pretrain: Improved Finetuning of Zero-Shot Vision Models: Sachin Goyal,

Ananya Kumar,

Sankalp Garg,

Zico Kolter,

Aditi Raghunathan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Goyal_2023_CVPR, author = {Goyal, Sachin and Kumar, Ananya and Garg, Sankalp and Kolter, Zico and Raghunathan, Aditi}, title = {Finetune Like You Pretrain: Improved Finetuning of Zero-Shot Vision Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19338-19347} }
Weakly Supervised Temporal Sentence Grounding With Uncertainty-Guided Self-Training: Yifei Huang,

Lijin Yang,

Yoichi Sato; [pdf]
[bibtex]
@InProceedings{Huang_2023_CVPR, author = {Huang, Yifei and Yang, Lijin and Sato, Yoichi}, title = {Weakly Supervised Temporal Sentence Grounding With Uncertainty-Guided Self-Training}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18908-18918} }
AutoRecon: Automated 3D Object Discovery and Reconstruction: Yuang Wang,

Xingyi He,

Sida Peng,

Haotong Lin,

Hujun Bao,

Xiaowei Zhou; [pdf] [arXiv]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Yuang and He, Xingyi and Peng, Sida and Lin, Haotong and Bao, Hujun and Zhou, Xiaowei}, title = {AutoRecon: Automated 3D Object Discovery and Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21382-21391} }
Learning a Practical SDR-to-HDRTV Up-Conversion Using New Dataset and Degradation Models: Cheng Guo,

Leidong Fan,

Ziyu Xue,

Xiuhua Jiang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Guo_2023_CVPR, author = {Guo, Cheng and Fan, Leidong and Xue, Ziyu and Jiang, Xiuhua}, title = {Learning a Practical SDR-to-HDRTV Up-Conversion Using New Dataset and Degradation Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22231-22241} }
Learning To Fuse Monocular and Multi-View Cues for Multi-Frame Depth Estimation in Dynamic Scenes: Rui Li,

Dong Gong,

Wei Yin,

Hao Chen,

Yu Zhu,

Kaixuan Wang,

Xiaozhi Chen,

Jinqiu Sun,

Yanning Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Rui and Gong, Dong and Yin, Wei and Chen, Hao and Zhu, Yu and Wang, Kaixuan and Chen, Xiaozhi and Sun, Jinqiu and Zhang, Yanning}, title = {Learning To Fuse Monocular and Multi-View Cues for Multi-Frame Depth Estimation in Dynamic Scenes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21539-21548} }
Bias-Eliminating Augmentation Learning for Debiased Federated Learning: Yuan-Yi Xu,

Ci-Siang Lin,

Yu-Chiang Frank Wang; [pdf]
[bibtex]
@InProceedings{Xu_2023_CVPR, author = {Xu, Yuan-Yi and Lin, Ci-Siang and Wang, Yu-Chiang Frank}, title = {Bias-Eliminating Augmentation Learning for Debiased Federated Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20442-20452} }
Understanding the Robustness of 3D Object Detection With Bird's-Eye-View Representations in Autonomous Driving: Zijian Zhu,

Yichi Zhang,

Hai Chen,

Yinpeng Dong,

Shu Zhao,

Wenbo Ding,

Jiachen Zhong,

Shibao Zheng; [pdf] [supp]
[bibtex]
@InProceedings{Zhu_2023_CVPR, author = {Zhu, Zijian and Zhang, Yichi and Chen, Hai and Dong, Yinpeng and Zhao, Shu and Ding, Wenbo and Zhong, Jiachen and Zheng, Shibao}, title = {Understanding the Robustness of 3D Object Detection With Bird's-Eye-View Representations in Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21600-21610} }
Generalist: Decoupling Natural and Robust Generalization: Hongjun Wang,

Yisen Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Hongjun and Wang, Yisen}, title = {Generalist: Decoupling Natural and Robust Generalization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20554-20563} }
Explicit Visual Prompting for Low-Level Structure Segmentations: Weihuang Liu,

Xi Shen,

Chi-Man Pun,

Xiaodong Cun; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Weihuang and Shen, Xi and Pun, Chi-Man and Cun, Xiaodong}, title = {Explicit Visual Prompting for Low-Level Structure Segmentations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19434-19445} }
Practical Network Acceleration With Tiny Sets: Guo-Hua Wang,

Jianxin Wu; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Guo-Hua and Wu, Jianxin}, title = {Practical Network Acceleration With Tiny Sets}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20331-20340} }
NeRF-RPN: A General Framework for Object Detection in NeRFs: Benran Hu,

Junkai Huang,

Yichen Liu,

Yu-Wing Tai,

Chi-Keung Tang; [pdf] [supp]
[bibtex]
@InProceedings{Hu_2023_CVPR, author = {Hu, Benran and Huang, Junkai and Liu, Yichen and Tai, Yu-Wing and Tang, Chi-Keung}, title = {NeRF-RPN: A General Framework for Object Detection in NeRFs}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {23528-23538} }
Masked Wavelet Representation for Compact Neural Radiance Fields: Daniel Rho,

Byeonghyeon Lee,

Seungtae Nam,

Joo Chan Lee,

Jong Hwan Ko,

Eunbyung Park; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Rho_2023_CVPR, author = {Rho, Daniel and Lee, Byeonghyeon and Nam, Seungtae and Lee, Joo Chan and Ko, Jong Hwan and Park, Eunbyung}, title = {Masked Wavelet Representation for Compact Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20680-20690} }
ObjectStitch: Object Compositing With Diffusion Model: Yizhi Song,

Zhifei Zhang,

Zhe Lin,

Scott Cohen,

Brian Price,

Jianming Zhang,

Soo Ye Kim,

Daniel Aliaga; [pdf] [supp]
[bibtex]
@InProceedings{Song_2023_CVPR, author = {Song, Yizhi and Zhang, Zhifei and Lin, Zhe and Cohen, Scott and Price, Brian and Zhang, Jianming and Kim, Soo Ye and Aliaga, Daniel}, title = {ObjectStitch: Object Compositing With Diffusion Model}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18310-18319} }
Anchor3DLane: Learning To Regress 3D Anchors for Monocular 3D Lane Detection: Shaofei Huang,

Zhenwei Shen,

Zehao Huang,

Zi-han Ding,

Jiao Dai,

Jizhong Han,

Naiyan Wang,

Si Liu; [pdf] [arXiv]
[bibtex]
@InProceedings{Huang_2023_CVPR, author = {Huang, Shaofei and Shen, Zhenwei and Huang, Zehao and Ding, Zi-han and Dai, Jiao and Han, Jizhong and Wang, Naiyan and Liu, Si}, title = {Anchor3DLane: Learning To Regress 3D Anchors for Monocular 3D Lane Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17451-17460} }
Class-Balancing Diffusion Models: Yiming Qin,

Huangjie Zheng,

Jiangchao Yao,

Mingyuan Zhou,

Ya Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Qin_2023_CVPR, author = {Qin, Yiming and Zheng, Huangjie and Yao, Jiangchao and Zhou, Mingyuan and Zhang, Ya}, title = {Class-Balancing Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18434-18443} }
AstroNet: When Astrocyte Meets Artificial Neural Network: Mengqiao Han,

Liyuan Pan,

Xiabi Liu; [pdf] [supp]
[bibtex]
@InProceedings{Han_2023_CVPR, author = {Han, Mengqiao and Pan, Liyuan and Liu, Xiabi}, title = {AstroNet: When Astrocyte Meets Artificial Neural Network}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20258-20268} }
Feature Alignment and Uniformity for Test Time Adaptation: Shuai Wang,

Daoan Zhang,

Zipei Yan,

Jianguo Zhang,

Rui Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_CVPR, author = {Wang, Shuai and Zhang, Daoan and Yan, Zipei and Zhang, Jianguo and Li, Rui}, title = {Feature Alignment and Uniformity for Test Time Adaptation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20050-20060} }
Balanced Product of Calibrated Experts for Long-Tailed Recognition: Emanuel Sanchez Aimar,

Arvi Jonnarth,

Michael Felsberg,

Marco Kuhlmann; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Aimar_2023_CVPR, author = {Aimar, Emanuel Sanchez and Jonnarth, Arvi and Felsberg, Michael and Kuhlmann, Marco}, title = {Balanced Product of Calibrated Experts for Long-Tailed Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19967-19977} }
PanoSwin: A Pano-Style Swin Transformer for Panorama Understanding: Zhixin Ling,

Zhen Xing,

Xiangdong Zhou,

Manliang Cao,

Guichun Zhou; [pdf] [supp]
[bibtex]
@InProceedings{Ling_2023_CVPR, author = {Ling, Zhixin and Xing, Zhen and Zhou, Xiangdong and Cao, Manliang and Zhou, Guichun}, title = {PanoSwin: A Pano-Style Swin Transformer for Panorama Understanding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17755-17764} }
Parameter Efficient Local Implicit Image Function Network for Face Segmentation: Mausoom Sarkar,

Nikitha SR,

Mayur Hemani,

Rishabh Jain,

Balaji Krishnamurthy; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sarkar_2023_CVPR, author = {Sarkar, Mausoom and Nikitha, SR and Hemani, Mayur and Jain, Rishabh and Krishnamurthy, Balaji}, title = {Parameter Efficient Local Implicit Image Function Network for Face Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20970-20980} }
Referring Image Matting: Jizhizi Li,

Jing Zhang,

Dacheng Tao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Jizhizi and Zhang, Jing and Tao, Dacheng}, title = {Referring Image Matting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22448-22457} }
Modality-Invariant Visual Odometry for Embodied Vision: Marius Memmel,

Roman Bachmann,

Amir Zamir; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Memmel_2023_CVPR, author = {Memmel, Marius and Bachmann, Roman and Zamir, Amir}, title = {Modality-Invariant Visual Odometry for Embodied Vision}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21549-21559} }
What You Can Reconstruct From a Shadow: Ruoshi Liu,

Sachit Menon,

Chengzhi Mao,

Dennis Park,

Simon Stent,

Carl Vondrick; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2023_CVPR, author = {Liu, Ruoshi and Menon, Sachit and Mao, Chengzhi and Park, Dennis and Stent, Simon and Vondrick, Carl}, title = {What You Can Reconstruct From a Shadow}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17059-17068} }
Lite DETR: An Interleaved Multi-Scale Encoder for Efficient DETR: Feng Li,

Ailing Zeng,

Shilong Liu,

Hao Zhang,

Hongyang Li,

Lei Zhang,

Lionel M. Ni; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_CVPR, author = {Li, Feng and Zeng, Ailing and Liu, Shilong and Zhang, Hao and Li, Hongyang and Zhang, Lei and Ni, Lionel M.}, title = {Lite DETR: An Interleaved Multi-Scale Encoder for Efficient DETR}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18558-18567} }
MobileNeRF: Exploiting the Polygon Rasterization Pipeline for Efficient Neural Field Rendering on Mobile Architectures: Zhiqin Chen,

Thomas Funkhouser,

Peter Hedman,

Andrea Tagliasacchi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_CVPR, author = {Chen, Zhiqin and Funkhouser, Thomas and Hedman, Peter and Tagliasacchi, Andrea}, title = {MobileNeRF: Exploiting the Polygon Rasterization Pipeline for Efficient Neural Field Rendering on Mobile Architectures}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16569-16578} }
Pseudo-Label Guided Contrastive Learning for Semi-Supervised Medical Image Segmentation: Hritam Basak,

Zhaozheng Yin; [pdf]
[bibtex]
@InProceedings{Basak_2023_CVPR, author = {Basak, Hritam and Yin, Zhaozheng}, title = {Pseudo-Label Guided Contrastive Learning for Semi-Supervised Medical Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19786-19797} }
Self-Supervised Geometry-Aware Encoder for Style-Based 3D GAN Inversion: Yushi Lan,

Xuyi Meng,

Shuai Yang,

Chen Change Loy,

Bo Dai; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lan_2023_CVPR, author = {Lan, Yushi and Meng, Xuyi and Yang, Shuai and Loy, Chen Change and Dai, Bo}, title = {Self-Supervised Geometry-Aware Encoder for Style-Based 3D GAN Inversion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20940-20949} }
POEM: Reconstructing Hand in a Point Embedded Multi-View Stereo: Lixin Yang,

Jian Xu,

Licheng Zhong,

Xinyu Zhan,

Zhicheng Wang,

Kejian Wu,

Cewu Lu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_CVPR, author = {Yang, Lixin and Xu, Jian and Zhong, Licheng and Zhan, Xinyu and Wang, Zhicheng and Wu, Kejian and Lu, Cewu}, title = {POEM: Reconstructing Hand in a Point Embedded Multi-View Stereo}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21108-21117} }
Progressively Optimized Local Radiance Fields for Robust View Synthesis: Andréas Meuleman,

Yu-Lun Liu,

Chen Gao,

Jia-Bin Huang,

Changil Kim,

Min H. Kim,

Johannes Kopf; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Meuleman_2023_CVPR, author = {Meuleman, Andr\'eas and Liu, Yu-Lun and Gao, Chen and Huang, Jia-Bin and Kim, Changil and Kim, Min H. and Kopf, Johannes}, title = {Progressively Optimized Local Radiance Fields for Robust View Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16539-16548} }
GeoMVSNet: Learning Multi-View Stereo With Geometry Perception: Zhe Zhang,

Rui Peng,

Yuxi Hu,

Ronggang Wang; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_CVPR, author = {Zhang, Zhe and Peng, Rui and Hu, Yuxi and Wang, Ronggang}, title = {GeoMVSNet: Learning Multi-View Stereo With Geometry Perception}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21508-21518} }
TeSLA: Test-Time Self-Learning With Automatic Adversarial Augmentation: Devavrat Tomar,

Guillaume Vray,

Behzad Bozorgtabar,

Jean-Philippe Thiran; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tomar_2023_CVPR, author = {Tomar, Devavrat and Vray, Guillaume and Bozorgtabar, Behzad and Thiran, Jean-Philippe}, title = {TeSLA: Test-Time Self-Learning With Automatic Adversarial Augmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20341-20350} }
RefTeacher: A Strong Baseline for Semi-Supervised Referring Expression Comprehension: Jiamu Sun,

Gen Luo,

Yiyi Zhou,

Xiaoshuai Sun,

Guannan Jiang,

Zhiyu Wang,

Rongrong Ji; [pdf]
[bibtex]
@InProceedings{Sun_2023_CVPR, author = {Sun, Jiamu and Luo, Gen and Zhou, Yiyi and Sun, Xiaoshuai and Jiang, Guannan and Wang, Zhiyu and Ji, Rongrong}, title = {RefTeacher: A Strong Baseline for Semi-Supervised Referring Expression Comprehension}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19144-19154} }
Handwritten Text Generation From Visual Archetypes: Vittorio Pippi,

Silvia Cascianelli,

Rita Cucchiara; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Pippi_2023_CVPR, author = {Pippi, Vittorio and Cascianelli, Silvia and Cucchiara, Rita}, title = {Handwritten Text Generation From Visual Archetypes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22458-22467} }
Unicode Analogies: An Anti-Objectivist Visual Reasoning Challenge: Steven Spratley,

Krista A. Ehinger,

Tim Miller; [pdf] [supp]
[bibtex]
@InProceedings{Spratley_2023_CVPR, author = {Spratley, Steven and Ehinger, Krista A. and Miller, Tim}, title = {Unicode Analogies: An Anti-Objectivist Visual Reasoning Challenge}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19082-19091} }
FFF: Fragment-Guided Flexible Fitting for Building Complete Protein Structures: Weijie Chen,

Xinyan Wang,

Yuhang Wang; [pdf]
[bibtex]
@InProceedings{Chen_2023_CVPR, author = {Chen, Weijie and Wang, Xinyan and Wang, Yuhang}, title = {FFF: Fragment-Guided Flexible Fitting for Building Complete Protein Structures}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19776-19785} }
Align Your Latents: High-Resolution Video Synthesis With Latent Diffusion Models: Andreas Blattmann,

Robin Rombach,

Huan Ling,

Tim Dockhorn,

Seung Wook Kim,

Sanja Fidler,

Karsten Kreis; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Blattmann_2023_CVPR, author = {Blattmann, Andreas and Rombach, Robin and Ling, Huan and Dockhorn, Tim and Kim, Seung Wook and Fidler, Sanja and Kreis, Karsten}, title = {Align Your Latents: High-Resolution Video Synthesis With Latent Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22563-22575} }
Implicit 3D Human Mesh Recovery Using Consistency With Pose and Shape From Unseen-View: Hanbyel Cho,

Yooshin Cho,

Jaesung Ahn,

Junmo Kim; [pdf] [supp]
[bibtex]
@InProceedings{Cho_2023_CVPR, author = {Cho, Hanbyel and Cho, Yooshin and Ahn, Jaesung and Kim, Junmo}, title = {Implicit 3D Human Mesh Recovery Using Consistency With Pose and Shape From Unseen-View}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {21148-21158} }
Teleidoscopic Imaging System for Microscale 3D Shape Reconstruction: Ryo Kawahara,

Meng-Yu Jennifer Kuo,

Shohei Nobuhara; [pdf] [supp]
[bibtex]
@InProceedings{Kawahara_2023_CVPR, author = {Kawahara, Ryo and Kuo, Meng-Yu Jennifer and Nobuhara, Shohei}, title = {Teleidoscopic Imaging System for Microscale 3D Shape Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20813-20822} }
UV Volumes for Real-Time Rendering of Editable Free-View Human Performance: Yue Chen,

Xuan Wang,

Xingyu Chen,

Qi Zhang,

Xiaoyu Li,

Yu Guo,

Jue Wang,

Fei Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_CVPR, author = {Chen, Yue and Wang, Xuan and Chen, Xingyu and Zhang, Qi and Li, Xiaoyu and Guo, Yu and Wang, Jue and Wang, Fei}, title = {UV Volumes for Real-Time Rendering of Editable Free-View Human Performance}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16621-16631} }
JacobiNeRF: NeRF Shaping With Mutual Information Gradients: Xiaomeng Xu,

Yanchao Yang,

Kaichun Mo,

Boxiao Pan,

Li Yi,

Leonidas Guibas; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_CVPR, author = {Xu, Xiaomeng and Yang, Yanchao and Mo, Kaichun and Pan, Boxiao and Yi, Li and Guibas, Leonidas}, title = {JacobiNeRF: NeRF Shaping With Mutual Information Gradients}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16498-16507} }
Open-Set Representation Learning Through Combinatorial Embedding: Geeho Kim,

Junoh Kang,

Bohyung Han; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2023_CVPR, author = {Kim, Geeho and Kang, Junoh and Han, Bohyung}, title = {Open-Set Representation Learning Through Combinatorial Embedding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19744-19753} }
Multi-View Stereo Representation Revist: Region-Aware MVSNet: Yisu Zhang,

Jianke Zhu,

Lixiang Lin; [pdf]
[bibtex]
@InProceedings{Zhang_2023_CVPR, author = {Zhang, Yisu and Zhu, Jianke and Lin, Lixiang}, title = {Multi-View Stereo Representation Revist: Region-Aware MVSNet}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {17376-17385} }
A Unified HDR Imaging Method With Pixel and Patch Level: Qingsen Yan,

Weiye Chen,

Song Zhang,

Yu Zhu,

Jinqiu Sun,

Yanning Zhang; [pdf] [arXiv]
[bibtex]
@InProceedings{Yan_2023_CVPR, author = {Yan, Qingsen and Chen, Weiye and Zhang, Song and Zhu, Yu and Sun, Jinqiu and Zhang, Yanning}, title = {A Unified HDR Imaging Method With Pixel and Patch Level}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22211-22220} }
Partial Network Cloning: Jingwen Ye,

Songhua Liu,

Xinchao Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ye_2023_CVPR, author = {Ye, Jingwen and Liu, Songhua and Wang, Xinchao}, title = {Partial Network Cloning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {20137-20146} }
MOTRv2: Bootstrapping End-to-End Multi-Object Tracking by Pretrained Object Detectors: Yuang Zhang,

Tiancai Wang,

Xiangyu Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_CVPR, author = {Zhang, Yuang and Wang, Tiancai and Zhang, Xiangyu}, title = {MOTRv2: Bootstrapping End-to-End Multi-Object Tracking by Pretrained Object Detectors}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {22056-22065} }
Principles of Forgetting in Domain-Incremental Semantic Segmentation in Adverse Weather Conditions: Tobias Kalb,

Jürgen Beyerer; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kalb_2023_CVPR, author = {Kalb, Tobias and Beyerer, J\"urgen}, title = {Principles of Forgetting in Domain-Incremental Semantic Segmentation in Adverse Weather Conditions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {19508-19518} }
Neural Texture Synthesis With Guided Correspondence: Yang Zhou,

Kaijian Chen,

Rongjun Xiao,

Hui Huang; [pdf] [supp]
[bibtex]
@InProceedings{Zhou_2023_CVPR, author = {Zhou, Yang and Chen, Kaijian and Xiao, Rongjun and Huang, Hui}, title = {Neural Texture Synthesis With Guided Correspondence}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {18095-18104} }
Interactive Cartoonization With Controllable Perceptual Factors: Namhyuk Ahn,

Patrick Kwon,

Jihye Back,

Kibeom Hong,

Seungkwon Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ahn_2023_CVPR, author = {Ahn, Namhyuk and Kwon, Patrick and Back, Jihye and Hong, Kibeom and Kim, Seungkwon}, title = {Interactive Cartoonization With Controllable Perceptual Factors}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, month = {June}, year = {2023}, pages = {16827-16835} }; Back