Papers
- Back
Towards Attack-tolerant Federated Learning via Critical Parameter Analysis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Han_2023_ICCV, author = {Han, Sungwon and Park, Sungwon and Wu, Fangzhao and Kim, Sundong and Zhu, Bin and Xie, Xing and Cha, Meeyoung}, title = {Towards Attack-tolerant Federated Learning via Critical Parameter Analysis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4999-5008} }
Stochastic Segmentation with Conditional Categorical Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zbinden_2023_ICCV, author = {Zbinden, Lukas and Doorenbos, Lars and Pissas, Theodoros and Huber, Adrian Thomas and Sznitman, Raphael and M\'arquez-Neila, Pablo}, title = {Stochastic Segmentation with Conditional Categorical Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1119-1129} }
Diff-Retinex: Rethinking Low-light Image Enhancement with A Generative Diffusion Model-
[pdf]
[bibtex]@InProceedings{Yi_2023_ICCV, author = {Yi, Xunpeng and Xu, Han and Zhang, Hao and Tang, Linfeng and Ma, Jiayi}, title = {Diff-Retinex: Rethinking Low-light Image Enhancement with A Generative Diffusion Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12302-12311} }
Bird's-Eye-View Scene Graph for Vision-Language Navigation-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Rui and Wang, Xiaohan and Wang, Wenguan and Yang, Yi}, title = {Bird's-Eye-View Scene Graph for Vision-Language Navigation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10968-10980} }
PVT++: A Simple End-to-End Latency-Aware Visual Tracking Framework-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Bowen and Huang, Ziyuan and Ye, Junjie and Li, Yiming and Scherer, Sebastian and Zhao, Hang and Fu, Changhong}, title = {PVT++: A Simple End-to-End Latency-Aware Visual Tracking Framework}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10006-10016} }
A Dynamic Dual-Processing Object Detection Framework Inspired by the Brain's Recognition Mechanism-
[pdf]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Minying and Bu, Tianpeng and Hu, Lulu}, title = {A Dynamic Dual-Processing Object Detection Framework Inspired by the Brain's Recognition Mechanism}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6264-6274} }
Hard No-Box Adversarial Attack on Skeleton-Based Human Action Recognition with Skeleton-Motion-Informed Gradient-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lu_2023_ICCV, author = {Lu, Zhengzhi and Wang, He and Chang, Ziyi and Yang, Guoan and Shum, Hubert P. H.}, title = {Hard No-Box Adversarial Attack on Skeleton-Based Human Action Recognition with Skeleton-Motion-Informed Gradient}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4597-4606} }
GameFormer: Game-theoretic Modeling and Learning of Transformer-based Interactive Prediction and Planning for Autonomous Driving-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Zhiyu and Liu, Haochen and Lv, Chen}, title = {GameFormer: Game-theoretic Modeling and Learning of Transformer-based Interactive Prediction and Planning for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3903-3913} }
Towards Better Robustness against Common Corruptions for Unsupervised Domain Adaptation-
[pdf]
[supp]
[bibtex]@InProceedings{Gao_2023_ICCV, author = {Gao, Zhiqiang and Huang, Kaizhu and Zhang, Rui and Liu, Dawei and Ma, Jieming}, title = {Towards Better Robustness against Common Corruptions for Unsupervised Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18882-18893} }
Learning in Imperfect Environment: Multi-Label Classification with Long-Tailed Distribution and Partial Labels-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Wenqiao and Liu, Changshuo and Zeng, Lingze and Ooi, Bengchin and Tang, Siliang and Zhuang, Yueting}, title = {Learning in Imperfect Environment: Multi-Label Classification with Long-Tailed Distribution and Partial Labels}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1423-1432} }
Flexible Visual Recognition by Evidential Modeling of Confusion and Ignorance-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fan_2023_ICCV, author = {Fan, Lei and Liu, Bo and Li, Haoxiang and Wu, Ying and Hua, Gang}, title = {Flexible Visual Recognition by Evidential Modeling of Confusion and Ignorance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1338-1347} }
Texture Generation on 3D Meshes with Point-UV Diffusion-
[pdf]
[arXiv]
[bibtex]@InProceedings{Yu_2023_ICCV, author = {Yu, Xin and Dai, Peng and Li, Wenbo and Ma, Lan and Liu, Zhengzhe and Qi, Xiaojuan}, title = {Texture Generation on 3D Meshes with Point-UV Diffusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4206-4216} }
Supervised Homography Learning with Realistic Dataset Generation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Jiang_2023_ICCV, author = {Jiang, Hai and Li, Haipeng and Han, Songchen and Fan, Haoqiang and Zeng, Bing and Liu, Shuaicheng}, title = {Supervised Homography Learning with Realistic Dataset Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9806-9815} }
E2E-LOAD: End-to-End Long-form Online Action Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Cao_2023_ICCV, author = {Cao, Shuqiang and Luo, Weixin and Wang, Bairui and Zhang, Wei and Ma, Lin}, title = {E2E-LOAD: End-to-End Long-form Online Action Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10422-10432} }
TALL: Thumbnail Layout for Deepfake Video Detection-
[pdf]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Yuting and Liang, Jian and Jia, Gengyun and Yang, Ziming and Zhang, Yanhao and He, Ran}, title = {TALL: Thumbnail Layout for Deepfake Video Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22658-22668} }
Enhanced Soft Label for Semi-Supervised Semantic Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Ma_2023_ICCV, author = {Ma, Jie and Wang, Chuan and Liu, Yang and Lin, Liang and Li, Guanbin}, title = {Enhanced Soft Label for Semi-Supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1185-1195} }
Self-supervised Monocular Depth Estimation: Let's Talk About The Weather-
[pdf]
[supp]
[bibtex]@InProceedings{Saunders_2023_ICCV, author = {Saunders, Kieran and Vogiatzis, George and Manso, Luis J.}, title = {Self-supervised Monocular Depth Estimation: Let's Talk About The Weather}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8907-8917} }
Bidirectional Alignment for Domain Adaptive Detection with Transformers-
[pdf]
[supp]
[bibtex]@InProceedings{He_2023_ICCV, author = {He, Liqiang and Wang, Wei and Chen, Albert and Sun, Min and Kuo, Cheng-Hao and Todorovic, Sinisa}, title = {Bidirectional Alignment for Domain Adaptive Detection with Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18775-18785} }
Fast Neural Scene Flow-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Xueqian and Zheng, Jianqiao and Ferroni, Francesco and Pontes, Jhony Kaesemodel and Lucey, Simon}, title = {Fast Neural Scene Flow}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9878-9890} }
CAME: Contrastive Automated Model Evaluation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Peng_2023_ICCV, author = {Peng, Ru and Duan, Qiuyang and Wang, Haobo and Ma, Jiachen and Jiang, Yanbo and Tu, Yongjun and Jiang, Xiu and Zhao, Junbo}, title = {CAME: Contrastive Automated Model Evaluation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20121-20132} }
ExposureDiffusion: Learning to Expose for Low-light Image Enhancement-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Yufei and Yu, Yi and Yang, Wenhan and Guo, Lanqing and Chau, Lap-Pui and Kot, Alex C. and Wen, Bihan}, title = {ExposureDiffusion: Learning to Expose for Low-light Image Enhancement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12438-12448} }
HM-ViT: Hetero-Modal Vehicle-to-Vehicle Cooperative Perception with Vision Transformer-
[pdf]
[supp]
[bibtex]@InProceedings{Xiang_2023_ICCV, author = {Xiang, Hao and Xu, Runsheng and Ma, Jiaqi}, title = {HM-ViT: Hetero-Modal Vehicle-to-Vehicle Cooperative Perception with Vision Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {284-295} }
HyperReenact: One-Shot Reenactment via Jointly Learning to Refine and Retarget Faces-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bounareli_2023_ICCV, author = {Bounareli, Stella and Tzelepis, Christos and Argyriou, Vasileios and Patras, Ioannis and Tzimiropoulos, Georgios}, title = {HyperReenact: One-Shot Reenactment via Jointly Learning to Refine and Retarget Faces}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7149-7159} }
Order-preserving Consistency Regularization for Domain Adaptation and Generalization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jing_2023_ICCV, author = {Jing, Mengmeng and Zhen, Xiantong and Li, Jingjing and Snoek, Cees G. M.}, title = {Order-preserving Consistency Regularization for Domain Adaptation and Generalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18916-18927} }
RefEgo: Referring Expression Comprehension Dataset from First-Person Perception of Ego4D-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kurita_2023_ICCV, author = {Kurita, Shuhei and Katsura, Naoki and Onami, Eri}, title = {RefEgo: Referring Expression Comprehension Dataset from First-Person Perception of Ego4D}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15214-15224} }
Exploring Temporal Frequency Spectrum in Deep Video Deblurring-
[pdf]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Qi and Zhou, Man and Zheng, Naishan and Li, Chongyi and Huang, Jie and Zhao, Feng}, title = {Exploring Temporal Frequency Spectrum in Deep Video Deblurring}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12428-12437} }
Unified Visual Relationship Detection with Vision and Language Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Long and Yuan, Liangzhe and Gong, Boqing and Cui, Yin and Schroff, Florian and Yang, Ming-Hsuan and Adam, Hartwig and Liu, Ting}, title = {Unified Visual Relationship Detection with Vision and Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6962-6973} }
Occ^2Net: Robust Image Matching Based on 3D Occupancy Estimation for Occluded Regions-
[pdf]
[bibtex]@InProceedings{Fan_2023_ICCV, author = {Fan, Miao and Chen, Mingrui and Hu, Chen and Zhou, Shuchang}, title = {Occ{\textasciicircum}2Net: Robust Image Matching Based on 3D Occupancy Estimation for Occluded Regions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9652-9662} }
Make-An-Animation: Large-Scale Text-conditional 3D Human Motion Generation-
[pdf]
[bibtex]@InProceedings{Azadi_2023_ICCV, author = {Azadi, Samaneh and Shah, Akbar and Hayes, Thomas and Parikh, Devi and Gupta, Sonal}, title = {Make-An-Animation: Large-Scale Text-conditional 3D Human Motion Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15039-15048} }
Rickrolling the Artist: Injecting Backdoors into Text Encoders for Text-to-Image Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Struppek_2023_ICCV, author = {Struppek, Lukas and Hintersdorf, Dominik and Kersting, Kristian}, title = {Rickrolling the Artist: Injecting Backdoors into Text Encoders for Text-to-Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4584-4596} }
LD-ZNet: A Latent Diffusion Approach for Text-Based Image Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{PNVR_2023_ICCV, author = {PNVR, Koutilya and Singh, Bharat and Ghosh, Pallabi and Siddiquie, Behjat and Jacobs, David}, title = {LD-ZNet: A Latent Diffusion Approach for Text-Based Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4157-4168} }
Workie-Talkie: Accelerating Federated Learning by Overlapping Computing and Communications via Contrastive Regularization-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Rui and Wan, Qiyu and Prakash, Pavana and Zhang, Lan and Yuan, Xu and Gong, Yanmin and Fu, Xin and Pan, Miao}, title = {Workie-Talkie: Accelerating Federated Learning by Overlapping Computing and Communications via Contrastive Regularization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16999-17009} }
Downstream-agnostic Adversarial Examples-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Ziqi and Hu, Shengshan and Zhao, Ruizhi and Wang, Qian and Zhang, Leo Yu and Hou, Junhui and Jin, Hai}, title = {Downstream-agnostic Adversarial Examples}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4345-4355} }
Late Stopping: Avoiding Confidently Learning from Mislabeled Examples-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yuan_2023_ICCV, author = {Yuan, Suqin and Feng, Lei and Liu, Tongliang}, title = {Late Stopping: Avoiding Confidently Learning from Mislabeled Examples}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16079-16088} }
AerialVLN: Vision-and-Language Navigation for UAVs-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Shubo and Zhang, Hongsheng and Qi, Yuankai and Wang, Peng and Zhang, Yanning and Wu, Qi}, title = {AerialVLN: Vision-and-Language Navigation for UAVs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15384-15394} }
On the Robustness of Open-World Test-Time Training: Self-Training with Dynamic Prototype Expansion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Yushu and Xu, Xun and Su, Yongyi and Jia, Kui}, title = {On the Robustness of Open-World Test-Time Training: Self-Training with Dynamic Prototype Expansion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11836-11846} }
Studying How to Efficiently and Effectively Guide Models with Explanations-
[pdf]
[supp]
[bibtex]@InProceedings{Rao_2023_ICCV, author = {Rao, Sukrut and B\"ohle, Moritz and Parchami-Araghi, Amin and Schiele, Bernt}, title = {Studying How to Efficiently and Effectively Guide Models with Explanations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1922-1933} }
Most Important Person-Guided Dual-Branch Cross-Patch Attention for Group Affect Recognition-
[pdf]
[bibtex]@InProceedings{Xie_2023_ICCV, author = {Xie, Hongxia and Lee, Ming-Xian and Chen, Tzu-Jui and Chen, Hung-Jen and Liu, Hou-I and Shuai, Hong-Han and Cheng, Wen-Huang}, title = {Most Important Person-Guided Dual-Branch Cross-Patch Attention for Group Affect Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20598-20608} }
SkeletonMAE: Graph-based Masked Autoencoder for Skeleton Sequence Pre-training-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yan_2023_ICCV, author = {Yan, Hong and Liu, Yang and Wei, Yushen and Li, Zhen and Li, Guanbin and Lin, Liang}, title = {SkeletonMAE: Graph-based Masked Autoencoder for Skeleton Sequence Pre-training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5606-5618} }
Achievement-Based Training Progress Balancing for Multi-Task Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Yun_2023_ICCV, author = {Yun, Hayoung and Cho, Hanjoo}, title = {Achievement-Based Training Progress Balancing for Multi-Task Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16935-16944} }
Pose-Free Neural Radiance Fields via Implicit Pose Regularization-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Jiahui and Zhan, Fangneng and Yu, Yingchen and Liu, Kunhao and Wu, Rongliang and Zhang, Xiaoqin and Shao, Ling and Lu, Shijian}, title = {Pose-Free Neural Radiance Fields via Implicit Pose Regularization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3534-3543} }
Self-supervised Learning to Bring Dual Reversed Rolling Shutter Images Alive-
[pdf]
[arXiv]
[bibtex]@InProceedings{Shang_2023_ICCV, author = {Shang, Wei and Ren, Dongwei and Feng, Chaoyu and Wang, Xiaotao and Lei, Lei and Zuo, Wangmeng}, title = {Self-supervised Learning to Bring Dual Reversed Rolling Shutter Images Alive}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13086-13094} }
Logic-induced Diagnostic Reasoning for Semi-supervised Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liang_2023_ICCV, author = {Liang, Chen and Wang, Wenguan and Miao, Jiaxu and Yang, Yi}, title = {Logic-induced Diagnostic Reasoning for Semi-supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16197-16208} }
Self-Supervised Monocular Depth Estimation by Direction-aware Cumulative Convolution Network-
[pdf]
[arXiv]
[bibtex]@InProceedings{Han_2023_ICCV, author = {Han, Wencheng and Yin, Junbo and Shen, Jianbing}, title = {Self-Supervised Monocular Depth Estimation by Direction-aware Cumulative Convolution Network}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8613-8623} }
Encyclopedic VQA: Visual Questions About Detailed Properties of Fine-Grained Categories-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mensink_2023_ICCV, author = {Mensink, Thomas and Uijlings, Jasper and Castrejon, Lluis and Goel, Arushi and Cadar, Felipe and Zhou, Howard and Sha, Fei and Araujo, Andr\'e and Ferrari, Vittorio}, title = {Encyclopedic VQA: Visual Questions About Detailed Properties of Fine-Grained Categories}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3113-3124} }
Towards Understanding the Generalization of Deepfake Detectors from a Game-Theoretical View-
[pdf]
[supp]
[bibtex]@InProceedings{Yao_2023_ICCV, author = {Yao, Kelu and Wang, Jin and Diao, Boyu and Li, Chao}, title = {Towards Understanding the Generalization of Deepfake Detectors from a Game-Theoretical View}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2031-2041} }
Few-Shot Common Action Localization via Cross-Attentional Fusion of Context and Temporal Dynamics-
[pdf]
[bibtex]@InProceedings{Lee_2023_ICCV, author = {Lee, Juntae and Jain, Mihir and Yun, Sungrack}, title = {Few-Shot Common Action Localization via Cross-Attentional Fusion of Context and Temporal Dynamics}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10214-10223} }
Physically-Plausible Illumination Distribution Estimation-
[pdf]
[bibtex]@InProceedings{Ershov_2023_ICCV, author = {Ershov, Egor and Tesalin, Vasily and Ermakov, Ivan and Brown, Michael S.}, title = {Physically-Plausible Illumination Distribution Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12928-12936} }
3DPPE: 3D Point Positional Encoding for Transformer-based Multi-Camera 3D Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Shu_2023_ICCV, author = {Shu, Changyong and Deng, Jiajun and Yu, Fisher and Liu, Yifan}, title = {3DPPE: 3D Point Positional Encoding for Transformer-based Multi-Camera 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3580-3589} }
Revisiting Foreground and Background Separation in Weakly-supervised Temporal Action Localization: A Clustering-based Approach-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Qinying and Wang, Zilei and Rong, Shenghai and Li, Junjie and Zhang, Yixin}, title = {Revisiting Foreground and Background Separation in Weakly-supervised Temporal Action Localization: A Clustering-based Approach}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10433-10443} }
VertexSerum: Poisoning Graph Neural Networks for Link Inference-
[pdf]
[arXiv]
[bibtex]@InProceedings{Ding_2023_ICCV, author = {Ding, Ruyi and Duan, Shijin and Xu, Xiaolin and Fei, Yunsi}, title = {VertexSerum: Poisoning Graph Neural Networks for Link Inference}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4532-4541} }
NeRF-Det: Learning Geometry-Aware Volumetric Representation for Multi-View 3D Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Chenfeng and Wu, Bichen and Hou, Ji and Tsai, Sam and Li, Ruilong and Wang, Jialiang and Zhan, Wei and He, Zijian and Vajda, Peter and Keutzer, Kurt and Tomizuka, Masayoshi}, title = {NeRF-Det: Learning Geometry-Aware Volumetric Representation for Multi-View 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23320-23330} }
Spatio-Temporal Domain Awareness for Multi-Agent Collaborative Perception-
[pdf]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Kun and Yang, Dingkang and Zhang, Jingyu and Li, Mingcheng and Liu, Yang and Liu, Jing and Wang, Hanqi and Sun, Peng and Song, Liang}, title = {Spatio-Temporal Domain Awareness for Multi-Agent Collaborative Perception}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23383-23392} }
LPFF: A Portrait Dataset for Face Generators Across Large Poses-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Yiqian and Zhang, Jing and Fu, Hongbo and Jin, Xiaogang}, title = {LPFF: A Portrait Dataset for Face Generators Across Large Poses}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20327-20337} }
Pseudo-label Alignment for Semi-supervised Instance Segmentation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Hu_2023_ICCV, author = {Hu, Jie and Chen, Chen and Cao, Liujuan and Zhang, Shengchuan and Shu, Annan and Jiang, Guannan and Ji, Rongrong}, title = {Pseudo-label Alignment for Semi-supervised Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16337-16347} }
Deep Geometrized Cartoon Line Inbetweening-
[pdf]
[supp]
[bibtex]@InProceedings{Siyao_2023_ICCV, author = {Siyao, Li and Gu, Tianpei and Xiao, Weiye and Ding, Henghui and Liu, Ziwei and Loy, Chen Change}, title = {Deep Geometrized Cartoon Line Inbetweening}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7291-7300} }
MixBag: Bag-Level Data Augmentation for Learning from Label Proportions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Asanomi_2023_ICCV, author = {Asanomi, Takanori and Matsuo, Shinnosuke and Suehiro, Daiki and Bise, Ryoma}, title = {MixBag: Bag-Level Data Augmentation for Learning from Label Proportions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16570-16579} }
Effective Real Image Editing with Accelerated Iterative Diffusion Inversion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Pan_2023_ICCV, author = {Pan, Zhihong and Gherardi, Riccardo and Xie, Xiufeng and Huang, Stephen}, title = {Effective Real Image Editing with Accelerated Iterative Diffusion Inversion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15912-15921} }
3D-Aware Neural Body Fitting for Occlusion Robust 3D Human Pose Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Yi and Ji, Pengliang and Wang, Angtian and Mei, Jieru and Kortylewski, Adam and Yuille, Alan}, title = {3D-Aware Neural Body Fitting for Occlusion Robust 3D Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9399-9410} }
Chinese Text Recognition with A Pre-Trained CLIP-Like Model Through Image-IDS Aligning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yu_2023_ICCV, author = {Yu, Haiyang and Wang, Xiaocong and Li, Bin and Xue, Xiangyang}, title = {Chinese Text Recognition with A Pre-Trained CLIP-Like Model Through Image-IDS Aligning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11943-11952} }
MatrixCity: A Large-scale City Dataset for City-scale Neural Rendering and Beyond-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Yixuan and Jiang, Lihan and Xu, Linning and Xiangli, Yuanbo and Wang, Zhenzhi and Lin, Dahua and Dai, Bo}, title = {MatrixCity: A Large-scale City Dataset for City-scale Neural Rendering and Beyond}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3205-3215} }
LinkGAN: Linking GAN Latents to Pixels for Controllable Image Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Jiapeng and Yang, Ceyuan and Shen, Yujun and Shi, Zifan and Dai, Bo and Zhao, Deli and Chen, Qifeng}, title = {LinkGAN: Linking GAN Latents to Pixels for Controllable Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7656-7666} }
Exploiting Proximity-Aware Tasks for Embodied Social Navigation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Cancelli_2023_ICCV, author = {Cancelli, Enrico and Campari, Tommaso and Serafini, Luciano and Chang, Angel X. and Ballan, Lamberto}, title = {Exploiting Proximity-Aware Tasks for Embodied Social Navigation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10957-10967} }
SVDiff: Compact Parameter Space for Diffusion Fine-Tuning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Han_2023_ICCV, author = {Han, Ligong and Li, Yinxiao and Zhang, Han and Milanfar, Peyman and Metaxas, Dimitris and Yang, Feng}, title = {SVDiff: Compact Parameter Space for Diffusion Fine-Tuning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7323-7334} }
UniFace: Unified Cross-Entropy Loss for Deep Face Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Jiancan and Jia, Xi and Li, Qiufu and Shen, Linlin and Duan, Jinming}, title = {UniFace: Unified Cross-Entropy Loss for Deep Face Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20730-20739} }
Jumping through Local Minima: Quantization in the Loss Landscape of Vision Transformers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Frumkin_2023_ICCV, author = {Frumkin, Natalia and Gope, Dibakar and Marculescu, Diana}, title = {Jumping through Local Minima: Quantization in the Loss Landscape of Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16978-16988} }
Hierarchical Contrastive Learning for Pattern-Generalizable Image Corruption Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Feng_2023_ICCV, author = {Feng, Xin and Xu, Yifeng and Lu, Guangming and Pei, Wenjie}, title = {Hierarchical Contrastive Learning for Pattern-Generalizable Image Corruption Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12076-12085} }
Learning Optical Flow from Event Camera with Rendered Dataset-
[pdf]
[arXiv]
[bibtex]@InProceedings{Luo_2023_ICCV, author = {Luo, Xinglong and Luo, Kunming and Luo, Ao and Wang, Zhengning and Tan, Ping and Liu, Shuaicheng}, title = {Learning Optical Flow from Event Camera with Rendered Dataset}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9847-9857} }
EPiC: Ensemble of Partial Point Clouds for Robust Classification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Levi_2023_ICCV, author = {Levi, Meir Yossef and Gilboa, Guy}, title = {EPiC: Ensemble of Partial Point Clouds for Robust Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14475-14484} }
Distilling Large Vision-Language Model with Out-of-Distribution Generalizability-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Xuanlin and Fang, Yunhao and Liu, Minghua and Ling, Zhan and Tu, Zhuowen and Su, Hao}, title = {Distilling Large Vision-Language Model with Out-of-Distribution Generalizability}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2492-2503} }
Cross-Modal Learning with 3D Deformable Attention for Action Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2023_ICCV, author = {Kim, Sangwon and Ahn, Dasom and Ko, Byoung Chul}, title = {Cross-Modal Learning with 3D Deformable Attention for Action Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10265-10275} }
What do neural networks learn in image classification? A frequency shortcut perspective-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Shunxin and Veldhuis, Raymond and Brune, Christoph and Strisciuglio, Nicola}, title = {What do neural networks learn in image classification? A frequency shortcut perspective}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1433-1442} }
Tracking by 3D Model Estimation of Unknown Objects in Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Rozumnyi_2023_ICCV, author = {Rozumnyi, Denys and Matas, Ji\v{r}{\'\i} and Pollefeys, Marc and Ferrari, Vittorio and Oswald, Martin R.}, title = {Tracking by 3D Model Estimation of Unknown Objects in Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14086-14096} }
ScatterNeRF: Seeing Through Fog with Physically-Based Inverse Neural Rendering-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ramazzina_2023_ICCV, author = {Ramazzina, Andrea and Bijelic, Mario and Walz, Stefanie and Sanvito, Alessandro and Scheuble, Dominik and Heide, Felix}, title = {ScatterNeRF: Seeing Through Fog with Physically-Based Inverse Neural Rendering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17957-17968} }
Sigmoid Loss for Language Image Pre-Training-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhai_2023_ICCV, author = {Zhai, Xiaohua and Mustafa, Basil and Kolesnikov, Alexander and Beyer, Lucas}, title = {Sigmoid Loss for Language Image Pre-Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11975-11986} }
PromptCap: Prompt-Guided Image Captioning for VQA with GPT-3-
[pdf]
[supp]
[bibtex]@InProceedings{Hu_2023_ICCV, author = {Hu, Yushi and Hua, Hang and Yang, Zhengyuan and Shi, Weijia and Smith, Noah A. and Luo, Jiebo}, title = {PromptCap: Prompt-Guided Image Captioning for VQA with GPT-3}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2963-2975} }
Neural Video Depth Stabilizer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Yiran and Shi, Min and Li, Jiaqi and Huang, Zihao and Cao, Zhiguo and Zhang, Jianming and Xian, Ke and Lin, Guosheng}, title = {Neural Video Depth Stabilizer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9466-9476} }
Learning Symmetry-Aware Geometry Correspondences for 6D Object Pose Estimation-
[pdf]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Heng and Wei, Shenxing and Shi, Dahu and Tan, Wenming and Li, Zheyang and Ren, Ye and Wei, Xing and Yang, Yi and Pu, Shiliang}, title = {Learning Symmetry-Aware Geometry Correspondences for 6D Object Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14045-14054} }
TrackFlow: Multi-Object tracking with Normalizing Flows-
[pdf]
[arXiv]
[bibtex]@InProceedings{Mancusi_2023_ICCV, author = {Mancusi, Gianluca and Panariello, Aniello and Porrello, Angelo and Fabbri, Matteo and Calderara, Simone and Cucchiara, Rita}, title = {TrackFlow: Multi-Object tracking with Normalizing Flows}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9531-9543} }
Towards Generic Image Manipulation Detection with Weakly-Supervised Self-Consistency Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhai_2023_ICCV, author = {Zhai, Yuanhao and Luan, Tianyu and Doermann, David and Yuan, Junsong}, title = {Towards Generic Image Manipulation Detection with Weakly-Supervised Self-Consistency Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22390-22400} }
PARF: Primitive-Aware Radiance Fusion for Indoor Scene Novel View Synthesis-
[pdf]
[supp]
[bibtex]@InProceedings{Ying_2023_ICCV, author = {Ying, Haiyang and Jiang, Baowei and Zhang, Jinzhi and Xu, Di and Yu, Tao and Dai, Qionghai and Fang, Lu}, title = {PARF: Primitive-Aware Radiance Fusion for Indoor Scene Novel View Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17706-17716} }
DeePoint: Visual Pointing Recognition and Direction Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nakamura_2023_ICCV, author = {Nakamura, Shu and Kawanishi, Yasutomo and Nobuhara, Shohei and Nishino, Ko}, title = {DeePoint: Visual Pointing Recognition and Direction Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20577-20587} }
Periodically Exchange Teacher-Student for Source-Free Object Detection-
[pdf]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Qipeng and Lin, Luojun and Shen, Zhifeng and Yang, Zhifeng}, title = {Periodically Exchange Teacher-Student for Source-Free Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6414-6424} }
Generating Instance-level Prompts for Rehearsal-free Continual Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Jung_2023_ICCV, author = {Jung, Dahuin and Han, Dongyoon and Bang, Jihwan and Song, Hwanjun}, title = {Generating Instance-level Prompts for Rehearsal-free Continual Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11847-11857} }
Deformer: Dynamic Fusion Transformer for Robust Hand Pose Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fu_2023_ICCV, author = {Fu, Qichen and Liu, Xingyu and Xu, Ran and Niebles, Juan Carlos and Kitani, Kris M.}, title = {Deformer: Dynamic Fusion Transformer for Robust Hand Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23600-23611} }
HSE: Hybrid Species Embedding for Deep Metric Learning-
[pdf]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Bailin and Sun, Haoqiang and Li, Frederick W. B. and Chen, Zheng and Cai, Jianlu and Song, Chao}, title = {HSE: Hybrid Species Embedding for Deep Metric Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11047-11057} }
Online Continual Learning on Hierarchical Label Expansion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2023_ICCV, author = {Lee, Byung Hyun and Jung, Okchul and Choi, Jonghyun and Chun, Se Young}, title = {Online Continual Learning on Hierarchical Label Expansion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11761-11770} }
iDAG: Invariant DAG Searching for Domain Generalization-
[pdf]
[supp]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Zenan and Wang, Haobo and Zhao, Junbo and Zheng, Nenggan}, title = {iDAG: Invariant DAG Searching for Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19169-19179} }
Spacetime Surface Regularization for Neural Dynamic Scene Reconstruction-
[pdf]
[supp]
[bibtex]@InProceedings{Choe_2023_ICCV, author = {Choe, Jaesung and Choy, Christopher and Park, Jaesik and Kweon, In So and Anandkumar, Anima}, title = {Spacetime Surface Regularization for Neural Dynamic Scene Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17871-17881} }
GasMono: Geometry-Aided Self-Supervised Monocular Depth Estimation for Indoor Scenes-
[pdf]
[supp]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Chaoqiang and Poggi, Matteo and Tosi, Fabio and Zhou, Lei and Sun, Qiyu and Tang, Yang and Mattoccia, Stefano}, title = {GasMono: Geometry-Aided Self-Supervised Monocular Depth Estimation for Indoor Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16209-16220} }
3D Motion Magnification: Visualizing Subtle Motions from Time-Varying Radiance Fields-
[pdf]
[bibtex]@InProceedings{Feng_2023_ICCV, author = {Feng, Brandon Y. and Alzayer, Hadi and Rubinstein, Michael and Freeman, William T. and Huang, Jia-bin}, title = {3D Motion Magnification: Visualizing Subtle Motions from Time-Varying Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9837-9846} }
Learning to Transform for Generalizable Instance-wise Invariance-
[pdf]
[bibtex]@InProceedings{Singhal_2023_ICCV, author = {Singhal, Utkarsh and Esteves, Carlos and Makadia, Ameesh and Yu, Stella X.}, title = {Learning to Transform for Generalizable Instance-wise Invariance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6211-6221} }
Audio-Visual Deception Detection: DOLOS Dataset and Parameter-Efficient Crossmodal Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Guo_2023_ICCV, author = {Guo, Xiaobao and Selvaraj, Nithish Muthuchamy and Yu, Zitong and Kong, Adams Wai-Kin and Shen, Bingquan and Kot, Alex}, title = {Audio-Visual Deception Detection: DOLOS Dataset and Parameter-Efficient Crossmodal Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22135-22145} }
Multiple Instance Learning Framework with Masked Hard Instance Mining for Whole Slide Image Classification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tang_2023_ICCV, author = {Tang, Wenhao and Huang, Sheng and Zhang, Xiaoxian and Zhou, Fengtao and Zhang, Yi and Liu, Bo}, title = {Multiple Instance Learning Framework with Masked Hard Instance Mining for Whole Slide Image Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4078-4087} }
Unsupervised Compositional Concepts Discovery with Text-to-Image Generative Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Nan and Du, Yilun and Li, Shuang and Tenenbaum, Joshua B. and Torralba, Antonio}, title = {Unsupervised Compositional Concepts Discovery with Text-to-Image Generative Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2085-2095} }
Partition-And-Debias: Agnostic Biases Mitigation via a Mixture of Biases-Specific Experts-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Jiaxuan and Vo, Duc Minh and Nakayama, Hideki}, title = {Partition-And-Debias: Agnostic Biases Mitigation via a Mixture of Biases-Specific Experts}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4924-4934} }
Spatial Self-Distillation for Object Detection with Inaccurate Bounding Boxes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Di and Chen, Pengfei and Yu, Xuehui and Li, Guorong and Han, Zhenjun and Jiao, Jianbin}, title = {Spatial Self-Distillation for Object Detection with Inaccurate Bounding Boxes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6855-6865} }
CC3D: Layout-Conditioned Generation of Compositional 3D Scenes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bahmani_2023_ICCV, author = {Bahmani, Sherwin and Park, Jeong Joon and Paschalidou, Despoina and Yan, Xingguang and Wetzstein, Gordon and Guibas, Leonidas and Tagliasacchi, Andrea}, title = {CC3D: Layout-Conditioned Generation of Compositional 3D Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7171-7181} }
Alleviating Catastrophic Forgetting of Incremental Object Detection via Within-Class and Between-Class Knowledge Distillation-
[pdf]
[supp]
[bibtex]@InProceedings{Kang_2023_ICCV, author = {Kang, Mengxue and Zhang, Jinpeng and Zhang, Jinming and Wang, Xiashuang and Chen, Yang and Ma, Zhe and Huang, Xuhui}, title = {Alleviating Catastrophic Forgetting of Incremental Object Detection via Within-Class and Between-Class Knowledge Distillation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18894-18904} }
TextPSG: Panoptic Scene Graph Generation from Textual Descriptions-
[pdf]
[supp]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Chengyang and Shen, Yikang and Chen, Zhenfang and Ding, Mingyu and Gan, Chuang}, title = {TextPSG: Panoptic Scene Graph Generation from Textual Descriptions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2839-2850} }
Revisiting the Parameter Efficiency of Adapters from the Perspective of Precision Redundancy-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jie_2023_ICCV, author = {Jie, Shibo and Wang, Haoqing and Deng, Zhi-Hong}, title = {Revisiting the Parameter Efficiency of Adapters from the Perspective of Precision Redundancy}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17217-17226} }
EMQ: Evolving Training-free Proxies for Automated Mixed Precision Quantization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dong_2023_ICCV, author = {Dong, Peijie and Li, Lujun and Wei, Zimian and Niu, Xin and Tian, Zhiliang and Pan, Hengyue}, title = {EMQ: Evolving Training-free Proxies for Automated Mixed Precision Quantization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17076-17086} }
Face Clustering via Graph Convolutional Networks with Confidence Edges-
[pdf]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Yang and Ge, Zhiwei and Luo, Yuhao and Liu, Lin and Xu, Sulong}, title = {Face Clustering via Graph Convolutional Networks with Confidence Edges}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20990-20999} }
Learning Spatial-context-aware Global Visual Feature Representation for Instance Image Retrieval-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Zhongyan and Wang, Lei and Zhou, Luping and Koniusz, Piotr}, title = {Learning Spatial-context-aware Global Visual Feature Representation for Instance Image Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11250-11259} }
Cross-modal Latent Space Alignment for Image to Avatar Translation-
[pdf]
[supp]
[bibtex]@InProceedings{de_Guevara_2023_ICCV, author = {de Guevara, Manuel Ladron and Echevarria, Jose and Li, Yijun and Hold-Geoffroy, Yannick and Smith, Cameron and Ito, Daichi}, title = {Cross-modal Latent Space Alignment for Image to Avatar Translation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {520-529} }
Inspecting the Geographical Representativeness of Images from Text-to-Image Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Basu_2023_ICCV, author = {Basu, Abhipsa and Babu, R. Venkatesh and Pruthi, Danish}, title = {Inspecting the Geographical Representativeness of Images from Text-to-Image Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5136-5147} }
Space-time Prompting for Video Class-incremental Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Pei_2023_ICCV, author = {Pei, Yixuan and Qing, Zhiwu and Zhang, Shiwei and Wang, Xiang and Zhang, Yingya and Zhao, Deli and Qian, Xueming}, title = {Space-time Prompting for Video Class-incremental Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11932-11942} }
Multimodal Garment Designer: Human-Centric Latent Diffusion Models for Fashion Image Editing-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Baldrati_2023_ICCV, author = {Baldrati, Alberto and Morelli, Davide and Cartella, Giuseppe and Cornia, Marcella and Bertini, Marco and Cucchiara, Rita}, title = {Multimodal Garment Designer: Human-Centric Latent Diffusion Models for Fashion Image Editing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23393-23402} }
Time-to-Contact Map by Joint Estimation of Up-to-Scale Inverse Depth and Global Motion using a Single Event Camera-
[pdf]
[supp]
[bibtex]@InProceedings{Nunes_2023_ICCV, author = {Nunes, Urbano Miguel and Perrinet, Laurent Udo and Ieng, Sio-Hoi}, title = {Time-to-Contact Map by Joint Estimation of Up-to-Scale Inverse Depth and Global Motion using a Single Event Camera}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23653-23663} }
Sparse Sampling Transformer with Uncertainty-Driven Ranking for Unified Removal of Raindrops and Rain Streaks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Sixiang and Ye, Tian and Bai, Jinbin and Chen, Erkang and Shi, Jun and Zhu, Lei}, title = {Sparse Sampling Transformer with Uncertainty-Driven Ranking for Unified Removal of Raindrops and Rain Streaks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13106-13117} }
A Benchmark for Chinese-English Scene Text Image Super-Resolution-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ma_2023_ICCV, author = {Ma, Jianqi and Liang, Zhetong and Xiang, Wangmeng and Yang, Xi and Zhang, Lei}, title = {A Benchmark for Chinese-English Scene Text Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19452-19461} }
HSR-Diff: Hyperspectral Image Super-Resolution via Conditional Diffusion Models-
[pdf]
[supp]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Chanyue and Wang, Dong and Bai, Yunpeng and Mao, Hanyu and Li, Ying and Shen, Qiang}, title = {HSR-Diff: Hyperspectral Image Super-Resolution via Conditional Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7083-7093} }
Replay: Multi-modal Multi-view Acted Videos for Casual Holography-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shapovalov_2023_ICCV, author = {Shapovalov, Roman and Kleiman, Yanir and Rocco, Ignacio and Novotny, David and Vedaldi, Andrea and Chen, Changan and Kokkinos, Filippos and Graham, Ben and Neverova, Natalia}, title = {Replay: Multi-modal Multi-view Acted Videos for Casual Holography}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20338-20348} }
Advancing Example Exploitation Can Alleviate Critical Challenges in Adversarial Training-
[pdf]
[supp]
[bibtex]@InProceedings{Ge_2023_ICCV, author = {Ge, Yao and Li, Yun and Han, Keji and Zhu, Junyi and Long, Xianzhong}, title = {Advancing Example Exploitation Can Alleviate Critical Challenges in Adversarial Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {145-154} }
Affine-Consistent Transformer for Multi-Class Cell Nuclei Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Junjia and Li, Haofeng and Wan, Xiang and Li, Guanbin}, title = {Affine-Consistent Transformer for Multi-Class Cell Nuclei Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21384-21393} }
Removing Anomalies as Noises for Industrial Defect Localization-
[pdf]
[bibtex]@InProceedings{Lu_2023_ICCV, author = {Lu, Fanbin and Yao, Xufeng and Fu, Chi-Wing and Jia, Jiaya}, title = {Removing Anomalies as Noises for Industrial Defect Localization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16166-16175} }
GPGait: Generalized Pose-based Gait Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fu_2023_ICCV, author = {Fu, Yang and Meng, Shibei and Hou, Saihui and Hu, Xuecai and Huang, Yongzhen}, title = {GPGait: Generalized Pose-based Gait Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19595-19604} }
Stable and Causal Inference for Discriminative Self-supervised Deep Visual Representations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Yuewei and Li, Hai and Chen, Yiran}, title = {Stable and Causal Inference for Discriminative Self-supervised Deep Visual Representations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16109-16120} }
ShiftNAS: Improving One-shot NAS via Probability Shift-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Mingyang and Yu, Xinyi and Zhao, Haodong and Ou, Linlin}, title = {ShiftNAS: Improving One-shot NAS via Probability Shift}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5919-5928} }
Semantic Attention Flow Fields for Monocular Dynamic Scene Decomposition-
[pdf]
[supp]
[bibtex]@InProceedings{Liang_2023_ICCV, author = {Liang, Yiqing and Laidlaw, Eliot and Meyerowitz, Alexander and Sridhar, Srinath and Tompkin, James}, title = {Semantic Attention Flow Fields for Monocular Dynamic Scene Decomposition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21797-21806} }
LexLIP: Lexicon-Bottlenecked Language-Image Pre-Training for Large-Scale Image-Text Sparse Retrieval-
[pdf]
[supp]
[bibtex]@InProceedings{Luo_2023_ICCV, author = {Luo, Ziyang and Zhao, Pu and Xu, Can and Geng, Xiubo and Shen, Tao and Tao, Chongyang and Ma, Jing and Lin, Qingwei and Jiang, Daxin}, title = {LexLIP: Lexicon-Bottlenecked Language-Image Pre-Training for Large-Scale Image-Text Sparse Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11206-11217} }
A Fast Unified System for 3D Object Detection and Tracking-
[pdf]
[supp]
[bibtex]@InProceedings{Heitzinger_2023_ICCV, author = {Heitzinger, Thomas and Kampel, Martin}, title = {A Fast Unified System for 3D Object Detection and Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17044-17054} }
Adaptive Testing of Computer Vision Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gao_2023_ICCV, author = {Gao, Irena and Ilharco, Gabriel and Lundberg, Scott and Ribeiro, Marco Tulio}, title = {Adaptive Testing of Computer Vision Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4003-4014} }
LFS-GAN: Lifelong Few-Shot Image Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Seo_2023_ICCV, author = {Seo, Juwon and Kang, Ji-Su and Park, Gyeong-Moon}, title = {LFS-GAN: Lifelong Few-Shot Image Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11356-11366} }
AIDE: A Vision-Driven Multi-View, Multi-Modal, Multi-Tasking Dataset for Assistive Driving Perception-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Dingkang and Huang, Shuai and Xu, Zhi and Li, Zhenpeng and Wang, Shunli and Li, Mingcheng and Wang, Yuzheng and Liu, Yang and Yang, Kun and Chen, Zhaoyu and Wang, Yan and Liu, Jing and Zhang, Peixuan and Zhai, Peng and Zhang, Lihua}, title = {AIDE: A Vision-Driven Multi-View, Multi-Modal, Multi-Tasking Dataset for Assistive Driving Perception}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20459-20470} }
Feature Proliferation -- the "Cancer" in StyleGAN and its Treatments-
[pdf]
[supp]
[bibtex]@InProceedings{Song_2023_ICCV, author = {Song, Shuang and Liang, Yuanbang and Wu, Jing and Lai, Yu-Kun and Qin, Yipeng}, title = {Feature Proliferation -- the ''Cancer'' in StyleGAN and its Treatments}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2360-2370} }
Self-Supervised Character-to-Character Distillation for Text Recognition-
[pdf]
[arXiv]
[bibtex]@InProceedings{Guan_2023_ICCV, author = {Guan, Tongkun and Shen, Wei and Yang, Xue and Feng, Qi and Jiang, Zekun and Yang, Xiaokang}, title = {Self-Supervised Character-to-Character Distillation for Text Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19473-19484} }
MixCycle: Mixup Assisted Semi-Supervised 3D Single Object Tracking with Cycle Consistency-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Qiao and Yang, Jiaqi and Sun, Kun and Zhang, Chu'ai and Zhang, Yanning and Salzmann, Mathieu}, title = {MixCycle: Mixup Assisted Semi-Supervised 3D Single Object Tracking with Cycle Consistency}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13956-13966} }
Multi-Label Self-Supervised Learning with Scene Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Ke and Fu, Minghao and Wu, Jianxin}, title = {Multi-Label Self-Supervised Learning with Scene Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6694-6703} }
Domain Adaptive Few-Shot Open-Set Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Pal_2023_ICCV, author = {Pal, Debabrata and More, Deeptej and Bhargav, Sai and Tamboli, Dipesh and Aggarwal, Vaneet and Banerjee, Biplab}, title = {Domain Adaptive Few-Shot Open-Set Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18831-18840} }
DiffFacto: Controllable Part-Based 3D Point Cloud Generation with Cross Diffusion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nakayama_2023_ICCV, author = {Nakayama, George Kiyohiro and Uy, Mikaela Angelina and Huang, Jiahui and Hu, Shi-Min and Li, Ke and Guibas, Leonidas}, title = {DiffFacto: Controllable Part-Based 3D Point Cloud Generation with Cross Diffusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14257-14267} }
Interactive Class-Agnostic Object Counting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Yifeng and Ranjan, Viresh and Hoai, Minh}, title = {Interactive Class-Agnostic Object Counting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22312-22322} }
Spatio-temporal Prompting Network for Robust Video Feature Extraction-
[pdf]
[supp]
[bibtex]@InProceedings{Sun_2023_ICCV, author = {Sun, Guanxiong and Wang, Chi and Zhang, Zhaoyu and Deng, Jiankang and Zafeiriou, Stefanos and Hua, Yang}, title = {Spatio-temporal Prompting Network for Robust Video Feature Extraction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13587-13597} }
Enhancing Fine-Tuning Based Backdoor Defense with Sharpness-Aware Minimization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Mingli and Wei, Shaokui and Shen, Li and Fan, Yanbo and Wu, Baoyuan}, title = {Enhancing Fine-Tuning Based Backdoor Defense with Sharpness-Aware Minimization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4466-4477} }
Deep Geometry-Aware Camera Self-Calibration from Video-
[pdf]
[supp]
[bibtex]@InProceedings{Hagemann_2023_ICCV, author = {Hagemann, Annika and Knorr, Moritz and Stiller, Christoph}, title = {Deep Geometry-Aware Camera Self-Calibration from Video}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3438-3448} }
A Simple Vision Transformer for Weakly Semi-supervised 3D Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Dingyuan and Liang, Dingkang and Zou, Zhikang and Li, Jingyu and Ye, Xiaoqing and Liu, Zhe and Tan, Xiao and Bai, Xiang}, title = {A Simple Vision Transformer for Weakly Semi-supervised 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8373-8383} }
Estimator Meets Equilibrium Perspective: A Rectified Straight Through Estimator for Binary Neural Networks Training-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Xiao-Ming and Zheng, Dian and Liu, Zuhao and Zheng, Wei-Shi}, title = {Estimator Meets Equilibrium Perspective: A Rectified Straight Through Estimator for Binary Neural Networks Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17055-17064} }
Exploring Object-Centric Temporal Modeling for Efficient Multi-View 3D Object Detection-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Shihao and Liu, Yingfei and Wang, Tiancai and Li, Ying and Zhang, Xiangyu}, title = {Exploring Object-Centric Temporal Modeling for Efficient Multi-View 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3621-3631} }
Open-domain Visual Entity Recognition: Towards Recognizing Millions of Wikipedia Entities-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hu_2023_ICCV, author = {Hu, Hexiang and Luan, Yi and Chen, Yang and Khandelwal, Urvashi and Joshi, Mandar and Lee, Kenton and Toutanova, Kristina and Chang, Ming-Wei}, title = {Open-domain Visual Entity Recognition: Towards Recognizing Millions of Wikipedia Entities}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12065-12075} }
MedKLIP: Medical Knowledge Enhanced Language-Image Pre-Training for X-ray Diagnosis-
[pdf]
[supp]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Chaoyi and Zhang, Xiaoman and Zhang, Ya and Wang, Yanfeng and Xie, Weidi}, title = {MedKLIP: Medical Knowledge Enhanced Language-Image Pre-Training for X-ray Diagnosis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21372-21383} }
Automated Knowledge Distillation via Monte Carlo Tree Search-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Lujun and Dong, Peijie and Wei, Zimian and Yang, Ya}, title = {Automated Knowledge Distillation via Monte Carlo Tree Search}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17413-17424} }
EmoTalk: Speech-Driven Emotional Disentanglement for 3D Face Animation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Peng_2023_ICCV, author = {Peng, Ziqiao and Wu, Haoyu and Song, Zhenbo and Xu, Hao and Zhu, Xiangyu and He, Jun and Liu, Hongyan and Fan, Zhaoxin}, title = {EmoTalk: Speech-Driven Emotional Disentanglement for 3D Face Animation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20687-20697} }
A Soft Nearest-Neighbor Framework for Continual Semi-Supervised Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kang_2023_ICCV, author = {Kang, Zhiqi and Fini, Enrico and Nabi, Moin and Ricci, Elisa and Alahari, Karteek}, title = {A Soft Nearest-Neighbor Framework for Continual Semi-Supervised Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11868-11877} }
Text-Conditioned Sampling Framework for Text-to-Image Generation with Masked Generative Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2023_ICCV, author = {Lee, Jaewoong and Jang, Sangwon and Jo, Jaehyeong and Yoon, Jaehong and Kim, Yunji and Kim, Jin-Hwa and Ha, Jung-Woo and Hwang, Sung Ju}, title = {Text-Conditioned Sampling Framework for Text-to-Image Generation with Masked Generative Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23252-23262} }
ScanNet++: A High-Fidelity Dataset of 3D Indoor Scenes-
[pdf]
[supp]
[bibtex]@InProceedings{Yeshwanth_2023_ICCV, author = {Yeshwanth, Chandan and Liu, Yueh-Cheng and Nie{\ss}ner, Matthias and Dai, Angela}, title = {ScanNet++: A High-Fidelity Dataset of 3D Indoor Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12-22} }
Minimal Solutions to Uncalibrated Two-view Geometry with Known Epipoles-
[pdf]
[bibtex]@InProceedings{Nakano_2023_ICCV, author = {Nakano, Gaku}, title = {Minimal Solutions to Uncalibrated Two-view Geometry with Known Epipoles}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13361-13370} }
Improving Diversity in Zero-Shot GAN Adaptation with Semantic Variations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jeon_2023_ICCV, author = {Jeon, Seogkyu and Liu, Bei and Lee, Pilhyeon and Hong, Kibeom and Fu, Jianlong and Byun, Hyeran}, title = {Improving Diversity in Zero-Shot GAN Adaptation with Semantic Variations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7258-7267} }
Context-Aware Planning and Environment-Aware Memory for Instruction Following Embodied Agents-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2023_ICCV, author = {Kim, Byeonghwi and Kim, Jinyeon and Kim, Yuyeong and Min, Cheolhong and Choi, Jonghyun}, title = {Context-Aware Planning and Environment-Aware Memory for Instruction Following Embodied Agents}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10936-10946} }
Vox-E: Text-Guided Voxel Editing of 3D Objects-
[pdf]
[supp]
[bibtex]@InProceedings{Sella_2023_ICCV, author = {Sella, Etai and Fiebelman, Gal and Hedman, Peter and Averbuch-Elor, Hadar}, title = {Vox-E: Text-Guided Voxel Editing of 3D Objects}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {430-440} }
Inverse Problem Regularization with Hierarchical Variational Autoencoders-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Prost_2023_ICCV, author = {Prost, Jean and Houdard, Antoine and Almansa, Andr\'es and Papadakis, Nicolas}, title = {Inverse Problem Regularization with Hierarchical Variational Autoencoders}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22894-22905} }
Unpaired Multi-domain Attribute Translation of 3D Facial Shapes with a Square and Symmetric Geometric Map-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fan_2023_ICCV, author = {Fan, Zhenfeng and Zhang, Zhiheng and Yang, Shuang and Zhong, Chongyang and Cao, Min and Xia, Shihong}, title = {Unpaired Multi-domain Attribute Translation of 3D Facial Shapes with a Square and Symmetric Geometric Map}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20828-20838} }
Passive Ultra-Wideband Single-Photon Imaging-
[pdf]
[supp]
[bibtex]@InProceedings{Wei_2023_ICCV, author = {Wei, Mian and Nousias, Sotiris and Gulve, Rahul and Lindell, David B. and Kutulakos, Kiriakos N.}, title = {Passive Ultra-Wideband Single-Photon Imaging}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8135-8146} }
Template Inversion Attack against Face Recognition Systems using 3D Face Reconstruction-
[pdf]
[supp]
[bibtex]@InProceedings{Shahreza_2023_ICCV, author = {Shahreza, Hatef Otroshi and Marcel, S\'ebastien}, title = {Template Inversion Attack against Face Recognition Systems using 3D Face Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19662-19672} }
ETran: Energy-Based Transferability Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gholami_2023_ICCV, author = {Gholami, Mohsen and Akbari, Mohammad and Wang, Xinglu and Kamranian, Behnam and Zhang, Yong}, title = {ETran: Energy-Based Transferability Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18613-18622} }
Predict to Detect: Prediction-guided 3D Object Detection using Sequential Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2023_ICCV, author = {Kim, Sanmin and Kim, Youngseok and Lee, In-Jae and Kum, Dongsuk}, title = {Predict to Detect: Prediction-guided 3D Object Detection using Sequential Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18057-18066} }
Unilaterally Aggregated Contrastive Learning with Hierarchical Augmentation for Anomaly Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Guodong and Wang, Yunhong and Qin, Jie and Zhang, Dongming and Bao, Xiuguo and Huang, Di}, title = {Unilaterally Aggregated Contrastive Learning with Hierarchical Augmentation for Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6888-6897} }
Learning Image-Adaptive Codebooks for Class-Agnostic Image Restoration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Kechun and Jiang, Yitong and Choi, Inchang and Gu, Jinwei}, title = {Learning Image-Adaptive Codebooks for Class-Agnostic Image Restoration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5373-5383} }
3D Segmentation of Humans in Point Clouds with Synthetic Data-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Takmaz_2023_ICCV, author = {Takmaz, Ay\c{c}a and Schult, Jonas and Kaftan, Irem and Ak\c{c}ay, Mertcan and Leibe, Bastian and Sumner, Robert and Engelmann, Francis and Tang, Siyu}, title = {3D Segmentation of Humans in Point Clouds with Synthetic Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1292-1304} }
Mastering Spatial Graph Prediction of Road Networks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sotiris_2023_ICCV, author = {Sotiris, Anagnostidis and Lucchi, Aurelien and Hofmann, Thomas}, title = {Mastering Spatial Graph Prediction of Road Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5408-5418} }
IDiff-Face: Synthetic-based Face Recognition through Fizzy Identity-Conditioned Diffusion Model-
[pdf]
[bibtex]@InProceedings{Boutros_2023_ICCV, author = {Boutros, Fadi and Grebe, Jonas Henry and Kuijper, Arjan and Damer, Naser}, title = {IDiff-Face: Synthetic-based Face Recognition through Fizzy Identity-Conditioned Diffusion Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19650-19661} }
Deep Video Demoireing via Compact Invertible Dyadic Decomposition-
[pdf]
[supp]
[bibtex]@InProceedings{Quan_2023_ICCV, author = {Quan, Yuhui and Huang, Haoran and He, Shengfeng and Xu, Ruotao}, title = {Deep Video Demoireing via Compact Invertible Dyadic Decomposition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12677-12686} }
Rethinking Multi-Contrast MRI Super-Resolution: Rectangle-Window Cross-Attention Transformer and Arbitrary-Scale Upsampling-
[pdf]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Guangyuan and Zhao, Lei and Sun, Jiakai and Lan, Zehua and Zhang, Zhanjie and Chen, Jiafu and Lin, Zhijie and Lin, Huaizhong and Xing, Wei}, title = {Rethinking Multi-Contrast MRI Super-Resolution: Rectangle-Window Cross-Attention Transformer and Arbitrary-Scale Upsampling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21230-21240} }
Domain Generalization via Rationale Invariance-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Liang and Zhang, Yong and Song, Yibing and van den Hengel, Anton and Liu, Lingqiao}, title = {Domain Generalization via Rationale Invariance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1751-1760} }
ProbVLM: Probabilistic Adapter for Frozen Vison-Language Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Upadhyay_2023_ICCV, author = {Upadhyay, Uddeshya and Karthik, Shyamgopal and Mancini, Massimiliano and Akata, Zeynep}, title = {ProbVLM: Probabilistic Adapter for Frozen Vison-Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1899-1910} }
Towards Open-Set Test-Time Adaptation Utilizing the Wisdom of Crowds in Entropy Minimization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2023_ICCV, author = {Lee, Jungsoo and Das, Debasmit and Choo, Jaegul and Choi, Sungha}, title = {Towards Open-Set Test-Time Adaptation Utilizing the Wisdom of Crowds in Entropy Minimization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16380-16389} }
Scene Graph Contrastive Learning for Embodied Navigation-
[pdf]
[supp]
[bibtex]@InProceedings{Singh_2023_ICCV, author = {Singh, Kunal Pratap and Salvador, Jordi and Weihs, Luca and Kembhavi, Aniruddha}, title = {Scene Graph Contrastive Learning for Embodied Navigation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10884-10894} }
Long-Range Grouping Transformer for Multi-View 3D Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Liying and Zhu, Zhenwei and Lin, Xuxin and Nong, Jian and Liang, Yanyan}, title = {Long-Range Grouping Transformer for Multi-View 3D Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18257-18267} }
Latent-OFER: Detect, Mask, and Reconstruct with Latent Vectors for Occluded Facial Expression Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Lee_2023_ICCV, author = {Lee, Isack and Lee, Eungi and Yoo, Seok Bong}, title = {Latent-OFER: Detect, Mask, and Reconstruct with Latent Vectors for Occluded Facial Expression Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1536-1546} }
DenseShift: Towards Accurate and Efficient Low-Bit Power-of-Two Quantization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Xinlin and Liu, Bang and Yang, Rui Heng and Courville, Vanessa and Xing, Chao and Nia, Vahid Partovi}, title = {DenseShift: Towards Accurate and Efficient Low-Bit Power-of-Two Quantization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17010-17020} }
Preparing the Future for Continual Semantic Segmentation-
[pdf]
[bibtex]@InProceedings{Lin_2023_ICCV, author = {Lin, Zihan and Wang, Zilei and Zhang, Yixin}, title = {Preparing the Future for Continual Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11910-11920} }
Efficient Computation Sharing for Multi-Task Visual Scene Understanding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shoouri_2023_ICCV, author = {Shoouri, Sara and Yang, Mingyu and Fan, Zichen and Kim, Hun-Seok}, title = {Efficient Computation Sharing for Multi-Task Visual Scene Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17130-17141} }
Self-supervised Cross-view Representation Reconstruction for Change Captioning-
[pdf]
[supp]
[bibtex]@InProceedings{Tu_2023_ICCV, author = {Tu, Yunbin and Li, Liang and Su, Li and Zha, Zheng-Jun and Yan, Chenggang and Huang, Qingming}, title = {Self-supervised Cross-view Representation Reconstruction for Change Captioning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2805-2815} }
Unify, Align and Refine: Multi-Level Semantic Alignment for Radiology Report Generation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Yaowei and Yang, Bang and Cheng, Xuxin and Zhu, Zhihong and Li, Hongxiang and Zou, Yuexian}, title = {Unify, Align and Refine: Multi-Level Semantic Alignment for Radiology Report Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2863-2874} }
Synthesizing Diverse Human Motions in 3D Indoor Scenes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Kaifeng and Zhang, Yan and Wang, Shaofei and Beeler, Thabo and Tang, Siyu}, title = {Synthesizing Diverse Human Motions in 3D Indoor Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14738-14749} }
Deep Optics for Video Snapshot Compressive Imaging-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Ping and Wang, Lishun and Yuan, Xin}, title = {Deep Optics for Video Snapshot Compressive Imaging}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10646-10656} }
DDIT: Semantic Scene Completion via Deformable Deep Implicit Templates-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Haoang and Dong, Jinhu and Wen, Binghui and Gao, Ming and Huang, Tianyu and Liu, Yun-Hui and Cremers, Daniel}, title = {DDIT: Semantic Scene Completion via Deformable Deep Implicit Templates}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21894-21904} }
Joint Demosaicing and Deghosting of Time-Varying Exposures for Single-Shot HDR Imaging-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2023_ICCV, author = {Kim, Jungwoo and Kim, Min H.}, title = {Joint Demosaicing and Deghosting of Time-Varying Exposures for Single-Shot HDR Imaging}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12292-12301} }
Scene-Aware Feature Matching-
[pdf]
[arXiv]
[bibtex]@InProceedings{Lu_2023_ICCV, author = {Lu, Xiaoyong and Yan, Yaping and Wei, Tong and Du, Songlin}, title = {Scene-Aware Feature Matching}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3704-3713} }
FDViT: Improve the Hierarchical Architecture of Vision Transformer-
[pdf]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Yixing and Li, Chao and Li, Dong and Sheng, Xiao and Jiang, Fan and Tian, Lu and Sirasao, Ashish}, title = {FDViT: Improve the Hierarchical Architecture of Vision Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5950-5960} }
Tuning Pre-trained Model via Moment Probing-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gao_2023_ICCV, author = {Gao, Mingze and Wang, Qilong and Lin, Zhenyi and Zhu, Pengfei and Hu, Qinghua and Zhou, Jingbo}, title = {Tuning Pre-trained Model via Moment Probing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11803-11813} }
Attention Where It Matters: Rethinking Visual Document Understanding with Selective Region Concentration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cao_2023_ICCV, author = {Cao, Haoyu and Bao, Changcun and Liu, Chaohu and Chen, Huang and Yin, Kun and Liu, Hao and Liu, Yinsong and Jiang, Deqiang and Sun, Xing}, title = {Attention Where It Matters: Rethinking Visual Document Understanding with Selective Region Concentration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19517-19527} }
Task Agnostic Restoration of Natural Video Dynamics-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ali_2023_ICCV, author = {Ali, Muhammad Kashif and Kim, Dongjin and Kim, Tae Hyun}, title = {Task Agnostic Restoration of Natural Video Dynamics}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13534-13544} }
TMR: Text-to-Motion Retrieval Using Contrastive 3D Human Motion Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Petrovich_2023_ICCV, author = {Petrovich, Mathis and Black, Michael J. and Varol, G\"ul}, title = {TMR: Text-to-Motion Retrieval Using Contrastive 3D Human Motion Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9488-9497} }
3D Neural Embedding Likelihood: Probabilistic Inverse Graphics for Robust 6D Pose Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Guangyao and Gothoskar, Nishad and Wang, Lirui and Tenenbaum, Joshua B. and Gutfreund, Dan and L\'azaro-Gredilla, Miguel and George, Dileep and Mansinghka, Vikash K.}, title = {3D Neural Embedding Likelihood: Probabilistic Inverse Graphics for Robust 6D Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21625-21636} }
Towards Robust Model Watermark via Reducing Parametric Vulnerability-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gan_2023_ICCV, author = {Gan, Guanhao and Li, Yiming and Wu, Dongxian and Xia, Shu-Tao}, title = {Towards Robust Model Watermark via Reducing Parametric Vulnerability}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4751-4761} }
SupFusion: Supervised LiDAR-Camera Fusion for 3D Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Qin_2023_ICCV, author = {Qin, Yiran and Wang, Chaoqun and Kang, Zijian and Ma, Ningning and Li, Zhen and Zhang, Ruimao}, title = {SupFusion: Supervised LiDAR-Camera Fusion for 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22014-22024} }
EMMN: Emotional Motion Memory Network for Audio-driven Emotional Talking Face Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Tan_2023_ICCV, author = {Tan, Shuai and Ji, Bin and Pan, Ye}, title = {EMMN: Emotional Motion Memory Network for Audio-driven Emotional Talking Face Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22146-22156} }
Rethinking Vision Transformers for MobileNet Size and Speed-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Yanyu and Hu, Ju and Wen, Yang and Evangelidis, Georgios and Salahi, Kamyar and Wang, Yanzhi and Tulyakov, Sergey and Ren, Jian}, title = {Rethinking Vision Transformers for MobileNet Size and Speed}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16889-16900} }
Implicit Identity Representation Conditioned Memory Compensation Network for Talking Head video Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hong_2023_ICCV, author = {Hong, Fa-Ting and Xu, Dan}, title = {Implicit Identity Representation Conditioned Memory Compensation Network for Talking Head video Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23062-23072} }
SINC: Self-Supervised In-Context Learning for Vision-Language Tasks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Yi-Syuan and Song, Yun-Zhu and Yeo, Cheng Yu and Liu, Bei and Fu, Jianlong and Shuai, Hong-Han}, title = {SINC: Self-Supervised In-Context Learning for Vision-Language Tasks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15430-15442} }
LEA2: A Lightweight Ensemble Adversarial Attack via Non-overlapping Vulnerable Frequency Regions-
[pdf]
[supp]
[bibtex]@InProceedings{Qian_2023_ICCV, author = {Qian, Yaguan and He, Shuke and Zhao, Chenyu and Sha, Jiaqiang and Wang, Wei and Wang, Bin}, title = {LEA2: A Lightweight Ensemble Adversarial Attack via Non-overlapping Vulnerable Frequency Regions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4510-4521} }
Chupa: Carving 3D Clothed Humans from Skinned Shape Priors using 2D Diffusion Probabilistic Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2023_ICCV, author = {Kim, Byungjun and Kwon, Patrick and Lee, Kwangho and Lee, Myunggi and Han, Sookwan and Kim, Daesik and Joo, Hanbyul}, title = {Chupa: Carving 3D Clothed Humans from Skinned Shape Priors using 2D Diffusion Probabilistic Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15965-15976} }
Unsupervised Domain Adaptive Detection with Network Stability Analysis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Wenzhang and Fan, Heng and Luo, Tiejian and Zhang, Libo}, title = {Unsupervised Domain Adaptive Detection with Network Stability Analysis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6986-6995} }
Learning a Room with the Occ-SDF Hybrid: Signed Distance Function Mingled with Occupancy Aids Scene Representation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lyu_2023_ICCV, author = {Lyu, Xiaoyang and Dai, Peng and Li, Zizhang and Yan, Dongyu and Lin, Yi and Peng, Yifan and Qi, Xiaojuan}, title = {Learning a Room with the Occ-SDF Hybrid: Signed Distance Function Mingled with Occupancy Aids Scene Representation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8940-8950} }
Cloth2Body: Generating 3D Human Body Mesh from 2D Clothing-
[pdf]
[bibtex]@InProceedings{Dai_2023_ICCV, author = {Dai, Lu and Ma, Liqian and Qian, Shenhan and Liu, Hao and Liu, Ziwei and Xiong, Hui}, title = {Cloth2Body: Generating 3D Human Body Mesh from 2D Clothing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15007-15017} }
Spatially and Spectrally Consistent Deep Functional Maps-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sun_2023_ICCV, author = {Sun, Mingze and Mao, Shiwei and Jiang, Puhua and Ovsjanikov, Maks and Huang, Ruqi}, title = {Spatially and Spectrally Consistent Deep Functional Maps}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14497-14507} }
Sparse Point Guided 3D Lane Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Yao_2023_ICCV, author = {Yao, Chengtang and Yu, Lidong and Wu, Yuwei and Jia, Yunde}, title = {Sparse Point Guided 3D Lane Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8363-8372} }
Event-based Temporally Dense Optical Flow Estimation with Sequential Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Ponghiran_2023_ICCV, author = {Ponghiran, Wachirawit and Liyanagedera, Chamika Mihiranga and Roy, Kaushik}, title = {Event-based Temporally Dense Optical Flow Estimation with Sequential Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9827-9836} }
Going Beyond Nouns With Vision & Language Models Using Synthetic Data-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cascante-Bonilla_2023_ICCV, author = {Cascante-Bonilla, Paola and Shehada, Khaled and Smith, James Seale and Doveh, Sivan and Kim, Donghyun and Panda, Rameswar and Varol, Gul and Oliva, Aude and Ordonez, Vicente and Feris, Rogerio and Karlinsky, Leonid}, title = {Going Beyond Nouns With Vision \& Language Models Using Synthetic Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20155-20165} }
Continual Zero-Shot Learning through Semantically Guided Generative Random Walks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Wenxuan and Janson, Paul and Yi, Kai and Skorokhodov, Ivan and Elhoseiny, Mohamed}, title = {Continual Zero-Shot Learning through Semantically Guided Generative Random Walks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11574-11585} }
Foreground-Background Distribution Modeling Transformer for Visual Object Tracking-
[pdf]
[supp]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Dawei and He, Jianfeng and Ma, Yinchao and Yu, Qianjin and Zhang, Tianzhu}, title = {Foreground-Background Distribution Modeling Transformer for Visual Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10117-10127} }
MeViS: A Large-scale Benchmark for Video Segmentation with Motion Expressions-
[pdf]
[arXiv]
[bibtex]@InProceedings{Ding_2023_ICCV, author = {Ding, Henghui and Liu, Chang and He, Shuting and Jiang, Xudong and Loy, Chen Change}, title = {MeViS: A Large-scale Benchmark for Video Segmentation with Motion Expressions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2694-2703} }
OPERA: Omni-Supervised Representation Learning with Hierarchical Supervisions-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Chengkun and Zheng, Wenzhao and Zhu, Zheng and Zhou, Jie and Lu, Jiwen}, title = {OPERA: Omni-Supervised Representation Learning with Hierarchical Supervisions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5559-5570} }
GPFL: Simultaneously Learning Global and Personalized Feature Information for Personalized Federated Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Jianqing and Hua, Yang and Wang, Hao and Song, Tao and Xue, Zhengui and Ma, Ruhui and Cao, Jian and Guan, Haibing}, title = {GPFL: Simultaneously Learning Global and Personalized Feature Information for Personalized Federated Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5041-5051} }
Zero-Shot Contrastive Loss for Text-Guided Diffusion Image Style Transfer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Serin and Hwang, Hyunmin and Ye, Jong Chul}, title = {Zero-Shot Contrastive Loss for Text-Guided Diffusion Image Style Transfer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22873-22882} }
Efficient Region-Aware Neural Radiance Fields for High-Fidelity Talking Portrait Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Jiahe and Zhang, Jiawei and Bai, Xiao and Zhou, Jun and Gu, Lin}, title = {Efficient Region-Aware Neural Radiance Fields for High-Fidelity Talking Portrait Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7568-7578} }
End2End Multi-View Feature Matching with Differentiable Pose Optimization-
[pdf]
[supp]
[bibtex]@InProceedings{Roessle_2023_ICCV, author = {Roessle, Barbara and Nie{\ss}ner, Matthias}, title = {End2End Multi-View Feature Matching with Differentiable Pose Optimization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {477-487} }
Low-Light Image Enhancement with Illumination-Aware Gamma Correction and Complete Image Modelling Network-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Yinglong and Liu, Zhen and Liu, Jianzhuang and Xu, Songcen and Liu, Shuaicheng}, title = {Low-Light Image Enhancement with Illumination-Aware Gamma Correction and Complete Image Modelling Network}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13128-13137} }
Both Diverse and Realism Matter: Physical Attribute and Style Alignment for Rainy Image Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Yu_2023_ICCV, author = {Yu, Changfeng and Chen, Shiming and Chang, Yi and Song, Yibing and Yan, Luxin}, title = {Both Diverse and Realism Matter: Physical Attribute and Style Alignment for Rainy Image Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12387-12397} }
Exploring the Benefits of Visual Prompting in Differential Privacy-
[pdf]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Yizhe and Tsai, Yu-Lin and Yu, Chia-Mu and Chen, Pin-Yu and Ren, Xuebin}, title = {Exploring the Benefits of Visual Prompting in Differential Privacy}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5158-5167} }
Single Image Reflection Separation via Component Synergy-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hu_2023_ICCV, author = {Hu, Qiming and Guo, Xiaojie}, title = {Single Image Reflection Separation via Component Synergy}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13138-13147} }
Mining bias-target Alignment from Voronoi Cells-
[pdf]
[arXiv]
[bibtex]@InProceedings{Nahon_2023_ICCV, author = {Nahon, R\'emi and Nguyen, Van-Tam and Tartaglione, Enzo}, title = {Mining bias-target Alignment from Voronoi Cells}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4946-4955} }
The Victim and The Beneficiary: Exploiting a Poisoned Model to Train a Clean Model on Poisoned Data-
[pdf]
[supp]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Zixuan and Wang, Rui and Zou, Cong and Jing, Lihua}, title = {The Victim and The Beneficiary: Exploiting a Poisoned Model to Train a Clean Model on Poisoned Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {155-164} }
DIFFGUARD: Semantic Mismatch-Guided Out-of-Distribution Detection Using Pre-Trained Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gao_2023_ICCV, author = {Gao, Ruiyuan and Zhao, Chenchen and Hong, Lanqing and Xu, Qiang}, title = {DIFFGUARD: Semantic Mismatch-Guided Out-of-Distribution Detection Using Pre-Trained Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1579-1589} }
Identity-Seeking Self-Supervised Representation Learning for Generalizable Person Re-Identification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dou_2023_ICCV, author = {Dou, Zhaopeng and Wang, Zhongdao and Li, Yali and Wang, Shengjin}, title = {Identity-Seeking Self-Supervised Representation Learning for Generalizable Person Re-Identification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15847-15858} }
3D-Aware Generative Model for Improved Side-View Image Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jo_2023_ICCV, author = {Jo, Kyungmin and Jin, Wonjoon and Choo, Jaegul and Lee, Hyunjoon and Cho, Sunghyun}, title = {3D-Aware Generative Model for Improved Side-View Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22862-22872} }
Tracking Anything with Decoupled Video Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cheng_2023_ICCV, author = {Cheng, Ho Kei and Oh, Seoung Wug and Price, Brian and Schwing, Alexander and Lee, Joon-Young}, title = {Tracking Anything with Decoupled Video Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1316-1326} }
Generative Gradient Inversion via Over-Parameterized Networks in Federated Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Chi and Xiaoman, Zhang and Sotthiwat, Ekanut and Xu, Yanyu and Liu, Ping and Zhen, Liangli and Liu, Yong}, title = {Generative Gradient Inversion via Over-Parameterized Networks in Federated Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5126-5135} }
EQ-Net: Elastic Quantization Neural Networks-
[pdf]
[supp]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Ke and Han, Lei and Tian, Ye and Yang, Shangshang and Zhang, Xingyi}, title = {EQ-Net: Elastic Quantization Neural Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1505-1514} }
OxfordTVG-HIC: Can Machine Make Humorous Captions from Images?-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Runjia and Sun, Shuyang and Elhoseiny, Mohamed and Torr, Philip}, title = {OxfordTVG-HIC: Can Machine Make Humorous Captions from Images?}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20293-20303} }
Exploring Open-Vocabulary Semantic Segmentation from CLIP Vision Encoder Distillation Only-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Jun and Zhu, Deyao and Qian, Guocheng and Ghanem, Bernard and Yan, Zhicheng and Zhu, Chenchen and Xiao, Fanyi and Culatana, Sean Chang and Elhoseiny, Mohamed}, title = {Exploring Open-Vocabulary Semantic Segmentation from CLIP Vision Encoder Distillation Only}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {699-710} }
EDAPS: Enhanced Domain-Adaptive Panoptic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Saha_2023_ICCV, author = {Saha, Suman and Hoyer, Lukas and Obukhov, Anton and Dai, Dengxin and Van Gool, Luc}, title = {EDAPS: Enhanced Domain-Adaptive Panoptic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19234-19245} }
Parallax-Tolerant Unsupervised Deep Image Stitching-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nie_2023_ICCV, author = {Nie, Lang and Lin, Chunyu and Liao, Kang and Liu, Shuaicheng and Zhao, Yao}, title = {Parallax-Tolerant Unsupervised Deep Image Stitching}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7399-7408} }
Scratch Each Other's Back: Incomplete Multi-Modal Brain Tumor Segmentation via Category Aware Group Self-Support Learning-
[pdf]
[bibtex]@InProceedings{Qiu_2023_ICCV, author = {Qiu, Yansheng and Chen, Delin and Yao, Hongdou and Xu, Yongchao and Wang, Zheng}, title = {Scratch Each Other's Back: Incomplete Multi-Modal Brain Tumor Segmentation via Category Aware Group Self-Support Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21317-21326} }
SFHarmony: Source Free Domain Adaptation for Distributed Neuroimaging Analysis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dinsdale_2023_ICCV, author = {Dinsdale, Nicola K and Jenkinson, Mark and Namburete, Ana IL}, title = {SFHarmony: Source Free Domain Adaptation for Distributed Neuroimaging Analysis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11494-11505} }
M2T: Masking Transformers Twice for Faster Decoding-
[pdf]
[supp]
[bibtex]@InProceedings{Mentzer_2023_ICCV, author = {Mentzer, Fabian and Agustson, Eirikur and Tschannen, Michael}, title = {M2T: Masking Transformers Twice for Faster Decoding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5340-5349} }
CoIn: Contrastive Instance Feature Mining for Outdoor 3D Object Detection with Very Limited Annotations-
[pdf]
[supp]
[bibtex]@InProceedings{Xia_2023_ICCV, author = {Xia, Qiming and Deng, Jinhao and Wen, Chenglu and Wu, Hai and Shi, Shaoshuai and Li, Xin and Wang, Cheng}, title = {CoIn: Contrastive Instance Feature Mining for Outdoor 3D Object Detection with Very Limited Annotations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6254-6263} }
3D Human Mesh Recovery with Sequentially Global Rotation Estimation-
[pdf]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Dongkai and Zhang, Shiliang}, title = {3D Human Mesh Recovery with Sequentially Global Rotation Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14953-14962} }
DREAMWALKER: Mental Planning for Continuous Vision-Language Navigation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Hanqing and Liang, Wei and Van Gool, Luc and Wang, Wenguan}, title = {DREAMWALKER: Mental Planning for Continuous Vision-Language Navigation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10873-10883} }
Computation and Data Efficient Backdoor Attacks-
[pdf]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Yutong and Han, Xingshuo and Qiu, Han and Zhang, Tianwei}, title = {Computation and Data Efficient Backdoor Attacks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4805-4814} }
Agglomerative Transformer for Human-Object Interaction Detection-
[pdf]
[arXiv]
[bibtex]@InProceedings{Tu_2023_ICCV, author = {Tu, Danyang and Sun, Wei and Zhai, Guangtao and Shen, Wei}, title = {Agglomerative Transformer for Human-Object Interaction Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21614-21624} }
Decouple Before Interact: Multi-Modal Prompt Learning for Continual Visual Question Answering-
[pdf]
[supp]
[bibtex]@InProceedings{Qian_2023_ICCV, author = {Qian, Zi and Wang, Xin and Duan, Xuguang and Qin, Pengda and Li, Yuhong and Zhu, Wenwu}, title = {Decouple Before Interact: Multi-Modal Prompt Learning for Continual Visual Question Answering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2953-2962} }
Rethinking Fast Fourier Convolution in Image Inpainting-
[pdf]
[supp]
[bibtex]@InProceedings{Chu_2023_ICCV, author = {Chu, Tianyi and Chen, Jiafu and Sun, Jiakai and Lian, Shuobin and Wang, Zhizhong and Zuo, Zhiwen and Zhao, Lei and Xing, Wei and Lu, Dongming}, title = {Rethinking Fast Fourier Convolution in Image Inpainting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23195-23205} }
Learning Robust Representations with Information Bottleneck and Memory Network for RGB-D-based Gesture Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Yunan and Chen, Huizhou and Feng, Guanwen and Miao, Qiguang}, title = {Learning Robust Representations with Information Bottleneck and Memory Network for RGB-D-based Gesture Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20968-20978} }
P1AC: Revisiting Absolute Pose From a Single Affine Correspondence-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ventura_2023_ICCV, author = {Ventura, Jonathan and Kukelova, Zuzana and Sattler, Torsten and Bar\'ath, D\'aniel}, title = {P1AC: Revisiting Absolute Pose From a Single Affine Correspondence}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19751-19761} }
LAN-HDR: Luminance-based Alignment Network for High Dynamic Range Video Reconstruction-
[pdf]
[bibtex]@InProceedings{Chung_2023_ICCV, author = {Chung, Haesoo and Cho, Nam Ik}, title = {LAN-HDR: Luminance-based Alignment Network for High Dynamic Range Video Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12760-12769} }
Dancing in the Dark: A Benchmark towards General Low-light Video Enhancement-
[pdf]
[bibtex]@InProceedings{Fu_2023_ICCV, author = {Fu, Huiyuan and Zheng, Wenkai and Wang, Xicong and Wang, Jiaxuan and Zhang, Heng and Ma, Huadong}, title = {Dancing in the Dark: A Benchmark towards General Low-light Video Enhancement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12877-12886} }
RED-PSM: Regularization by Denoising of Partially Separable Models for Dynamic Imaging-
[pdf]
[supp]
[bibtex]@InProceedings{Iskender_2023_ICCV, author = {Iskender, Berk and Klasky, Marc L. and Bresler, Yoram}, title = {RED-PSM: Regularization by Denoising of Partially Separable Models for Dynamic Imaging}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10595-10604} }
Unsupervised Manifold Linearizing and Clustering-
[pdf]
[arXiv]
[bibtex]@InProceedings{Ding_2023_ICCV, author = {Ding, Tianjiao and Tong, Shengbang and Chan, Kwan Ho Ryan and Dai, Xili and Ma, Yi and Haeffele, Benjamin D.}, title = {Unsupervised Manifold Linearizing and Clustering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5450-5461} }
Lossy and Lossless (L2) Post-training Model Size Compression-
[pdf]
[supp]
[bibtex]@InProceedings{Shi_2023_ICCV, author = {Shi, Yumeng and Bai, Shihao and Wei, Xiuying and Gong, Ruihao and Yang, Jianlei}, title = {Lossy and Lossless (L2) Post-training Model Size Compression}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17546-17556} }
C2ST: Cross-Modal Contextualized Sequence Transduction for Continuous Sign Language Recognition-
[pdf]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Huaiwen and Guo, Zihang and Yang, Yang and Liu, Xin and Hu, De}, title = {C2ST: Cross-Modal Contextualized Sequence Transduction for Continuous Sign Language Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21053-21062} }
ObjectFusion: Multi-modal 3D Object Detection with Object-Centric Fusion-
[pdf]
[supp]
[bibtex]@InProceedings{Cai_2023_ICCV, author = {Cai, Qi and Pan, Yingwei and Yao, Ting and Ngo, Chong-Wah and Mei, Tao}, title = {ObjectFusion: Multi-modal 3D Object Detection with Object-Centric Fusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18067-18076} }
D-IF: Uncertainty-aware Human Digitization via Implicit Distribution Field-
[pdf]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Xueting and Luo, Yihao and Xiu, Yuliang and Wang, Wei and Xu, Hao and Fan, Zhaoxin}, title = {D-IF: Uncertainty-aware Human Digitization via Implicit Distribution Field}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9122-9132} }
MMVP: Motion-Matrix-Based Video Prediction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhong_2023_ICCV, author = {Zhong, Yiqi and Liang, Luming and Zharkov, Ilya and Neumann, Ulrich}, title = {MMVP: Motion-Matrix-Based Video Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4273-4283} }
Human Preference Score: Better Aligning Text-to-Image Models with Human Preference-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Xiaoshi and Sun, Keqiang and Zhu, Feng and Zhao, Rui and Li, Hongsheng}, title = {Human Preference Score: Better Aligning Text-to-Image Models with Human Preference}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2096-2105} }
Guided Motion Diffusion for Controllable Human Motion Synthesis-
[pdf]
[supp]
[bibtex]@InProceedings{Karunratanakul_2023_ICCV, author = {Karunratanakul, Korrawe and Preechakul, Konpat and Suwajanakorn, Supasorn and Tang, Siyu}, title = {Guided Motion Diffusion for Controllable Human Motion Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2151-2162} }
AffordPose: A Large-Scale Dataset of Hand-Object Interactions with Affordance-Driven Hand Pose-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jian_2023_ICCV, author = {Jian, Juntao and Liu, Xiuping and Li, Manyi and Hu, Ruizhen and Liu, Jian}, title = {AffordPose: A Large-Scale Dataset of Hand-Object Interactions with Affordance-Driven Hand Pose}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14713-14724} }
Locomotion-Action-Manipulation: Synthesizing Human-Scene Interactions in Complex 3D Environments-
[pdf]
[supp]
[bibtex]@InProceedings{Lee_2023_ICCV, author = {Lee, Jiye and Joo, Hanbyul}, title = {Locomotion-Action-Manipulation: Synthesizing Human-Scene Interactions in Complex 3D Environments}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9663-9674} }
NDDepth: Normal-Distance Assisted Monocular Depth Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shao_2023_ICCV, author = {Shao, Shuwei and Pei, Zhongcai and Chen, Weihai and Wu, Xingming and Li, Zhengguo}, title = {NDDepth: Normal-Distance Assisted Monocular Depth Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7931-7940} }
Sequential Texts Driven Cohesive Motions Synthesis with Natural Transitions-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Shuai and Zhuang, Sisi and Song, Wenfeng and Zhang, Xinyu and Chen, Hejia and Hao, Aimin}, title = {Sequential Texts Driven Cohesive Motions Synthesis with Natural Transitions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9498-9508} }
Efficient Converted Spiking Neural Network for 3D and 2D Classification-
[pdf]
[bibtex]@InProceedings{Lan_2023_ICCV, author = {Lan, Yuxiang and Zhang, Yachao and Ma, Xu and Qu, Yanyun and Fu, Yun}, title = {Efficient Converted Spiking Neural Network for 3D and 2D Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9211-9220} }
Eulerian Single-Photon Vision-
[pdf]
[supp]
[bibtex]@InProceedings{Gupta_2023_ICCV, author = {Gupta, Shantanu and Gupta, Mohit}, title = {Eulerian Single-Photon Vision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10465-10476} }
Adaptive Calibrator Ensemble: Navigating Test Set Difficulty in Out-of-Distribution Scenarios-
[pdf]
[supp]
[bibtex]@InProceedings{Zou_2023_ICCV, author = {Zou, Yuli and Deng, Weijian and Zheng, Liang}, title = {Adaptive Calibrator Ensemble: Navigating Test Set Difficulty in Out-of-Distribution Scenarios}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19333-19342} }
Contrastive Learning Relies More on Spatial Inductive Bias Than Supervised Learning: An Empirical Study-
[pdf]
[supp]
[bibtex]@InProceedings{Zhong_2023_ICCV, author = {Zhong, Yuanyi and Tang, Haoran and Chen, Jun-Kun and Wang, Yu-Xiong}, title = {Contrastive Learning Relies More on Spatial Inductive Bias Than Supervised Learning: An Empirical Study}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16327-16336} }
DiffuMask: Synthesizing Images with Pixel-level Annotations for Semantic Segmentation Using Diffusion Models-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Weijia and Zhao, Yuzhong and Shou, Mike Zheng and Zhou, Hong and Shen, Chunhua}, title = {DiffuMask: Synthesizing Images with Pixel-level Annotations for Semantic Segmentation Using Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1206-1217} }
NSF: Neural Surface Fields for Human Modeling from Monocular Depth-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xue_2023_ICCV, author = {Xue, Yuxuan and Bhatnagar, Bharat Lal and Marin, Riccardo and Sarafianos, Nikolaos and Xu, Yuanlu and Pons-Moll, Gerard and Tung, Tony}, title = {NSF: Neural Surface Fields for Human Modeling from Monocular Depth}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15049-15060} }
Unaligned 2D to 3D Translation with Conditional Vector-Quantized Code Diffusion using Transformers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Corona-Figueroa_2023_ICCV, author = {Corona-Figueroa, Abril and Bond-Taylor, Sam and Bhowmik, Neelanjan and Gaus, Yona Falinie A. and Breckon, Toby P. and Shum, Hubert P. H. and Willcocks, Chris G.}, title = {Unaligned 2D to 3D Translation with Conditional Vector-Quantized Code Diffusion using Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14585-14594} }
DMNet: Delaunay Meshing Network for 3D Shape Representation-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Chen and Yuan, Ganzhangqin and Tao, Wenbing}, title = {DMNet: Delaunay Meshing Network for 3D Shape Representation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14418-14428} }
StyleDomain: Efficient and Lightweight Parameterizations of StyleGAN for One-shot and Few-shot Domain Adaptation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Alanov_2023_ICCV, author = {Alanov, Aibek and Titov, Vadim and Nakhodnov, Maksim and Vetrov, Dmitry}, title = {StyleDomain: Efficient and Lightweight Parameterizations of StyleGAN for One-shot and Few-shot Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2184-2194} }
RankMixup: Ranking-Based Mixup Training for Network Calibration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Noh_2023_ICCV, author = {Noh, Jongyoun and Park, Hyekang and Lee, Junghyup and Ham, Bumsub}, title = {RankMixup: Ranking-Based Mixup Training for Network Calibration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1358-1368} }
Body Knowledge and Uncertainty Modeling for Monocular 3D Human Body Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Yufei and Wang, Hanjing and Kephart, Jeffrey O. and Ji, Qiang}, title = {Body Knowledge and Uncertainty Modeling for Monocular 3D Human Body Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9020-9032} }
Randomized Quantization: A Generic Augmentation for Data Agnostic Self-supervised Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Huimin and Lei, Chenyang and Sun, Xiao and Wang, Peng-Shuai and Chen, Qifeng and Cheng, Kwang-Ting and Lin, Stephen and Wu, Zhirong}, title = {Randomized Quantization: A Generic Augmentation for Data Agnostic Self-supervised Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16305-16316} }
Learning to Generate Semantic Layouts for Higher Text-Image Correspondence in Text-to-Image Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Park_2023_ICCV, author = {Park, Minho and Yun, Jooyeol and Choi, Seunghwan and Choo, Jaegul}, title = {Learning to Generate Semantic Layouts for Higher Text-Image Correspondence in Text-to-Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7591-7600} }
Neural Radiance Field with LiDAR maps-
[pdf]
[supp]
[bibtex]@InProceedings{Chang_2023_ICCV, author = {Chang, MingFang and Sharma, Akash and Kaess, Michael and Lucey, Simon}, title = {Neural Radiance Field with LiDAR maps}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17914-17923} }
AREA: Adaptive Reweighting via Effective Area for Long-Tailed Classification-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Xiaohua and Zhou, Yucan and Wu, Dayan and Yang, Chule and Li, Bo and Hu, Qinghua and Wang, Weiping}, title = {AREA: Adaptive Reweighting via Effective Area for Long-Tailed Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19277-19287} }
Erasing Concepts from Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gandikota_2023_ICCV, author = {Gandikota, Rohit and Materzynska, Joanna and Fiotto-Kaufman, Jaden and Bau, David}, title = {Erasing Concepts from Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2426-2436} }
Fully Attentional Networks with Self-emerging Token Labeling-
[pdf]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Bingyin and Yu, Zhiding and Lan, Shiyi and Cheng, Yutao and Anandkumar, Anima and Lao, Yingjie and Alvarez, Jose M.}, title = {Fully Attentional Networks with Self-emerging Token Labeling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5585-5595} }
ACTIVE: Towards Highly Transferable 3D Physical Camouflage for Universal and Robust Vehicle Evasion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Suryanto_2023_ICCV, author = {Suryanto, Naufal and Kim, Yongsu and Larasati, Harashta Tatimma and Kang, Hyoeun and Le, Thi-Thu-Huong and Hong, Yoonyoung and Yang, Hunmin and Oh, Se-Yoon and Kim, Howon}, title = {ACTIVE: Towards Highly Transferable 3D Physical Camouflage for Universal and Robust Vehicle Evasion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4305-4314} }
Learning Adaptive Neighborhoods for Graph Neural Networks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Saha_2023_ICCV, author = {Saha, Avishkar and Mendez, Oscar and Russell, Chris and Bowden, Richard}, title = {Learning Adaptive Neighborhoods for Graph Neural Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22541-22550} }
Equivariant Similarity for Vision-Language Foundation Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Tan and Lin, Kevin and Li, Linjie and Lin, Chung-Ching and Yang, Zhengyuan and Zhang, Hanwang and Liu, Zicheng and Wang, Lijuan}, title = {Equivariant Similarity for Vision-Language Foundation Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11998-12008} }
ReST: A Reconfigurable Spatial-Temporal Graph Model for Multi-Camera Multi-Object Tracking-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cheng_2023_ICCV, author = {Cheng, Cheng-Che and Qiu, Min-Xuan and Chiang, Chen-Kuo and Lai, Shang-Hong}, title = {ReST: A Reconfigurable Spatial-Temporal Graph Model for Multi-Camera Multi-Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10051-10060} }
Too Large; Data Reduction for Vision-Language Pre-Training-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Alex Jinpeng and Lin, Kevin Qinghong and Zhang, David Junhao and Lei, Stan Weixian and Shou, Mike Zheng}, title = {Too Large; Data Reduction for Vision-Language Pre-Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3147-3157} }
Make-It-3D: High-fidelity 3D Creation from A Single Image with Diffusion Prior-
[pdf]
[supp]
[bibtex]@InProceedings{Tang_2023_ICCV, author = {Tang, Junshu and Wang, Tengfei and Zhang, Bo and Zhang, Ting and Yi, Ran and Ma, Lizhuang and Chen, Dong}, title = {Make-It-3D: High-fidelity 3D Creation from A Single Image with Diffusion Prior}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22819-22829} }
Towards Deeply Unified Depth-aware Panoptic Segmentation with Bi-directional Guidance Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{He_2023_ICCV, author = {He, Junwen and Wang, Yifan and Wang, Lijun and Lu, Huchuan and Luo, Bin and He, Jun-Yan and Lan, Jin-Peng and Geng, Yifeng and Xie, Xuansong}, title = {Towards Deeply Unified Depth-aware Panoptic Segmentation with Bi-directional Guidance Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4111-4121} }
Taxonomy Adaptive Cross-Domain Adaptation in Medical Imaging via Optimization Trajectory Distillation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fan_2023_ICCV, author = {Fan, Jianan and Liu, Dongnan and Chang, Hang and Huang, Heng and Chen, Mei and Cai, Weidong}, title = {Taxonomy Adaptive Cross-Domain Adaptation in Medical Imaging via Optimization Trajectory Distillation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21174-21184} }
DiffTAD: Temporal Action Detection with Proposal Denoising Diffusion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nag_2023_ICCV, author = {Nag, Sauradip and Zhu, Xiatian and Deng, Jiankang and Song, Yi-Zhe and Xiang, Tao}, title = {DiffTAD: Temporal Action Detection with Proposal Denoising Diffusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10362-10374} }
Ray Conditioning: Trading Photo-consistency for Photo-realism in Multi-view Image Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Eric Ming and Holalkere, Sidhanth and Yan, Ruyu and Zhang, Kai and Davis, Abe}, title = {Ray Conditioning: Trading Photo-consistency for Photo-realism in Multi-view Image Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23242-23251} }
SCOB: Universal Text Understanding via Character-wise Supervised Contrastive Learning with Online Text Rendering for Bridging Domain Gap-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2023_ICCV, author = {Kim, Daehee and Kim, Yoonsik and Kim, DongHyun and Lim, Yumin and Kim, Geewook and Kil, Taeho}, title = {SCOB: Universal Text Understanding via Character-wise Supervised Contrastive Learning with Online Text Rendering for Bridging Domain Gap}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19562-19573} }
Point-Query Quadtree for Crowd Counting, Localization, and More-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Chengxin and Lu, Hao and Cao, Zhiguo and Liu, Tongliang}, title = {Point-Query Quadtree for Crowd Counting, Localization, and More}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1676-1685} }
Heterogeneous Diversity Driven Active Learning for Multi-Object Tracking-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Rui and Zhang, Baopeng and Liu, Jun and Liu, Wei and Zhao, Jian and Teng, Zhu}, title = {Heterogeneous Diversity Driven Active Learning for Multi-Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9932-9941} }
Domain Generalization of 3D Semantic Segmentation in Autonomous Driving-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sanchez_2023_ICCV, author = {Sanchez, Jules and Deschaud, Jean-Emmanuel and Goulette, Fran\c{c}ois}, title = {Domain Generalization of 3D Semantic Segmentation in Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18077-18087} }
HaMuCo: Hand Pose Estimation via Multiview Collaborative Self-Supervised Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zheng_2023_ICCV, author = {Zheng, Xiaozheng and Wen, Chao and Xue, Zhou and Ren, Pengfei and Wang, Jingyu}, title = {HaMuCo: Hand Pose Estimation via Multiview Collaborative Self-Supervised Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20763-20773} }
Efficient Model Personalization in Federated Learning via Client-Specific Prompt Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Fu-En and Wang, Chien-Yi and Wang, Yu-Chiang Frank}, title = {Efficient Model Personalization in Federated Learning via Client-Specific Prompt Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19159-19168} }
Dual Aggregation Transformer for Image Super-Resolution-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Zheng and Zhang, Yulun and Gu, Jinjin and Kong, Linghe and Yang, Xiaokang and Yu, Fisher}, title = {Dual Aggregation Transformer for Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12312-12321} }
Zero-Shot Spatial Layout Conditioning for Text-to-Image Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Couairon_2023_ICCV, author = {Couairon, Guillaume and Careil, Marl\`ene and Cord, Matthieu and Lathuili\`ere, St\'ephane and Verbeek, Jakob}, title = {Zero-Shot Spatial Layout Conditioning for Text-to-Image Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2174-2183} }
SegGPT: Towards Segmenting Everything in Context-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Xinlong and Zhang, Xiaosong and Cao, Yue and Wang, Wen and Shen, Chunhua and Huang, Tiejun}, title = {SegGPT: Towards Segmenting Everything in Context}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1130-1140} }
Semantify: Simplifying the Control of 3D Morphable Models Using CLIP-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gralnik_2023_ICCV, author = {Gralnik, Omer and Gafni, Guy and Shamir, Ariel}, title = {Semantify: Simplifying the Control of 3D Morphable Models Using CLIP}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14554-14564} }
From Sky to the Ground: A Large-scale Benchmark and Simple Baseline Towards Real Rain Removal-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Guo_2023_ICCV, author = {Guo, Yun and Xiao, Xueyao and Chang, Yi and Deng, Shumin and Yan, Luxin}, title = {From Sky to the Ground: A Large-scale Benchmark and Simple Baseline Towards Real Rain Removal}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12097-12107} }
Knowledge Restore and Transfer for Multi-Label Class-Incremental Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dong_2023_ICCV, author = {Dong, Songlin and Luo, Haoyu and He, Yuhang and Wei, Xing and Cheng, Jie and Gong, Yihong}, title = {Knowledge Restore and Transfer for Multi-Label Class-Incremental Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18711-18720} }
DDColor: Towards Photo-Realistic Image Colorization via Dual Decoders-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kang_2023_ICCV, author = {Kang, Xiaoyang and Yang, Tao and Ouyang, Wenqi and Ren, Peiran and Li, Lingzhi and Xie, Xuansong}, title = {DDColor: Towards Photo-Realistic Image Colorization via Dual Decoders}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {328-338} }
Visual Explanations via Iterated Integrated Attributions-
[pdf]
[supp]
[bibtex]@InProceedings{Barkan_2023_ICCV, author = {Barkan, Oren and Elisha, Yehonatan and Asher, Yuval and Eshel, Amit and Koenigstein, Noam}, title = {Visual Explanations via Iterated Integrated Attributions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2073-2084} }
PanFlowNet: A Flow-Based Deep Network for Pan-Sharpening-
[pdf]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Gang and Cao, Xiangyong and Xiao, Wenzhe and Zhou, Man and Liu, Aiping and Chen, Xun and Meng, Deyu}, title = {PanFlowNet: A Flow-Based Deep Network for Pan-Sharpening}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16857-16867} }
Domain Generalization via Balancing Training Difficulty and Model Capability-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jiang_2023_ICCV, author = {Jiang, Xueying and Huang, Jiaxing and Jin, Sheng and Lu, Shijian}, title = {Domain Generalization via Balancing Training Difficulty and Model Capability}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18993-19003} }
Pairwise Similarity Learning is SimPLE-
[pdf]
[supp]
[bibtex]@InProceedings{Wen_2023_ICCV, author = {Wen, Yandong and Liu, Weiyang and Feng, Yao and Raj, Bhiksha and Singh, Rita and Weller, Adrian and Black, Michael J. and Sch\"olkopf, Bernhard}, title = {Pairwise Similarity Learning is SimPLE}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5308-5318} }
GO-SLAM: Global Optimization for Consistent 3D Instant Reconstruction-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Youmin and Tosi, Fabio and Mattoccia, Stefano and Poggi, Matteo}, title = {GO-SLAM: Global Optimization for Consistent 3D Instant Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3727-3737} }
JOTR: 3D Joint Contrastive Learning with Transformers for Occluded Human Mesh Recovery-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Jiahao and Yang, Zongxin and Wang, Xiaohan and Ma, Jianxin and Zhou, Chang and Yang, Yi}, title = {JOTR: 3D Joint Contrastive Learning with Transformers for Occluded Human Mesh Recovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9110-9121} }
CLIP-Driven Universal Model for Organ Segmentation and Tumor Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Jie and Zhang, Yixiao and Chen, Jie-Neng and Xiao, Junfei and Lu, Yongyi and A Landman, Bennett and Yuan, Yixuan and Yuille, Alan and Tang, Yucheng and Zhou, Zongwei}, title = {CLIP-Driven Universal Model for Organ Segmentation and Tumor Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21152-21164} }
NIR-assisted Video Enhancement via Unpaired 24-hour Data-
[pdf]
[supp]
[bibtex]@InProceedings{Niu_2023_ICCV, author = {Niu, Muyao and Zhong, Zhihang and Zheng, Yinqiang}, title = {NIR-assisted Video Enhancement via Unpaired 24-hour Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10778-10788} }
FACTS: First Amplify Correlations and Then Slice to Discover Bias-
[pdf]
[supp]
[bibtex]@InProceedings{Yenamandra_2023_ICCV, author = {Yenamandra, Sriram and Ramesh, Pratik and Prabhu, Viraj and Hoffman, Judy}, title = {FACTS: First Amplify Correlations and Then Slice to Discover Bias}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4794-4804} }
Anchor Structure Regularization Induced Multi-view Subspace Clustering via Enhanced Tensor Rank Minimization-
[pdf]
[supp]
[bibtex]@InProceedings{Ji_2023_ICCV, author = {Ji, Jintian and Feng, Songhe}, title = {Anchor Structure Regularization Induced Multi-view Subspace Clustering via Enhanced Tensor Rank Minimization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19343-19352} }
VeRi3D: Generative Vertex-based Radiance Fields for 3D Controllable Human Image Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Xinya and Huang, Jiaxin and Bin, Yanrui and Yu, Lu and Liao, Yiyi}, title = {VeRi3D: Generative Vertex-based Radiance Fields for 3D Controllable Human Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8986-8997} }
MOSE: A New Dataset for Video Object Segmentation in Complex Scenes-
[pdf]
[arXiv]
[bibtex]@InProceedings{Ding_2023_ICCV, author = {Ding, Henghui and Liu, Chang and He, Shuting and Jiang, Xudong and Torr, Philip H.S. and Bai, Song}, title = {MOSE: A New Dataset for Video Object Segmentation in Complex Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20224-20234} }
BoMD: Bag of Multi-label Descriptors for Noisy Chest X-ray Classification-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Yuanhong and Liu, Fengbei and Wang, Hu and Wang, Chong and Liu, Yuyuan and Tian, Yu and Carneiro, Gustavo}, title = {BoMD: Bag of Multi-label Descriptors for Noisy Chest X-ray Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21284-21295} }
Mask-Attention-Free Transformer for 3D Instance Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lai_2023_ICCV, author = {Lai, Xin and Yuan, Yuhui and Chu, Ruihang and Chen, Yukang and Hu, Han and Jia, Jiaya}, title = {Mask-Attention-Free Transformer for 3D Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3693-3703} }
SHIFT3D: Synthesizing Hard Inputs For Tricking 3D Detectors-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Hongge and Chen, Zhao and Meyer, Gregory P. and Park, Dennis and Vondrick, Carl and Shrivastava, Ashish and Chai, Yuning}, title = {SHIFT3D: Synthesizing Hard Inputs For Tricking 3D Detectors}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8493-8503} }
EgoLoc: Revisiting 3D Object Localization from Egocentric Videos with Visual Queries-
[pdf]
[arXiv]
[bibtex]@InProceedings{Mai_2023_ICCV, author = {Mai, Jinjie and Hamdi, Abdullah and Giancola, Silvio and Zhao, Chen and Ghanem, Bernard}, title = {EgoLoc: Revisiting 3D Object Localization from Egocentric Videos with Visual Queries}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {45-57} }
Coordinate Transformer: Achieving Single-stage Multi-person Mesh Recovery from Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Haoyuan and Dong, Haoye and Jia, Hanchao and Huang, Dong and Kampffmeyer, Michael C. and Lin, Liang and Liang, Xiaodan}, title = {Coordinate Transformer: Achieving Single-stage Multi-person Mesh Recovery from Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8744-8753} }
FLatten Transformer: Vision Transformer using Focused Linear Attention-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Han_2023_ICCV, author = {Han, Dongchen and Pan, Xuran and Han, Yizeng and Song, Shiji and Huang, Gao}, title = {FLatten Transformer: Vision Transformer using Focused Linear Attention}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5961-5971} }
Q-Diffusion: Quantizing Diffusion Models-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Xiuyu and Liu, Yijiang and Lian, Long and Yang, Huanrui and Dong, Zhen and Kang, Daniel and Zhang, Shanghang and Keutzer, Kurt}, title = {Q-Diffusion: Quantizing Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17535-17545} }
Robustifying Token Attention for Vision Transformers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Guo_2023_ICCV, author = {Guo, Yong and Stutz, David and Schiele, Bernt}, title = {Robustifying Token Attention for Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17557-17568} }
Boosting Positive Segments for Weakly-Supervised Audio-Visual Video Parsing-
[pdf]
[supp]
[bibtex]@InProceedings{Rachavarapu_2023_ICCV, author = {Rachavarapu, Kranthi Kumar and N., Rajagopalan A.}, title = {Boosting Positive Segments for Weakly-Supervised Audio-Visual Video Parsing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10192-10202} }
ADNet: Lane Shape Prediction via Anchor Decomposition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xiao_2023_ICCV, author = {Xiao, Lingyu and Li, Xiang and Yang, Sen and Yang, Wankou}, title = {ADNet: Lane Shape Prediction via Anchor Decomposition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6404-6413} }
UniSeg: A Unified Multi-Modal LiDAR Segmentation Network and the OpenPCSeg Codebase-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Youquan and Chen, Runnan and Li, Xin and Kong, Lingdong and Yang, Yuchen and Xia, Zhaoyang and Bai, Yeqi and Zhu, Xinge and Ma, Yuexin and Li, Yikang and Qiao, Yu and Hou, Yuenan}, title = {UniSeg: A Unified Multi-Modal LiDAR Segmentation Network and the OpenPCSeg Codebase}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21662-21673} }
Sign Language Translation with Iterative Prototype-
[pdf]
[arXiv]
[bibtex]@InProceedings{Yao_2023_ICCV, author = {Yao, Huijie and Zhou, Wengang and Feng, Hao and Hu, Hezhen and Zhou, Hao and Li, Houqiang}, title = {Sign Language Translation with Iterative Prototype}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15592-15601} }
Pixel-Wise Contrastive Distillation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Junqiang and Guo, Zichao}, title = {Pixel-Wise Contrastive Distillation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16359-16369} }
Efficient Deep Space Filling Curve-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Wanli and Yao, Xufeng and Zhang, Xinyun and Yu, Bei}, title = {Efficient Deep Space Filling Curve}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17525-17534} }
GlueGen: Plug and Play Multi-modal Encoders for X-to-image Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Qin_2023_ICCV, author = {Qin, Can and Yu, Ning and Xing, Chen and Zhang, Shu and Chen, Zeyuan and Ermon, Stefano and Fu, Yun and Xiong, Caiming and Xu, Ran}, title = {GlueGen: Plug and Play Multi-modal Encoders for X-to-image Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23085-23096} }
Humans in 4D: Reconstructing and Tracking Humans with Transformers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Goel_2023_ICCV, author = {Goel, Shubham and Pavlakos, Georgios and Rajasegaran, Jathushan and Kanazawa, Angjoo and Malik, Jitendra}, title = {Humans in 4D: Reconstructing and Tracking Humans with Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14783-14794} }
Ponder: Point Cloud Pre-training via Neural Rendering-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Di and Peng, Sida and He, Tong and Yang, Honghui and Zhou, Xiaowei and Ouyang, Wanli}, title = {Ponder: Point Cloud Pre-training via Neural Rendering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16089-16098} }
Perpetual Humanoid Control for Real-time Simulated Avatars-
[pdf]
[supp]
[bibtex]@InProceedings{Luo_2023_ICCV, author = {Luo, Zhengyi and Cao, Jinkun and AlexanderWinkler and Kitani, Kris and Xu, Weipeng}, title = {Perpetual Humanoid Control for Real-time Simulated Avatars}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10895-10904} }
HollowNeRF: Pruning Hashgrid-Based NeRFs with Trainable Collision Mitigation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Xie_2023_ICCV, author = {Xie, Xiufeng and Gherardi, Riccardo and Pan, Zhihong and Huang, Stephen}, title = {HollowNeRF: Pruning Hashgrid-Based NeRFs with Trainable Collision Mitigation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3480-3490} }
A Complete Recipe for Diffusion Generative Models-
[pdf]
[supp]
[bibtex]@InProceedings{Pandey_2023_ICCV, author = {Pandey, Kushagra and Mandt, Stephan}, title = {A Complete Recipe for Diffusion Generative Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4261-4272} }
The Devil is in the Crack Orientation: A New Perspective for Crack Detection-
[pdf]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Zhuangzhuang and Zhang, Jin and Lai, Zhuonan and Zhu, Guanming and Liu, Zun and Chen, Jie and Li, Jianqiang}, title = {The Devil is in the Crack Orientation: A New Perspective for Crack Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6653-6663} }
FedPD: Federated Open Set Recognition with Parameter Disentanglement-
[pdf]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Chen and Zhu, Meilu and Liu, Yifan and Yuan, Yixuan}, title = {FedPD: Federated Open Set Recognition with Parameter Disentanglement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4882-4891} }
WaterMask: Instance Segmentation for Underwater Imagery-
[pdf]
[bibtex]@InProceedings{Lian_2023_ICCV, author = {Lian, Shijie and Li, Hua and Cong, Runmin and Li, Suqi and Zhang, Wei and Kwong, Sam}, title = {WaterMask: Instance Segmentation for Underwater Imagery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1305-1315} }
Score Priors Guided Deep Variational Inference for Unsupervised Real-World Single Image Denoising-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cheng_2023_ICCV, author = {Cheng, Jun and Liu, Tao and Tan, Shan}, title = {Score Priors Guided Deep Variational Inference for Unsupervised Real-World Single Image Denoising}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12937-12948} }
L-DAWA: Layer-wise Divergence Aware Weight Aggregation in Federated Self-Supervised Visual Representation Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Rehman_2023_ICCV, author = {Rehman, Yasar Abbas Ur and Gao, Yan and de Gusmao, Pedro Porto Buarque and Alibeigi, Mina and Shen, Jiajun and Lane, Nicholas D.}, title = {L-DAWA: Layer-wise Divergence Aware Weight Aggregation in Federated Self-Supervised Visual Representation Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16464-16473} }
Improving Transformer-based Image Matching by Cascaded Capturing Spatially Informative Keypoints-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cao_2023_ICCV, author = {Cao, Chenjie and Fu, Yanwei}, title = {Improving Transformer-based Image Matching by Cascaded Capturing Spatially Informative Keypoints}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12129-12139} }
Controllable Guide-Space for Generalizable Face Forgery Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Guo_2023_ICCV, author = {Guo, Ying and Zhen, Cheng and Yan, Pengfei}, title = {Controllable Guide-Space for Generalizable Face Forgery Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20818-20827} }
Calibrating Uncertainty for Semi-Supervised Crowd Counting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{LI_2023_ICCV, author = {LI, Chen and Hu, Xiaoling and Abousamra, Shahira and Chen, Chao}, title = {Calibrating Uncertainty for Semi-Supervised Crowd Counting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16731-16741} }
MosaiQ: Quantum Generative Adversarial Networks for Image Generation on NISQ Computers-
[pdf]
[arXiv]
[bibtex]@InProceedings{Silver_2023_ICCV, author = {Silver, Daniel and Patel, Tirthak and Cutler, William and Ranjan, Aditya and Gandhi, Harshitta and Tiwari, Devesh}, title = {MosaiQ: Quantum Generative Adversarial Networks for Image Generation on NISQ Computers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7030-7039} }
DVIS: Decoupled Video Instance Segmentation Framework-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Tao and Tian, Xingye and Wu, Yu and Ji, Shunping and Wang, Xuebo and Zhang, Yuan and Wan, Pengfei}, title = {DVIS: Decoupled Video Instance Segmentation Framework}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1282-1291} }
Segmentation of Tubular Structures Using Iterative Training with Tailored Samples-
[pdf]
[arXiv]
[bibtex]@InProceedings{Liao_2023_ICCV, author = {Liao, Wei}, title = {Segmentation of Tubular Structures Using Iterative Training with Tailored Samples}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23643-23652} }
Boundary-Aware Divide and Conquer: A Diffusion-Based Solution for Unsupervised Shadow Removal-
[pdf]
[supp]
[bibtex]@InProceedings{Guo_2023_ICCV, author = {Guo, Lanqing and Wang, Chong and Yang, Wenhan and Wang, Yufei and Wen, Bihan}, title = {Boundary-Aware Divide and Conquer: A Diffusion-Based Solution for Unsupervised Shadow Removal}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13045-13054} }
Towards Nonlinear-Motion-Aware and Occlusion-Robust Rolling Shutter Correction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Qu_2023_ICCV, author = {Qu, Delin and Lao, Yizhen and Wang, Zhigang and Wang, Dong and Zhao, Bin and Li, Xuelong}, title = {Towards Nonlinear-Motion-Aware and Occlusion-Robust Rolling Shutter Correction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10680-10688} }
Surface Extraction from Neural Unsigned Distance Fields-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Congyi and Lin, Guying and Yang, Lei and Li, Xin and Komura, Taku and Schaefer, Scott and Keyser, John and Wang, Wenping}, title = {Surface Extraction from Neural Unsigned Distance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22531-22540} }
CBA: Improving Online Continual Learning via Continual Bias Adaptor-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Quanziang and Wang, Renzhen and Wu, Yichen and Jia, Xixi and Meng, Deyu}, title = {CBA: Improving Online Continual Learning via Continual Bias Adaptor}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19082-19092} }
GraphEcho: Graph-Driven Unsupervised Domain Adaptation for Echocardiogram Video Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Jiewen and Ding, Xinpeng and Zheng, Ziyang and Xu, Xiaowei and Li, Xiaomeng}, title = {GraphEcho: Graph-Driven Unsupervised Domain Adaptation for Echocardiogram Video Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11878-11887} }
Multi-view Spectral Polarization Propagation for Video Glass Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Qiao_2023_ICCV, author = {Qiao, Yu and Dong, Bo and Jin, Ao and Fu, Yu and Baek, Seung-Hwan and Heide, Felix and Peers, Pieter and Wei, Xiaopeng and Yang, Xin}, title = {Multi-view Spectral Polarization Propagation for Video Glass Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23218-23228} }
Rethinking Amodal Video Segmentation from Learning Supervised Signals with Object-centric Representation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fan_2023_ICCV, author = {Fan, Ke and Lei, Jingshi and Qian, Xuelin and Yu, Miaopeng and Xiao, Tianjun and He, Tong and Zhang, Zheng and Fu, Yanwei}, title = {Rethinking Amodal Video Segmentation from Learning Supervised Signals with Object-centric Representation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1272-1281} }
Augmented Box Replay: Overcoming Foreground Shift for Incremental Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Yuyang and Cong, Yang and Goswami, Dipam and Liu, Xialei and van de Weijer, Joost}, title = {Augmented Box Replay: Overcoming Foreground Shift for Incremental Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11367-11377} }
Distilled Reverse Attention Network for Open-world Compositional Zero-Shot Learning-
[pdf]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Yun and Liu, Zhe and Jha, Saurav and Yao, Lina}, title = {Distilled Reverse Attention Network for Open-world Compositional Zero-Shot Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1782-1791} }
DandelionNet: Domain Composition with Instance Adaptive Classification for Domain Generalization-
[pdf]
[supp]
[bibtex]@InProceedings{Hu_2023_ICCV, author = {Hu, Lanqing and Kan, Meina and Shan, Shiguang and Chen, Xilin}, title = {DandelionNet: Domain Composition with Instance Adaptive Classification for Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19050-19059} }
TexFusion: Synthesizing 3D Textures with Text-Guided Image Diffusion Models-
[pdf]
[supp]
[bibtex]@InProceedings{Cao_2023_ICCV, author = {Cao, Tianshi and Kreis, Karsten and Fidler, Sanja and Sharp, Nicholas and Yin, Kangxue}, title = {TexFusion: Synthesizing 3D Textures with Text-Guided Image Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4169-4181} }
Shift from Texture-bias to Shape-bias: Edge Deformation-based Augmentation for Robust Object Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{He_2023_ICCV, author = {He, Xilin and Lin, Qinliang and Luo, Cheng and Xie, Weicheng and Song, Siyang and Liu, Feng and Shen, Linlin}, title = {Shift from Texture-bias to Shape-bias: Edge Deformation-based Augmentation for Robust Object Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1526-1535} }
Lighting Every Darkness in Two Pairs: A Calibration-Free Pipeline for RAW Denoising-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jin_2023_ICCV, author = {Jin, Xin and Xiao, Jia-Wen and Han, Ling-Hao and Guo, Chunle and Zhang, Ruixun and Liu, Xialei and Li, Chongyi}, title = {Lighting Every Darkness in Two Pairs: A Calibration-Free Pipeline for RAW Denoising}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13275-13284} }
Data-free Knowledge Distillation for Fine-grained Visual Categorization-
[pdf]
[supp]
[bibtex]@InProceedings{Shao_2023_ICCV, author = {Shao, Renrong and Zhang, Wei and Yin, Jianhua and Wang, Jun}, title = {Data-free Knowledge Distillation for Fine-grained Visual Categorization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1515-1525} }
MotionBERT: A Unified Perspective on Learning Human Motion Representations-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Wentao and Ma, Xiaoxuan and Liu, Zhaoyang and Liu, Libin and Wu, Wayne and Wang, Yizhou}, title = {MotionBERT: A Unified Perspective on Learning Human Motion Representations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15085-15099} }
PASTA: Proportional Amplitude Spectrum Training Augmentation for Syn-to-Real Domain Generalization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chattopadhyay_2023_ICCV, author = {Chattopadhyay, Prithvijit and Sarangmath, Kartik and Vijaykumar, Vivek and Hoffman, Judy}, title = {PASTA: Proportional Amplitude Spectrum Training Augmentation for Syn-to-Real Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19288-19300} }
EgoPCA: A New Framework for Egocentric Hand-Object Interaction Understanding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Yue and Li, Yong-Lu and Huang, Zhemin and Liu, Michael Xu and Lu, Cewu and Tai, Yu-Wing and Tang, Chi-Keung}, title = {EgoPCA: A New Framework for Egocentric Hand-Object Interaction Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5273-5284} }
Metric3D: Towards Zero-shot Metric 3D Prediction from A Single Image-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yin_2023_ICCV, author = {Yin, Wei and Zhang, Chi and Chen, Hao and Cai, Zhipeng and Yu, Gang and Wang, Kaixuan and Chen, Xiaozhi and Shen, Chunhua}, title = {Metric3D: Towards Zero-shot Metric 3D Prediction from A Single Image}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9043-9053} }
I Can't Believe There's No Images! Learning Visual Tasks Using only Language Supervision-
[pdf]
[supp]
[bibtex]@InProceedings{Gu_2023_ICCV, author = {Gu, Sophia and Clark, Christopher and Kembhavi, Aniruddha}, title = {I Can't Believe There's No Images! Learning Visual Tasks Using only Language Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2672-2683} }
Lightweight Image Super-Resolution with Superpixel Token Interaction-
[pdf]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Aiping and Ren, Wenqi and Liu, Yi and Cao, Xiaochun}, title = {Lightweight Image Super-Resolution with Superpixel Token Interaction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12728-12737} }
Feature Prediction Diffusion Model for Video Anomaly Detection-
[pdf]
[bibtex]@InProceedings{Yan_2023_ICCV, author = {Yan, Cheng and Zhang, Shiyu and Liu, Yang and Pang, Guansong and Wang, Wenjun}, title = {Feature Prediction Diffusion Model for Video Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5527-5537} }
RANA: Relightable Articulated Neural Avatars-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Iqbal_2023_ICCV, author = {Iqbal, Umar and Caliskan, Akin and Nagano, Koki and Khamis, Sameh and Molchanov, Pavlo and Kautz, Jan}, title = {RANA: Relightable Articulated Neural Avatars}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23142-23153} }
Iterative Denoiser and Noise Estimator for Self-Supervised Image Denoising-
[pdf]
[bibtex]@InProceedings{Zou_2023_ICCV, author = {Zou, Yunhao and Yan, Chenggang and Fu, Ying}, title = {Iterative Denoiser and Noise Estimator for Self-Supervised Image Denoising}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13265-13274} }
MasQCLIP for Open-Vocabulary Universal Image Segmentation-
[pdf]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Xin and Xiong, Tianyi and Ding, Zheng and Tu, Zhuowen}, title = {MasQCLIP for Open-Vocabulary Universal Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {887-898} }
Memory-and-Anticipation Transformer for Online Action Understanding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Jiahao and Chen, Guo and Huang, Yifei and Wang, Limin and Lu, Tong}, title = {Memory-and-Anticipation Transformer for Online Action Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13824-13835} }
Self-similarity Driven Scale-invariant Learning for Weakly Supervised Person Search-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Benzhi and Yang, Yang and Wu, Jinlin and Qi, Guo-jun and Lei, Zhen}, title = {Self-similarity Driven Scale-invariant Learning for Weakly Supervised Person Search}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1813-1822} }
MODA: Mapping-Once Audio-driven Portrait Animation with Dual Attentions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Yunfei and Lin, Lijian and Yu, Fei and Zhou, Changyin and Li, Yu}, title = {MODA: Mapping-Once Audio-driven Portrait Animation with Dual Attentions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23020-23029} }
Realistic Full-Body Tracking from Sparse Observations via Joint-Level Modeling-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zheng_2023_ICCV, author = {Zheng, Xiaozheng and Su, Zhuo and Wen, Chao and Xue, Zhou and Jin, Xiaojie}, title = {Realistic Full-Body Tracking from Sparse Observations via Joint-Level Modeling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14678-14688} }
MetaF2N: Blind Image Super-Resolution by Learning Efficient Model Adaptation from Faces-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yin_2023_ICCV, author = {Yin, Zhicun and Liu, Ming and Li, Xiaoming and Yang, Hui and Xiao, Longan and Zuo, Wangmeng}, title = {MetaF2N: Blind Image Super-Resolution by Learning Efficient Model Adaptation from Faces}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13033-13044} }
Lighting up NeRF via Unsupervised Decomposition and Enhancement-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Haoyuan and Xu, Xiaogang and Xu, Ke and Lau, Rynson W.H.}, title = {Lighting up NeRF via Unsupervised Decomposition and Enhancement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12632-12641} }
ViM: Vision Middleware for Unified Downstream Transferring-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Feng_2023_ICCV, author = {Feng, Yutong and Gong, Biao and Jiang, Jianwen and Lv, Yiliang and Shen, Yujun and Zhao, Deli and Zhou, Jingren}, title = {ViM: Vision Middleware for Unified Downstream Transferring}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11696-11707} }
DIRE for Diffusion-Generated Image Detection-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Zhendong and Bao, Jianmin and Zhou, Wengang and Wang, Weilun and Hu, Hezhen and Chen, Hong and Li, Houqiang}, title = {DIRE for Diffusion-Generated Image Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22445-22455} }
Ord2Seq: Regarding Ordinal Regression as Label Sequence Prediction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Jinhong and Cheng, Yi and Chen, Jintai and Chen, TingTing and Chen, Danny and Wu, Jian}, title = {Ord2Seq: Regarding Ordinal Regression as Label Sequence Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5865-5875} }
Bring Clipart to Life-
[pdf]
[supp]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Nanxuan and Dang, Shengqi and Lin, Hexun and Shi, Yang and Cao, Nan}, title = {Bring Clipart to Life}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23341-23350} }
Co-Evolution of Pose and Mesh for 3D Human Body Estimation from Video-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{You_2023_ICCV, author = {You, Yingxuan and Liu, Hong and Wang, Ti and Li, Wenhao and Ding, Runwei and Li, Xia}, title = {Co-Evolution of Pose and Mesh for 3D Human Body Estimation from Video}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14963-14973} }
Noise2Info: Noisy Image to Information of Noise for Self-Supervised Image Denoising-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Jiachuan and Di, Shimin and Chen, Lei and Ng, Charles Wang Wai}, title = {Noise2Info: Noisy Image to Information of Noise for Self-Supervised Image Denoising}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16034-16043} }
Controllable Visual-Tactile Synthesis-
[pdf]
[arXiv]
[bibtex]@InProceedings{Gao_2023_ICCV, author = {Gao, Ruihan and Yuan, Wenzhen and Zhu, Jun-Yan}, title = {Controllable Visual-Tactile Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7040-7052} }
Keep It SimPool: Who Said Supervised Transformers Suffer from Attention Deficit?-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Psomas_2023_ICCV, author = {Psomas, Bill and Kakogeorgiou, Ioannis and Karantzalos, Konstantinos and Avrithis, Yannis}, title = {Keep It SimPool: Who Said Supervised Transformers Suffer from Attention Deficit?}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5350-5360} }
SynBody: Synthetic Dataset with Layered Human Models for 3D Human Perception and Modeling-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Zhitao and Cai, Zhongang and Mei, Haiyi and Liu, Shuai and Chen, Zhaoxi and Xiao, Weiye and Wei, Yukun and Qing, Zhongfei and Wei, Chen and Dai, Bo and Wu, Wayne and Qian, Chen and Lin, Dahua and Liu, Ziwei and Yang, Lei}, title = {SynBody: Synthetic Dataset with Layered Human Models for 3D Human Perception and Modeling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20282-20292} }
Viewset Diffusion: (0-)Image-Conditioned 3D Generative Models from 2D Data-
[pdf]
[supp]
[bibtex]@InProceedings{Szymanowicz_2023_ICCV, author = {Szymanowicz, Stanislaw and Rupprecht, Christian and Vedaldi, Andrea}, title = {Viewset Diffusion: (0-)Image-Conditioned 3D Generative Models from 2D Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8863-8873} }
LoGoPrompt: Synthetic Text Images Can Be Good Visual Prompts for Vision-Language Models-
[pdf]
[arXiv]
[bibtex]@InProceedings{Shi_2023_ICCV, author = {Shi, Cheng and Yang, Sibei}, title = {LoGoPrompt: Synthetic Text Images Can Be Good Visual Prompts for Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2932-2941} }
EP2P-Loc: End-to-End 3D Point to 2D Pixel Localization for Large-Scale Visual Localization-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2023_ICCV, author = {Kim, Minjung and Koo, Junseo and Kim, Gunhee}, title = {EP2P-Loc: End-to-End 3D Point to 2D Pixel Localization for Large-Scale Visual Localization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21527-21537} }
SIRA-PCR: Sim-to-Real Adaptation for 3D Point Cloud Registration-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Suyi and Xu, Hao and Li, Ru and Liu, Guanghui and Fu, Chi-Wing and Liu, Shuaicheng}, title = {SIRA-PCR: Sim-to-Real Adaptation for 3D Point Cloud Registration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14394-14405} }
FeatEnHancer: Enhancing Hierarchical Features for Object Detection and Beyond Under Low-Light Vision-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hashmi_2023_ICCV, author = {Hashmi, Khurram Azeem and Kallempudi, Goutham and Stricker, Didier and Afzal, Muhammad Zeshan}, title = {FeatEnHancer: Enhancing Hierarchical Features for Object Detection and Beyond Under Low-Light Vision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6725-6735} }
SOAR: Scene-debiasing Open-set Action Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhai_2023_ICCV, author = {Zhai, Yuanhao and Liu, Ziyi and Wu, Zhenyu and Wu, Yi and Zhou, Chunluan and Doermann, David and Yuan, Junsong and Hua, Gang}, title = {SOAR: Scene-debiasing Open-set Action Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10244-10254} }
Physics-Augmented Autoencoder for 3D Skeleton-Based Gait Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Guo_2023_ICCV, author = {Guo, Hongji and Ji, Qiang}, title = {Physics-Augmented Autoencoder for 3D Skeleton-Based Gait Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19627-19638} }
Regularized Primitive Graph Learning for Unified Vector Mapping-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Lei and Dai, Min and He, Jianan and Huang, Jingwei}, title = {Regularized Primitive Graph Learning for Unified Vector Mapping}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16817-16826} }
Saliency Regularization for Self-Training with Partial Annotations-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Shouwen and Wan, Qian and Xiang, Xiang and Zeng, Zhigang}, title = {Saliency Regularization for Self-Training with Partial Annotations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1611-1620} }
Stabilizing Visual Reinforcement Learning via Asymmetric Interactive Cooperation-
[pdf]
[bibtex]@InProceedings{Zhai_2023_ICCV, author = {Zhai, Yunpeng and Peng, Peixi and Zhao, Yifan and Huang, Yangru and Tian, Yonghong}, title = {Stabilizing Visual Reinforcement Learning via Asymmetric Interactive Cooperation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {207-216} }
FlipNeRF: Flipped Reflection Rays for Few-shot Novel View Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Seo_2023_ICCV, author = {Seo, Seunghyeon and Chang, Yeonjin and Kwak, Nojun}, title = {FlipNeRF: Flipped Reflection Rays for Few-shot Novel View Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22883-22893} }
Discovering Spatio-Temporal Rationales for Video Question Answering-
[pdf]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Yicong and Xiao, Junbin and Feng, Chun and Wang, Xiang and Chua, Tat-Seng}, title = {Discovering Spatio-Temporal Rationales for Video Question Answering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13869-13878} }
Iterative Soft Shrinkage Learning for Efficient Image Super-Resolution-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Jiamian and Wang, Huan and Zhang, Yulun and Fu, Yun and Tao, Zhiqiang}, title = {Iterative Soft Shrinkage Learning for Efficient Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12590-12599} }
Learning Hierarchical Features with Joint Latent Space Energy-Based Prior-
[pdf]
[supp]
[bibtex]@InProceedings{Cui_2023_ICCV, author = {Cui, Jiali and Wu, Ying Nian and Han, Tian}, title = {Learning Hierarchical Features with Joint Latent Space Energy-Based Prior}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2218-2227} }
UniFormerV2: Unlocking the Potential of Image ViTs for Video Understanding-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Kunchang and Wang, Yali and He, Yinan and Li, Yizhuo and Wang, Yi and Wang, Limin and Qiao, Yu}, title = {UniFormerV2: Unlocking the Potential of Image ViTs for Video Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1632-1643} }
G2L: Semantically Aligned and Uniform Video Grounding via Geodesic and Game Theory-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Hongxiang and Cao, Meng and Cheng, Xuxin and Li, Yaowei and Zhu, Zhihong and Zou, Yuexian}, title = {G2L: Semantically Aligned and Uniform Video Grounding via Geodesic and Game Theory}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12032-12042} }
TARGET: Federated Class-Continual Learning via Exemplar-Free Distillation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Jie and Chen, Chen and Zhuang, Weiming and Lyu, Lingjuan}, title = {TARGET: Federated Class-Continual Learning via Exemplar-Free Distillation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4782-4793} }
FashionNTM: Multi-turn Fashion Image Retrieval via Cascaded Memory-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Pal_2023_ICCV, author = {Pal, Anwesan and Wadhwa, Sahil and Jaiswal, Ayush and Zhang, Xu and Wu, Yue and Chada, Rakesh and Natarajan, Pradeep and Christensen, Henrik I.}, title = {FashionNTM: Multi-turn Fashion Image Retrieval via Cascaded Memory}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11323-11334} }
MolGrapher: Graph-based Visual Recognition of Chemical Structures-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Morin_2023_ICCV, author = {Morin, Lucas and Danelljan, Martin and Agea, Maria Isabel and Nassar, Ahmed and Weber, Valery and Meijer, Ingmar and Staar, Peter and Yu, Fisher}, title = {MolGrapher: Graph-based Visual Recognition of Chemical Structures}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19552-19561} }
SAMPLING: Scene-adaptive Hierarchical Multiplane Images Representation for Novel View Synthesis from a Single Image-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Xiaoyu and Lin, Zhiwei and Shan, Xiaojun and Wang, Yongtao and Sun, Deqing and Yang, Ming-Hsuan}, title = {SAMPLING: Scene-adaptive Hierarchical Multiplane Images Representation for Novel View Synthesis from a Single Image}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22830-22840} }
DiffV2S: Diffusion-Based Video-to-Speech Synthesis with Vision-Guided Speaker Embedding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Choi_2023_ICCV, author = {Choi, Jeongsoo and Hong, Joanna and Ro, Yong Man}, title = {DiffV2S: Diffusion-Based Video-to-Speech Synthesis with Vision-Guided Speaker Embedding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7812-7821} }
PointOdyssey: A Large-Scale Synthetic Dataset for Long-Term Point Tracking-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zheng_2023_ICCV, author = {Zheng, Yang and Harley, Adam W. and Shen, Bokui and Wetzstein, Gordon and Guibas, Leonidas J.}, title = {PointOdyssey: A Large-Scale Synthetic Dataset for Long-Term Point Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19855-19865} }
The Effectiveness of MAE Pre-Pretraining for Billion-Scale Pretraining-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Singh_2023_ICCV, author = {Singh, Mannat and Duval, Quentin and Alwala, Kalyan Vasudev and Fan, Haoqi and Aggarwal, Vaibhav and Adcock, Aaron and Joulin, Armand and Dollar, Piotr and Feichtenhofer, Christoph and Girshick, Ross and Girdhar, Rohit and Misra, Ishan}, title = {The Effectiveness of MAE Pre-Pretraining for Billion-Scale Pretraining}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5484-5494} }
Towards Zero Domain Gap: A Comprehensive Study of Realistic LiDAR Simulation for Autonomy Testing-
[pdf]
[supp]
[bibtex]@InProceedings{Manivasagam_2023_ICCV, author = {Manivasagam, Sivabalan and B\^arsan, Ioan Andrei and Wang, Jingkang and Yang, Ze and Urtasun, Raquel}, title = {Towards Zero Domain Gap: A Comprehensive Study of Realistic LiDAR Simulation for Autonomy Testing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8272-8282} }
GPA-3D: Geometry-aware Prototype Alignment for Unsupervised Domain Adaptive 3D Object Detection from Point Clouds-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Ziyu and Guo, Jingming and Cao, Tongtong and Bingbing, Liu and Yang, Wankou}, title = {GPA-3D: Geometry-aware Prototype Alignment for Unsupervised Domain Adaptive 3D Object Detection from Point Clouds}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6394-6403} }
TransHuman: A Transformer-based Human Representation for Generalizable Neural Human Rendering-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Pan_2023_ICCV, author = {Pan, Xiao and Yang, Zongxin and Ma, Jianxin and Zhou, Chang and Yang, Yi}, title = {TransHuman: A Transformer-based Human Representation for Generalizable Neural Human Rendering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3544-3555} }
LNPL-MIL: Learning from Noisy Pseudo Labels for Promoting Multiple Instance Learning in Whole Slide Image-
[pdf]
[supp]
[bibtex]@InProceedings{Shao_2023_ICCV, author = {Shao, Zhuchen and Wang, Yifeng and Chen, Yang and Bian, Hao and Liu, Shaohui and Wang, Haoqian and Zhang, Yongbing}, title = {LNPL-MIL: Learning from Noisy Pseudo Labels for Promoting Multiple Instance Learning in Whole Slide Image}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21495-21505} }
Few-Shot Dataset Distillation via Translative Pre-Training-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Songhua and Wang, Xinchao}, title = {Few-Shot Dataset Distillation via Translative Pre-Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18654-18664} }
Random Sub-Samples Generation for Self-Supervised Real Image Denoising-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Pan_2023_ICCV, author = {Pan, Yizhong and Liu, Xiao and Liao, Xiangyu and Cao, Yuanzhouhan and Ren, Chao}, title = {Random Sub-Samples Generation for Self-Supervised Real Image Denoising}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12150-12159} }
Waffling Around for Performance: Visual Classification with Random Words and Broad Concepts-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Roth_2023_ICCV, author = {Roth, Karsten and Kim, Jae Myung and Koepke, A. Sophia and Vinyals, Oriol and Schmid, Cordelia and Akata, Zeynep}, title = {Waffling Around for Performance: Visual Classification with Random Words and Broad Concepts}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15746-15757} }
Unsupervised Surface Anomaly Detection with Diffusion Probabilistic Model-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Xinyi and Li, Naiqi and Li, Jiawei and Dai, Tao and Jiang, Yong and Xia, Shu-Tao}, title = {Unsupervised Surface Anomaly Detection with Diffusion Probabilistic Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6782-6791} }
AutoAD II: The Sequel - Who, When, and What in Movie Audio Description-
[pdf]
[supp]
[bibtex]@InProceedings{Han_2023_ICCV, author = {Han, Tengda and Bain, Max and Nagrani, Arsha and Varol, Gul and Xie, Weidi and Zisserman, Andrew}, title = {AutoAD II: The Sequel - Who, When, and What in Movie Audio Description}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13645-13655} }
TinyCLIP: CLIP Distillation via Affinity Mimicking and Weight Inheritance-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Kan and Peng, Houwen and Zhou, Zhenghong and Xiao, Bin and Liu, Mengchen and Yuan, Lu and Xuan, Hong and Valenzuela, Michael and Chen, Xi (Stephen) and Wang, Xinggang and Chao, Hongyang and Hu, Han}, title = {TinyCLIP: CLIP Distillation via Affinity Mimicking and Weight Inheritance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21970-21980} }
Hyperbolic Chamfer Distance for Point Cloud Completion-
[pdf]
[bibtex]@InProceedings{Lin_2023_ICCV, author = {Lin, Fangzhou and Yue, Yun and Hou, Songlin and Yu, Xuechu and Xu, Yajun and Yamada, Kazunori D and Zhang, Ziming}, title = {Hyperbolic Chamfer Distance for Point Cloud Completion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14595-14606} }
Democratising 2D Sketch to 3D Shape Retrieval Through Pivoting-
[pdf]
[supp]
[bibtex]@InProceedings{Chowdhury_2023_ICCV, author = {Chowdhury, Pinaki Nath and Bhunia, Ayan Kumar and Sain, Aneeshan and Koley, Subhadeep and Xiang, Tao and Song, Yi-Zhe}, title = {Democratising 2D Sketch to 3D Shape Retrieval Through Pivoting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23275-23286} }
Simoun: Synergizing Interactive Motion-appearance Understanding for Vision-based Reinforcement Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Yangru and Peng, Peixi and Zhao, Yifan and Zhai, Yunpeng and Xu, Haoran and Tian, Yonghong}, title = {Simoun: Synergizing Interactive Motion-appearance Understanding for Vision-based Reinforcement Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {176-185} }
AG3D: Learning to Generate 3D Avatars from 2D Image Collections-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dong_2023_ICCV, author = {Dong, Zijian and Chen, Xu and Yang, Jinlong and Black, Michael J. and Hilliges, Otmar and Geiger, Andreas}, title = {AG3D: Learning to Generate 3D Avatars from 2D Image Collections}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14916-14927} }
KECOR: Kernel Coding Rate Maximization for Active 3D Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Luo_2023_ICCV, author = {Luo, Yadan and Chen, Zhuoxiao and Fang, Zhen and Zhang, Zheng and Baktashmotlagh, Mahsa and Huang, Zi}, title = {KECOR: Kernel Coding Rate Maximization for Active 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18279-18290} }
Learned Image Reasoning Prior Penetrates Deep Unfolding Network for Panchromatic and Multi-spectral Image Fusion-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Man and Huang, Jie and Zheng, Naishan and Li, Chongyi}, title = {Learned Image Reasoning Prior Penetrates Deep Unfolding Network for Panchromatic and Multi-spectral Image Fusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12398-12407} }
Representation Disparity-aware Distillation for 3D Object Detection-
[pdf]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Yanjing and Xu, Sheng and Lin, Mingbao and Yin, Jihao and Zhang, Baochang and Cao, Xianbin}, title = {Representation Disparity-aware Distillation for 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6715-6724} }
NCHO: Unsupervised Learning for Neural 3D Composition of Humans and Objects-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2023_ICCV, author = {Kim, Taeksoo and Saito, Shunsuke and Joo, Hanbyul}, title = {NCHO: Unsupervised Learning for Neural 3D Composition of Humans and Objects}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14817-14828} }
Breaking The Limits of Text-conditioned 3D Motion Synthesis with Elaborative Descriptions-
[pdf]
[bibtex]@InProceedings{Qian_2023_ICCV, author = {Qian, Yijun and Urbanek, Jack and Hauptmann, Alexander G. and Won, Jungdam}, title = {Breaking The Limits of Text-conditioned 3D Motion Synthesis with Elaborative Descriptions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2306-2316} }
VL-PET: Vision-and-Language Parameter-Efficient Tuning via Granularity Control-
[pdf]
[supp]
[bibtex]@InProceedings{Hu_2023_ICCV, author = {Hu, Zi-Yuan and Li, Yanyang and Lyu, Michael R. and Wang, Liwei}, title = {VL-PET: Vision-and-Language Parameter-Efficient Tuning via Granularity Control}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3010-3020} }
ROME: Robustifying Memory-Efficient NAS via Topology Disentanglement and Gradient Accumulation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Xiaoxing and Chu, Xiangxiang and Fan, Yuda and Zhang, Zhexi and Zhang, Bo and Yang, Xiaokang and Yan, Junchi}, title = {ROME: Robustifying Memory-Efficient NAS via Topology Disentanglement and Gradient Accumulation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5939-5949} }
Toward Multi-Granularity Decision-Making: Explicit Visual Reasoning with Hierarchical Knowledge-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Yifeng and Chen, Shi and Zhao, Qi}, title = {Toward Multi-Granularity Decision-Making: Explicit Visual Reasoning with Hierarchical Knowledge}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2573-2583} }
3D-aware Image Generation using 2D Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xiang_2023_ICCV, author = {Xiang, Jianfeng and Yang, Jiaolong and Huang, Binbin and Tong, Xin}, title = {3D-aware Image Generation using 2D Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2383-2393} }
Locating Noise is Halfway Denoising for Semi-Supervised Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Fang_2023_ICCV, author = {Fang, Yan and Zhu, Feng and Cheng, Bowen and Liu, Luoqi and Zhao, Yao and Wei, Yunchao}, title = {Locating Noise is Halfway Denoising for Semi-Supervised Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16612-16622} }
Learning Non-Local Spatial-Angular Correlation for Light Field Image Super-Resolution-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liang_2023_ICCV, author = {Liang, Zhengyu and Wang, Yingqian and Wang, Longguang and Yang, Jungang and Zhou, Shilin and Guo, Yulan}, title = {Learning Non-Local Spatial-Angular Correlation for Light Field Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12376-12386} }
ICE-NeRF: Interactive Color Editing of NeRFs via Decomposition-Aware Weight Optimization-
[pdf]
[bibtex]@InProceedings{Lee_2023_ICCV, author = {Lee, Jae-Hyeok and Kim, Dae-Shik}, title = {ICE-NeRF: Interactive Color Editing of NeRFs via Decomposition-Aware Weight Optimization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3491-3501} }
SPANet: Frequency-balancing Token Mixer using Spectral Pooling Aggregation Modulation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yun_2023_ICCV, author = {Yun, Guhnoo and Yoo, Juhan and Kim, Kijung and Lee, Jeongho and Kim, Dong Hwan}, title = {SPANet: Frequency-balancing Token Mixer using Spectral Pooling Aggregation Modulation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6113-6124} }
ASAG: Building Strong One-Decoder-Layer Sparse Detectors via Adaptive Sparse Anchor Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fu_2023_ICCV, author = {Fu, Shenghao and Yan, Junkai and Gao, Yipeng and Xie, Xiaohua and Zheng, Wei-Shi}, title = {ASAG: Building Strong One-Decoder-Layer Sparse Detectors via Adaptive Sparse Anchor Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6328-6338} }
MGMAE: Motion Guided Masking for Video Masked Autoencoding-
[pdf]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Bingkun and Zhao, Zhiyu and Zhang, Guozhen and Qiao, Yu and Wang, Limin}, title = {MGMAE: Motion Guided Masking for Video Masked Autoencoding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13493-13504} }
The Perils of Learning From Unlabeled Data: Backdoor Attacks on Semi-supervised Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shejwalkar_2023_ICCV, author = {Shejwalkar, Virat and Lyu, Lingjuan and Houmansadr, Amir}, title = {The Perils of Learning From Unlabeled Data: Backdoor Attacks on Semi-supervised Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4730-4740} }
SSB: Simple but Strong Baseline for Boosting Performance of Open-Set Semi-Supervised Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Fan_2023_ICCV, author = {Fan, Yue and Kukleva, Anna and Dai, Dengxin and Schiele, Bernt}, title = {SSB: Simple but Strong Baseline for Boosting Performance of Open-Set Semi-Supervised Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16068-16078} }
StyleDiffusion: Controllable Disentangled Style Transfer via Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Zhizhong and Zhao, Lei and Xing, Wei}, title = {StyleDiffusion: Controllable Disentangled Style Transfer via Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7677-7689} }
AdvDiffuser: Natural Adversarial Example Synthesis with Diffusion Models-
[pdf]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Xinquan and Gao, Xitong and Zhao, Juanjuan and Ye, Kejiang and Xu, Cheng-Zhong}, title = {AdvDiffuser: Natural Adversarial Example Synthesis with Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4562-4572} }
ViewRefer: Grasp the Multi-view Knowledge for 3D Visual Grounding-
[pdf]
[arXiv]
[bibtex]@InProceedings{Guo_2023_ICCV, author = {Guo, Zoey and Tang, Yiwen and Zhang, Ray and Wang, Dong and Wang, Zhigang and Zhao, Bin and Li, Xuelong}, title = {ViewRefer: Grasp the Multi-view Knowledge for 3D Visual Grounding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15372-15383} }
CaPhy: Capturing Physical Properties for Animatable Human Avatars-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Su_2023_ICCV, author = {Su, Zhaoqi and Hu, Liangxiao and Lin, Siyou and Zhang, Hongwen and Zhang, Shengping and Thies, Justus and Liu, Yebin}, title = {CaPhy: Capturing Physical Properties for Animatable Human Avatars}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14150-14160} }
DarSwin: Distortion Aware Radial Swin Transformer-
[pdf]
[bibtex]@InProceedings{Athwale_2023_ICCV, author = {Athwale, Akshaya and Afrasiyabi, Arman and Lag\"ue, Justin and Shili, Ichrak and Ahmad, Ola and Lalonde, Jean-Fran\c{c}ois}, title = {DarSwin: Distortion Aware Radial Swin Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5929-5938} }
Fine-grained Unsupervised Domain Adaptation for Gait Recognition-
[pdf]
[bibtex]@InProceedings{Ma_2023_ICCV, author = {Ma, Kang and Fu, Ying and Zheng, Dezhi and Peng, Yunjie and Cao, Chunshui and Huang, Yongzhen}, title = {Fine-grained Unsupervised Domain Adaptation for Gait Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11313-11322} }
Cross-Modal Orthogonal High-Rank Augmentation for RGB-Event Transformer-Trackers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Zhiyu and Hou, Junhui and Wu, Dapeng Oliver}, title = {Cross-Modal Orthogonal High-Rank Augmentation for RGB-Event Transformer-Trackers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22045-22055} }
Take-A-Photo: 3D-to-2D Generative Pre-training of Point Cloud Models-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Ziyi and Yu, Xumin and Rao, Yongming and Zhou, Jie and Lu, Jiwen}, title = {Take-A-Photo: 3D-to-2D Generative Pre-training of Point Cloud Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5640-5650} }
Open-vocabulary Panoptic Segmentation with Embedding Modulation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Xi and Li, Shuang and Lim, Ser-Nam and Torralba, Antonio and Zhao, Hengshuang}, title = {Open-vocabulary Panoptic Segmentation with Embedding Modulation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1141-1150} }
Beyond Single Path Integrated Gradients for Reliable Input Attribution via Randomized Path Sampling-
[pdf]
[supp]
[bibtex]@InProceedings{Jeon_2023_ICCV, author = {Jeon, Giyoung and Jeong, Haedong and Choi, Jaesik}, title = {Beyond Single Path Integrated Gradients for Reliable Input Attribution via Randomized Path Sampling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2052-2061} }
Instance-aware Dynamic Prompt Tuning for Pre-trained Point Cloud Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zha_2023_ICCV, author = {Zha, Yaohua and Wang, Jinpeng and Dai, Tao and Chen, Bin and Wang, Zhi and Xia, Shu-Tao}, title = {Instance-aware Dynamic Prompt Tuning for Pre-trained Point Cloud Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14161-14170} }
How to Boost Face Recognition with StyleGAN?-
[pdf]
[supp]
[bibtex]@InProceedings{Sevastopolskiy_2023_ICCV, author = {Sevastopolskiy, Artem and Malkov, Yury and Durasov, Nikita and Verdoliva, Luisa and Nie{\ss}ner, Matthias}, title = {How to Boost Face Recognition with StyleGAN?}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20924-20934} }
Text2Tex: Text-driven Texture Synthesis via Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Dave Zhenyu and Siddiqui, Yawar and Lee, Hsin-Ying and Tulyakov, Sergey and Nie{\ss}ner, Matthias}, title = {Text2Tex: Text-driven Texture Synthesis via Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18558-18568} }
MUVA: A New Large-Scale Benchmark for Multi-View Amodal Instance Segmentation in the Shopping Scenario-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Zhixuan and Ye, Weining and Terven, Juan and Bennett, Zachary and Zheng, Ying and Jiang, Tingting and Huang, Tiejun}, title = {MUVA: A New Large-Scale Benchmark for Multi-View Amodal Instance Segmentation in the Shopping Scenario}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23504-23513} }
Foreground-Background Separation through Concept Distillation from Generative Image Foundation Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dombrowski_2023_ICCV, author = {Dombrowski, Mischa and Reynaud, Hadrien and Baugh, Matthew and Kainz, Bernhard}, title = {Foreground-Background Separation through Concept Distillation from Generative Image Foundation Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {988-998} }
ENVIDR: Implicit Differentiable Renderer with Neural Environment Lighting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liang_2023_ICCV, author = {Liang, Ruofan and Chen, Huiting and Li, Chunlin and Chen, Fan and Panneer, Selvakumar and Vijaykumar, Nandita}, title = {ENVIDR: Implicit Differentiable Renderer with Neural Environment Lighting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {79-89} }
Not All Steps are Created Equal: Selective Diffusion Distillation for Image Manipulation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Luozhou and Yang, Shuai and Liu, Shu and Chen, Ying-cong}, title = {Not All Steps are Created Equal: Selective Diffusion Distillation for Image Manipulation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7472-7481} }
SeiT: Storage-Efficient Vision Training with Tokens Using 1% of Pixel Storage-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Park_2023_ICCV, author = {Park, Song and Chun, Sanghyuk and Heo, Byeongho and Kim, Wonjae and Yun, Sangdoo}, title = {SeiT: Storage-Efficient Vision Training with Tokens Using 1\% of Pixel Storage}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17248-17259} }
ALIP: Adaptive Language-Image Pre-Training with Synthetic Caption-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Kaicheng and Deng, Jiankang and An, Xiang and Li, Jiawei and Feng, Ziyong and Guo, Jia and Yang, Jing and Liu, Tongliang}, title = {ALIP: Adaptive Language-Image Pre-Training with Synthetic Caption}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2922-2931} }
GeoUDF: Surface Reconstruction from 3D Point Clouds via Geometry-guided Distance Representation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ren_2023_ICCV, author = {Ren, Siyu and Hou, Junhui and Chen, Xiaodong and He, Ying and Wang, Wenping}, title = {GeoUDF: Surface Reconstruction from 3D Point Clouds via Geometry-guided Distance Representation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14214-14224} }
LaPE: Layer-adaptive Position Embedding for Vision Transformers with Independent Layer Normalization-
[pdf]
[supp]
[bibtex]@InProceedings{Yu_2023_ICCV, author = {Yu, Runyi and Wang, Zhennan and Wang, Yinhuai and Li, Kehan and Liu, Chang and Duan, Haoyi and Ji, Xiangyang and Chen, Jie}, title = {LaPE: Layer-adaptive Position Embedding for Vision Transformers with Independent Layer Normalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5886-5896} }
CLIP2Point: Transfer CLIP to Point Cloud Classification with Image-Depth Pre-Training-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Tianyu and Dong, Bowen and Yang, Yunhan and Huang, Xiaoshui and Lau, Rynson W.H. and Ouyang, Wanli and Zuo, Wangmeng}, title = {CLIP2Point: Transfer CLIP to Point Cloud Classification with Image-Depth Pre-Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22157-22167} }
Parametric Classification for Generalized Category Discovery: A Baseline Study-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wen_2023_ICCV, author = {Wen, Xin and Zhao, Bingchen and Qi, Xiaojuan}, title = {Parametric Classification for Generalized Category Discovery: A Baseline Study}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16590-16600} }
MeMOTR: Long-Term Memory-Augmented Transformer for Multi-Object Tracking-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gao_2023_ICCV, author = {Gao, Ruopeng and Wang, Limin}, title = {MeMOTR: Long-Term Memory-Augmented Transformer for Multi-Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9901-9910} }
RawHDR: High Dynamic Range Image Reconstruction from a Single Raw Image-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zou_2023_ICCV, author = {Zou, Yunhao and Yan, Chenggang and Fu, Ying}, title = {RawHDR: High Dynamic Range Image Reconstruction from a Single Raw Image}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12334-12344} }
Denoising Diffusion Autoencoders are Unified Self-supervised Learners-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xiang_2023_ICCV, author = {Xiang, Weilai and Yang, Hongyu and Huang, Di and Wang, Yunhong}, title = {Denoising Diffusion Autoencoders are Unified Self-supervised Learners}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15802-15812} }
Robust Object Modeling for Visual Tracking-
[pdf]
[arXiv]
[bibtex]@InProceedings{Cai_2023_ICCV, author = {Cai, Yidong and Liu, Jie and Tang, Jie and Wu, Gangshan}, title = {Robust Object Modeling for Visual Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9589-9600} }
FSI: Frequency and Spatial Interactive Learning for Image Restoration in Under-Display Cameras-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Chengxu and Wang, Xuan and Li, Shuai and Wang, Yuzhi and Qian, Xueming}, title = {FSI: Frequency and Spatial Interactive Learning for Image Restoration in Under-Display Cameras}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12537-12546} }
Cross-view Topology Based Consistent and Complementary Information for Deep Multi-view Clustering-
[pdf]
[bibtex]@InProceedings{Dong_2023_ICCV, author = {Dong, Zhibin and Wang, Siwei and Jin, Jiaqi and Liu, Xinwang and Zhu, En}, title = {Cross-view Topology Based Consistent and Complementary Information for Deep Multi-view Clustering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19440-19451} }
Distribution-Consistent Modal Recovering for Incomplete Multimodal Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Yuanzhi and Cui, Zhen and Li, Yong}, title = {Distribution-Consistent Modal Recovering for Incomplete Multimodal Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22025-22034} }
ContactGen: Generative Contact Modeling for Grasp Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Shaowei and Zhou, Yang and Yang, Jimei and Gupta, Saurabh and Wang, Shenlong}, title = {ContactGen: Generative Contact Modeling for Grasp Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20609-20620} }
Temporal Collection and Distribution for Referring Video Object Segmentation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Tang_2023_ICCV, author = {Tang, Jiajin and Zheng, Ge and Yang, Sibei}, title = {Temporal Collection and Distribution for Referring Video Object Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15466-15476} }
SA-BEV: Generating Semantic-Aware Bird's-Eye-View Feature for Multi-view 3D Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Jinqing and Zhang, Yanan and Liu, Qingjie and Wang, Yunhong}, title = {SA-BEV: Generating Semantic-Aware Bird's-Eye-View Feature for Multi-view 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3348-3357} }
Variational Degeneration to Structural Refinement: A Unified Framework for Superimposed Image Decomposition-
[pdf]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Wenyu and Xu, Yan and Yang, Yang and Ji, Haoran and Lang, Yue}, title = {Variational Degeneration to Structural Refinement: A Unified Framework for Superimposed Image Decomposition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12206-12216} }
Global Knowledge Calibration for Fast Open-Vocabulary Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Han_2023_ICCV, author = {Han, Kunyang and Liu, Yong and Liew, Jun Hao and Ding, Henghui and Liu, Jiajun and Wang, Yitong and Tang, Yansong and Yang, Yujiu and Feng, Jiashi and Zhao, Yao and Wei, Yunchao}, title = {Global Knowledge Calibration for Fast Open-Vocabulary Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {797-807} }
Ego-Humans: An Ego-Centric 3D Multi-Human Benchmark-
[pdf]
[supp]
[bibtex]@InProceedings{Khirodkar_2023_ICCV, author = {Khirodkar, Rawal and Bansal, Aayush and Ma, Lingni and Newcombe, Richard and Vo, Minh and Kitani, Kris}, title = {Ego-Humans: An Ego-Centric 3D Multi-Human Benchmark}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19807-19819} }
Focal Network for Image Restoration-
[pdf]
[supp]
[bibtex]@InProceedings{Cui_2023_ICCV, author = {Cui, Yuning and Ren, Wenqi and Cao, Xiaochun and Knoll, Alois}, title = {Focal Network for Image Restoration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13001-13011} }
Indoor Depth Recovery Based on Deep Unfolding with Non-Local Prior-
[pdf]
[bibtex]@InProceedings{Dai_2023_ICCV, author = {Dai, Yuhui and Zhang, Junkang and Fang, Faming and Zhang, Guixu}, title = {Indoor Depth Recovery Based on Deep Unfolding with Non-Local Prior}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12355-12364} }
Compatibility of Fundamental Matrices for Complete Viewing Graphs-
[pdf]
[supp]
[bibtex]@InProceedings{Bratelund_2023_ICCV, author = {Br\r{a}telund, Martin and Rydell, Felix}, title = {Compatibility of Fundamental Matrices for Complete Viewing Graphs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3328-3336} }
GAFlow: Incorporating Gaussian Attention into Optical Flow-
[pdf]
[bibtex]@InProceedings{Luo_2023_ICCV, author = {Luo, Ao and Yang, Fan and Li, Xin and Nie, Lang and Lin, Chunyu and Fan, Haoqiang and Liu, Shuaicheng}, title = {GAFlow: Incorporating Gaussian Attention into Optical Flow}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9642-9651} }
MAtch, eXpand and Improve: Unsupervised Finetuning for Zero-Shot Action Recognition with Language Knowledge-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lin_2023_ICCV, author = {Lin, Wei and Karlinsky, Leonid and Shvetsova, Nina and Possegger, Horst and Kozinski, Mateusz and Panda, Rameswar and Feris, Rogerio and Kuehne, Hilde and Bischof, Horst}, title = {MAtch, eXpand and Improve: Unsupervised Finetuning for Zero-Shot Action Recognition with Language Knowledge}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2851-2862} }
Space Engage: Collaborative Space Supervision for Contrastive-Based Semi-Supervised Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Changqi and Xie, Haoyu and Yuan, Yuhui and Fu, Chong and Yue, Xiangyu}, title = {Space Engage: Collaborative Space Supervision for Contrastive-Based Semi-Supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {931-942} }
Delving into Motion-Aware Matching for Monocular 3D Object Tracking-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Kuan-Chih and Yang, Ming-Hsuan and Tsai, Yi-Hsuan}, title = {Delving into Motion-Aware Matching for Monocular 3D Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6909-6918} }
SoDaCam: Software-defined Cameras via Single-Photon Imaging-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sundar_2023_ICCV, author = {Sundar, Varun and Ardelean, Andrei and Swedish, Tristan and Bruschini, Claudio and Charbon, Edoardo and Gupta, Mohit}, title = {SoDaCam: Software-defined Cameras via Single-Photon Imaging}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8165-8176} }
Reference-guided Controllable Inpainting of Neural Radiance Fields-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mirzaei_2023_ICCV, author = {Mirzaei, Ashkan and Aumentado-Armstrong, Tristan and Brubaker, Marcus A. and Kelly, Jonathan and Levinshtein, Alex and Derpanis, Konstantinos G. and Gilitschenski, Igor}, title = {Reference-guided Controllable Inpainting of Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17815-17825} }
Diffusion-Guided Reconstruction of Everyday Hand-Object Interaction Clips-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ye_2023_ICCV, author = {Ye, Yufei and Hebbar, Poorvi and Gupta, Abhinav and Tulsiani, Shubham}, title = {Diffusion-Guided Reconstruction of Everyday Hand-Object Interaction Clips}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19717-19728} }
Decoupled Iterative Refinement Framework for Interacting Hands Reconstruction from a Single RGB Image-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ren_2023_ICCV, author = {Ren, Pengfei and Wen, Chao and Zheng, Xiaozheng and Xue, Zhou and Sun, Haifeng and Qi, Qi and Wang, Jingyu and Liao, Jianxin}, title = {Decoupled Iterative Refinement Framework for Interacting Hands Reconstruction from a Single RGB Image}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8014-8025} }
Fast Adversarial Training with Smooth Convergence-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Mengnan and Zhang, Lihe and Kong, Yuqiu and Yin, Baocai}, title = {Fast Adversarial Training with Smooth Convergence}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4720-4729} }
Who Are You Referring To? Coreference Resolution In Image Narrations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Goel_2023_ICCV, author = {Goel, Arushi and Fernando, Basura and Keller, Frank and Bilen, Hakan}, title = {Who Are You Referring To? Coreference Resolution In Image Narrations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15247-15258} }
DVGaze: Dual-View Gaze Estimation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Cheng_2023_ICCV, author = {Cheng, Yihua and Lu, Feng}, title = {DVGaze: Dual-View Gaze Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20632-20641} }
Dynamic Hyperbolic Attention Network for Fine Hand-object Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Leng_2023_ICCV, author = {Leng, Zhiying and Wu, Shun-Cheng and Saleh, Mahdi and Montanaro, Antonio and Yu, Hao and Wang, Yin and Navab, Nassir and Liang, Xiaohui and Tombari, Federico}, title = {Dynamic Hyperbolic Attention Network for Fine Hand-object Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14894-14904} }
A-STAR: Test-time Attention Segregation and Retention for Text-to-image Synthesis-
[pdf]
[supp]
[bibtex]@InProceedings{Agarwal_2023_ICCV, author = {Agarwal, Aishwarya and Karanam, Srikrishna and Joseph, K J and Saxena, Apoorv and Goswami, Koustava and Srinivasan, Balaji Vasan}, title = {A-STAR: Test-time Attention Segregation and Retention for Text-to-image Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2283-2293} }
LivePose: Online 3D Reconstruction from Monocular Video with Dynamic Camera Poses-
[pdf]
[arXiv]
[bibtex]@InProceedings{Stier_2023_ICCV, author = {Stier, Noah and Angles, Baptiste and Yang, Liang and Yan, Yajie and Colburn, Alex and Chuang, Ming}, title = {LivePose: Online 3D Reconstruction from Monocular Video with Dynamic Camera Poses}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7921-7930} }
Efficient Joint Optimization of Layer-Adaptive Weight Pruning in Deep Neural Networks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Kaixin and Wang, Zhe and Geng, Xue and Wu, Min and Li, Xiaoli and Lin, Weisi}, title = {Efficient Joint Optimization of Layer-Adaptive Weight Pruning in Deep Neural Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17447-17457} }
Feature Modulation Transformer: Cross-Refinement of Global Representation via High-Frequency Prior for Image Super-Resolution-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Ao and Zhang, Le and Liu, Yun and Zhu, Ce}, title = {Feature Modulation Transformer: Cross-Refinement of Global Representation via High-Frequency Prior for Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12514-12524} }
Exploring the Sim2Real Gap Using Digital Twins-
[pdf]
[supp]
[bibtex]@InProceedings{Sudhakar_2023_ICCV, author = {Sudhakar, Sruthi and Hanzelka, Jon and Bobillot, Josh and Randhavane, Tanmay and Joshi, Neel and Vineet, Vibhav}, title = {Exploring the Sim2Real Gap Using Digital Twins}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20418-20427} }
MPI-Flow: Learning Realistic Optical Flow with Multiplane Images-
[pdf]
[bibtex]@InProceedings{Liang_2023_ICCV, author = {Liang, Yingping and Liu, Jiaming and Zhang, Debing and Fu, Ying}, title = {MPI-Flow: Learning Realistic Optical Flow with Multiplane Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13857-13868} }
Re:PolyWorld - A Graph Neural Network for Polygonal Scene Parsing-
[pdf]
[supp]
[bibtex]@InProceedings{Zorzi_2023_ICCV, author = {Zorzi, Stefano and Fraundorfer, Friedrich}, title = {Re:PolyWorld - A Graph Neural Network for Polygonal Scene Parsing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16762-16771} }
FaceCLIPNeRF: Text-driven 3D Face Manipulation using Deformable Neural Radiance Fields-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hwang_2023_ICCV, author = {Hwang, Sungwon and Hyung, Junha and Kim, Daejin and Kim, Min-Jung and Choo, Jaegul}, title = {FaceCLIPNeRF: Text-driven 3D Face Manipulation using Deformable Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3469-3479} }
Video State-Changing Object Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Yu_2023_ICCV, author = {Yu, Jiangwei and Li, Xiang and Zhao, Xinran and Zhang, Hongming and Wang, Yu-Xiong}, title = {Video State-Changing Object Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20439-20448} }
Learning Shape Primitives via Implicit Convexity Regularization-
[pdf]
[supp]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Xiaoyang and Zhang, Yi and Chen, Kai and Li, Teng and Zhang, Wenjun and Ni, Bingbing}, title = {Learning Shape Primitives via Implicit Convexity Regularization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3642-3651} }
MonoNeRF: Learning a Generalizable Dynamic Radiance Field from Monocular Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tian_2023_ICCV, author = {Tian, Fengrui and Du, Shaoyi and Duan, Yueqi}, title = {MonoNeRF: Learning a Generalizable Dynamic Radiance Field from Monocular Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17903-17913} }
PG-RCNN: Semantic Surface Point Generation for 3D Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Koo_2023_ICCV, author = {Koo, Inyong and Lee, Inyoung and Kim, Se-Ho and Kim, Hee-Seon and Jeon, Woo-jin and Kim, Changick}, title = {PG-RCNN: Semantic Surface Point Generation for 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18142-18151} }
ITI-GEN: Inclusive Text-to-Image Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Cheng and Chen, Xuanbai and Chai, Siqi and Wu, Chen Henry and Lagun, Dmitry and Beeler, Thabo and De la Torre, Fernando}, title = {ITI-GEN: Inclusive Text-to-Image Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3969-3980} }
Learning Depth Estimation for Transparent and Mirror Surfaces-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Costanzino_2023_ICCV, author = {Costanzino, Alex and Ramirez, Pierluigi Zama and Poggi, Matteo and Tosi, Fabio and Mattoccia, Stefano and Di Stefano, Luigi}, title = {Learning Depth Estimation for Transparent and Mirror Surfaces}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9244-9255} }
Learning Neural Eigenfunctions for Unsupervised Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Deng_2023_ICCV, author = {Deng, Zhijie and Luo, Yucen}, title = {Learning Neural Eigenfunctions for Unsupervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {551-561} }
Shape Analysis of Euclidean Curves under Frenet-Serret Framework-
[pdf]
[supp]
[bibtex]@InProceedings{Chassat_2023_ICCV, author = {Chassat, Perrine and Park, Juhyun and Brunel, Nicolas}, title = {Shape Analysis of Euclidean Curves under Frenet-Serret Framework}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4027-4036} }
Representation Uncertainty in Self-Supervised Learning as Variational Inference-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nakamura_2023_ICCV, author = {Nakamura, Hiroki and Okada, Masashi and Taniguchi, Tadahiro}, title = {Representation Uncertainty in Self-Supervised Learning as Variational Inference}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16484-16493} }
Efficient Diffusion Training via Min-SNR Weighting Strategy-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hang_2023_ICCV, author = {Hang, Tiankai and Gu, Shuyang and Li, Chen and Bao, Jianmin and Chen, Dong and Hu, Han and Geng, Xin and Guo, Baining}, title = {Efficient Diffusion Training via Min-SNR Weighting Strategy}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7441-7451} }
Bridging Vision and Language Encoders: Parameter-Efficient Tuning for Referring Image Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Zunnan and Chen, Zhihong and Zhang, Yong and Song, Yibing and Wan, Xiang and Li, Guanbin}, title = {Bridging Vision and Language Encoders: Parameter-Efficient Tuning for Referring Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17503-17512} }
Towards Zero-Shot Scale-Aware Monocular Depth Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Guizilini_2023_ICCV, author = {Guizilini, Vitor and Vasiljevic, Igor and Chen, Dian and Ambruș, Rareș and Gaidon, Adrien}, title = {Towards Zero-Shot Scale-Aware Monocular Depth Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9233-9243} }
ATT3D: Amortized Text-to-3D Object Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lorraine_2023_ICCV, author = {Lorraine, Jonathan and Xie, Kevin and Zeng, Xiaohui and Lin, Chen-Hsuan and Takikawa, Towaki and Sharp, Nicholas and Lin, Tsung-Yi and Liu, Ming-Yu and Fidler, Sanja and Lucas, James}, title = {ATT3D: Amortized Text-to-3D Object Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17946-17956} }
Virtual Try-On with Pose-Garment Keypoints Guided Inpainting-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Zhi and Wei, Pengfei and Yin, Xiang and Ma, Zejun and Kot, Alex C.}, title = {Virtual Try-On with Pose-Garment Keypoints Guided Inpainting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22788-22797} }
Learning by Sorting: Self-supervised Learning with Group Ordering Constraints-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shvetsova_2023_ICCV, author = {Shvetsova, Nina and Petersen, Felix and Kukleva, Anna and Schiele, Bernt and Kuehne, Hilde}, title = {Learning by Sorting: Self-supervised Learning with Group Ordering Constraints}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16453-16463} }
Cross Modal Transformer: Towards Fast and Robust 3D Object Detection-
[pdf]
[arXiv]
[bibtex]@InProceedings{Yan_2023_ICCV, author = {Yan, Junjie and Liu, Yingfei and Sun, Jianjian and Jia, Fan and Li, Shuailin and Wang, Tiancai and Zhang, Xiangyu}, title = {Cross Modal Transformer: Towards Fast and Robust 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18268-18278} }
Perceptual Grouping in Contrastive Vision-Language Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ranasinghe_2023_ICCV, author = {Ranasinghe, Kanchana and McKinzie, Brandon and Ravi, Sachin and Yang, Yinfei and Toshev, Alexander and Shlens, Jonathon}, title = {Perceptual Grouping in Contrastive Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5571-5584} }
Dynamic Perceiver for Efficient Visual Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Han_2023_ICCV, author = {Han, Yizeng and Han, Dongchen and Liu, Zeyu and Wang, Yulin and Pan, Xuran and Pu, Yifan and Deng, Chao and Feng, Junlan and Song, Shiji and Huang, Gao}, title = {Dynamic Perceiver for Efficient Visual Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5992-6002} }
MoTIF: Learning Motion Trajectories with Local Implicit Neural Functions for Continuous Space-Time Video Super-Resolution-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Yi-Hsin and Chen, Si-Cun and Chen, Yi-Hsin and Lin, Yen-Yu and Peng, Wen-Hsiao}, title = {MoTIF: Learning Motion Trajectories with Local Implicit Neural Functions for Continuous Space-Time Video Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23131-23141} }
CRN: Camera Radar Net for Accurate, Robust, Efficient 3D Perception-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2023_ICCV, author = {Kim, Youngseok and Shin, Juyeb and Kim, Sanmin and Lee, In-Jae and Choi, Jun Won and Kum, Dongsuk}, title = {CRN: Camera Radar Net for Accurate, Robust, Efficient 3D Perception}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17615-17626} }
PromptStyler: Prompt-driven Style Generation for Source-free Domain Generalization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cho_2023_ICCV, author = {Cho, Junhyeong and Nam, Gilhyun and Kim, Sungyeon and Yang, Hunmin and Kwak, Suha}, title = {PromptStyler: Prompt-driven Style Generation for Source-free Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15702-15712} }
Phasic Content Fusing Diffusion Model with Directional Distribution Consistency for Few-Shot Model Adaption-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hu_2023_ICCV, author = {Hu, Teng and Zhang, Jiangning and Liu, Liang and Yi, Ran and Kou, Siqi and Zhu, Haokun and Chen, Xu and Wang, Yabiao and Wang, Chengjie and Ma, Lizhuang}, title = {Phasic Content Fusing Diffusion Model with Directional Distribution Consistency for Few-Shot Model Adaption}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2406-2415} }
SVQNet: Sparse Voxel-Adjacent Query Network for 4D Spatio-Temporal LiDAR Semantic Segmentation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Xuechao and Xu, Shuangjie and Zou, Xiaoyi and Cao, Tongyi and Yeung, Dit-Yan and Fang, Lu}, title = {SVQNet: Sparse Voxel-Adjacent Query Network for 4D Spatio-Temporal LiDAR Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8569-8578} }
HAL3D: Hierarchical Active Learning for Fine-Grained 3D Part Labeling-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yu_2023_ICCV, author = {Yu, Fenggen and Qian, Yiming and Gil-Ureta, Francisca and Jackson, Brian and Bennett, Eric and Zhang, Hao}, title = {HAL3D: Hierarchical Active Learning for Fine-Grained 3D Part Labeling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {865-875} }
MEFLUT: Unsupervised 1D Lookup Tables for Multi-exposure Image Fusion-
[pdf]
[arXiv]
[bibtex]@InProceedings{Jiang_2023_ICCV, author = {Jiang, Ting and Wang, Chuan and Li, Xinpeng and Li, Ru and Fan, Haoqiang and Liu, Shuaicheng}, title = {MEFLUT: Unsupervised 1D Lookup Tables for Multi-exposure Image Fusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10542-10551} }
FedPerfix: Towards Partial Model Personalization of Vision Transformers in Federated Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sun_2023_ICCV, author = {Sun, Guangyu and Mendieta, Matias and Luo, Jun and Wu, Shandong and Chen, Chen}, title = {FedPerfix: Towards Partial Model Personalization of Vision Transformers in Federated Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4988-4998} }
Conditional 360-degree Image Synthesis for Immersive Indoor Scene Decoration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shum_2023_ICCV, author = {Shum, Ka Chun and Pang, Hong-Wing and Hua, Binh-Son and Nguyen, Duc Thanh and Yeung, Sai-Kit}, title = {Conditional 360-degree Image Synthesis for Immersive Indoor Scene Decoration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4478-4488} }
The Unreasonable Effectiveness of Large Language-Vision Models for Source-Free Video Domain Adaptation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zara_2023_ICCV, author = {Zara, Giacomo and Conti, Alessandro and Roy, Subhankar and Lathuili\`ere, St\'ephane and Rota, Paolo and Ricci, Elisa}, title = {The Unreasonable Effectiveness of Large Language-Vision Models for Source-Free Video Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10307-10317} }
SIDGAN: High-Resolution Dubbed Video Generation via Shift-Invariant Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Muaz_2023_ICCV, author = {Muaz, Urwa and Jang, Wondong and Tripathi, Rohun and Mani, Santhosh and Ouyang, Wenbin and Gadde, Ravi Teja and Gecer, Baris and Elizondo, Sergio and Madad, Reza and Nair, Naveen}, title = {SIDGAN: High-Resolution Dubbed Video Generation via Shift-Invariant Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7833-7842} }
Meta-ZSDETR: Zero-shot DETR with Meta-learning-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Lu and Zhang, Chenbo and Zhao, Jiajia and Guan, Jihong and Zhou, Shuigeng}, title = {Meta-ZSDETR: Zero-shot DETR with Meta-learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6845-6854} }
GaPro: Box-Supervised 3D Point Cloud Instance Segmentation Using Gaussian Processes as Pseudo Labelers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ngo_2023_ICCV, author = {Ngo, Tuan Duc and Hua, Binh-Son and Nguyen, Khoi}, title = {GaPro: Box-Supervised 3D Point Cloud Instance Segmentation Using Gaussian Processes as Pseudo Labelers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17794-17803} }
STPrivacy: Spatio-Temporal Privacy-Preserving Action Recognition-
[pdf]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Ming and Xu, Xiangyu and Fan, Hehe and Zhou, Pan and Liu, Jun and Liu, Jia-Wei and Li, Jiahe and Keppo, Jussi and Shou, Mike Zheng and Yan, Shuicheng}, title = {STPrivacy: Spatio-Temporal Privacy-Preserving Action Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5106-5115} }
Get the Best of Both Worlds: Improving Accuracy and Transferability by Grassmann Class Representation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Haoqi and Li, Zhizhong and Zhang, Wayne}, title = {Get the Best of Both Worlds: Improving Accuracy and Transferability by Grassmann Class Representation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22478-22487} }
Computationally-Efficient Neural Image Compression with Shallow Decoders-
[pdf]
[supp]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Yibo and Mandt, Stephan}, title = {Computationally-Efficient Neural Image Compression with Shallow Decoders}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {530-540} }
ObjectSDF++: Improved Object-Compositional Neural Implicit Surfaces-
[pdf]
[supp]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Qianyi and Wang, Kaisiyuan and Li, Kejie and Zheng, Jianmin and Cai, Jianfei}, title = {ObjectSDF++: Improved Object-Compositional Neural Implicit Surfaces}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21764-21774} }
Tracing the Origin of Adversarial Attack for Forensic Investigation and Deterrence-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fang_2023_ICCV, author = {Fang, Han and Zhang, Jiyi and Qiu, Yupeng and Liu, Jiayang and Xu, Ke and Fang, Chengfang and Chang, Ee-Chien}, title = {Tracing the Origin of Adversarial Attack for Forensic Investigation and Deterrence}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4335-4344} }
Sketch and Text Guided Diffusion Model for Colored Point Cloud Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Zijie and Wang, Yaonan and Feng, Mingtao and Xie, He and Mian, Ajmal}, title = {Sketch and Text Guided Diffusion Model for Colored Point Cloud Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8929-8939} }
Scenimefy: Learning to Craft Anime Scene via Semi-Supervised Image-to-Image Translation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jiang_2023_ICCV, author = {Jiang, Yuxin and Jiang, Liming and Yang, Shuai and Loy, Chen Change}, title = {Scenimefy: Learning to Craft Anime Scene via Semi-Supervised Image-to-Image Translation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7357-7367} }
Towards Unsupervised Domain Generalization for Face Anti-Spoofing-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Yuchen and Chen, Yabo and Gou, Mengran and Huang, Chun-Ting and Wang, Yaoming and Dai, Wenrui and Xiong, Hongkai}, title = {Towards Unsupervised Domain Generalization for Face Anti-Spoofing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20654-20664} }
DR-Tune: Improving Fine-tuning of Pretrained Visual Models by Distribution Regularization with Semantic Calibration-
[pdf]
[supp]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Nan and Chen, Jiaxin and Huang, Di}, title = {DR-Tune: Improving Fine-tuning of Pretrained Visual Models by Distribution Regularization with Semantic Calibration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1547-1556} }
MotionDeltaCNN: Sparse CNN Inference of Frame Differences in Moving Camera Videos with Spherical Buffers and Padded Convolutions-
[pdf]
[supp]
[bibtex]@InProceedings{Parger_2023_ICCV, author = {Parger, Mathias and Tang, Chengcheng and Neff, Thomas and Twigg, Christopher D. and Keskin, Cem and Wang, Robert and Steinberger, Markus}, title = {MotionDeltaCNN: Sparse CNN Inference of Frame Differences in Moving Camera Videos with Spherical Buffers and Padded Convolutions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17292-17301} }
General Image-to-Image Translation with One-Shot Image Guidance-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cheng_2023_ICCV, author = {Cheng, Bin and Liu, Zuhao and Peng, Yunbo and Lin, Yue}, title = {General Image-to-Image Translation with One-Shot Image Guidance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22736-22746} }
Dense 2D-3D Indoor Prediction with Sound via Aligned Cross-Modal Distillation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yun_2023_ICCV, author = {Yun, Heeseung and Na, Joonil and Kim, Gunhee}, title = {Dense 2D-3D Indoor Prediction with Sound via Aligned Cross-Modal Distillation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7863-7872} }
Leveraging SE(3) Equivariance for Learning 3D Geometric Shape Assembly-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Ruihai and Tie, Chenrui and Du, Yushi and Zhao, Yan and Dong, Hao}, title = {Leveraging SE(3) Equivariance for Learning 3D Geometric Shape Assembly}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14311-14320} }
Adversarial Bayesian Augmentation for Single-Source Domain Generalization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cheng_2023_ICCV, author = {Cheng, Sheng and Gokhale, Tejas and Yang, Yezhou}, title = {Adversarial Bayesian Augmentation for Single-Source Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11400-11410} }
Robust Geometry-Preserving Depth Estimation Using Differentiable Rendering-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Chi and Yin, Wei and Yu, Gang and Wang, Zhibin and Chen, Tao and Fu, Bin and Zhou, Joey Tianyi and Shen, Chunhua}, title = {Robust Geometry-Preserving Depth Estimation Using Differentiable Rendering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8951-8961} }
Self-regulating Prompts: Foundational Model Adaptation without Forgetting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Khattak_2023_ICCV, author = {Khattak, Muhammad Uzair and Wasim, Syed Talal and Naseer, Muzammal and Khan, Salman and Yang, Ming-Hsuan and Khan, Fahad Shahbaz}, title = {Self-regulating Prompts: Foundational Model Adaptation without Forgetting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15190-15200} }
ASM: Adaptive Skinning Model for High-Quality 3D Face Modeling-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Kai and Shang, Hong and Shi, Tianyang and Chen, Xinghan and Zhou, Jingkai and Sun, Zhongqian and Yang, Wei}, title = {ASM: Adaptive Skinning Model for High-Quality 3D Face Modeling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20708-20717} }
EverLight: Indoor-Outdoor Editable HDR Lighting Estimation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Dastjerdi_2023_ICCV, author = {Dastjerdi, Mohammad Reza Karimi and Eisenmann, Jonathan and Hold-Geoffroy, Yannick and Lalonde, Jean-Fran\c{c}ois}, title = {EverLight: Indoor-Outdoor Editable HDR Lighting Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7420-7429} }
MARS: Model-agnostic Biased Object Removal without Additional Supervision for Weakly-Supervised Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jo_2023_ICCV, author = {Jo, Sanghyun and Yu, In-Jae and Kim, Kyungsu}, title = {MARS: Model-agnostic Biased Object Removal without Additional Supervision for Weakly-Supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {614-623} }
CAFA: Class-Aware Feature Alignment for Test-Time Adaptation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jung_2023_ICCV, author = {Jung, Sanghun and Lee, Jungsoo and Kim, Nanhee and Shaban, Amirreza and Boots, Byron and Choo, Jaegul}, title = {CAFA: Class-Aware Feature Alignment for Test-Time Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19060-19071} }
Learning Clothing and Pose Invariant 3D Shape Representation for Long-Term Person Re-Identification-
[pdf]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Feng and Kim, Minchul and Gu, ZiAng and Jain, Anil and Liu, Xiaoming}, title = {Learning Clothing and Pose Invariant 3D Shape Representation for Long-Term Person Re-Identification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19617-19626} }
Agile Modeling: From Concept to Classifier in Minutes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Stretcu_2023_ICCV, author = {Stretcu, Otilia and Vendrow, Edward and Hata, Kenji and Viswanathan, Krishnamurthy and Ferrari, Vittorio and Tavakkol, Sasan and Zhou, Wenlei and Avinash, Aditya and Luo, Emming and Alldrin, Neil Gordon and Bateni, MohammadHossein and Berger, Gabriel and Bunner, Andrew and Lu, Chun-Ta and Rey, Javier and DeSalvo, Giulia and Krishna, Ranjay and Fuxman, Ariel}, title = {Agile Modeling: From Concept to Classifier in Minutes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22323-22334} }
Improving Lens Flare Removal with General-Purpose Pipeline and Multiple Light Sources Recovery-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Yuyan and Liang, Dong and Chen, Songcan and Huang, Sheng-Jun and Yang, Shuo and Li, Chongyi}, title = {Improving Lens Flare Removal with General-Purpose Pipeline and Multiple Light Sources Recovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12969-12979} }
FACET: Fairness in Computer Vision Evaluation Benchmark-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gustafson_2023_ICCV, author = {Gustafson, Laura and Rolland, Chloe and Ravi, Nikhila and Duval, Quentin and Adcock, Aaron and Fu, Cheng-Yang and Hall, Melissa and Ross, Candace}, title = {FACET: Fairness in Computer Vision Evaluation Benchmark}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20370-20382} }
Few-Shot Physically-Aware Articulated Mesh Generation via Hierarchical Deformation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Xueyi and Wang, Bin and Wang, He and Yi, Li}, title = {Few-Shot Physically-Aware Articulated Mesh Generation via Hierarchical Deformation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {854-864} }
Single-Stage Diffusion NeRF: A Unified Approach to 3D Generation and Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Hansheng and Gu, Jiatao and Chen, Anpei and Tian, Wei and Tu, Zhuowen and Liu, Lingjie and Su, Hao}, title = {Single-Stage Diffusion NeRF: A Unified Approach to 3D Generation and Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2416-2425} }
DCPB: Deformable Convolution Based on the Poincare Ball for Top-view Fisheye Cameras-
[pdf]
[bibtex]@InProceedings{Wei_2023_ICCV, author = {Wei, Xuan and Ran, Zhidan and Lu, Xiaobo}, title = {DCPB: Deformable Convolution Based on the Poincare Ball for Top-view Fisheye Cameras}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13308-13317} }
Integrating Boxes and Masks: A Multi-Object Framework for Unified Visual Tracking and Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Yuanyou and Yang, Zongxin and Yang, Yi}, title = {Integrating Boxes and Masks: A Multi-Object Framework for Unified Visual Tracking and Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9738-9751} }
One-Shot Generative Domain Adaptation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Ceyuan and Shen, Yujun and Zhang, Zhiyi and Xu, Yinghao and Zhu, Jiapeng and Wu, Zhirong and Zhou, Bolei}, title = {One-Shot Generative Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7733-7742} }
Prototypes-oriented Transductive Few-shot Learning with Conditional Transport-
[pdf]
[arXiv]
[bibtex]@InProceedings{Tian_2023_ICCV, author = {Tian, Long and Feng, Jingyi and Chai, Xiaoqiang and Chen, Wenchao and Wang, Liming and Liu, Xiyang and Chen, Bo}, title = {Prototypes-oriented Transductive Few-shot Learning with Conditional Transport}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16317-16326} }
SparseFusion: Fusing Multi-Modal Sparse Representations for Multi-Sensor 3D Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xie_2023_ICCV, author = {Xie, Yichen and Xu, Chenfeng and Rakotosaona, Marie-Julie and Rim, Patrick and Tombari, Federico and Keutzer, Kurt and Tomizuka, Masayoshi and Zhan, Wei}, title = {SparseFusion: Fusing Multi-Modal Sparse Representations for Multi-Sensor 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17591-17602} }
DetermiNet: A Large-Scale Diagnostic Dataset for Complex Visually-Grounded Referencing using Determiners-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2023_ICCV, author = {Lee, Clarence and Kumar, M Ganesh and Tan, Cheston}, title = {DetermiNet: A Large-Scale Diagnostic Dataset for Complex Visually-Grounded Referencing using Determiners}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20019-20028} }
3DMOTFormer: Graph Transformer for Online 3D Multi-Object Tracking-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ding_2023_ICCV, author = {Ding, Shuxiao and Rehder, Eike and Schneider, Lukas and Cordts, Marius and Gall, Juergen}, title = {3DMOTFormer: Graph Transformer for Online 3D Multi-Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9784-9794} }
ReGen: A good Generative Zero-Shot Video Classifier Should be Rewarded-
[pdf]
[supp]
[bibtex]@InProceedings{Bulat_2023_ICCV, author = {Bulat, Adrian and Sanchez, Enrique and Martinez, Brais and Tzimiropoulos, Georgios}, title = {ReGen: A good Generative Zero-Shot Video Classifier Should be Rewarded}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13523-13533} }
Complementary Domain Adaptation and Generalization for Unsupervised Continual Domain Shift Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cho_2023_ICCV, author = {Cho, Wonguk and Park, Jinha and Kim, Taesup}, title = {Complementary Domain Adaptation and Generalization for Unsupervised Continual Domain Shift Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11442-11452} }
RICO: Regularizing the Unobservable for Indoor Compositional Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Zizhang and Lyu, Xiaoyang and Ding, Yuanyuan and Wang, Mengmeng and Liao, Yiyi and Liu, Yong}, title = {RICO: Regularizing the Unobservable for Indoor Compositional Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17761-17771} }
Ordered Atomic Activity for Fine-grained Interactive Traffic Scenario Understanding-
[pdf]
[supp]
[bibtex]@InProceedings{Agarwal_2023_ICCV, author = {Agarwal, Nakul and Chen, Yi-Ting}, title = {Ordered Atomic Activity for Fine-grained Interactive Traffic Scenario Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8624-8636} }
CO-PILOT: Dynamic Top-Down Point Cloud with Conditional Neighborhood Aggregation for Multi-Gigapixel Histopathology Image Representation-
[pdf]
[supp]
[bibtex]@InProceedings{Nakhli_2023_ICCV, author = {Nakhli, Ramin and Zhang, Allen and Mirabadi, Ali and Rich, Katherine and Asadi, Maryam and Gilks, Blake and Farahani, Hossein and Bashashati, Ali}, title = {CO-PILOT: Dynamic Top-Down Point Cloud with Conditional Neighborhood Aggregation for Multi-Gigapixel Histopathology Image Representation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21063-21073} }
Troubleshooting Ethnic Quality Bias with Curriculum Domain Adaptation for Face Image Quality Assessment-
[pdf]
[bibtex]@InProceedings{Ou_2023_ICCV, author = {Ou, Fu-Zhao and Chen, Baoliang and Li, Chongyi and Wang, Shiqi and Kwong, Sam}, title = {Troubleshooting Ethnic Quality Bias with Curriculum Domain Adaptation for Face Image Quality Assessment}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20718-20729} }
HybridAugment++: Unified Frequency Spectra Perturbations for Model Robustness-
[pdf]
[supp]
[bibtex]@InProceedings{Yucel_2023_ICCV, author = {Yucel, Mehmet Kerim and Cinbis, Ramazan Gokberk and Duygulu, Pinar}, title = {HybridAugment++: Unified Frequency Spectra Perturbations for Model Robustness}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5718-5728} }
CLR: Channel-wise Lightweight Reprogramming for Continual Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ge_2023_ICCV, author = {Ge, Yunhao and Li, Yuecheng and Ni, Shuo and Zhao, Jiaping and Yang, Ming-Hsuan and Itti, Laurent}, title = {CLR: Channel-wise Lightweight Reprogramming for Continual Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18798-18808} }
IOMatch: Simplifying Open-Set Semi-Supervised Learning with Joint Inliers and Outliers Utilization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Zekun and Qi, Lei and Shi, Yinghuan and Gao, Yang}, title = {IOMatch: Simplifying Open-Set Semi-Supervised Learning with Joint Inliers and Outliers Utilization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15870-15879} }
Hierarchical Point-based Active Learning for Semi-supervised Point Cloud Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Zongyi and Yuan, Bo and Zhao, Shanshan and Zhang, Qianni and Gao, Xinbo}, title = {Hierarchical Point-based Active Learning for Semi-supervised Point Cloud Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18098-18108} }
Doppelgangers: Learning to Disambiguate Images of Similar Structures-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cai_2023_ICCV, author = {Cai, Ruojin and Tung, Joseph and Wang, Qianqian and Averbuch-Elor, Hadar and Hariharan, Bharath and Snavely, Noah}, title = {Doppelgangers: Learning to Disambiguate Images of Similar Structures}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {34-44} }
BEV-DG: Cross-Modal Learning under Bird's-Eye View for Domain Generalization of 3D Semantic Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Miaoyu and Zhang, Yachao and Ma, Xu and Qu, Yanyun and Fu, Yun}, title = {BEV-DG: Cross-Modal Learning under Bird's-Eye View for Domain Generalization of 3D Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11632-11642} }
Grounded Entity-Landmark Adaptive Pre-Training for Vision-and-Language Navigation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cui_2023_ICCV, author = {Cui, Yibo and Xie, Liang and Zhang, Yakun and Zhang, Meishan and Yan, Ye and Yin, Erwei}, title = {Grounded Entity-Landmark Adaptive Pre-Training for Vision-and-Language Navigation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12043-12053} }
Lip Reading for Low-resource Languages by Learning and Combining General Speech Knowledge and Language-specific Knowledge-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2023_ICCV, author = {Kim, Minsu and Yeo, Jeong Hun and Choi, Jeongsoo and Ro, Yong Man}, title = {Lip Reading for Low-resource Languages by Learning and Combining General Speech Knowledge and Language-specific Knowledge}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15359-15371} }
Quality-Agnostic Deepfake Detection with Intra-model Collaborative Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Le_2023_ICCV, author = {Le, Binh M. and Woo, Simon S.}, title = {Quality-Agnostic Deepfake Detection with Intra-model Collaborative Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22378-22389} }
Object-Centric Multiple Object Tracking-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Zixu and Wang, Jiaze and Horn, Max and Ding, Yizhuo and He, Tong and Bai, Zechen and Zietlow, Dominik and Simon-Gabriel, Carl-Johann and Shuai, Bing and Tu, Zhuowen and Brox, Thomas and Schiele, Bernt and Fu, Yanwei and Locatello, Francesco and Zhang, Zheng and Xiao, Tianjun}, title = {Object-Centric Multiple Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16601-16611} }
Point-TTA: Test-Time Adaptation for Point Cloud Registration Using Multitask Meta-Auxiliary Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Hatem_2023_ICCV, author = {Hatem, Ahmed and Qian, Yiming and Wang, Yang}, title = {Point-TTA: Test-Time Adaptation for Point Cloud Registration Using Multitask Meta-Auxiliary Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16494-16504} }
HopFIR: Hop-wise GraphFormer with Intragroup Joint Refinement for 3D Human Pose Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhai_2023_ICCV, author = {Zhai, Kai and Nie, Qiang and Ouyang, Bo and Li, Xiang and Yang, Shanlin}, title = {HopFIR: Hop-wise GraphFormer with Intragroup Joint Refinement for 3D Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14985-14995} }
Improving Generalization of Adversarial Training via Robust Critical Fine-Tuning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Kaijie and Hu, Xixu and Wang, Jindong and Xie, Xing and Yang, Ge}, title = {Improving Generalization of Adversarial Training via Robust Critical Fine-Tuning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4424-4434} }
Minimal Solutions to Generalized Three-View Relative Pose Problem-
[pdf]
[supp]
[bibtex]@InProceedings{Ding_2023_ICCV, author = {Ding, Yaqing and Chien, Chiang-Heng and Larsson, Viktor and \r{A}str\"om, Karl and Kimia, Benjamin}, title = {Minimal Solutions to Generalized Three-View Relative Pose Problem}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8156-8164} }
Trajectory Unified Transformer for Pedestrian Trajectory Prediction-
[pdf]
[supp]
[bibtex]@InProceedings{Shi_2023_ICCV, author = {Shi, Liushuai and Wang, Le and Zhou, Sanping and Hua, Gang}, title = {Trajectory Unified Transformer for Pedestrian Trajectory Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9675-9684} }
Understanding the Feature Norm for Out-of-Distribution Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Park_2023_ICCV, author = {Park, Jaewoo and Chai, Jacky Chen Long and Yoon, Jaeho and Teoh, Andrew Beng Jin}, title = {Understanding the Feature Norm for Out-of-Distribution Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1557-1567} }
MHEntropy: Entropy Meets Multiple Hypotheses for Pose and Shape Recovery-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Rongyu and Yang, Linlin and Yao, Angela}, title = {MHEntropy: Entropy Meets Multiple Hypotheses for Pose and Shape Recovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14840-14849} }
uSplit: Image Decomposition for Fluorescence Microscopy-
[pdf]
[supp]
[bibtex]@InProceedings{Ashesh_2023_ICCV, author = {Ashesh, Ashesh and Krull, Alexander and Di Sante, Moises and Pasqualini, Francesco and Jug, Florian}, title = {uSplit: Image Decomposition for Fluorescence Microscopy}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21219-21229} }
Modeling the Relative Visual Tempo for Self-supervised Skeleton-based Action Recognition-
[pdf]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Yisheng and Han, Hu and Yu, Zhengtao and Liu, Guangcan}, title = {Modeling the Relative Visual Tempo for Self-supervised Skeleton-based Action Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13913-13922} }
LightGlue: Local Feature Matching at Light Speed-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lindenberger_2023_ICCV, author = {Lindenberger, Philipp and Sarlin, Paul-Edouard and Pollefeys, Marc}, title = {LightGlue: Local Feature Matching at Light Speed}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17627-17638} }
Masked Autoencoders are Efficient Class Incremental Learners-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhai_2023_ICCV, author = {Zhai, Jiang-Tian and Liu, Xialei and Bagdanov, Andrew D. and Li, Ke and Cheng, Ming-Ming}, title = {Masked Autoencoders are Efficient Class Incremental Learners}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19104-19113} }
Knowledge Proxy Intervention for Deconfounded Video Question Answering-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Jiangtong and Niu, Li and Zhang, Liqing}, title = {Knowledge Proxy Intervention for Deconfounded Video Question Answering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2782-2793} }
Towards Semi-supervised Learning with Non-random Missing Labels-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Duan_2023_ICCV, author = {Duan, Yue and Zhao, Zhen and Qi, Lei and Zhou, Luping and Wang, Lei and Shi, Yinghuan}, title = {Towards Semi-supervised Learning with Non-random Missing Labels}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16121-16131} }
DetZero: Rethinking Offboard 3D Object Detection with Long-term Sequential Point Clouds-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ma_2023_ICCV, author = {Ma, Tao and Yang, Xuemeng and Zhou, Hongbin and Li, Xin and Shi, Botian and Liu, Junjie and Yang, Yuchen and Liu, Zhizheng and He, Liang and Qiao, Yu and Li, Yikang and Li, Hongsheng}, title = {DetZero: Rethinking Offboard 3D Object Detection with Long-term Sequential Point Clouds}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6736-6747} }
ImbSAM: A Closer Look at Sharpness-Aware Minimization in Class-Imbalanced Recognition-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Yixuan and Qu, Yi and Xu, Xing and Shen, Hengtao}, title = {ImbSAM: A Closer Look at Sharpness-Aware Minimization in Class-Imbalanced Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11345-11355} }
Learning from Noisy Data for Semi-Supervised 3D Object Detection-
[pdf]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Zehui and Li, Zhenyu and Wang, Shuo and Fu, Dengpan and Zhao, Feng}, title = {Learning from Noisy Data for Semi-Supervised 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6929-6939} }
NeRFrac: Neural Radiance Fields through Refractive Surface-
[pdf]
[supp]
[bibtex]@InProceedings{Zhan_2023_ICCV, author = {Zhan, Yifan and Nobuhara, Shohei and Nishino, Ko and Zheng, Yinqiang}, title = {NeRFrac: Neural Radiance Fields through Refractive Surface}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18402-18412} }
MonoDETR: Depth-guided Transformer for Monocular 3D Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Renrui and Qiu, Han and Wang, Tai and Guo, Ziyu and Cui, Ziteng and Qiao, Yu and Li, Hongsheng and Gao, Peng}, title = {MonoDETR: Depth-guided Transformer for Monocular 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9155-9166} }
Towards Authentic Face Restoration with Iterative Diffusion Models and Beyond-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Yang and Hou, Tingbo and Su, Yu-Chuan and Jia, Xuhui and Li, Yandong and Grundmann, Matthias}, title = {Towards Authentic Face Restoration with Iterative Diffusion Models and Beyond}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7312-7322} }
LivelySpeaker: Towards Semantic-Aware Co-Speech Gesture Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhi_2023_ICCV, author = {Zhi, Yihao and Cun, Xiaodong and Chen, Xuelin and Shen, Xi and Guo, Wen and Huang, Shaoli and Gao, Shenghua}, title = {LivelySpeaker: Towards Semantic-Aware Co-Speech Gesture Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20807-20817} }
Contrastive Feature Masking Open-Vocabulary Vision Transformer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2023_ICCV, author = {Kim, Dahun and Angelova, Anelia and Kuo, Weicheng}, title = {Contrastive Feature Masking Open-Vocabulary Vision Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15602-15612} }
Group DETR: Fast DETR Training with Group-Wise One-to-Many Assignment-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Qiang and Chen, Xiaokang and Wang, Jian and Zhang, Shan and Yao, Kun and Feng, Haocheng and Han, Junyu and Ding, Errui and Zeng, Gang and Wang, Jingdong}, title = {Group DETR: Fast DETR Training with Group-Wise One-to-Many Assignment}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6633-6642} }
Preventing Zero-Shot Transfer Degradation in Continual Learning of Vision-Language Models-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zheng_2023_ICCV, author = {Zheng, Zangwei and Ma, Mingyuan and Wang, Kai and Qin, Ziheng and Yue, Xiangyu and You, Yang}, title = {Preventing Zero-Shot Transfer Degradation in Continual Learning of Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19125-19136} }
Personalized Image Generation for Color Vision Deficiency Population-
[pdf]
[supp]
[bibtex]@InProceedings{Jiang_2023_ICCV, author = {Jiang, Shuyi and Liu, Daochang and Li, Dingquan and Xu, Chang}, title = {Personalized Image Generation for Color Vision Deficiency Population}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22571-22580} }
EGC: Image Generation and Classification via a Diffusion Energy-Based Model-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Guo_2023_ICCV, author = {Guo, Qiushan and Ma, Chuofan and Jiang, Yi and Yuan, Zehuan and Yu, Yizhou and Luo, Ping}, title = {EGC: Image Generation and Classification via a Diffusion Energy-Based Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22952-22962} }
OccFormer: Dual-path Transformer for Vision-based 3D Semantic Occupancy Prediction-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Yunpeng and Zhu, Zheng and Du, Dalong}, title = {OccFormer: Dual-path Transformer for Vision-based 3D Semantic Occupancy Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9433-9443} }
Probabilistic Triangulation for Uncalibrated Multi-View 3D Human Pose Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jiang_2023_ICCV, author = {Jiang, Boyuan and Hu, Lei and Xia, Shihong}, title = {Probabilistic Triangulation for Uncalibrated Multi-View 3D Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14850-14860} }
Joint Metrics Matter: A Better Standard for Trajectory Forecasting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Weng_2023_ICCV, author = {Weng, Erica and Hoshino, Hana and Ramanan, Deva and Kitani, Kris}, title = {Joint Metrics Matter: A Better Standard for Trajectory Forecasting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20315-20326} }
TORE: Token Reduction for Efficient Human Mesh Recovery with Transformer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dou_2023_ICCV, author = {Dou, Zhiyang and Wu, Qingxuan and Lin, Cheng and Cao, Zeyu and Wu, Qiangqiang and Wan, Weilin and Komura, Taku and Wang, Wenping}, title = {TORE: Token Reduction for Efficient Human Mesh Recovery with Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15143-15155} }
Test Time Adaptation for Blind Image Quality Assessment-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Roy_2023_ICCV, author = {Roy, Subhadeep and Mitra, Shankhanil and Biswas, Soma and Soundararajan, Rajiv}, title = {Test Time Adaptation for Blind Image Quality Assessment}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16742-16751} }
GeT: Generative Target Structure Debiasing for Domain Adaptation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Can and Lee, Gim Hee}, title = {GeT: Generative Target Structure Debiasing for Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23577-23588} }
D3G: Exploring Gaussian Prior for Temporal Sentence Grounding with Glance Annotation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Hanjun and Shu, Xiujun and He, Sunan and Qiao, Ruizhi and Wen, Wei and Guo, Taian and Gan, Bei and Sun, Xing}, title = {D3G: Exploring Gaussian Prior for Temporal Sentence Grounding with Glance Annotation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13734-13746} }
GEDepth: Ground Embedding for Monocular Depth Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Xiaodong and Ma, Zhuang and Ji, Zhiyu and Ren, Zhe}, title = {GEDepth: Ground Embedding for Monocular Depth Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12719-12727} }
DETRs with Collaborative Hybrid Assignments Training-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zong_2023_ICCV, author = {Zong, Zhuofan and Song, Guanglu and Liu, Yu}, title = {DETRs with Collaborative Hybrid Assignments Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6748-6758} }
Animal3D: A Comprehensive Dataset of 3D Animal Pose and Shape-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Jiacong and Zhang, Yi and Peng, Jiawei and Ma, Wufei and Jesslen, Artur and Ji, Pengliang and Hu, Qixin and Zhang, Jiehua and Liu, Qihao and Wang, Jiahao and Ji, Wei and Wang, Chen and Yuan, Xiaoding and Kaushik, Prakhar and Zhang, Guofeng and Liu, Jie and Xie, Yushan and Cui, Yawen and Yuille, Alan and Kortylewski, Adam}, title = {Animal3D: A Comprehensive Dataset of 3D Animal Pose and Shape}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9099-9109} }
Rethinking Video Frame Interpolation from Shutter Mode Induced Degradation-
[pdf]
[supp]
[bibtex]@InProceedings{Ji_2023_ICCV, author = {Ji, Xiang and Wang, Zhixiang and Zhong, Zhihang and Zheng, Yinqiang}, title = {Rethinking Video Frame Interpolation from Shutter Mode Induced Degradation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12259-12268} }
Multi-Modal Neural Radiance Field for Monocular Dense SLAM with a Light-Weight ToF Sensor-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Xinyang and Li, Yijin and Teng, Yanbin and Bao, Hujun and Zhang, Guofeng and Zhang, Yinda and Cui, Zhaopeng}, title = {Multi-Modal Neural Radiance Field for Monocular Dense SLAM with a Light-Weight ToF Sensor}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1-11} }
MonoNeRD: NeRF-like Representations for Monocular 3D Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Junkai and Peng, Liang and Cheng, Haoran and Li, Hao and Qian, Wei and Li, Ke and Wang, Wenxiao and Cai, Deng}, title = {MonoNeRD: NeRF-like Representations for Monocular 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6814-6824} }
Monocular 3D Object Detection with Bounding Box Denoising in 3D by Perceiver-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Xianpeng and Zheng, Ce and Cheng, Kelvin B and Xue, Nan and Qi, Guo-Jun and Wu, Tianfu}, title = {Monocular 3D Object Detection with Bounding Box Denoising in 3D by Perceiver}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6436-6446} }
Point-SLAM: Dense Neural Point Cloud-based SLAM-
[pdf]
[supp]
[bibtex]@InProceedings{Sandstrom_2023_ICCV, author = {Sandstr\"om, Erik and Li, Yue and Van Gool, Luc and Oswald, Martin R.}, title = {Point-SLAM: Dense Neural Point Cloud-based SLAM}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18433-18444} }
TrajectoryFormer: 3D Object Tracking Transformer with Predictive Trajectory Hypotheses-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Xuesong and Shi, Shaoshuai and Zhang, Chao and Zhu, Benjin and Wang, Qiang and Cheung, Ka Chun and See, Simon and Li, Hongsheng}, title = {TrajectoryFormer: 3D Object Tracking Transformer with Predictive Trajectory Hypotheses}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18527-18536} }
Semantic-Aware Dynamic Parameter for Video Inpainting Transformer-
[pdf]
[supp]
[bibtex]@InProceedings{Lee_2023_ICCV, author = {Lee, Eunhye and Yoo, Jinsu and Yang, Yunjeong and Baik, Sungyong and Kim, Tae Hyun}, title = {Semantic-Aware Dynamic Parameter for Video Inpainting Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12949-12958} }
See More and Know More: Zero-shot Point Cloud Segmentation via Multi-modal Visual Data-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lu_2023_ICCV, author = {Lu, Yuhang and Jiang, Qi and Chen, Runnan and Hou, Yuenan and Zhu, Xinge and Ma, Yuexin}, title = {See More and Know More: Zero-shot Point Cloud Segmentation via Multi-modal Visual Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21674-21684} }
SKED: Sketch-guided Text-based 3D Editing-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mikaeili_2023_ICCV, author = {Mikaeili, Aryan and Perel, Or and Safaee, Mehdi and Cohen-Or, Daniel and Mahdavi-Amiri, Ali}, title = {SKED: Sketch-guided Text-based 3D Editing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14607-14619} }
WaveIPT: Joint Attention and Flow Alignment in the Wavelet domain for Pose Transfer-
[pdf]
[supp]
[bibtex]@InProceedings{Ma_2023_ICCV, author = {Ma, Liyuan and Gao, Tingwei and Jiang, Haitian and Shen, Haibin and Huang, Kejie}, title = {WaveIPT: Joint Attention and Flow Alignment in the Wavelet domain for Pose Transfer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7215-7225} }
Editable Image Geometric Abstraction via Neural Primitive Assembly-
[pdf]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Ye and Ni, Bingbing and Chen, Xuanhong and Hu, Zhangli}, title = {Editable Image Geometric Abstraction via Neural Primitive Assembly}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23514-23523} }
Homeomorphism Alignment for Unsupervised Domain Adaptation-
[pdf]
[supp]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Lihua and Ye, Mao and Zhu, Xiatian and Xiao, Siying and Fan, Xu-Qian and Neri, Ferrante}, title = {Homeomorphism Alignment for Unsupervised Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18699-18710} }
MBPTrack: Improving 3D Point Cloud Tracking with Memory Networks and Box Priors-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Tian-Xing and Guo, Yuan-Chen and Lai, Yu-Kun and Zhang, Song-Hai}, title = {MBPTrack: Improving 3D Point Cloud Tracking with Memory Networks and Box Priors}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9911-9920} }
Novel-View Synthesis and Pose Estimation for Hand-Object Interaction from Sparse Views-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Qu_2023_ICCV, author = {Qu, Wentian and Cui, Zhaopeng and Zhang, Yinda and Meng, Chenyu and Ma, Cuixia and Deng, Xiaoming and Wang, Hongan}, title = {Novel-View Synthesis and Pose Estimation for Hand-Object Interaction from Sparse Views}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15100-15111} }
EmoSet: A Large-scale Visual Emotion Dataset with Rich Attributes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Jingyuan and Huang, Qirui and Ding, Tingting and Lischinski, Dani and Cohen-Or, Danny and Huang, Hui}, title = {EmoSet: A Large-scale Visual Emotion Dataset with Rich Attributes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20383-20394} }
Distilling from Similar Tasks for Transfer Learning on a Budget-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Borup_2023_ICCV, author = {Borup, Kenneth and Phoo, Cheng Perng and Hariharan, Bharath}, title = {Distilling from Similar Tasks for Transfer Learning on a Budget}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11431-11441} }
Self-Supervised Burst Super-Resolution-
[pdf]
[supp]
[bibtex]@InProceedings{Bhat_2023_ICCV, author = {Bhat, Goutam and Gharbi, Micha\"el and Chen, Jiawen and Van Gool, Luc and Xia, Zhihao}, title = {Self-Supervised Burst Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10605-10614} }
Class-relation Knowledge Distillation for Novel Class Discovery-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gu_2023_ICCV, author = {Gu, Peiyan and Zhang, Chuyu and Xu, Ruijie and He, Xuming}, title = {Class-relation Knowledge Distillation for Novel Class Discovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16474-16483} }
PARTNER: Level up the Polar Representation for LiDAR 3D Object Detection-
[pdf]
[arXiv]
[bibtex]@InProceedings{Nie_2023_ICCV, author = {Nie, Ming and Xue, Yujing and Wang, Chunwei and Ye, Chaoqiang and Xu, Hang and Zhu, Xinge and Huang, Qingqiu and Mi, Michael Bi and Wang, Xinchao and Zhang, Li}, title = {PARTNER: Level up the Polar Representation for LiDAR 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3801-3813} }
Data-Free Class-Incremental Hand Gesture Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Aich_2023_ICCV, author = {Aich, Shubhra and Ruiz-Santaquiteria, Jesus and Lu, Zhenyu and Garg, Prachi and Joseph, K J and Garcia, Alvaro Fernandez and Balasubramanian, Vineeth N and Kin, Kenrick and Wan, Chengde and Camgoz, Necati Cihan and Ma, Shugao and De la Torre, Fernando}, title = {Data-Free Class-Incremental Hand Gesture Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20958-20967} }
Corrupting Neuron Explanations of Deep Visual Features-
[pdf]
[supp]
[bibtex]@InProceedings{Srivastava_2023_ICCV, author = {Srivastava, Divyansh and Oikarinen, Tuomas and Weng, Tsui-Wei}, title = {Corrupting Neuron Explanations of Deep Visual Features}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1877-1886} }
PNI : Industrial Anomaly Detection using Position and Neighborhood Information-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bae_2023_ICCV, author = {Bae, Jaehyeok and Lee, Jae-Han and Kim, Seyun}, title = {PNI : Industrial Anomaly Detection using Position and Neighborhood Information}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6373-6383} }
PC-Adapter: Topology-Aware Adapter for Efficient Domain Adaption on Point Clouds with Rectified Pseudo-label-
[pdf]
[supp]
[bibtex]@InProceedings{Park_2023_ICCV, author = {Park, Joonhyung and Seo, Hyunjin and Yang, Eunho}, title = {PC-Adapter: Topology-Aware Adapter for Efficient Domain Adaption on Point Clouds with Rectified Pseudo-label}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11530-11540} }
Cyclic Test-Time Adaptation on Monocular Video for 3D Human Mesh Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nam_2023_ICCV, author = {Nam, Hyeongjin and Jung, Daniel Sungho and Oh, Yeonguk and Lee, Kyoung Mu}, title = {Cyclic Test-Time Adaptation on Monocular Video for 3D Human Mesh Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14829-14839} }
2D3D-MATR: 2D-3D Matching Transformer for Detection-Free Registration Between Images and Point Clouds-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Minhao and Qin, Zheng and Gao, Zhirui and Yi, Renjiao and Zhu, Chenyang and Guo, Yulan and Xu, Kai}, title = {2D3D-MATR: 2D-3D Matching Transformer for Detection-Free Registration Between Images and Point Clouds}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14128-14138} }
Mixed Neural Voxels for Fast Multi-view Video Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Feng and Tan, Sinan and Li, Xinghang and Tian, Zeyue and Song, Yafei and Liu, Huaping}, title = {Mixed Neural Voxels for Fast Multi-view Video Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19706-19716} }
Bidirectionally Deformable Motion Modulation For Video-based Human Pose Transfer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yu_2023_ICCV, author = {Yu, Wing-Yin and Po, Lai-Man and Cheung, Ray C.C. and Zhao, Yuzhi and Xue, Yu and Li, Kun}, title = {Bidirectionally Deformable Motion Modulation For Video-based Human Pose Transfer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7502-7512} }
Harvard Glaucoma Detection and Progression: A Multimodal Multitask Dataset and Generalization-Reinforced Semi-Supervised Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Luo_2023_ICCV, author = {Luo, Yan and Shi, Min and Tian, Yu and Elze, Tobias and Wang, Mengyu}, title = {Harvard Glaucoma Detection and Progression: A Multimodal Multitask Dataset and Generalization-Reinforced Semi-Supervised Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20471-20482} }
Tracking Everything Everywhere All at Once-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Qianqian and Chang, Yen-Yu and Cai, Ruojin and Li, Zhengqi and Hariharan, Bharath and Holynski, Aleksander and Snavely, Noah}, title = {Tracking Everything Everywhere All at Once}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19795-19806} }
Group Pose: A Simple Baseline for End-to-End Multi-Person Pose Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Huan and Chen, Qiang and Tan, Zichang and Liu, Jiang-Jiang and Wang, Jian and Su, Xiangbo and Li, Xiaolong and Yao, Kun and Han, Junyu and Ding, Errui and Zhao, Yao and Wang, Jingdong}, title = {Group Pose: A Simple Baseline for End-to-End Multi-Person Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15029-15038} }
Objects Do Not Disappear: Video Object Detection by Single-Frame Object Location Anticipation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Xin and Nejadasl, Fatemeh Karimi and van Gemert, Jan C. and Booij, Olaf and Pintea, Silvia L.}, title = {Objects Do Not Disappear: Video Object Detection by Single-Frame Object Location Anticipation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6950-6961} }
CauSSL: Causality-inspired Semi-supervised Learning for Medical Image Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Miao_2023_ICCV, author = {Miao, Juzheng and Chen, Cheng and Liu, Furui and Wei, Hao and Heng, Pheng-Ann}, title = {CauSSL: Causality-inspired Semi-supervised Learning for Medical Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21426-21437} }
ChartReader: A Unified Framework for Chart Derendering and Comprehension without Heuristic Rules-
[pdf]
[arXiv]
[bibtex]@InProceedings{Cheng_2023_ICCV, author = {Cheng, Zhi-Qi and Dai, Qi and Hauptmann, Alexander G.}, title = {ChartReader: A Unified Framework for Chart Derendering and Comprehension without Heuristic Rules}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22202-22213} }
Learning from Semantic Alignment between Unpaired Multiviews for Egocentric Video Recognition-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Qitong and Zhao, Long and Yuan, Liangzhe and Liu, Ting and Peng, Xi}, title = {Learning from Semantic Alignment between Unpaired Multiviews for Egocentric Video Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3307-3317} }
Neural LiDAR Fields for Novel View Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Shengyu and Gojcic, Zan and Wang, Zian and Williams, Francis and Kasten, Yoni and Fidler, Sanja and Schindler, Konrad and Litany, Or}, title = {Neural LiDAR Fields for Novel View Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18236-18246} }
Source-free Depth for Object Pop-out-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{WU_2023_ICCV, author = {WU, Zongwei and Paudel, Danda Pani and Fan, Deng-Ping and Wang, Jingjing and Wang, Shuo and Demonceaux, C\'edric and Timofte, Radu and Van Gool, Luc}, title = {Source-free Depth for Object Pop-out}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1032-1042} }
Token-Label Alignment for Vision Transformers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xiao_2023_ICCV, author = {Xiao, Han and Zheng, Wenzhao and Zhu, Zheng and Zhou, Jie and Lu, Jiwen}, title = {Token-Label Alignment for Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5495-5504} }
Understanding 3D Object Interaction from a Single Image-
[pdf]
[arXiv]
[bibtex]@InProceedings{Qian_2023_ICCV, author = {Qian, Shengyi and Fouhey, David F.}, title = {Understanding 3D Object Interaction from a Single Image}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21753-21763} }
SkeleTR: Towards Skeleton-based Action Recognition in the Wild-
[pdf]
[bibtex]@InProceedings{Duan_2023_ICCV, author = {Duan, Haodong and Xu, Mingze and Shuai, Bing and Modolo, Davide and Tu, Zhuowen and Tighe, Joseph and Bergamo, Alessandro}, title = {SkeleTR: Towards Skeleton-based Action Recognition in the Wild}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13634-13644} }
Learning Gabor Texture Features for Fine-Grained Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Lanyun and Chen, Tianrun and Yin, Jianxiong and See, Simon and Liu, Jun}, title = {Learning Gabor Texture Features for Fine-Grained Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1621-1631} }
Weakly-Supervised Action Localization by Hierarchically-Structured Latent Attention Modeling-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Guiqin and Zhao, Peng and Zhao, Cong and Yang, Shusen and Cheng, Jie and Leng, Luziwei and Liao, Jianxing and Guo, Qinghai}, title = {Weakly-Supervised Action Localization by Hierarchically-Structured Latent Attention Modeling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10203-10213} }
Get3DHuman: Lifting StyleGAN-Human into a 3D Generative Model Using Pixel-Aligned Reconstruction Priors-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xiong_2023_ICCV, author = {Xiong, Zhangyang and Kang, Di and Jin, Derong and Chen, Weikai and Bao, Linchao and Cui, Shuguang and Han, Xiaoguang}, title = {Get3DHuman: Lifting StyleGAN-Human into a 3D Generative Model Using Pixel-Aligned Reconstruction Priors}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9287-9297} }
Query6DoF: Learning Sparse Queries as Implicit Shape Prior for Category-Level 6DoF Pose Estimation-
[pdf]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Ruiqi and Wang, Xinggang and Li, Te and Yang, Rong and Wan, Minhong and Liu, Wenyu}, title = {Query6DoF: Learning Sparse Queries as Implicit Shape Prior for Category-Level 6DoF Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14055-14064} }
Towards High-Quality Specular Highlight Removal by Leveraging Large-Scale Synthetic Data-
[pdf]
[arXiv]
[bibtex]@InProceedings{Fu_2023_ICCV, author = {Fu, Gang and Zhang, Qing and Zhu, Lei and Xiao, Chunxia and Li, Ping}, title = {Towards High-Quality Specular Highlight Removal by Leveraging Large-Scale Synthetic Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12857-12865} }
An Embarrassingly Simple Backdoor Attack on Self-supervised Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Changjiang and Pang, Ren and Xi, Zhaohan and Du, Tianyu and Ji, Shouling and Yao, Yuan and Wang, Ting}, title = {An Embarrassingly Simple Backdoor Attack on Self-supervised Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4367-4378} }
Cross-Modal Translation and Alignment for Survival Analysis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Fengtao and Chen, Hao}, title = {Cross-Modal Translation and Alignment for Survival Analysis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21485-21494} }
Chaotic World: A Large and Challenging Benchmark for Human Behavior Understanding in Chaotic Events-
[pdf]
[supp]
[bibtex]@InProceedings{Ong_2023_ICCV, author = {Ong, Kian Eng and Ng, Xun Long and Li, Yanchao and Ai, Wenjie and Zhao, Kuangyi and Yeo, Si Yong and Liu, Jun}, title = {Chaotic World: A Large and Challenging Benchmark for Human Behavior Understanding in Chaotic Events}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20213-20223} }
Unsupervised 3D Perception with 2D Vision-Language Distillation for Autonomous Driving-
[pdf]
[supp]
[bibtex]@InProceedings{Najibi_2023_ICCV, author = {Najibi, Mahyar and Ji, Jingwei and Zhou, Yin and Qi, Charles R. and Yan, Xinchen and Ettinger, Scott and Anguelov, Dragomir}, title = {Unsupervised 3D Perception with 2D Vision-Language Distillation for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8602-8612} }
Towards Grand Unified Representation Learning for Unsupervised Visible-Infrared Person Re-Identification-
[pdf]
[supp]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Bin and Chen, Jun and Ye, Mang}, title = {Towards Grand Unified Representation Learning for Unsupervised Visible-Infrared Person Re-Identification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11069-11079} }
Active Stereo Without Pattern Projector-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bartolomei_2023_ICCV, author = {Bartolomei, Luca and Poggi, Matteo and Tosi, Fabio and Conti, Andrea and Mattoccia, Stefano}, title = {Active Stereo Without Pattern Projector}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18470-18482} }
Partition Speeds Up Learning Implicit Neural Representations Based on Exponential-Increase Hypothesis-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Ke and Liu, Feng and Wang, Haishuai and Ma, Ning and Bu, Jiajun and Han, Bo}, title = {Partition Speeds Up Learning Implicit Neural Representations Based on Exponential-Increase Hypothesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5474-5483} }
Uncertainty Guided Adaptive Warping for Robust and Efficient Stereo Matching-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jing_2023_ICCV, author = {Jing, Junpeng and Li, Jiankun and Xiong, Pengfei and Liu, Jiangyu and Liu, Shuaicheng and Guo, Yichen and Deng, Xin and Xu, Mai and Jiang, Lai and Sigal, Leonid}, title = {Uncertainty Guided Adaptive Warping for Robust and Efficient Stereo Matching}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3318-3327} }
ReFit: Recurrent Fitting Network for 3D Human Recovery-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Yufu and Daniilidis, Kostas}, title = {ReFit: Recurrent Fitting Network for 3D Human Recovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14644-14654} }
Towards Instance-adaptive Inference for Federated Learning-
[pdf]
[arXiv]
[bibtex]@InProceedings{Feng_2023_ICCV, author = {Feng, Chun-Mei and Yu, Kai and Liu, Nian and Xu, Xinxing and Khan, Salman and Zuo, Wangmeng}, title = {Towards Instance-adaptive Inference for Federated Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23287-23296} }
CGBA: Curvature-aware Geometric Black-box Attack-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Reza_2023_ICCV, author = {Reza, Md Farhamdur and Rahmati, Ali and Wu, Tianfu and Dai, Huaiyu}, title = {CGBA: Curvature-aware Geometric Black-box Attack}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {124-133} }
Unsupervised Facial Performance Editing via Vector-Quantized StyleGAN Representations-
[pdf]
[supp]
[bibtex]@InProceedings{Kicanaoglu_2023_ICCV, author = {Kicanaoglu, Berkay and Garrido, Pablo and Bharaj, Gaurav}, title = {Unsupervised Facial Performance Editing via Vector-Quantized StyleGAN Representations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2371-2382} }
Online Clustered Codebook-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zheng_2023_ICCV, author = {Zheng, Chuanxia and Vedaldi, Andrea}, title = {Online Clustered Codebook}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22798-22807} }
A Multidimensional Analysis of Social Biases in Vision Transformers-
[pdf]
[arXiv]
[bibtex]@InProceedings{Brinkmann_2023_ICCV, author = {Brinkmann, Jannik and Swoboda, Paul and Bartelt, Christian}, title = {A Multidimensional Analysis of Social Biases in Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4914-4923} }
PGFed: Personalize Each Client's Global Objective for Federated Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Luo_2023_ICCV, author = {Luo, Jun and Mendieta, Matias and Chen, Chen and Wu, Shandong}, title = {PGFed: Personalize Each Client's Global Objective for Federated Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3946-3956} }
Verbs in Action: Improving Verb Understanding in Video-Language Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Momeni_2023_ICCV, author = {Momeni, Liliane and Caron, Mathilde and Nagrani, Arsha and Zisserman, Andrew and Schmid, Cordelia}, title = {Verbs in Action: Improving Verb Understanding in Video-Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15579-15591} }
Zero-Shot Point Cloud Segmentation by Semantic-Visual Aware Synthesis-
[pdf]
[supp]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Yuwei and Hayat, Munawar and Jin, Zhao and Zhu, Hongyuan and Lei, Yinjie}, title = {Zero-Shot Point Cloud Segmentation by Semantic-Visual Aware Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11586-11596} }
Exploring Predicate Visual Context in Detecting of Human-Object Interactions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Frederic Z and Yuan, Yuhui and Campbell, Dylan and Zhong, Zhuoyao and Gould, Stephen}, title = {Exploring Predicate Visual Context in Detecting of Human-Object Interactions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10411-10421} }
Robo3D: Towards Robust and Reliable 3D Perception against Corruptions-
[pdf]
[arXiv]
[bibtex]@InProceedings{Kong_2023_ICCV, author = {Kong, Lingdong and Liu, Youquan and Li, Xin and Chen, Runnan and Zhang, Wenwei and Ren, Jiawei and Pan, Liang and Chen, Kai and Liu, Ziwei}, title = {Robo3D: Towards Robust and Reliable 3D Perception against Corruptions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19994-20006} }
Towards Saner Deep Image Registration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Duan_2023_ICCV, author = {Duan, Bin and Zhong, Ming and Yan, Yan}, title = {Towards Saner Deep Image Registration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12459-12468} }
Instance and Category Supervision are Alternate Learners for Continual Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Tian_2023_ICCV, author = {Tian, Xudong and Zhang, Zhizhong and Tan, Xin and Liu, Jun and Wang, Chengjie and Qu, Yanyun and Jiang, Guannan and Xie, Yuan}, title = {Instance and Category Supervision are Alternate Learners for Continual Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5596-5605} }
Diverse Data Augmentation with Diffusions for Effective Test-time Prompt Tuning-
[pdf]
[arXiv]
[bibtex]@InProceedings{Feng_2023_ICCV, author = {Feng, Chun-Mei and Yu, Kai and Liu, Yong and Khan, Salman and Zuo, Wangmeng}, title = {Diverse Data Augmentation with Diffusions for Effective Test-time Prompt Tuning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2704-2714} }
Interaction-aware Joint Attention Estimation Using People Attributes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nakatani_2023_ICCV, author = {Nakatani, Chihiro and Kawashima, Hiroaki and Ukita, Norimichi}, title = {Interaction-aware Joint Attention Estimation Using People Attributes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10224-10233} }
GePSAn: Generative Procedure Step Anticipation in Cooking Videos-
[pdf]
[supp]
[bibtex]@InProceedings{Abdelsalam_2023_ICCV, author = {Abdelsalam, Mohamed A. and Rangrej, Samrudhdhi B. and Hadji, Isma and Dvornik, Nikita and Derpanis, Konstantinos G. and Fazly, Afsaneh}, title = {GePSAn: Generative Procedure Step Anticipation in Cooking Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2988-2997} }
Gradient-based Sampling for Class Imbalanced Semi-supervised Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Jiaming and Lin, Xiangru and Zhang, Wei and Tan, Xiao and Li, Yingying and Han, Junyu and Ding, Errui and Wang, Jingdong and Li, Guanbin}, title = {Gradient-based Sampling for Class Imbalanced Semi-supervised Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16390-16400} }
SLCA: Slow Learner with Classifier Alignment for Continual Learning on a Pre-trained Model-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Gengwei and Wang, Liyuan and Kang, Guoliang and Chen, Ling and Wei, Yunchao}, title = {SLCA: Slow Learner with Classifier Alignment for Continual Learning on a Pre-trained Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19148-19158} }
Implicit Temporal Modeling with Learnable Alignment for Video Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tu_2023_ICCV, author = {Tu, Shuyuan and Dai, Qi and Wu, Zuxuan and Cheng, Zhi-Qi and Hu, Han and Jiang, Yu-Gang}, title = {Implicit Temporal Modeling with Learnable Alignment for Video Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19936-19947} }
Non-Coaxial Event-Guided Motion Deblurring with Spatial Alignment-
[pdf]
[supp]
[bibtex]@InProceedings{Cho_2023_ICCV, author = {Cho, Hoonhee and Jeong, Yuhwan and Kim, Taewoo and Yoon, Kuk-Jin}, title = {Non-Coaxial Event-Guided Motion Deblurring with Spatial Alignment}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12492-12503} }
Fingerprinting Deep Image Restoration Models-
[pdf]
[supp]
[bibtex]@InProceedings{Quan_2023_ICCV, author = {Quan, Yuhui and Teng, Huan and Xu, Ruotao and Huang, Jun and Ji, Hui}, title = {Fingerprinting Deep Image Restoration Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13285-13295} }
AutoDiffusion: Training-Free Optimization of Time Steps and Architectures for Automated Diffusion Model Acceleration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Lijiang and Li, Huixia and Zheng, Xiawu and Wu, Jie and Xiao, Xuefeng and Wang, Rui and Zheng, Min and Pan, Xin and Chao, Fei and Ji, Rongrong}, title = {AutoDiffusion: Training-Free Optimization of Time Steps and Architectures for Automated Diffusion Model Acceleration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7105-7114} }
SportsMOT: A Large Multi-Object Tracking Dataset in Multiple Sports Scenes-
[pdf]
[arXiv]
[bibtex]@InProceedings{Cui_2023_ICCV, author = {Cui, Yutao and Zeng, Chenkai and Zhao, Xiaoyu and Yang, Yichun and Wu, Gangshan and Wang, Limin}, title = {SportsMOT: A Large Multi-Object Tracking Dataset in Multiple Sports Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9921-9931} }
Localizing Moments in Long Video Via Multimodal Guidance-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Barrios_2023_ICCV, author = {Barrios, Wayner and Soldan, Mattia and Ceballos-Arroyo, Alberto Mario and Heilbron, Fabian Caba and Ghanem, Bernard}, title = {Localizing Moments in Long Video Via Multimodal Guidance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13667-13678} }
Pixel-Aligned Recurrent Queries for Multi-View 3D Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Xie_2023_ICCV, author = {Xie, Yiming and Jiang, Huaizu and Gkioxari, Georgia and Straub, Julian}, title = {Pixel-Aligned Recurrent Queries for Multi-View 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18370-18380} }
Towards Universal Image Embeddings: A Large-Scale Dataset and Challenge for Generic Image Representations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ypsilantis_2023_ICCV, author = {Ypsilantis, Nikolaos-Antonios and Chen, Kaifeng and Cao, Bingyi and Lipovsk\'y, M\'ario and Dogan-Sch\"onberger, Pelin and Makosa, Grzegorz and Bluntschli, Boris and Seyedhosseini, Mojtaba and Chum, Ond\v{r}ej and Araujo, Andr\'e}, title = {Towards Universal Image Embeddings: A Large-Scale Dataset and Challenge for Generic Image Representations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11290-11301} }
SemARFlow: Injecting Semantics into Unsupervised Optical Flow Estimation for Autonomous Driving-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yuan_2023_ICCV, author = {Yuan, Shuai and Yu, Shuzhi and Kim, Hannah and Tomasi, Carlo}, title = {SemARFlow: Injecting Semantics into Unsupervised Optical Flow Estimation for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9566-9577} }
TiDAL: Learning Training Dynamics for Active Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kye_2023_ICCV, author = {Kye, Seong Min and Choi, Kwanghee and Byun, Hyeongmin and Chang, Buru}, title = {TiDAL: Learning Training Dynamics for Active Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22335-22345} }
Uncertainty-aware Unsupervised Multi-Object Tracking-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Kai and Jin, Sheng and Fu, Zhihang and Chen, Ze and Jiang, Rongxin and Ye, Jieping}, title = {Uncertainty-aware Unsupervised Multi-Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9996-10005} }
DPS-Net: Deep Polarimetric Stereo Depth Estimation-
[pdf]
[supp]
[bibtex]@InProceedings{Tian_2023_ICCV, author = {Tian, Chaoran and Pan, Weihong and Wang, Zimo and Mao, Mao and Zhang, Guofeng and Bao, Hujun and Tan, Ping and Cui, Zhaopeng}, title = {DPS-Net: Deep Polarimetric Stereo Depth Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3569-3579} }
Designing Phase Masks for Under-Display Cameras-
[pdf]
[supp]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Anqi and Kang, Eunhee and Lee, Hyong-Euk and Sankaranarayanan, Aswin C.}, title = {Designing Phase Masks for Under-Display Cameras}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10637-10645} }
Can Language Models Learn to Listen?-
[pdf]
[arXiv]
[bibtex]@InProceedings{Ng_2023_ICCV, author = {Ng, Evonne and Subramanian, Sanjay and Klein, Dan and Kanazawa, Angjoo and Darrell, Trevor and Ginosar, Shiry}, title = {Can Language Models Learn to Listen?}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10083-10093} }
SpaceEvo: Hardware-Friendly Search Space Design for Efficient INT8 Inference-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Xudong and Zhang, Li Lyna and Xu, Jiahang and Zhang, Quanlu and Wang, Yujing and Yang, Yuqing and Zheng, Ningxin and Cao, Ting and Yang, Mao}, title = {SpaceEvo: Hardware-Friendly Search Space Design for Efficient INT8 Inference}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5819-5828} }
How Far Pre-trained Models Are from Neural Collapse on the Target Dataset Informs their Transferability-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Zijian and Luo, Yadan and Zheng, Liang and Huang, Zi and Baktashmotlagh, Mahsa}, title = {How Far Pre-trained Models Are from Neural Collapse on the Target Dataset Informs their Transferability}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5549-5558} }
SurfsUP: Learning Fluid Simulation for Novel Surfaces-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mani_2023_ICCV, author = {Mani, Arjun and Chandratreya, Ishaan Preetam and Creager, Elliot and Vondrick, Carl and Zemel, Richard}, title = {SurfsUP: Learning Fluid Simulation for Novel Surfaces}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14225-14235} }
Convolutional Networks with Oriented 1D Kernels-
[pdf]
[supp]
[bibtex]@InProceedings{Kirchmeyer_2023_ICCV, author = {Kirchmeyer, Alexandre and Deng, Jia}, title = {Convolutional Networks with Oriented 1D Kernels}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6222-6232} }
Regularized Mask Tuning: Uncovering Hidden Knowledge in Pre-Trained Vision-Language Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zheng_2023_ICCV, author = {Zheng, Kecheng and Wu, Wei and Feng, Ruili and Zhu, Kai and Liu, Jiawei and Zhao, Deli and Zha, Zheng-Jun and Chen, Wei and Shen, Yujun}, title = {Regularized Mask Tuning: Uncovering Hidden Knowledge in Pre-Trained Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11663-11673} }
Skill Transformer: A Monolithic Policy for Mobile Manipulation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Xiaoyu and Batra, Dhruv and Rai, Akshara and Szot, Andrew}, title = {Skill Transformer: A Monolithic Policy for Mobile Manipulation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10852-10862} }
Adaptive and Background-Aware Vision Transformer for Real-Time UAV Tracking-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Shuiwang and Yang, Yangxiang and Zeng, Dan and Wang, Xucheng}, title = {Adaptive and Background-Aware Vision Transformer for Real-Time UAV Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13989-14000} }
Improving Pixel-based MIM by Reducing Wasted Modeling Capability-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Yuan and Zhang, Songyang and Chen, Jiacheng and Yu, Zhaohui and Chen, Kai and Lin, Dahua}, title = {Improving Pixel-based MIM by Reducing Wasted Modeling Capability}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5361-5372} }
Towards Memory- and Time-Efficient Backpropagation for Training Spiking Neural Networks-
[pdf]
[supp]
[bibtex]@InProceedings{Meng_2023_ICCV, author = {Meng, Qingyan and Xiao, Mingqing and Yan, Shen and Wang, Yisen and Lin, Zhouchen and Luo, Zhi-Quan}, title = {Towards Memory- and Time-Efficient Backpropagation for Training Spiking Neural Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6166-6176} }
Persistent-Transient Duality: A Multi-Mechanism Approach for Modeling Human-Object Interaction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tran_2023_ICCV, author = {Tran, Hung and Le, Vuong and Venkatesh, Svetha and Tran, Truyen}, title = {Persistent-Transient Duality: A Multi-Mechanism Approach for Modeling Human-Object Interaction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9858-9867} }
When to Learn What: Model-Adaptive Data Augmentation Curriculum-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hou_2023_ICCV, author = {Hou, Chengkai and Zhang, Jieyu and Zhou, Tianyi}, title = {When to Learn What: Model-Adaptive Data Augmentation Curriculum}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1717-1728} }
DiffPose: Multi-hypothesis Human Pose Estimation using Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Holmquist_2023_ICCV, author = {Holmquist, Karl and Wandt, Bastian}, title = {DiffPose: Multi-hypothesis Human Pose Estimation using Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15977-15987} }
AesPA-Net: Aesthetic Pattern-Aware Style Transfer Networks-
[pdf]
[supp]
[bibtex]@InProceedings{Hong_2023_ICCV, author = {Hong, Kibeom and Jeon, Seogkyu and Lee, Junsoo and Ahn, Namhyuk and Kim, Kunhee and Lee, Pilhyeon and Kim, Daesik and Uh, Youngjung and Byun, Hyeran}, title = {AesPA-Net: Aesthetic Pattern-Aware Style Transfer Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22758-22767} }
COPILOT: Human-Environment Collision Prediction and Localization from Egocentric Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Pan_2023_ICCV, author = {Pan, Boxiao and Shen, Bokui and Rempe, Davis and Paschalidou, Despoina and Mo, Kaichun and Yang, Yanchao and Guibas, Leonidas J.}, title = {COPILOT: Human-Environment Collision Prediction and Localization from Egocentric Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5262-5272} }
EGformer: Equirectangular Geometry-biased Transformer for 360 Depth Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yun_2023_ICCV, author = {Yun, Ilwi and Shin, Chanyong and Lee, Hyunku and Lee, Hyuk-Jae and Rhee, Chae Eun}, title = {EGformer: Equirectangular Geometry-biased Transformer for 360 Depth Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6101-6112} }
Size Does Matter: Size-aware Virtual Try-on via Clothing-oriented Transformation Try-on Network-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Chieh-Yun and Chen, Yi-Chung and Shuai, Hong-Han and Cheng, Wen-Huang}, title = {Size Does Matter: Size-aware Virtual Try-on via Clothing-oriented Transformation Try-on Network}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7513-7522} }
Generating Realistic Images from In-the-wild Sounds-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2023_ICCV, author = {Lee, Taegyeong and Kang, Jeonghun and Kim, Hyeonyu and Kim, Taehwan}, title = {Generating Realistic Images from In-the-wild Sounds}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7160-7170} }
DDS2M: Self-Supervised Denoising Diffusion Spatio-Spectral Model for Hyperspectral Image Restoration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Miao_2023_ICCV, author = {Miao, Yuchun and Zhang, Lefei and Zhang, Liangpei and Tao, Dacheng}, title = {DDS2M: Self-Supervised Denoising Diffusion Spatio-Spectral Model for Hyperspectral Image Restoration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12086-12096} }
Candidate-aware Selective Disambiguation Based On Normalized Entropy for Instance-dependent Partial-label Learning-
[pdf]
[bibtex]@InProceedings{He_2023_ICCV, author = {He, Shuo and Yang, Guowu and Feng, Lei}, title = {Candidate-aware Selective Disambiguation Based On Normalized Entropy for Instance-dependent Partial-label Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1792-1801} }
Open-vocabulary Video Question Answering: A New Benchmark for Evaluating the Generalizability of Video Question Answering Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ko_2023_ICCV, author = {Ko, Dohwan and Lee, Ji Soo and Choi, Miso and Chu, Jaewon and Park, Jihwan and Kim, Hyunwoo J.}, title = {Open-vocabulary Video Question Answering: A New Benchmark for Evaluating the Generalizability of Video Question Answering Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3101-3112} }
Using a Waffle Iron for Automotive Point Cloud Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Puy_2023_ICCV, author = {Puy, Gilles and Boulch, Alexandre and Marlet, Renaud}, title = {Using a Waffle Iron for Automotive Point Cloud Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3379-3389} }
AutoReP: Automatic ReLU Replacement for Fast Private Network Inference-
[pdf]
[arXiv]
[bibtex]@InProceedings{Peng_2023_ICCV, author = {Peng, Hongwu and Huang, Shaoyi and Zhou, Tong and Luo, Yukui and Wang, Chenghong and Wang, Zigeng and Zhao, Jiahui and Xie, Xi and Li, Ang and Geng, Tony and Mahmood, Kaleel and Wen, Wujie and Xu, Xiaolin and Ding, Caiwen}, title = {AutoReP: Automatic ReLU Replacement for Fast Private Network Inference}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5178-5188} }
MotionLM: Multi-Agent Motion Forecasting as Language Modeling-
[pdf]
[supp]
[bibtex]@InProceedings{Seff_2023_ICCV, author = {Seff, Ari and Cera, Brian and Chen, Dian and Ng, Mason and Zhou, Aurick and Nayakanti, Nigamaa and Refaat, Khaled S. and Al-Rfou, Rami and Sapp, Benjamin}, title = {MotionLM: Multi-Agent Motion Forecasting as Language Modeling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8579-8590} }
Black Box Few-Shot Adaptation for Vision-Language Models-
[pdf]
[supp]
[bibtex]@InProceedings{Ouali_2023_ICCV, author = {Ouali, Yassine and Bulat, Adrian and Matinez, Brais and Tzimiropoulos, Georgios}, title = {Black Box Few-Shot Adaptation for Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15534-15546} }
Center-Based Decoupled Point-cloud Registration for 6D Object Pose Estimation-
[pdf]
[bibtex]@InProceedings{Jiang_2023_ICCV, author = {Jiang, Haobo and Dang, Zheng and Gu, Shuo and Xie, Jin and Salzmann, Mathieu and Yang, Jian}, title = {Center-Based Decoupled Point-cloud Registration for 6D Object Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3427-3437} }
Self-Ordering Point Clouds-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Pengwan and Snoek, Cees G. M. and Asano, Yuki M.}, title = {Self-Ordering Point Clouds}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15813-15822} }
Continual Segment: Towards a Single, Unified and Non-forgetting Continual Segmentation Model of 143 Whole-body Organs in CT Scans-
[pdf]
[supp]
[bibtex]@InProceedings{Ji_2023_ICCV, author = {Ji, Zhanghexuan and Guo, Dazhou and Wang, Puyang and Yan, Ke and Lu, Le and Xu, Minfeng and Wang, Qifeng and Ge, Jia and Gao, Mingchen and Ye, Xianghua and Jin, Dakai}, title = {Continual Segment: Towards a Single, Unified and Non-forgetting Continual Segmentation Model of 143 Whole-body Organs in CT Scans}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21140-21151} }
Enhancing Modality-Agnostic Representations via Meta-Learning for Brain Tumor Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Konwer_2023_ICCV, author = {Konwer, Aishik and Hu, Xiaoling and Bae, Joseph and Xu, Xuan and Chen, Chao and Prasanna, Prateek}, title = {Enhancing Modality-Agnostic Representations via Meta-Learning for Brain Tumor Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21415-21425} }
Zero-1-to-3: Zero-shot One Image to 3D Object-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Ruoshi and Wu, Rundi and Van Hoorick, Basile and Tokmakov, Pavel and Zakharov, Sergey and Vondrick, Carl}, title = {Zero-1-to-3: Zero-shot One Image to 3D Object}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9298-9309} }
3D Distillation: Improving Self-Supervised Monocular Depth Estimation on Reflective Surfaces-
[pdf]
[supp]
[bibtex]@InProceedings{Shi_2023_ICCV, author = {Shi, Xuepeng and Dikov, Georgi and Reitmayr, Gerhard and Kim, Tae-Kyun and Ghafoorian, Mohsen}, title = {3D Distillation: Improving Self-Supervised Monocular Depth Estimation on Reflective Surfaces}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9133-9143} }
GAIT: Generating Aesthetic Indoor Tours with Deep Reinforcement Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Xie_2023_ICCV, author = {Xie, Desai and Hu, Ping and Sun, Xin and Pirk, Soren and Zhang, Jianming and Mech, Radomir and Kaufman, Arie E.}, title = {GAIT: Generating Aesthetic Indoor Tours with Deep Reinforcement Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7409-7419} }
Low-Light Image Enhancement with Multi-Stage Residue Quantization and Brightness-Aware Attention-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Yunlong and Huang, Tao and Dong, Weisheng and Wu, Fangfang and Li, Xin and Shi, Guangming}, title = {Low-Light Image Enhancement with Multi-Stage Residue Quantization and Brightness-Aware Attention}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12140-12149} }
Hierarchically Decomposed Graph Convolutional Networks for Skeleton-Based Action Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2023_ICCV, author = {Lee, Jungho and Lee, Minhyeok and Lee, Dogyoon and Lee, Sangyoun}, title = {Hierarchically Decomposed Graph Convolutional Networks for Skeleton-Based Action Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10444-10453} }
LIST: Learning Implicitly from Spatial Transformers for Single-View 3D Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Arshad_2023_ICCV, author = {Arshad, Mohammad Samiul and Beksi, William J.}, title = {LIST: Learning Implicitly from Spatial Transformers for Single-View 3D Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9321-9330} }
Rethinking Mobile Block for Efficient Attention-based Models-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Jiangning and Li, Xiangtai and Li, Jian and Liu, Liang and Xue, Zhucun and Zhang, Boshen and Jiang, Zhengkai and Huang, Tianxin and Wang, Yabiao and Wang, Chengjie}, title = {Rethinking Mobile Block for Efficient Attention-based Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1389-1400} }
REAP: A Large-Scale Realistic Adversarial Patch Benchmark-
[pdf]
[arXiv]
[bibtex]@InProceedings{Hingun_2023_ICCV, author = {Hingun, Nabeel and Sitawarin, Chawin and Li, Jerry and Wagner, David}, title = {REAP: A Large-Scale Realistic Adversarial Patch Benchmark}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4640-4651} }
LRRU: Long-short Range Recurrent Updating Networks for Depth Completion-
[pdf]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Yufei and Li, Bo and Zhang, Ge and Liu, Qi and Gao, Tao and Dai, Yuchao}, title = {LRRU: Long-short Range Recurrent Updating Networks for Depth Completion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9422-9432} }
MetaBEV: Solving Sensor Failures for 3D Detection and Map Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Ge_2023_ICCV, author = {Ge, Chongjian and Chen, Junsong and Xie, Enze and Wang, Zhongdao and Hong, Lanqing and Lu, Huchuan and Li, Zhenguo and Luo, Ping}, title = {MetaBEV: Solving Sensor Failures for 3D Detection and Map Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8721-8731} }
DNA-Rendering: A Diverse Neural Actor Repository for High-Fidelity Human-Centric Rendering-
[pdf]
[supp]
[bibtex]@InProceedings{Cheng_2023_ICCV, author = {Cheng, Wei and Chen, Ruixiang and Fan, Siming and Yin, Wanqi and Chen, Keyu and Cai, Zhongang and Wang, Jingbo and Gao, Yang and Yu, Zhengming and Lin, Zhengyu and Ren, Daxuan and Yang, Lei and Liu, Ziwei and Loy, Chen Change and Qian, Chen and Wu, Wayne and Lin, Dahua and Dai, Bo and Lin, Kwan-Yee}, title = {DNA-Rendering: A Diverse Neural Actor Repository for High-Fidelity Human-Centric Rendering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19982-19993} }
Exploring Temporal Concurrency for Video-Language Representation Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Heng and Liu, Daqing and Lv, Zezhong and Su, Bing and Tao, Dacheng}, title = {Exploring Temporal Concurrency for Video-Language Representation Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15568-15578} }
StegaNeRF: Embedding Invisible Information within Neural Radiance Fields-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Chenxin and Feng, Brandon Y. and Fan, Zhiwen and Pan, Panwang and Wang, Zhangyang}, title = {StegaNeRF: Embedding Invisible Information within Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {441-453} }
DynamicISP: Dynamically Controlled Image Signal Processor for Image Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yoshimura_2023_ICCV, author = {Yoshimura, Masakazu and Otsuka, Junji and Irie, Atsushi and Ohashi, Takeshi}, title = {DynamicISP: Dynamically Controlled Image Signal Processor for Image Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12866-12876} }
R-Pred: Two-Stage Motion Prediction Via Tube-Query Attention-Based Trajectory Refinement-
[pdf]
[supp]
[bibtex]@InProceedings{Choi_2023_ICCV, author = {Choi, Sehwan and Kim, Jungho and Yun, Junyong and Choi, Jun Won}, title = {R-Pred: Two-Stage Motion Prediction Via Tube-Query Attention-Based Trajectory Refinement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8525-8535} }
A step towards understanding why classification helps regression-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Pintea_2023_ICCV, author = {Pintea, Silvia L. and Lin, Yancong and Dijkstra, Jouke and van Gemert, Jan C.}, title = {A step towards understanding why classification helps regression}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19972-19981} }
Robust Evaluation of Diffusion-Based Adversarial Purification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2023_ICCV, author = {Lee, Minjong and Kim, Dongwoo}, title = {Robust Evaluation of Diffusion-Based Adversarial Purification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {134-144} }
Hyperbolic Audio-visual Zero-shot Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hong_2023_ICCV, author = {Hong, Jie and Hayder, Zeeshan and Han, Junlin and Fang, Pengfei and Harandi, Mehrtash and Petersson, Lars}, title = {Hyperbolic Audio-visual Zero-shot Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7873-7883} }
CTP:Towards Vision-Language Continual Pretraining via Compatible Momentum Contrast and Topology Preservation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Hongguang and Wei, Yunchao and Liang, Xiaodan and Zhang, Chunjie and Zhao, Yao}, title = {CTP:Towards Vision-Language Continual Pretraining via Compatible Momentum Contrast and Topology Preservation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22257-22267} }
Aggregating Feature Point Cloud for Depth Completion-
[pdf]
[supp]
[bibtex]@InProceedings{Yu_2023_ICCV, author = {Yu, Zhu and Sheng, Zehua and Zhou, Zili and Luo, Lun and Cao, Si-Yuan and Gu, Hong and Zhang, Huaqi and Shen, Hui-Liang}, title = {Aggregating Feature Point Cloud for Depth Completion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8732-8743} }
FLIP: Cross-domain Face Anti-spoofing with Language Guidance-
[pdf]
[supp]
[bibtex]@InProceedings{Srivatsan_2023_ICCV, author = {Srivatsan, Koushik and Naseer, Muzammal and Nandakumar, Karthik}, title = {FLIP: Cross-domain Face Anti-spoofing with Language Guidance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19685-19696} }
Distribution Shift Matters for Knowledge Distillation with Webly Collected Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tang_2023_ICCV, author = {Tang, Jialiang and Chen, Shuo and Niu, Gang and Sugiyama, Masashi and Gong, Chen}, title = {Distribution Shift Matters for Knowledge Distillation with Webly Collected Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17470-17480} }
Reconstructed Convolution Module Based Look-Up Tables for Efficient Image Super-Resolution-
[pdf]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Guandu and Ding, Yukang and Li, Mading and Sun, Ming and Wen, Xing and Wang, Bin}, title = {Reconstructed Convolution Module Based Look-Up Tables for Efficient Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12217-12226} }
Action Sensitivity Learning for Temporal Action Localization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shao_2023_ICCV, author = {Shao, Jiayi and Wang, Xiaohan and Quan, Ruijie and Zheng, Junjun and Yang, Jiang and Yang, Yi}, title = {Action Sensitivity Learning for Temporal Action Localization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13457-13469} }
Gram-based Attentive Neural Ordinary Differential Equations Network for Video Nystagmography Classification-
[pdf]
[bibtex]@InProceedings{Qiu_2023_ICCV, author = {Qiu, Xihe and Shi, Shaojie and Tan, Xiaoyu and Qu, Chao and Fang, Zhijun and Wang, Hailing and Gao, Yongbin and Wu, Peixia and Li, Huawei}, title = {Gram-based Attentive Neural Ordinary Differential Equations Network for Video Nystagmography Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21339-21348} }
PEANUT: Predicting and Navigating to Unseen Targets-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhai_2023_ICCV, author = {Zhai, Albert J. and Wang, Shenlong}, title = {PEANUT: Predicting and Navigating to Unseen Targets}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10926-10935} }
Pluralistic Aging Diffusion Autoencoder-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Peipei and Wang, Rui and Huang, Huaibo and He, Ran and He, Zhaofeng}, title = {Pluralistic Aging Diffusion Autoencoder}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22613-22623} }
ModelGiF: Gradient Fields for Model Functional Distance-
[pdf]
[arXiv]
[bibtex]@InProceedings{Song_2023_ICCV, author = {Song, Jie and Xu, Zhengqi and Wu, Sai and Chen, Gang and Song, Mingli}, title = {ModelGiF: Gradient Fields for Model Functional Distance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6125-6135} }
PoseDiffusion: Solving Pose Estimation via Diffusion-aided Bundle Adjustment-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Jianyuan and Rupprecht, Christian and Novotny, David}, title = {PoseDiffusion: Solving Pose Estimation via Diffusion-aided Bundle Adjustment}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9773-9783} }
TIFA: Accurate and Interpretable Text-to-Image Faithfulness Evaluation with Question Answering-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hu_2023_ICCV, author = {Hu, Yushi and Liu, Benlin and Kasai, Jungo and Wang, Yizhong and Ostendorf, Mari and Krishna, Ranjay and Smith, Noah A.}, title = {TIFA: Accurate and Interpretable Text-to-Image Faithfulness Evaluation with Question Answering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20406-20417} }
SIGMA: Scale-Invariant Global Sparse Shape Matching-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gao_2023_ICCV, author = {Gao, Maolin and Roetzer, Paul and Eisenberger, Marvin and L\"ahner, Zorah and Moeller, Michael and Cremers, Daniel and Bernard, Florian}, title = {SIGMA: Scale-Invariant Global Sparse Shape Matching}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {645-654} }
CORE: Cooperative Reconstruction for Multi-Agent Perception-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Binglu and Zhang, Lei and Wang, Zhaozhong and Zhao, Yongqiang and Zhou, Tianfei}, title = {CORE: Cooperative Reconstruction for Multi-Agent Perception}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8710-8720} }
VidStyleODE: Disentangled Video Editing via StyleGAN and NeuralODEs-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ali_2023_ICCV, author = {Ali, Moayed Haji and Bond, Andrew and Birdal, Tolga and Ceylan, Duygu and Karacan, Levent and Erdem, Erkut and Erdem, Aykut}, title = {VidStyleODE: Disentangled Video Editing via StyleGAN and NeuralODEs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7523-7534} }
SEFD: Learning to Distill Complex Pose and Occlusion-
[pdf]
[supp]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, ChangHee and Kong, Kyeongbo and Min, SungJun and Wee, Dongyoon and Jang, Ho-Deok and Cha, Geonho and Kang, SukJu}, title = {SEFD: Learning to Distill Complex Pose and Occlusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14941-14952} }
CiT: Curation in Training for Effective Vision-Language Data-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Hu and Xie, Saining and Huang, Po-Yao and Yu, Licheng and Howes, Russell and Ghosh, Gargi and Zettlemoyer, Luke and Feichtenhofer, Christoph}, title = {CiT: Curation in Training for Effective Vision-Language Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15180-15189} }
SparseNeRF: Distilling Depth Ranking for Few-shot Novel View Synthesis-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Guangcong and Chen, Zhaoxi and Loy, Chen Change and Liu, Ziwei}, title = {SparseNeRF: Distilling Depth Ranking for Few-shot Novel View Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9065-9076} }
Towards Models that Can See and Read-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ganz_2023_ICCV, author = {Ganz, Roy and Nuriel, Oren and Aberdam, Aviad and Kittenplon, Yair and Mazor, Shai and Litman, Ron}, title = {Towards Models that Can See and Read}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21718-21728} }
ProPainter: Improving Propagation and Transformer for Video Inpainting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Shangchen and Li, Chongyi and Chan, Kelvin C.K. and Loy, Chen Change}, title = {ProPainter: Improving Propagation and Transformer for Video Inpainting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10477-10486} }
Query Refinement Transformer for 3D Instance Segmentation-
[pdf]
[bibtex]@InProceedings{Lu_2023_ICCV, author = {Lu, Jiahao and Deng, Jiacheng and Wang, Chuxin and He, Jianfeng and Zhang, Tianzhu}, title = {Query Refinement Transformer for 3D Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18516-18526} }
Root Pose Decomposition Towards Generic Non-rigid 3D Reconstruction with Monocular Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Yikai and Dong, Yinpeng and Sun, Fuchun and Yang, Xiao}, title = {Root Pose Decomposition Towards Generic Non-rigid 3D Reconstruction with Monocular Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13890-13900} }
3DHumanGAN: 3D-Aware Human Image Generation with 3D Pose Mapping-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Zhuoqian and Li, Shikai and Wu, Wayne and Dai, Bo}, title = {3DHumanGAN: 3D-Aware Human Image Generation with 3D Pose Mapping}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23008-23019} }
LeaF: Learning Frames for 4D Point Cloud Sequence Understanding-
[pdf]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Yunze and Chen, Junyu and Zhang, Zekai and Huang, Jingwei and Yi, Li}, title = {LeaF: Learning Frames for 4D Point Cloud Sequence Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {604-613} }
GLA-GCN: Global-local Adaptive Graph Convolutional Network for 3D Human Pose Estimation from Monocular Video-
[pdf]
[bibtex]@InProceedings{Yu_2023_ICCV, author = {Yu, Bruce X.B. and Zhang, Zhi and Liu, Yongxu and Zhong, Sheng-hua and Liu, Yan and Chen, Chang Wen}, title = {GLA-GCN: Global-local Adaptive Graph Convolutional Network for 3D Human Pose Estimation from Monocular Video}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8818-8829} }
Snow Removal in Video: A New Dataset and A Novel Method-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Haoyu and Ren, Jingjing and Gu, Jinjin and Wu, Hongtao and Lu, Xuequan and Cai, Haoming and Zhu, Lei}, title = {Snow Removal in Video: A New Dataset and A Novel Method}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13211-13222} }
Degradation-Resistant Unfolding Network for Heterogeneous Image Fusion-
[pdf]
[supp]
[bibtex]@InProceedings{He_2023_ICCV, author = {He, Chunming and Li, Kai and Xu, Guoxia and Zhang, Yulun and Hu, Runze and Guo, Zhenhua and Li, Xiu}, title = {Degradation-Resistant Unfolding Network for Heterogeneous Image Fusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12611-12621} }
Priority-Centric Human Motion Generation in Discrete Latent Space-
[pdf]
[arXiv]
[bibtex]@InProceedings{Kong_2023_ICCV, author = {Kong, Hanyang and Gong, Kehong and Lian, Dongze and Mi, Michael Bi and Wang, Xinchao}, title = {Priority-Centric Human Motion Generation in Discrete Latent Space}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14806-14816} }
Domain-Specificity Inducing Transformers for Source-Free Domain Adaptation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sanyal_2023_ICCV, author = {Sanyal, Sunandini and Asokan, Ashish Ramayee and Bhambri, Suvaansh and Kulkarni, Akshay and Kundu, Jogendra Nath and Babu, R Venkatesh}, title = {Domain-Specificity Inducing Transformers for Source-Free Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18928-18937} }
Towards Improved Input Masking for Convolutional Neural Networks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Balasubramanian_2023_ICCV, author = {Balasubramanian, Sriram and Feizi, Soheil}, title = {Towards Improved Input Masking for Convolutional Neural Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1855-1865} }
3DHacker: Spectrum-based Decision Boundary Generation for Hard-label 3D Point Cloud Attack-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tao_2023_ICCV, author = {Tao, Yunbo and Liu, Daizong and Zhou, Pan and Xie, Yulai and Du, Wei and Hu, Wei}, title = {3DHacker: Spectrum-based Decision Boundary Generation for Hard-label 3D Point Cloud Attack}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14340-14350} }
Exploring Lightweight Hierarchical Vision Transformers for Efficient Visual Tracking-
[pdf]
[arXiv]
[bibtex]@InProceedings{Kang_2023_ICCV, author = {Kang, Ben and Chen, Xin and Wang, Dong and Peng, Houwen and Lu, Huchuan}, title = {Exploring Lightweight Hierarchical Vision Transformers for Efficient Visual Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9612-9621} }
MiniROAD: Minimal RNN Framework for Online Action Detection-
[pdf]
[supp]
[bibtex]@InProceedings{An_2023_ICCV, author = {An, Joungbin and Kang, Hyolim and Han, Su Ho and Yang, Ming-Hsuan and Kim, Seon Joo}, title = {MiniROAD: Minimal RNN Framework for Online Action Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10341-10350} }
Efficient Emotional Adaptation for Audio-Driven Talking-Head Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gan_2023_ICCV, author = {Gan, Yuan and Yang, Zongxin and Yue, Xihang and Sun, Lingyun and Yang, Yi}, title = {Efficient Emotional Adaptation for Audio-Driven Talking-Head Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22634-22645} }
Object-aware Gaze Target Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tonini_2023_ICCV, author = {Tonini, Francesco and Dall'Asen, Nicola and Beyan, Cigdem and Ricci, Elisa}, title = {Object-aware Gaze Target Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21860-21869} }
Gramian Attention Heads are Strong yet Efficient Vision Learners-
[pdf]
[supp]
[bibtex]@InProceedings{Ryu_2023_ICCV, author = {Ryu, Jongbin and Han, Dongyoon and Lim, Jongwoo}, title = {Gramian Attention Heads are Strong yet Efficient Vision Learners}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5841-5851} }
VADER: Video Alignment Differencing and Retrieval-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Black_2023_ICCV, author = {Black, Alexander and Jenni, Simon and Bui, Tu and Tanjim, Md. Mehrab and Petrangeli, Stefano and Sinha, Ritwik and Swaminathan, Viswanathan and Collomosse, John}, title = {VADER: Video Alignment Differencing and Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22357-22367} }
MI-GAN: A Simple Baseline for Image Inpainting on Mobile Devices-
[pdf]
[supp]
[bibtex]@InProceedings{Sargsyan_2023_ICCV, author = {Sargsyan, Andranik and Navasardyan, Shant and Xu, Xingqian and Shi, Humphrey}, title = {MI-GAN: A Simple Baseline for Image Inpainting on Mobile Devices}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7335-7345} }
HiLo: Exploiting High Low Frequency Relations for Unbiased Panoptic Scene Graph Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Zijian and Shi, Miaojing and Caesar, Holger}, title = {HiLo: Exploiting High Low Frequency Relations for Unbiased Panoptic Scene Graph Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21637-21648} }
Chop & Learn: Recognizing and Generating Object-State Compositions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Saini_2023_ICCV, author = {Saini, Nirat and Wang, Hanyu and Swaminathan, Archana and Jayasundara, Vinoj and He, Bo and Gupta, Kamal and Shrivastava, Abhinav}, title = {Chop \& Learn: Recognizing and Generating Object-State Compositions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20247-20258} }
Automatic Animation of Hair Blowing in Still Portrait Photos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xiao_2023_ICCV, author = {Xiao, Wenpeng and Liu, Wentao and Wang, Yitong and Ghanem, Bernard and Li, Bing}, title = {Automatic Animation of Hair Blowing in Still Portrait Photos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22963-22975} }
A Large-Scale Outdoor Multi-Modal Dataset and Benchmark for Novel View Synthesis and Implicit Scene Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lu_2023_ICCV, author = {Lu, Chongshan and Yin, Fukun and Chen, Xin and Liu, Wen and Chen, Tao and Yu, Gang and Fan, Jiayuan}, title = {A Large-Scale Outdoor Multi-Modal Dataset and Benchmark for Novel View Synthesis and Implicit Scene Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7557-7567} }
4D Panoptic Segmentation as Invariant and Equivariant Field Prediction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Minghan and Han, Shizhong and Cai, Hong and Borse, Shubhankar and Ghaffari, Maani and Porikli, Fatih}, title = {4D Panoptic Segmentation as Invariant and Equivariant Field Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22488-22498} }
Unleashing Vanilla Vision Transformer with Masked Image Modeling for Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fang_2023_ICCV, author = {Fang, Yuxin and Yang, Shusheng and Wang, Shijie and Ge, Yixiao and Shan, Ying and Wang, Xinggang}, title = {Unleashing Vanilla Vision Transformer with Masked Image Modeling for Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6244-6253} }
NDC-Scene: Boost Monocular 3D Semantic Scene Completion in Normalized Device Coordinates Space-
[pdf]
[supp]
[bibtex]@InProceedings{Yao_2023_ICCV, author = {Yao, Jiawei and Li, Chuming and Sun, Keqiang and Cai, Yingjie and Li, Hao and Ouyang, Wanli and Li, Hongsheng}, title = {NDC-Scene: Boost Monocular 3D Semantic Scene Completion in Normalized Device Coordinates Space}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9455-9465} }
Spatio-Temporal Crop Aggregation for Video Representation Learning-
[pdf]
[arXiv]
[bibtex]@InProceedings{Sameni_2023_ICCV, author = {Sameni, Sepehr and Jenni, Simon and Favaro, Paolo}, title = {Spatio-Temporal Crop Aggregation for Video Representation Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5664-5674} }
Zip-NeRF: Anti-Aliased Grid-Based Neural Radiance Fields-
[pdf]
[supp]
[bibtex]@InProceedings{Barron_2023_ICCV, author = {Barron, Jonathan T. and Mildenhall, Ben and Verbin, Dor and Srinivasan, Pratul P. and Hedman, Peter}, title = {Zip-NeRF: Anti-Aliased Grid-Based Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19697-19705} }
Neural-PBIR Reconstruction of Shape, Material, and Illumination-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sun_2023_ICCV, author = {Sun, Cheng and Cai, Guangyan and Li, Zhengqin and Yan, Kai and Zhang, Cheng and Marshall, Carl and Huang, Jia-Bin and Zhao, Shuang and Dong, Zhao}, title = {Neural-PBIR Reconstruction of Shape, Material, and Illumination}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18046-18056} }
Fg-T2M: Fine-Grained Text-Driven Human Motion Generation via Diffusion Model-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Yin and Leng, Zhiying and Li, Frederick W. B. and Wu, Shun-Cheng and Liang, Xiaohui}, title = {Fg-T2M: Fine-Grained Text-Driven Human Motion Generation via Diffusion Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22035-22044} }
BlindHarmony: "Blind" Harmonization for MR Images via Flow Model-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jeong_2023_ICCV, author = {Jeong, Hwihun and Byun, Heejoon and Kang, Dong Un and Lee, Jongho}, title = {BlindHarmony: ''Blind'' Harmonization for MR Images via Flow Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21129-21139} }
Zero-guidance Segmentation Using Zero Segment Labels-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Rewatbowornwong_2023_ICCV, author = {Rewatbowornwong, Pitchaporn and Chatthee, Nattanat and Chuangsuwanich, Ekapol and Suwajanakorn, Supasorn}, title = {Zero-guidance Segmentation Using Zero Segment Labels}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1162-1172} }
Efficient LiDAR Point Cloud Oversegmentation Network-
[pdf]
[supp]
[bibtex]@InProceedings{Hui_2023_ICCV, author = {Hui, Le and Tang, Linghua and Dai, Yuchao and Xie, Jin and Yang, Jian}, title = {Efficient LiDAR Point Cloud Oversegmentation Network}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18003-18012} }
Communication-efficient Federated Learning with Single-Step Synthetic Features Compressor for Faster Convergence-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Yuhao and Shi, Mingjia and Li, Yuanxi and Sun, Yanan and Ye, Qing and Lv, Jiancheng}, title = {Communication-efficient Federated Learning with Single-Step Synthetic Features Compressor for Faster Convergence}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5031-5040} }
SVDFormer: Complementing Point Cloud via Self-view Augmentation and Self-structure Dual-generator-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Zhe and Chen, Honghua and He, Xing and Wang, Weiming and Qin, Jing and Wei, Mingqiang}, title = {SVDFormer: Complementing Point Cloud via Self-view Augmentation and Self-structure Dual-generator}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14508-14518} }
Few-Shot Video Classification via Representation Fusion and Promotion Learning-
[pdf]
[bibtex]@InProceedings{Xia_2023_ICCV, author = {Xia, Haifeng and Li, Kai and Min, Martin Renqiang and Ding, Zhengming}, title = {Few-Shot Video Classification via Representation Fusion and Promotion Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19311-19320} }
E3Sym: Leveraging E(3) Invariance for Unsupervised 3D Planar Reflective Symmetry Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Ren-Wu and Zhang, Ling-Xiao and Li, Chunpeng and Lai, Yu-Kun and Gao, Lin}, title = {E3Sym: Leveraging E(3) Invariance for Unsupervised 3D Planar Reflective Symmetry Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14543-14553} }
CTVIS: Consistent Training for Online Video Instance Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ying_2023_ICCV, author = {Ying, Kaining and Zhong, Qing and Mao, Weian and Wang, Zhenhua and Chen, Hao and Wu, Lin Yuanbo and Liu, Yifan and Fan, Chengxiang and Zhuge, Yunzhi and Shen, Chunhua}, title = {CTVIS: Consistent Training for Online Video Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {899-908} }
Unsupervised Video Object Segmentation with Online Adversarial Self-Tuning-
[pdf]
[bibtex]@InProceedings{Su_2023_ICCV, author = {Su, Tiankang and Song, Huihui and Liu, Dong and Liu, Bo and Liu, Qingshan}, title = {Unsupervised Video Object Segmentation with Online Adversarial Self-Tuning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {688-698} }
Hallucination Improves the Performance of Unsupervised Visual Representation Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Jing and Hobbs, Jennifer and Hovakimyan, Naira}, title = {Hallucination Improves the Performance of Unsupervised Visual Representation Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16132-16143} }
S3IM: Stochastic Structural SIMilarity and Its Unreasonable Effectiveness for Neural Fields-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xie_2023_ICCV, author = {Xie, Zeke and Yang, Xindi and Yang, Yujie and Sun, Qi and Jiang, Yixiang and Wang, Haoran and Cai, Yunfeng and Sun, Mingming}, title = {S3IM: Stochastic Structural SIMilarity and Its Unreasonable Effectiveness for Neural Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18024-18034} }
GlobalMapper: Arbitrary-Shaped Urban Layout Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{He_2023_ICCV, author = {He, Liu and Aliaga, Daniel}, title = {GlobalMapper: Arbitrary-Shaped Urban Layout Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {454-464} }
Membrane Potential Batch Normalization for Spiking Neural Networks-
[pdf]
[arXiv]
[bibtex]@InProceedings{Guo_2023_ICCV, author = {Guo, Yufei and Zhang, Yuhan and Chen, Yuanpei and Peng, Weihang and Liu, Xiaode and Zhang, Liwen and Huang, Xuhui and Ma, Zhe}, title = {Membrane Potential Batch Normalization for Spiking Neural Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19420-19430} }
Enhancing Sample Utilization through Sample Adaptive Augmentation in Semi-Supervised Learning-
[pdf]
[arXiv]
[bibtex]@InProceedings{Gui_2023_ICCV, author = {Gui, Guan and Zhao, Zhen and Qi, Lei and Zhou, Luping and Wang, Lei and Shi, Yinghuan}, title = {Enhancing Sample Utilization through Sample Adaptive Augmentation in Semi-Supervised Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15880-15889} }
Imitator: Personalized Speech-driven 3D Facial Animation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Thambiraja_2023_ICCV, author = {Thambiraja, Balamurugan and Habibie, Ikhsanul and Aliakbarian, Sadegh and Cosker, Darren and Theobalt, Christian and Thies, Justus}, title = {Imitator: Personalized Speech-driven 3D Facial Animation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20621-20631} }
Unified Coarse-to-Fine Alignment for Video-Text Retrieval-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Ziyang and Sung, Yi-Lin and Cheng, Feng and Bertasius, Gedas and Bansal, Mohit}, title = {Unified Coarse-to-Fine Alignment for Video-Text Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2816-2827} }
Seeing Beyond the Patch: Scale-Adaptive Semantic Segmentation of High-resolution Remote Sensing Imagery based on Reinforcement Learning-
[pdf]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Yinhe and Shi, Sunan and Wang, Junjue and Zhong, Yanfei}, title = {Seeing Beyond the Patch: Scale-Adaptive Semantic Segmentation of High-resolution Remote Sensing Imagery based on Reinforcement Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16868-16878} }
Gradient-Regulated Meta-Prompt Learning for Generalizable Vision-Language Models-
[pdf]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Juncheng and Gao, Minghe and Wei, Longhui and Tang, Siliang and Zhang, Wenqiao and Li, Mengze and Ji, Wei and Tian, Qi and Chua, Tat-Seng and Zhuang, Yueting}, title = {Gradient-Regulated Meta-Prompt Learning for Generalizable Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2551-2562} }
Zero-Shot Composed Image Retrieval with Textual Inversion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Baldrati_2023_ICCV, author = {Baldrati, Alberto and Agnolucci, Lorenzo and Bertini, Marco and Del Bimbo, Alberto}, title = {Zero-Shot Composed Image Retrieval with Textual Inversion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15338-15347} }
MUter: Machine Unlearning on Adversarially Trained Models-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Junxu and Xue, Mingsheng and Lou, Jian and Zhang, Xiaoyu and Xiong, Li and Qin, Zhan}, title = {MUter: Machine Unlearning on Adversarially Trained Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4892-4902} }
WALDO: Future Video Synthesis Using Object Layer Decomposition and Parametric Flow Prediction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Le_Moing_2023_ICCV, author = {Le Moing, Guillaume and Ponce, Jean and Schmid, Cordelia}, title = {WALDO: Future Video Synthesis Using Object Layer Decomposition and Parametric Flow Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23229-23241} }
ParCNetV2: Oversized Kernel with Enhanced Attention-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Ruihan and Zhang, Haokui and Hu, Wenze and Zhang, Shiliang and Wang, Xiaoyu}, title = {ParCNetV2: Oversized Kernel with Enhanced Attention}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5752-5762} }
BiFF: Bi-level Future Fusion with Polyline-based Coordinate for Interactive Trajectory Prediction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Yiyao and Luan, Di and Shen, Shaojie}, title = {BiFF: Bi-level Future Fusion with Polyline-based Coordinate for Interactive Trajectory Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8260-8271} }
RealGraph: A Multiview Dataset for 4D Real-world Context Graph Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Lin_2023_ICCV, author = {Lin, Haozhe and Chen, Zequn and Zhang, Jinzhi and Bai, Bing and Wang, Yu and Huang, Ruqi and Fang, Lu}, title = {RealGraph: A Multiview Dataset for 4D Real-world Context Graph Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3758-3768} }
COOL-CHIC: Coordinate-based Low Complexity Hierarchical Image Codec-
[pdf]
[bibtex]@InProceedings{Ladune_2023_ICCV, author = {Ladune, Th\'eo and Philippe, Pierrick and Henry, F\'elix and Clare, Gordon and Leguay, Thomas}, title = {COOL-CHIC: Coordinate-based Low Complexity Hierarchical Image Codec}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13515-13522} }
Normalizing Flows for Human Pose Anomaly Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hirschorn_2023_ICCV, author = {Hirschorn, Or and Avidan, Shai}, title = {Normalizing Flows for Human Pose Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13545-13554} }
Reconstructing Groups of People with Hypergraph Relational Reasoning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Buzhen and Ju, Jingyi and Li, Zhihao and Wang, Yangang}, title = {Reconstructing Groups of People with Hypergraph Relational Reasoning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14873-14883} }
PivotNet: Vectorized Pivot Learning for End-to-end HD Map Construction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ding_2023_ICCV, author = {Ding, Wenjie and Qiao, Limeng and Qiu, Xi and Zhang, Chi}, title = {PivotNet: Vectorized Pivot Learning for End-to-end HD Map Construction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3672-3682} }
Universal Domain Adaptation via Compressive Attention Matching-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Didi and Li, Yinchuan and Yuan, Junkun and Li, Zexi and Kuang, Kun and Wu, Chao}, title = {Universal Domain Adaptation via Compressive Attention Matching}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6974-6985} }
Contactless Pulse Estimation Leveraging Pseudo Labels and Self-Supervision-
[pdf]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Zhihua and Yin, Lijun}, title = {Contactless Pulse Estimation Leveraging Pseudo Labels and Self-Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20588-20597} }
Instruct-NeRF2NeRF: Editing 3D Scenes with Instructions-
[pdf]
[supp]
[bibtex]@InProceedings{Haque_2023_ICCV, author = {Haque, Ayaan and Tancik, Matthew and Efros, Alexei A. and Holynski, Aleksander and Kanazawa, Angjoo}, title = {Instruct-NeRF2NeRF: Editing 3D Scenes with Instructions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19740-19750} }
Point2Mask: Point-supervised Panoptic Segmentation via Optimal Transport-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Wentong and Yuan, Yuqian and Wang, Song and Zhu, Jianke and Li, Jianshu and Liu, Jian and Zhang, Lei}, title = {Point2Mask: Point-supervised Panoptic Segmentation via Optimal Transport}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {572-581} }
Multi-Task Learning with Knowledge Distillation for Dense Prediction-
[pdf]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Yangyang and Yang, Yibo and Zhang, Lefei}, title = {Multi-Task Learning with Knowledge Distillation for Dense Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21550-21559} }
What Does a Platypus Look Like? Generating Customized Prompts for Zero-Shot Image Classification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Pratt_2023_ICCV, author = {Pratt, Sarah and Covert, Ian and Liu, Rosanne and Farhadi, Ali}, title = {What Does a Platypus Look Like? Generating Customized Prompts for Zero-Shot Image Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15691-15701} }
Scene as Occupancy-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tong_2023_ICCV, author = {Tong, Wenwen and Sima, Chonghao and Wang, Tai and Chen, Li and Wu, Silei and Deng, Hanming and Gu, Yi and Lu, Lewei and Luo, Ping and Lin, Dahua and Li, Hongyang}, title = {Scene as Occupancy}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8406-8415} }
U-RED: Unsupervised 3D Shape Retrieval and Deformation for Partial Point Clouds-
[pdf]
[supp]
[bibtex]@InProceedings{Di_2023_ICCV, author = {Di, Yan and Zhang, Chenyangguang and Zhang, Ruida and Manhardt, Fabian and Su, Yongzhi and Rambach, Jason and Stricker, Didier and Ji, Xiangyang and Tombari, Federico}, title = {U-RED: Unsupervised 3D Shape Retrieval and Deformation for Partial Point Clouds}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8884-8895} }
RFLA: A Stealthy Reflected Light Adversarial Attack in the Physical World-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Donghua and Yao, Wen and Jiang, Tingsong and Li, Chao and Chen, Xiaoqian}, title = {RFLA: A Stealthy Reflected Light Adversarial Attack in the Physical World}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4455-4465} }
Nearest Neighbor Guidance for Out-of-Distribution Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Park_2023_ICCV, author = {Park, Jaewoo and Jung, Yoon Gyo and Teoh, Andrew Beng Jin}, title = {Nearest Neighbor Guidance for Out-of-Distribution Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1686-1695} }
PatchCT: Aligning Patch Set and Label Set with Conditional Transport for Multi-Label Image Classification-
[pdf]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Miaoge and Wang, Dongsheng and Liu, Xinyang and Zeng, Zequn and Lu, Ruiying and Chen, Bo and Zhou, Mingyuan}, title = {PatchCT: Aligning Patch Set and Label Set with Conditional Transport for Multi-Label Image Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15348-15358} }
VI-Net: Boosting Category-level 6D Object Pose Estimation via Learning Decoupled Rotations on the Spherical Representations-
[pdf]
[supp]
[bibtex]@InProceedings{Lin_2023_ICCV, author = {Lin, Jiehong and Wei, Zewei and Zhang, Yabin and Jia, Kui}, title = {VI-Net: Boosting Category-level 6D Object Pose Estimation via Learning Decoupled Rotations on the Spherical Representations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14001-14011} }
ICD-Face: Intra-class Compactness Distillation for Face Recognition-
[pdf]
[bibtex]@InProceedings{Yu_2023_ICCV, author = {Yu, Zhipeng and Liu, Jiaheng and Qin, Haoyu and Wu, Yichao and Hu, Kun and Tian, Jiayi and Liang, Ding}, title = {ICD-Face: Intra-class Compactness Distillation for Face Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21042-21052} }
Diffusion-SDF: Conditional Generative Modeling of Signed Distance Functions-
[pdf]
[bibtex]@InProceedings{Chou_2023_ICCV, author = {Chou, Gene and Bahat, Yuval and Heide, Felix}, title = {Diffusion-SDF: Conditional Generative Modeling of Signed Distance Functions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2262-2272} }
Open-Vocabulary Object Detection With an Open Corpus-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Jiong and Zhang, Huiming and Hong, Haiwen and Jin, Xuan and He, Yuan and Xue, Hui and Zhao, Zhou}, title = {Open-Vocabulary Object Detection With an Open Corpus}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6759-6769} }
Long-range Multimodal Pretraining for Movie Understanding-
[pdf]
[arXiv]
[bibtex]@InProceedings{Argaw_2023_ICCV, author = {Argaw, Dawit Mureja and Lee, Joon-Young and Woodson, Markus and Kweon, In So and Heilbron, Fabian Caba}, title = {Long-range Multimodal Pretraining for Movie Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13392-13403} }
MRM: Masked Relation Modeling for Medical Image Pre-Training with Genetics-
[pdf]
[supp]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Qiushi and Li, Wuyang and Li, Baopu and Yuan, Yixuan}, title = {MRM: Masked Relation Modeling for Medical Image Pre-Training with Genetics}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21452-21462} }
Adverse Weather Removal with Codebook Priors-
[pdf]
[supp]
[bibtex]@InProceedings{Ye_2023_ICCV, author = {Ye, Tian and Chen, Sixiang and Bai, Jinbin and Shi, Jun and Xue, Chenghao and Jiang, Jingxia and Yin, Junjie and Chen, Erkang and Liu, Yun}, title = {Adverse Weather Removal with Codebook Priors}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12653-12664} }
Spectrum-guided Multi-granularity Referring Video Object Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Miao_2023_ICCV, author = {Miao, Bo and Bennamoun, Mohammed and Gao, Yongsheng and Mian, Ajmal}, title = {Spectrum-guided Multi-granularity Referring Video Object Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {920-930} }
Sound Source Localization is All about Cross-Modal Alignment-
[pdf]
[arXiv]
[bibtex]@InProceedings{Senocak_2023_ICCV, author = {Senocak, Arda and Ryu, Hyeonggon and Kim, Junsik and Oh, Tae-Hyun and Pfister, Hanspeter and Chung, Joon Son}, title = {Sound Source Localization is All about Cross-Modal Alignment}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7777-7787} }
MAP: Towards Balanced Generalization of IID and OOD through Model-Agnostic Adapters-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Min and Yuan, Junkun and He, Yue and Li, Wenbin and Chen, Zhengyu and Kuang, Kun}, title = {MAP: Towards Balanced Generalization of IID and OOD through Model-Agnostic Adapters}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11921-11931} }
Exploring Group Video Captioning with Efficient Relational Approximation-
[pdf]
[supp]
[bibtex]@InProceedings{Lin_2023_ICCV, author = {Lin, Wang and Jin, Tao and Wang, Ye and Pan, Wenwen and Li, Linjun and Cheng, Xize and Zhao, Zhou}, title = {Exploring Group Video Captioning with Efficient Relational Approximation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15281-15290} }
ADAPT: Efficient Multi-Agent Trajectory Prediction with Adaptation-
[pdf]
[supp]
[bibtex]@InProceedings{Aydemir_2023_ICCV, author = {Aydemir, G\"orkay and Akan, Adil Kaan and G\"uney, Fatma}, title = {ADAPT: Efficient Multi-Agent Trajectory Prediction with Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8295-8305} }
TaskExpert: Dynamically Assembling Multi-Task Representations with Memorial Mixture-of-Experts-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ye_2023_ICCV, author = {Ye, Hanrong and Xu, Dan}, title = {TaskExpert: Dynamically Assembling Multi-Task Representations with Memorial Mixture-of-Experts}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21828-21837} }
Meta OOD Learning For Continuously Adaptive OOD Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Xinheng and Lu, Jie and Fang, Zhen and Zhang, Guangquan}, title = {Meta OOD Learning For Continuously Adaptive OOD Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19353-19364} }
MAPConNet: Self-supervised 3D Pose Transfer with Mesh and Point Contrastive Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sun_2023_ICCV, author = {Sun, Jiaze and Chen, Zhixiang and Kim, Tae-Kyun}, title = {MAPConNet: Self-supervised 3D Pose Transfer with Mesh and Point Contrastive Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14452-14462} }
BlendFace: Re-designing Identity Encoders for Face-Swapping-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shiohara_2023_ICCV, author = {Shiohara, Kaede and Yang, Xingchao and Taketomi, Takafumi}, title = {BlendFace: Re-designing Identity Encoders for Face-Swapping}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7634-7644} }
Test-time Personalizable Forecasting of 3D Human Poses-
[pdf]
[supp]
[bibtex]@InProceedings{Cui_2023_ICCV, author = {Cui, Qiongjie and Sun, Huaijiang and Lu, Jianfeng and Li, Weiqing and Li, Bin and Yi, Hongwei and Wang, Haofan}, title = {Test-time Personalizable Forecasting of 3D Human Poses}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {274-283} }
Few-shot Continual Infomax Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Gu_2023_ICCV, author = {Gu, Ziqi and Xu, Chunyan and Yang, Jian and Cui, Zhen}, title = {Few-shot Continual Infomax Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19224-19233} }
A Parse-Then-Place Approach for Generating Graphic Layouts from Textual Descriptions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lin_2023_ICCV, author = {Lin, Jiawei and Guo, Jiaqi and Sun, Shizhao and Xu, Weijiang and Liu, Ting and Lou, Jian-Guang and Zhang, Dongmei}, title = {A Parse-Then-Place Approach for Generating Graphic Layouts from Textual Descriptions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23622-23631} }
DreamBooth3D: Subject-Driven Text-to-3D Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Raj_2023_ICCV, author = {Raj, Amit and Kaza, Srinivas and Poole, Ben and Niemeyer, Michael and Ruiz, Nataniel and Mildenhall, Ben and Zada, Shiran and Aberman, Kfir and Rubinstein, Michael and Barron, Jonathan and Li, Yuanzhen and Jampani, Varun}, title = {DreamBooth3D: Subject-Driven Text-to-3D Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2349-2359} }
DARTH: Holistic Test-time Adaptation for Multiple Object Tracking-
[pdf]
[supp]
[bibtex]@InProceedings{Segu_2023_ICCV, author = {Segu, Mattia and Schiele, Bernt and Yu, Fisher}, title = {DARTH: Holistic Test-time Adaptation for Multiple Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9717-9727} }
Multi-interactive Feature Learning and a Full-time Multi-modality Benchmark for Image Fusion and Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Jinyuan and Liu, Zhu and Wu, Guanyao and Ma, Long and Liu, Risheng and Zhong, Wei and Luo, Zhongxuan and Fan, Xin}, title = {Multi-interactive Feature Learning and a Full-time Multi-modality Benchmark for Image Fusion and Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8115-8124} }
BaRe-ESA: A Riemannian Framework for Unregistered Human Body Shapes-
[pdf]
[supp]
[bibtex]@InProceedings{Hartman_2023_ICCV, author = {Hartman, Emmanuel and Pierson, Emery and Bauer, Martin and Charon, Nicolas and Daoudi, Mohamed}, title = {BaRe-ESA: A Riemannian Framework for Unregistered Human Body Shapes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14181-14191} }
Skip-Plan: Procedure Planning in Instructional Videos via Condensed Action Space Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Zhiheng and Geng, Wenjia and Li, Muheng and Chen, Lei and Tang, Yansong and Lu, Jiwen and Zhou, Jie}, title = {Skip-Plan: Procedure Planning in Instructional Videos via Condensed Action Space Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10297-10306} }
A Retrospect to Multi-prompt Learning across Vision and Language-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Ziliang and Huang, Xin and Guan, Quanlong and Lin, Liang and Luo, Weiqi}, title = {A Retrospect to Multi-prompt Learning across Vision and Language}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22190-22201} }
Sparse Instance Conditioned Multimodal Trajectory Prediction-
[pdf]
[bibtex]@InProceedings{Dong_2023_ICCV, author = {Dong, Yonghao and Wang, Le and Zhou, Sanping and Hua, Gang}, title = {Sparse Instance Conditioned Multimodal Trajectory Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9763-9772} }
Label Shift Adapter for Test-Time Adaptation under Covariate and Label Shifts-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Park_2023_ICCV, author = {Park, Sunghyun and Yang, Seunghan and Choo, Jaegul and Yun, Sungrack}, title = {Label Shift Adapter for Test-Time Adaptation under Covariate and Label Shifts}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16421-16431} }
NAPA-VQ: Neighborhood-Aware Prototype Augmentation with Vector Quantization for Continual Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Malepathirana_2023_ICCV, author = {Malepathirana, Tamasha and Senanayake, Damith and Halgamuge, Saman}, title = {NAPA-VQ: Neighborhood-Aware Prototype Augmentation with Vector Quantization for Continual Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11674-11684} }
Dynamic Snake Convolution Based on Topological Geometric Constraints for Tubular Structure Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Qi_2023_ICCV, author = {Qi, Yaolei and He, Yuting and Qi, Xiaoming and Zhang, Yuan and Yang, Guanyu}, title = {Dynamic Snake Convolution Based on Topological Geometric Constraints for Tubular Structure Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6070-6079} }
Unsupervised Open-Vocabulary Object Localization in Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fan_2023_ICCV, author = {Fan, Ke and Bai, Zechen and Xiao, Tianjun and Zietlow, Dominik and Horn, Max and Zhao, Zixu and Simon-Gabriel, Carl-Johann and Shou, Mike Zheng and Locatello, Francesco and Schiele, Bernt and Brox, Thomas and Zhang, Zheng and Fu, Yanwei and He, Tong}, title = {Unsupervised Open-Vocabulary Object Localization in Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13747-13755} }
Dataset Quantization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Daquan and Wang, Kai and Gu, Jianyang and Peng, Xiangyu and Lian, Dongze and Zhang, Yifan and You, Yang and Feng, Jiashi}, title = {Dataset Quantization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17205-17216} }
Unsupervised Video Deraining with An Event Camera-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Jin and Weng, Wenming and Zhang, Yueyi and Xiong, Zhiwei}, title = {Unsupervised Video Deraining with An Event Camera}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10831-10840} }
Overcoming Forgetting Catastrophe in Quantization-Aware Training-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Ting-An and Yang, De-Nian and Chen, Ming-Syan}, title = {Overcoming Forgetting Catastrophe in Quantization-Aware Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17358-17367} }
DIME-FM : DIstilling Multimodal and Efficient Foundation Models-
[pdf]
[supp]
[bibtex]@InProceedings{Sun_2023_ICCV, author = {Sun, Ximeng and Zhang, Pengchuan and Zhang, Peizhao and Shah, Hardik and Saenko, Kate and Xia, Xide}, title = {DIME-FM : DIstilling Multimodal and Efficient Foundation Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15521-15533} }
Boosting Single Image Super-Resolution via Partial Channel Shifting-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Xiaoming and Li, Tianrui and Zhao, Xiaole}, title = {Boosting Single Image Super-Resolution via Partial Channel Shifting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13223-13232} }
Learning to Upsample by Learning to Sample-
[pdf]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Wenze and Lu, Hao and Fu, Hongtao and Cao, Zhiguo}, title = {Learning to Upsample by Learning to Sample}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6027-6037} }
LayoutDiffusion: Improving Graphic Layout Generation by Discrete Diffusion Probabilistic Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Junyi and Guo, Jiaqi and Sun, Shizhao and Lou, Jian-Guang and Zhang, Dongmei}, title = {LayoutDiffusion: Improving Graphic Layout Generation by Discrete Diffusion Probabilistic Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7226-7236} }
Efficiently Robustify Pre-Trained Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jain_2023_ICCV, author = {Jain, Nishant and Behl, Harkirat and Rawat, Yogesh Singh and Vineet, Vibhav}, title = {Efficiently Robustify Pre-Trained Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5505-5515} }
Efficient Video Prediction via Sparsely Conditioned Flow Matching-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Davtyan_2023_ICCV, author = {Davtyan, Aram and Sameni, Sepehr and Favaro, Paolo}, title = {Efficient Video Prediction via Sparsely Conditioned Flow Matching}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23263-23274} }
Surface Normal Clustering for Implicit Representation of Manhattan Scenes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Popovic_2023_ICCV, author = {Popovic, Nikola and Paudel, Danda Pani and Van Gool, Luc}, title = {Surface Normal Clustering for Implicit Representation of Manhattan Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17860-17870} }
Distracting Downpour: Adversarial Weather Attacks for Motion Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Schmalfuss_2023_ICCV, author = {Schmalfuss, Jenny and Mehl, Lukas and Bruhn, Andr\'es}, title = {Distracting Downpour: Adversarial Weather Attacks for Motion Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10106-10116} }
Adaptive Similarity Bootstrapping for Self-Distillation Based Representation Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Lebailly_2023_ICCV, author = {Lebailly, Tim and Stegm\"uller, Thomas and Bozorgtabar, Behzad and Thiran, Jean-Philippe and Tuytelaars, Tinne}, title = {Adaptive Similarity Bootstrapping for Self-Distillation Based Representation Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16505-16514} }
Generalized Differentiable RANSAC-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wei_2023_ICCV, author = {Wei, Tong and Patel, Yash and Shekhovtsov, Alexander and Matas, Jiri and Barath, Daniel}, title = {Generalized Differentiable RANSAC}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17649-17660} }
Unfolding Framework with Prior of Convolution-Transformer Mixture and Uncertainty Estimation for Video Snapshot Compressive Imaging-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zheng_2023_ICCV, author = {Zheng, Siming and Yuan, Xin}, title = {Unfolding Framework with Prior of Convolution-Transformer Mixture and Uncertainty Estimation for Video Snapshot Compressive Imaging}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12738-12749} }
Non-Semantics Suppressed Mask Learning for Unsupervised Video Semantic Compression-
[pdf]
[bibtex]@InProceedings{Tian_2023_ICCV, author = {Tian, Yuan and Lu, Guo and Zhai, Guangtao and Gao, Zhiyong}, title = {Non-Semantics Suppressed Mask Learning for Unsupervised Video Semantic Compression}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13610-13622} }
ResQ: Residual Quantization for Video Perception-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Abati_2023_ICCV, author = {Abati, Davide and Ben Yahia, Haitam and Nagel, Markus and Habibian, Amirhossein}, title = {ResQ: Residual Quantization for Video Perception}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17119-17129} }
Inverse Compositional Learning for Weakly-supervised Relation Grounding-
[pdf]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Huan and Wei, Ping and Ma, Zeyu and Zheng, Nanning}, title = {Inverse Compositional Learning for Weakly-supervised Relation Grounding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15477-15487} }
XMem++: Production-level Video Segmentation From Few Annotated Frames-
[pdf]
[supp]
[bibtex]@InProceedings{Bekuzarov_2023_ICCV, author = {Bekuzarov, Maksym and Bermudez, Ariana and Lee, Joon-Young and Li, Hao}, title = {XMem++: Production-level Video Segmentation From Few Annotated Frames}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {635-644} }
MHCN: A Hyperbolic Neural Network Model for Multi-view Hierarchical Clustering-
[pdf]
[supp]
[bibtex]@InProceedings{Lin_2023_ICCV, author = {Lin, Fangfei and Bai, Bing and Guo, Yiwen and Chen, Hao and Ren, Yazhou and Xu, Zenglin}, title = {MHCN: A Hyperbolic Neural Network Model for Multi-view Hierarchical Clustering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16525-16535} }
End-to-End Diffusion Latent Optimization Improves Classifier Guidance-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wallace_2023_ICCV, author = {Wallace, Bram and Gokul, Akash and Ermon, Stefano and Naik, Nikhil}, title = {End-to-End Diffusion Latent Optimization Improves Classifier Guidance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7280-7290} }
FineRecon: Depth-aware Feed-forward Network for Detailed 3D Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Stier_2023_ICCV, author = {Stier, Noah and Ranjan, Anurag and Colburn, Alex and Yan, Yajie and Yang, Liang and Ma, Fangchang and Angles, Baptiste}, title = {FineRecon: Depth-aware Feed-forward Network for Detailed 3D Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18423-18432} }
Navigating to Objects Specified by Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Krantz_2023_ICCV, author = {Krantz, Jacob and Gervet, Theophile and Yadav, Karmesh and Wang, Austin and Paxton, Chris and Mottaghi, Roozbeh and Batra, Dhruv and Malik, Jitendra and Lee, Stefan and Chaplot, Devendra Singh}, title = {Navigating to Objects Specified by Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10916-10925} }
TRM-UAP: Enhancing the Transferability of Data-Free Universal Adversarial Perturbation via Truncated Ratio Maximization-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Yiran and Feng, Xin and Wang, Yunlong and Yang, Wu and Ming, Di}, title = {TRM-UAP: Enhancing the Transferability of Data-Free Universal Adversarial Perturbation via Truncated Ratio Maximization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4762-4771} }
LATR: 3D Lane Detection from Monocular Images with Transformer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Luo_2023_ICCV, author = {Luo, Yueru and Zheng, Chaoda and Yan, Xu and Kun, Tang and Zheng, Chao and Cui, Shuguang and Li, Zhen}, title = {LATR: 3D Lane Detection from Monocular Images with Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7941-7952} }
Scratching Visual Transformer's Back with Uniform Attention-
[pdf]
[supp]
[bibtex]@InProceedings{Hyeon-Woo_2023_ICCV, author = {Hyeon-Woo, Nam and Yu-Ji, Kim and Heo, Byeongho and Han, Dongyoon and Oh, Seong Joon and Oh, Tae-Hyun}, title = {Scratching Visual Transformer's Back with Uniform Attention}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5807-5818} }
Tune-A-Video: One-Shot Tuning of Image Diffusion Models for Text-to-Video Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Jay Zhangjie and Ge, Yixiao and Wang, Xintao and Lei, Stan Weixian and Gu, Yuchao and Shi, Yufei and Hsu, Wynne and Shan, Ying and Qie, Xiaohu and Shou, Mike Zheng}, title = {Tune-A-Video: One-Shot Tuning of Image Diffusion Models for Text-to-Video Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7623-7633} }
Anchor-Intermediate Detector: Decoupling and Coupling Bounding Boxes for Accurate Object Detection-
[pdf]
[bibtex]@InProceedings{Lv_2023_ICCV, author = {Lv, Yilong and Li, Min and He, Yujie and Li, Shaopeng and He, Zhuzhen and Yang, Aitao}, title = {Anchor-Intermediate Detector: Decoupling and Coupling Bounding Boxes for Accurate Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6275-6284} }
Environment-Invariant Curriculum Relation Learning for Fine-Grained Scene Graph Generation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Min_2023_ICCV, author = {Min, Yukuan and Wu, Aming and Deng, Cheng}, title = {Environment-Invariant Curriculum Relation Learning for Fine-Grained Scene Graph Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13296-13307} }
Extensible and Efficient Proxy for Neural Architecture Search-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Yuhong and Li, Jiajie and Hao, Cong and Li, Pan and Xiong, Jinjun and Chen, Deming}, title = {Extensible and Efficient Proxy for Neural Architecture Search}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6199-6210} }
Zenseact Open Dataset: A Large-Scale and Diverse Multimodal Dataset for Autonomous Driving-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Alibeigi_2023_ICCV, author = {Alibeigi, Mina and Ljungbergh, William and Tonderski, Adam and Hess, Georg and Lilja, Adam and Lindstr\"om, Carl and Motorniuk, Daria and Fu, Junsheng and Widahl, Jenny and Petersson, Christoffer}, title = {Zenseact Open Dataset: A Large-Scale and Diverse Multimodal Dataset for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20178-20188} }
MAAL: Multimodality-Aware Autoencoder-Based Affordance Learning for 3D Articulated Objects-
[pdf]
[supp]
[bibtex]@InProceedings{Liang_2023_ICCV, author = {Liang, Yuanzhi and Wang, Xiaohan and Zhu, Linchao and Yang, Yi}, title = {MAAL: Multimodality-Aware Autoencoder-Based Affordance Learning for 3D Articulated Objects}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {217-227} }
Generalizable Decision Boundaries: Dualistic Meta-Learning for Open Set Domain Generalization-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Xiran and Zhang, Jian and Qi, Lei and Shi, Yinghuan}, title = {Generalizable Decision Boundaries: Dualistic Meta-Learning for Open Set Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11564-11573} }
Benchmarking and Analyzing Robust Point Cloud Recognition: Bag of Tricks for Defending Adversarial Examples-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ji_2023_ICCV, author = {Ji, Qiufan and Wang, Lin and Shi, Cong and Hu, Shengshan and Chen, Yingying and Sun, Lichao}, title = {Benchmarking and Analyzing Robust Point Cloud Recognition: Bag of Tricks for Defending Adversarial Examples}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4295-4304} }
Weakly Supervised Referring Image Segmentation with Intra-Chunk and Inter-Chunk Consistency-
[pdf]
[supp]
[bibtex]@InProceedings{Lee_2023_ICCV, author = {Lee, Jungbeom and Lee, Sungjin and Nam, Jinseok and Yu, Seunghak and Do, Jaeyoung and Taghavi, Tara}, title = {Weakly Supervised Referring Image Segmentation with Intra-Chunk and Inter-Chunk Consistency}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21870-21881} }
Poincare ResNet-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{van_Spengler_2023_ICCV, author = {van Spengler, Max and Berkhout, Erwin and Mettes, Pascal}, title = {Poincare ResNet}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5419-5428} }
Parameterized Cost Volume for Stereo Matching-
[pdf]
[supp]
[bibtex]@InProceedings{Zeng_2023_ICCV, author = {Zeng, Jiaxi and Yao, Chengtang and Yu, Lidong and Wu, Yuwei and Jia, Yunde}, title = {Parameterized Cost Volume for Stereo Matching}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18347-18357} }
SAFE: Sensitivity-Aware Features for Out-of-Distribution Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wilson_2023_ICCV, author = {Wilson, Samuel and Fischer, Tobias and Dayoub, Feras and Miller, Dimity and S\"underhauf, Niko}, title = {SAFE: Sensitivity-Aware Features for Out-of-Distribution Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23565-23576} }
SimFIR: A Simple Framework for Fisheye Image Rectification with Self-supervised Representation Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Feng_2023_ICCV, author = {Feng, Hao and Wang, Wendi and Deng, Jiajun and Zhou, Wengang and Li, Li and Li, Houqiang}, title = {SimFIR: A Simple Framework for Fisheye Image Rectification with Self-supervised Representation Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12418-12427} }
Subclass-balancing Contrastive Learning for Long-tailed Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hou_2023_ICCV, author = {Hou, Chengkai and Zhang, Jieyu and Wang, Haonan and Zhou, Tianyi}, title = {Subclass-balancing Contrastive Learning for Long-tailed Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5395-5407} }
Generalized Lightness Adaptation with Channel Selective Normalization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yao_2023_ICCV, author = {Yao, Mingde and Huang, Jie and Jin, Xin and Xu, Ruikang and Zhou, Shenglong and Zhou, Man and Xiong, Zhiwei}, title = {Generalized Lightness Adaptation with Channel Selective Normalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10668-10679} }
Omnidirectional Information Gathering for Knowledge Transfer-Based Audio-Visual Navigation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Jinyu and Wang, Wenguan and Liu, Si and Li, Hongsheng and Yang, Yi}, title = {Omnidirectional Information Gathering for Knowledge Transfer-Based Audio-Visual Navigation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10993-11003} }
Multi-Scale Bidirectional Recurrent Network with Hybrid Correlation for Point Cloud Based Scene Flow Estimation-
[pdf]
[bibtex]@InProceedings{Cheng_2023_ICCV, author = {Cheng, Wencan and Ko, Jong Hwan}, title = {Multi-Scale Bidirectional Recurrent Network with Hybrid Correlation for Point Cloud Based Scene Flow Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10041-10050} }
Dynamic Mesh-Aware Radiance Fields-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Qiao_2023_ICCV, author = {Qiao, Yi-Ling and Gao, Alexander and Xu, Yiran and Feng, Yue and Huang, Jia-Bin and Lin, Ming C.}, title = {Dynamic Mesh-Aware Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {385-396} }
Learning Support and Trivial Prototypes for Interpretable Image Classification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Chong and Liu, Yuyuan and Chen, Yuanhong and Liu, Fengbei and Tian, Yu and McCarthy, Davis and Frazer, Helen and Carneiro, Gustavo}, title = {Learning Support and Trivial Prototypes for Interpretable Image Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2062-2072} }
Decoupled DETR: Spatially Disentangling Localization and Classification for Improved End-to-End Object Detection-
[pdf]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Manyuan and Song, Guanglu and Liu, Yu and Li, Hongsheng}, title = {Decoupled DETR: Spatially Disentangling Localization and Classification for Improved End-to-End Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6601-6610} }
GIFD: A Generative Gradient Inversion Method with Feature Domain Optimization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fang_2023_ICCV, author = {Fang, Hao and Chen, Bin and Wang, Xuan and Wang, Zhi and Xia, Shu-Tao}, title = {GIFD: A Generative Gradient Inversion Method with Feature Domain Optimization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4967-4976} }
VLN-PETL: Parameter-Efficient Transfer Learning for Vision-and-Language Navigation-
[pdf]
[supp]
[bibtex]@InProceedings{Qiao_2023_ICCV, author = {Qiao, Yanyuan and Yu, Zheng and Wu, Qi}, title = {VLN-PETL: Parameter-Efficient Transfer Learning for Vision-and-Language Navigation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15443-15452} }
Generalized Sum Pooling for Metric Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Gurbuz_2023_ICCV, author = {G\"urb\"uz, Yeti Z. and Sener, Ozan and Alatan, A. Aydin}, title = {Generalized Sum Pooling for Metric Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5462-5473} }
AlignDet: Aligning Pre-training and Fine-tuning in Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Ming and Wu, Jie and Wang, Xionghui and Chen, Chen and Qin, Jie and Xiao, Xuefeng and Wang, Rui and Zheng, Min and Pan, Xin}, title = {AlignDet: Aligning Pre-training and Fine-tuning in Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6866-6876} }
Learning Continuous Exposure Value Representations for Single-Image HDR Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Su-Kai and Yen, Hung-Lin and Liu, Yu-Lun and Chen, Min-Hung and Hu, Hou-Ning and Peng, Wen-Hsiao and Lin, Yen-Yu}, title = {Learning Continuous Exposure Value Representations for Single-Image HDR Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12990-13000} }
DREAM: Efficient Dataset Distillation by Representative Matching-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Yanqing and Gu, Jianyang and Wang, Kai and Zhu, Zheng and Jiang, Wei and You, Yang}, title = {DREAM: Efficient Dataset Distillation by Representative Matching}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17314-17324} }
MixSynthFormer: A Transformer Encoder-like Structure with Mixed Synthetic Self-attention for Efficient Human Pose Estimation-
[pdf]
[supp]
[bibtex]@InProceedings{Sun_2023_ICCV, author = {Sun, Yuran and Dougherty, Alan William and Zhang, Zhuoying and Choi, Yi King and Wu, Chuan}, title = {MixSynthFormer: A Transformer Encoder-like Structure with Mixed Synthetic Self-attention for Efficient Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14884-14893} }
Focus on Your Target: A Dual Teacher-Student Framework for Domain-Adaptive Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huo_2023_ICCV, author = {Huo, Xinyue and Xie, Lingxi and Zhou, Wengang and Li, Houqiang and Tian, Qi}, title = {Focus on Your Target: A Dual Teacher-Student Framework for Domain-Adaptive Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19027-19038} }
Enhanced Meta Label Correction for Coping with Label Corruption-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Taraday_2023_ICCV, author = {Taraday, Mitchell Keren and Baskin, Chaim}, title = {Enhanced Meta Label Correction for Coping with Label Corruption}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16295-16304} }
Dense Text-to-Image Generation with Attention Modulation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Kim_2023_ICCV, author = {Kim, Yunji and Lee, Jiyoung and Kim, Jin-Hwa and Ha, Jung-Woo and Zhu, Jun-Yan}, title = {Dense Text-to-Image Generation with Attention Modulation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7701-7711} }
HumanMAC: Masked Motion Completion for Human Motion Prediction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Ling-Hao and Zhang, JiaWei and Li, Yewen and Pang, Yiren and Xia, Xiaobo and Liu, Tongliang}, title = {HumanMAC: Masked Motion Completion for Human Motion Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9544-9555} }
Will Large-scale Generative Models Corrupt Future Datasets?-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hataya_2023_ICCV, author = {Hataya, Ryuichiro and Bao, Han and Arai, Hiromi}, title = {Will Large-scale Generative Models Corrupt Future Datasets?}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20555-20565} }
SHACIRA: Scalable HAsh-grid Compression for Implicit Neural Representations-
[pdf]
[supp]
[bibtex]@InProceedings{Girish_2023_ICCV, author = {Girish, Sharath and Shrivastava, Abhinav and Gupta, Kamal}, title = {SHACIRA: Scalable HAsh-grid Compression for Implicit Neural Representations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17513-17524} }
Prompt Switch: Efficient CLIP Adaptation for Text-Video Retrieval-
[pdf]
[arXiv]
[bibtex]@InProceedings{Deng_2023_ICCV, author = {Deng, Chaorui and Chen, Qi and Qin, Pengda and Chen, Da and Wu, Qi}, title = {Prompt Switch: Efficient CLIP Adaptation for Text-Video Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15648-15658} }
Video Action Recognition with Attentive Semantic Units-
[pdf]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Yifei and Chen, Dapeng and Liu, Ruijin and Li, Hao and Peng, Wei}, title = {Video Action Recognition with Attentive Semantic Units}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10170-10180} }
Sentence Attention Blocks for Answer Grounding-
[pdf]
[arXiv]
[bibtex]@InProceedings{Khoshsirat_2023_ICCV, author = {Khoshsirat, Seyedalireza and Kambhamettu, Chandra}, title = {Sentence Attention Blocks for Answer Grounding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6080-6090} }
Scanning Only Once: An End-to-end Framework for Fast Temporal Grounding in Long Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Pan_2023_ICCV, author = {Pan, Yulin and He, Xiangteng and Gong, Biao and Lv, Yiliang and Shen, Yujun and Peng, Yuxin and Zhao, Deli}, title = {Scanning Only Once: An End-to-end Framework for Fast Temporal Grounding in Long Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13767-13777} }
A Low-Shot Object Counting Network With Iterative Prototype Adaptation-
[pdf]
[bibtex]@InProceedings{Dukic_2023_ICCV, author = {{\DJ}uki\'c, Nikola and Luke\v{z}i\v{c}, Alan and Zavrtanik, Vitjan and Kristan, Matej}, title = {A Low-Shot Object Counting Network With Iterative Prototype Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18872-18881} }
Towards Fairness-aware Adversarial Network Pruning-
[pdf]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Lei and Wang, Zhibo and Dong, Xiaowei and Feng, Yunhe and Pang, Xiaoyi and Zhang, Zhifei and Ren, Kui}, title = {Towards Fairness-aware Adversarial Network Pruning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5168-5177} }
VoroMesh: Learning Watertight Surface Meshes with Voronoi Diagrams-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Maruani_2023_ICCV, author = {Maruani, Nissim and Klokov, Roman and Ovsjanikov, Maks and Alliez, Pierre and Desbrun, Mathieu}, title = {VoroMesh: Learning Watertight Surface Meshes with Voronoi Diagrams}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14565-14574} }
Breaking Temporal Consistency: Generating Video Universal Adversarial Perturbations Using Image Models-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2023_ICCV, author = {Kim, Hee-Seon and Son, Minji and Kim, Minbeom and Kwon, Myung-Joon and Kim, Changick}, title = {Breaking Temporal Consistency: Generating Video Universal Adversarial Perturbations Using Image Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4325-4334} }
Smoothness Similarity Regularization for Few-Shot GAN Adaptation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sushko_2023_ICCV, author = {Sushko, Vadim and Wang, Ruyu and Gall, Juergen}, title = {Smoothness Similarity Regularization for Few-Shot GAN Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7073-7082} }
Distilling Coarse-to-Fine Semantic Matching Knowledge for Weakly Supervised 3D Visual Grounding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Zehan and Huang, Haifeng and Zhao, Yang and Li, Linjun and Cheng, Xize and Zhu, Yichen and Yin, Aoxiong and Zhao, Zhou}, title = {Distilling Coarse-to-Fine Semantic Matching Knowledge for Weakly Supervised 3D Visual Grounding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2662-2671} }
What does CLIP know about a red circle? Visual prompt engineering for VLMs-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shtedritski_2023_ICCV, author = {Shtedritski, Aleksandar and Rupprecht, Christian and Vedaldi, Andrea}, title = {What does CLIP know about a red circle? Visual prompt engineering for VLMs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11987-11997} }
MEGA: Multimodal Alignment Aggregation and Distillation For Cinematic Video Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sadoughi_2023_ICCV, author = {Sadoughi, Najmeh and Li, Xinyu and Vajpayee, Avijit and Fan, David and Shuai, Bing and Santos-Villalobos, Hector and Bhat, Vimal and MV, Rohith}, title = {MEGA: Multimodal Alignment Aggregation and Distillation For Cinematic Video Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23331-23340} }
DiffRate : Differentiable Compression Rate for Efficient Vision Transformers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Mengzhao and Shao, Wenqi and Xu, Peng and Lin, Mingbao and Zhang, Kaipeng and Chao, Fei and Ji, Rongrong and Qiao, Yu and Luo, Ping}, title = {DiffRate : Differentiable Compression Rate for Efficient Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17164-17174} }
zPROBE: Zero Peek Robustness Checks for Federated Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ghodsi_2023_ICCV, author = {Ghodsi, Zahra and Javaheripi, Mojan and Sheybani, Nojan and Zhang, Xinqiao and Huang, Ke and Koushanfar, Farinaz}, title = {zPROBE: Zero Peek Robustness Checks for Federated Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4860-4870} }
LoLep: Single-View View Synthesis with Locally-Learned Planes and Self-Attention Occlusion Inference-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Cong and Wang, Yu-Ping and Manocha, Dinesh}, title = {LoLep: Single-View View Synthesis with Locally-Learned Planes and Self-Attention Occlusion Inference}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10841-10851} }
Multi-Modal Continual Test-Time Adaptation for 3D Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cao_2023_ICCV, author = {Cao, Haozhi and Xu, Yuecong and Yang, Jianfei and Yin, Pengyu and Yuan, Shenghai and Xie, Lihua}, title = {Multi-Modal Continual Test-Time Adaptation for 3D Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18809-18819} }
Exploring Positional Characteristics of Dual-Pixel Data for Camera Autofocus-
[pdf]
[supp]
[bibtex]@InProceedings{Choi_2023_ICCV, author = {Choi, Myungsub and Lee, Hana and Lee, Hyong-euk}, title = {Exploring Positional Characteristics of Dual-Pixel Data for Camera Autofocus}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13158-13168} }
Heterogeneous Forgetting Compensation for Class-Incremental Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dong_2023_ICCV, author = {Dong, Jiahua and Liang, Wenqi and Cong, Yang and Sun, Gan}, title = {Heterogeneous Forgetting Compensation for Class-Incremental Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11742-11751} }
FemtoDet: An Object Detection Baseline for Energy Versus Performance Tradeoffs-
[pdf]
[arXiv]
[bibtex]@InProceedings{Tu_2023_ICCV, author = {Tu, Peng and Xie, Xu and Ai, Guo and Li, Yuexiang and Huang, Yawen and Zheng, Yefeng}, title = {FemtoDet: An Object Detection Baseline for Energy Versus Performance Tradeoffs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13318-13327} }
Generative Prompt Model for Weakly Supervised Object Localization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Yuzhong and Ye, Qixiang and Wu, Weijia and Shen, Chunhua and Wan, Fang}, title = {Generative Prompt Model for Weakly Supervised Object Localization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6351-6361} }
ActFormer: A GAN-based Transformer towards General Action-Conditioned 3D Human Motion Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Liang and Song, Ziyang and Wang, Dongliang and Su, Jing and Fang, Zhicheng and Ding, Chenjing and Gan, Weihao and Yan, Yichao and Jin, Xin and Yang, Xiaokang and Zeng, Wenjun and Wu, Wei}, title = {ActFormer: A GAN-based Transformer towards General Action-Conditioned 3D Human Motion Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2228-2238} }
Hiding Visual Information via Obfuscating Adversarial Perturbations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Su_2023_ICCV, author = {Su, Zhigang and Zhou, Dawei and Wang, Nannan and Liu, Decheng and Wang, Zhen and Gao, Xinbo}, title = {Hiding Visual Information via Obfuscating Adversarial Perturbations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4356-4366} }
Category-aware Allocation Transformer for Weakly Supervised Object Localization-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Zhiwei and Ding, Jinren and Cao, Liujuan and Shen, Yunhang and Zhang, Shengchuan and Jiang, Guannan and Ji, Rongrong}, title = {Category-aware Allocation Transformer for Weakly Supervised Object Localization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6643-6652} }
Domain Specified Optimization for Deployment Authorization-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Haotian and Chi, Haoang and Yang, Wenjing and Lin, Zhipeng and Geng, Mingyang and Lan, Long and Zhang, Jing and Tao, Dacheng}, title = {Domain Specified Optimization for Deployment Authorization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5095-5105} }
Iterative Prompt Learning for Unsupervised Backlit Image Enhancement-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liang_2023_ICCV, author = {Liang, Zhexin and Li, Chongyi and Zhou, Shangchen and Feng, Ruicheng and Loy, Chen Change}, title = {Iterative Prompt Learning for Unsupervised Backlit Image Enhancement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8094-8103} }
UMIFormer: Mining the Correlations between Similar Tokens for Multi-View 3D Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Zhenwei and Yang, Liying and Li, Ning and Jiang, Chaohao and Liang, Yanyan}, title = {UMIFormer: Mining the Correlations between Similar Tokens for Multi-View 3D Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18226-18235} }
Improved Knowledge Transfer for Semi-Supervised Domain Adaptation via Trico Training Strategy-
[pdf]
[supp]
[bibtex]@InProceedings{Ngo_2023_ICCV, author = {Ngo, Ba Hung and Chae, Yeon Jeong and Kwon, Jung Eun and Park, Jae Hyeon and Cho, Sung In}, title = {Improved Knowledge Transfer for Semi-Supervised Domain Adaptation via Trico Training Strategy}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19214-19223} }
Locally Stylized Neural Radiance Fields-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Pang_2023_ICCV, author = {Pang, Hong-Wing and Hua, Binh-Son and Yeung, Sai-Kit}, title = {Locally Stylized Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {307-316} }
InterFormer: Real-time Interactive Image Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, You and Yang, Hao and Sun, Ke and Zhang, Shengchuan and Cao, Liujuan and Jiang, Guannan and Ji, Rongrong}, title = {InterFormer: Real-time Interactive Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22301-22311} }
Confidence-aware Pseudo-label Learning for Weakly Supervised Visual Grounding-
[pdf]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Yang and Zhang, Jiahua and Chen, Qingchao and Peng, Yuxin}, title = {Confidence-aware Pseudo-label Learning for Weakly Supervised Visual Grounding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2828-2838} }
Luminance-aware Color Transform for Multiple Exposure Correction-
[pdf]
[supp]
[bibtex]@InProceedings{Baek_2023_ICCV, author = {Baek, Jong-Hyeon and Kim, DaeHyun and Choi, Su-Min and Lee, Hyo-jun and Kim, Hanul and Koh, Yeong Jun}, title = {Luminance-aware Color Transform for Multiple Exposure Correction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6156-6165} }
A Simple Framework for Open-Vocabulary Segmentation and Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Hao and Li, Feng and Zou, Xueyan and Liu, Shilong and Li, Chunyuan and Yang, Jianwei and Zhang, Lei}, title = {A Simple Framework for Open-Vocabulary Segmentation and Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1020-1031} }
Alignment Before Aggregation: Trajectory Memory Retrieval Network for Video Object Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Sun_2023_ICCV, author = {Sun, Rui and Wang, Yuan and Mai, Huayu and Zhang, Tianzhu and Wu, Feng}, title = {Alignment Before Aggregation: Trajectory Memory Retrieval Network for Video Object Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1218-1228} }
UATVR: Uncertainty-Adaptive Text-Video Retrieval-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fang_2023_ICCV, author = {Fang, Bo and Wu, Wenhao and Liu, Chang and Zhou, Yu and Song, Yuxin and Wang, Weiping and Shu, Xiangbo and Ji, Xiangyang and Wang, Jingdong}, title = {UATVR: Uncertainty-Adaptive Text-Video Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13723-13733} }
Deep Directly-Trained Spiking Neural Networks for Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Su_2023_ICCV, author = {Su, Qiaoyi and Chou, Yuhong and Hu, Yifan and Li, Jianing and Mei, Shijie and Zhang, Ziyang and Li, Guoqi}, title = {Deep Directly-Trained Spiking Neural Networks for Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6555-6565} }
Online Prototype Learning for Online Continual Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wei_2023_ICCV, author = {Wei, Yujie and Ye, Jiaxin and Huang, Zhizhong and Zhang, Junping and Shan, Hongming}, title = {Online Prototype Learning for Online Continual Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18764-18774} }
Robust e-NeRF: NeRF from Sparse & Noisy Events under Non-Uniform Motion-
[pdf]
[supp]
[bibtex]@InProceedings{Low_2023_ICCV, author = {Low, Weng Fei and Lee, Gim Hee}, title = {Robust e-NeRF: NeRF from Sparse \& Noisy Events under Non-Uniform Motion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18335-18346} }
ActorsNeRF: Animatable Few-shot Human Rendering with Generalizable NeRFs-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mu_2023_ICCV, author = {Mu, Jiteng and Sang, Shen and Vasconcelos, Nuno and Wang, Xiaolong}, title = {ActorsNeRF: Animatable Few-shot Human Rendering with Generalizable NeRFs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18391-18401} }
SALAD: Part-Level Latent Diffusion for 3D Shape Generation and Manipulation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Koo_2023_ICCV, author = {Koo, Juil and Yoo, Seungwoo and Nguyen, Minh Hieu and Sung, Minhyuk}, title = {SALAD: Part-Level Latent Diffusion for 3D Shape Generation and Manipulation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14441-14451} }
COMPASS: High-Efficiency Deep Image Compression with Arbitrary-scale Spatial Scalability-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Park_2023_ICCV, author = {Park, Jongmin and Lee, Jooyoung and Kim, Munchurl}, title = {COMPASS: High-Efficiency Deep Image Compression with Arbitrary-scale Spatial Scalability}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12826-12835} }
Masked Autoencoders Are Stronger Knowledge Distillers-
[pdf]
[supp]
[bibtex]@InProceedings{Lao_2023_ICCV, author = {Lao, Shanshan and Song, Guanglu and Liu, Boxiao and Liu, Yu and Yang, Yujiu}, title = {Masked Autoencoders Are Stronger Knowledge Distillers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6384-6393} }
Score-Based Diffusion Models as Principled Priors for Inverse Imaging-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Feng_2023_ICCV, author = {Feng, Berthy T. and Smith, Jamie and Rubinstein, Michael and Chang, Huiwen and Bouman, Katherine L. and Freeman, William T.}, title = {Score-Based Diffusion Models as Principled Priors for Inverse Imaging}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10520-10531} }
Multiscale Structure Guided Diffusion for Image Deblurring-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ren_2023_ICCV, author = {Ren, Mengwei and Delbracio, Mauricio and Talebi, Hossein and Gerig, Guido and Milanfar, Peyman}, title = {Multiscale Structure Guided Diffusion for Image Deblurring}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10721-10733} }
Multiple Planar Object Tracking-
[pdf]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Zhicheng and Liu, Shengzhe and Yang, Jufeng}, title = {Multiple Planar Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23460-23470} }
CheckerPose: Progressive Dense Keypoint Localization for Object Pose Estimation with Graph Neural Network-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lian_2023_ICCV, author = {Lian, Ruyi and Ling, Haibin}, title = {CheckerPose: Progressive Dense Keypoint Localization for Object Pose Estimation with Graph Neural Network}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14022-14033} }
ASIC: Aligning Sparse in-the-wild Image Collections-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gupta_2023_ICCV, author = {Gupta, Kamal and Jampani, Varun and Esteves, Carlos and Shrivastava, Abhinav and Makadia, Ameesh and Snavely, Noah and Kar, Abhishek}, title = {ASIC: Aligning Sparse in-the-wild Image Collections}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4134-4145} }
Residual Pattern Learning for Pixel-Wise Out-of-Distribution Detection in Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Yuyuan and Ding, Choubo and Tian, Yu and Pang, Guansong and Belagiannis, Vasileios and Reid, Ian and Carneiro, Gustavo}, title = {Residual Pattern Learning for Pixel-Wise Out-of-Distribution Detection in Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1151-1161} }
Hierarchical Visual Primitive Experts for Compositional Zero-Shot Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2023_ICCV, author = {Kim, Hanjae and Lee, Jiyoung and Park, Seongheon and Sohn, Kwanghoon}, title = {Hierarchical Visual Primitive Experts for Compositional Zero-Shot Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5675-5685} }
Event Camera Data Pre-training-
[pdf]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Yan and Pan, Liyuan and Liu, Liu}, title = {Event Camera Data Pre-training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10699-10709} }
Segment Every Reference Object in Spatial and Temporal Spaces-
[pdf]
[supp]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Jiannan and Jiang, Yi and Yan, Bin and Lu, Huchuan and Yuan, Zehuan and Luo, Ping}, title = {Segment Every Reference Object in Spatial and Temporal Spaces}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2538-2550} }
Unified Out-Of-Distribution Detection: A Model-Specific Perspective-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Averly_2023_ICCV, author = {Averly, Reza and Chao, Wei-Lun}, title = {Unified Out-Of-Distribution Detection: A Model-Specific Perspective}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1453-1463} }
One-shot Implicit Animatable Avatars with Model-based Priors-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Yangyi and Yi, Hongwei and Liu, Weiyang and Wang, Haofan and Wu, Boxi and Wang, Wenxiao and Lin, Binbin and Zhang, Debing and Cai, Deng}, title = {One-shot Implicit Animatable Avatars with Model-based Priors}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8974-8985} }
Unsupervised Feature Representation Learning for Domain-generalized Cross-domain Image Retrieval-
[pdf]
[supp]
[bibtex]@InProceedings{Hu_2023_ICCV, author = {Hu, Conghui and Zhang, Can and Lee, Gim Hee}, title = {Unsupervised Feature Representation Learning for Domain-generalized Cross-domain Image Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11016-11025} }
RankMatch: Fostering Confidence and Consistency in Learning with Noisy Labels-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Ziyi and Chen, Weikai and Fang, Chaowei and Li, Zhen and Chen, Lechao and Lin, Liang and Li, Guanbin}, title = {RankMatch: Fostering Confidence and Consistency in Learning with Noisy Labels}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1644-1654} }
Dec-Adapter: Exploring Efficient Decoder-Side Adapter for Bridging Screen Content and Natural Image Compression-
[pdf]
[supp]
[bibtex]@InProceedings{Shen_2023_ICCV, author = {Shen, Sheng and Yue, Huanjing and Yang, Jingyu}, title = {Dec-Adapter: Exploring Efficient Decoder-Side Adapter for Bridging Screen Content and Natural Image Compression}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12887-12896} }
MixReorg: Cross-Modal Mixed Patch Reorganization is a Good Mask Learner for Open-World Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cai_2023_ICCV, author = {Cai, Kaixin and Ren, Pengzhen and Zhu, Yi and Xu, Hang and Liu, Jianzhuang and Li, Changlin and Wang, Guangrun and Liang, Xiaodan}, title = {MixReorg: Cross-Modal Mixed Patch Reorganization is a Good Mask Learner for Open-World Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1196-1205} }
Preface: A Data-driven Volumetric Prior for Few-shot Ultra High-resolution Face Synthesis-
[pdf]
[supp]
[bibtex]@InProceedings{Buhler_2023_ICCV, author = {B\"uhler, Marcel C. and Sarkar, Kripasindhu and Shah, Tanmay and Li, Gengyan and Wang, Daoye and Helminger, Leonhard and Orts-Escolano, Sergio and Lagun, Dmitry and Hilliges, Otmar and Beeler, Thabo and Meka, Abhimitra}, title = {Preface: A Data-driven Volumetric Prior for Few-shot Ultra High-resolution Face Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3402-3413} }
Label-Guided Knowledge Distillation for Continual Semantic Segmentation on 2D Images and 3D Point Clouds-
[pdf]
[supp]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Ze and Li, Ruibo and Ling, Evan and Zhang, Chi and Wang, Yiming and Huang, Dezhao and Ma, Keng Teck and Hur, Minhoe and Lin, Guosheng}, title = {Label-Guided Knowledge Distillation for Continual Semantic Segmentation on 2D Images and 3D Point Clouds}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18601-18612} }
Under-Display Camera Image Restoration with Scattering Effect-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Song_2023_ICCV, author = {Song, Binbin and Chen, Xiangyu and Xu, Shuning and Zhou, Jiantao}, title = {Under-Display Camera Image Restoration with Scattering Effect}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12580-12589} }
PRANC: Pseudo RAndom Networks for Compacting Deep Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nooralinejad_2023_ICCV, author = {Nooralinejad, Parsa and Abbasi, Ali and Koohpayegani, Soroush Abbasi and Meibodi, Kossar Pourahmadi and Khan, Rana Muhammad Shahroz and Kolouri, Soheil and Pirsiavash, Hamed}, title = {PRANC: Pseudo RAndom Networks for Compacting Deep Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17021-17031} }
ICICLE: Interpretable Class Incremental Continual Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Rymarczyk_2023_ICCV, author = {Rymarczyk, Dawid and van de Weijer, Joost and Zieli\'nski, Bartosz and Twardowski, Bartlomiej}, title = {ICICLE: Interpretable Class Incremental Continual Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1887-1898} }
Clutter Detection and Removal in 3D Scenes with View-Consistent Inpainting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wei_2023_ICCV, author = {Wei, Fangyin and Funkhouser, Thomas and Rusinkiewicz, Szymon}, title = {Clutter Detection and Removal in 3D Scenes with View-Consistent Inpainting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18131-18141} }
PointCLIP V2: Prompting CLIP and GPT for Powerful 3D Open-world Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Xiangyang and Zhang, Renrui and He, Bowei and Guo, Ziyu and Zeng, Ziyao and Qin, Zipeng and Zhang, Shanghang and Gao, Peng}, title = {PointCLIP V2: Prompting CLIP and GPT for Powerful 3D Open-world Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2639-2650} }
VideoFlow: Exploiting Temporal Cues for Multi-frame Optical Flow Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shi_2023_ICCV, author = {Shi, Xiaoyu and Huang, Zhaoyang and Bian, Weikang and Li, Dasong and Zhang, Manyuan and Cheung, Ka Chun and See, Simon and Qin, Hongwei and Dai, Jifeng and Li, Hongsheng}, title = {VideoFlow: Exploiting Temporal Cues for Multi-frame Optical Flow Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12469-12480} }
3DMiner: Discovering Shapes from Large-Scale Unannotated Image Datasets-
[pdf]
[bibtex]@InProceedings{Cheng_2023_ICCV, author = {Cheng, Ta-Ying and Gadelha, Matheus and Pirk, S\"oren and Groueix, Thibault and M\v{e}ch, Radom{\'\i}r and Markham, Andrew and Trigoni, Niki}, title = {3DMiner: Discovering Shapes from Large-Scale Unannotated Image Datasets}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9331-9341} }
Identification of Systematic Errors of Image Classifiers on Rare Subgroups-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Metzen_2023_ICCV, author = {Metzen, Jan Hendrik and Hutmacher, Robin and Hua, N. Grace and Boreiko, Valentyn and Zhang, Dan}, title = {Identification of Systematic Errors of Image Classifiers on Rare Subgroups}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5064-5073} }
Hierarchical Spatio-Temporal Representation Learning for Gait Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Lei and Liu, Bo and Liang, Fangfang and Wang, Bincheng}, title = {Hierarchical Spatio-Temporal Representation Learning for Gait Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19639-19649} }
Order-Prompted Tag Sequence Generation for Video Tagging-
[pdf]
[supp]
[bibtex]@InProceedings{Ma_2023_ICCV, author = {Ma, Zongyang and Zhang, Ziqi and Chen, Yuxin and Qi, Zhongang and Luo, Yingmin and Li, Zekun and Yuan, Chunfeng and Li, Bing and Qie, Xiaohu and Shan, Ying and Hu, Weiming}, title = {Order-Prompted Tag Sequence Generation for Video Tagging}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15681-15690} }
XVO: Generalized Visual Odometry via Cross-Modal Self-Training-
[pdf]
[bibtex]@InProceedings{Lai_2023_ICCV, author = {Lai, Lei and Shangguan, Zhongkai and Zhang, Jimuyang and Ohn-Bar, Eshed}, title = {XVO: Generalized Visual Odometry via Cross-Modal Self-Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10094-10105} }
Weakly Supervised Learning of Semantic Correspondence through Cascaded Online Correspondence Refinement-
[pdf]
[supp]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Yiwen and Sun, Yixuan and Lai, Chenghang and Xu, Qing and Wang, Xiaomei and Shen, Xuli and Ge, Weifeng}, title = {Weakly Supervised Learning of Semantic Correspondence through Cascaded Online Correspondence Refinement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16254-16263} }
Clusterformer: Cluster-based Transformer for 3D Object Detection in Point Clouds-
[pdf]
[bibtex]@InProceedings{Pei_2023_ICCV, author = {Pei, Yu and Zhao, Xian and Li, Hao and Ma, Jingyuan and Zhang, Jingwei and Pu, Shiliang}, title = {Clusterformer: Cluster-based Transformer for 3D Object Detection in Point Clouds}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6664-6673} }
HMD-NeMo: Online 3D Avatar Motion Generation From Sparse Observations-
[pdf]
[supp]
[bibtex]@InProceedings{Aliakbarian_2023_ICCV, author = {Aliakbarian, Sadegh and Saleh, Fatemeh and Collier, David and Cameron, Pashmina and Cosker, Darren}, title = {HMD-NeMo: Online 3D Avatar Motion Generation From Sparse Observations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9622-9631} }
NaviNeRF: NeRF-based 3D Representation Disentanglement by Latent Semantic Navigation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xie_2023_ICCV, author = {Xie, Baao and Li, Bohan and Zhang, Zequn and Dong, Junting and Jin, Xin and Yang, Jingyu and Zeng, Wenjun}, title = {NaviNeRF: NeRF-based 3D Representation Disentanglement by Latent Semantic Navigation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17992-18002} }
Adaptive Illumination Mapping for Shadow Detection in Raw Images-
[pdf]
[bibtex]@InProceedings{Sun_2023_ICCV, author = {Sun, Jiayu and Xu, Ke and Pang, Youwei and Zhang, Lihe and Lu, Huchuan and Hancke, Gerhard and Lau, Rynson}, title = {Adaptive Illumination Mapping for Shadow Detection in Raw Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12709-12718} }
CDUL: CLIP-Driven Unsupervised Learning for Multi-Label Image Classification-
[pdf]
[arXiv]
[bibtex]@InProceedings{Abdelfattah_2023_ICCV, author = {Abdelfattah, Rabab and Guo, Qing and Li, Xiaoguang and Wang, Xiaofeng and Wang, Song}, title = {CDUL: CLIP-Driven Unsupervised Learning for Multi-Label Image Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1348-1357} }
Your Diffusion Model is Secretly a Zero-Shot Classifier-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Alexander C. and Prabhudesai, Mihir and Duggal, Shivam and Brown, Ellis and Pathak, Deepak}, title = {Your Diffusion Model is Secretly a Zero-Shot Classifier}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2206-2217} }
Backpropagation Path Search On Adversarial Transferability-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Zhuoer and Gu, Zhangxuan and Zhang, Jianping and Cui, Shiwen and Meng, Changhua and Wang, Weiqiang}, title = {Backpropagation Path Search On Adversarial Transferability}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4663-4673} }
Boosting Adversarial Transferability via Gradient Relevance Attack-
[pdf]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Hegui and Ren, Yuchen and Sui, Xiaoyan and Yang, Lianping and Jiang, Wuming}, title = {Boosting Adversarial Transferability via Gradient Relevance Attack}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4741-4750} }
Image-Free Classifier Injection for Zero-Shot Classification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Christensen_2023_ICCV, author = {Christensen, Anders and Mancini, Massimiliano and Koepke, A. Sophia and Winther, Ole and Akata, Zeynep}, title = {Image-Free Classifier Injection for Zero-Shot Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19072-19081} }
CLIPN for Zero-Shot OOD Detection: Teaching CLIP to Say No-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Hualiang and Li, Yi and Yao, Huifeng and Li, Xiaomeng}, title = {CLIPN for Zero-Shot OOD Detection: Teaching CLIP to Say No}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1802-1812} }
CO-Net: Learning Multiple Point Cloud Tasks at Once with A Cohesive Network-
[pdf]
[supp]
[bibtex]@InProceedings{Xie_2023_ICCV, author = {Xie, Tao and Wang, Ke and Lu, Siyi and Zhang, Yukun and Dai, Kun and Li, Xiaoyu and Xu, Jie and Wang, Li and Zhao, Lijun and Zhang, Xinyu and Li, Ruifeng}, title = {CO-Net: Learning Multiple Point Cloud Tasks at Once with A Cohesive Network}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3523-3533} }
Quality Diversity for Visual Pre-Training-
[pdf]
[supp]
[bibtex]@InProceedings{Chavhan_2023_ICCV, author = {Chavhan, Ruchika and Gouk, Henry and Li, Da and Hospedales, Timothy}, title = {Quality Diversity for Visual Pre-Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5384-5394} }
UniDexGrasp++: Improving Dexterous Grasping Policy Learning via Geometry-Aware Curriculum and Iterative Generalist-Specialist Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Wan_2023_ICCV, author = {Wan, Weikang and Geng, Haoran and Liu, Yun and Shan, Zikang and Yang, Yaodong and Yi, Li and Wang, He}, title = {UniDexGrasp++: Improving Dexterous Grasping Policy Learning via Geometry-Aware Curriculum and Iterative Generalist-Specialist Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3891-3902} }
Multi-Scale Residual Low-Pass Filter Network for Image Deblurring-
[pdf]
[supp]
[bibtex]@InProceedings{Dong_2023_ICCV, author = {Dong, Jiangxin and Pan, Jinshan and Yang, Zhongbao and Tang, Jinhui}, title = {Multi-Scale Residual Low-Pass Filter Network for Image Deblurring}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12345-12354} }
FerKD: Surgical Label Adaptation for Efficient Distillation-
[pdf]
[supp]
[bibtex]@InProceedings{Shen_2023_ICCV, author = {Shen, Zhiqiang}, title = {FerKD: Surgical Label Adaptation for Efficient Distillation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1666-1675} }
Neural Fields for Structured Lighting-
[pdf]
[supp]
[bibtex]@InProceedings{Shandilya_2023_ICCV, author = {Shandilya, Aarrushi and Attal, Benjamin and Richardt, Christian and Tompkin, James and O'toole, Matthew}, title = {Neural Fields for Structured Lighting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3512-3522} }
ClothPose: A Real-world Benchmark for Visual Analysis of Garment Pose via An Indirect Recording Solution-
[pdf]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Wenqiang and Du, Wenxin and Xue, Han and Li, Yutong and Ye, Ruolin and Wang, Yan-Feng and Lu, Cewu}, title = {ClothPose: A Real-world Benchmark for Visual Analysis of Garment Pose via An Indirect Recording Solution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {58-68} }
Semantically Structured Image Compression via Irregular Group-Based Decoupling-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Feng_2023_ICCV, author = {Feng, Ruoyu and Gao, Yixin and Jin, Xin and Feng, Runsen and Chen, Zhibo}, title = {Semantically Structured Image Compression via Irregular Group-Based Decoupling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17237-17247} }
PhaseMP: Robust 3D Pose Estimation via Phase-conditioned Human Motion Prior-
[pdf]
[supp]
[bibtex]@InProceedings{Shi_2023_ICCV, author = {Shi, Mingyi and Starke, Sebastian and Ye, Yuting and Komura, Taku and Won, Jungdam}, title = {PhaseMP: Robust 3D Pose Estimation via Phase-conditioned Human Motion Prior}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14725-14737} }
NLOS-NeuS: Non-line-of-sight Neural Implicit Surface-
[pdf]
[supp]
[bibtex]@InProceedings{Fujimura_2023_ICCV, author = {Fujimura, Yuki and Kushida, Takahiro and Funatomi, Takuya and Mukaigawa, Yasuhiro}, title = {NLOS-NeuS: Non-line-of-sight Neural Implicit Surface}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10532-10541} }
Unsupervised Object Localization with Representer Point Selection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Song_2023_ICCV, author = {Song, Yeonghwan and Jang, Seokwoo and Katabi, Dina and Son, Jeany}, title = {Unsupervised Object Localization with Representer Point Selection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6534-6544} }
SEMPART: Self-supervised Multi-resolution Partitioning of Image Semantics-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ravindran_2023_ICCV, author = {Ravindran, Sriram and Basu, Debraj}, title = {SEMPART: Self-supervised Multi-resolution Partitioning of Image Semantics}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {723-733} }
Flatness-Aware Minimization for Domain Generalization-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Xingxuan and Xu, Renzhe and Yu, Han and Dong, Yancheng and Tian, Pengfei and Cui, Peng}, title = {Flatness-Aware Minimization for Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5189-5202} }
ProtoFL: Unsupervised Federated Learning via Prototypical Distillation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Kim_2023_ICCV, author = {Kim, Hansol and Kwak, Youngjun and Jung, Minyoung and Shin, Jinho and Kim, Youngsung and Kim, Changick}, title = {ProtoFL: Unsupervised Federated Learning via Prototypical Distillation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6470-6479} }
Augmenting and Aligning Snippets for Few-Shot Video Domain Adaptation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Yuecong and Yang, Jianfei and Zhou, Yunjiao and Chen, Zhenghua and Wu, Min and Li, Xiaoli}, title = {Augmenting and Aligning Snippets for Few-Shot Video Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13445-13456} }
Self-Organizing Pathway Expansion for Non-Exemplar Class-Incremental Learning-
[pdf]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Kai and Zheng, Kecheng and Feng, Ruili and Zhao, Deli and Cao, Yang and Zha, Zheng-Jun}, title = {Self-Organizing Pathway Expansion for Non-Exemplar Class-Incremental Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19204-19213} }
Preserving Tumor Volumes for Unsupervised Medical Image Registration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dong_2023_ICCV, author = {Dong, Qihua and Du, Hao and Song, Ying and Xu, Yan and Liao, Jing}, title = {Preserving Tumor Volumes for Unsupervised Medical Image Registration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21208-21218} }
Multi-label Affordance Mapping from Egocentric Vision-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mur-Labadia_2023_ICCV, author = {Mur-Labadia, Lorenzo and Guerrero, Jose J. and Martinez-Cantin, Ruben}, title = {Multi-label Affordance Mapping from Egocentric Vision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5238-5249} }
Towards Real-World Burst Image Super-Resolution: Benchmark and Method-
[pdf]
[supp]
[bibtex]@InProceedings{Wei_2023_ICCV, author = {Wei, Pengxu and Sun, Yujing and Guo, Xingbei and Liu, Chang and Li, Guanbin and Chen, Jie and Ji, Xiangyang and Lin, Liang}, title = {Towards Real-World Burst Image Super-Resolution: Benchmark and Method}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13233-13242} }
Unified Adversarial Patch for Cross-Modal Attacks in the Physical World-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wei_2023_ICCV, author = {Wei, Xingxing and Huang, Yao and Sun, Yitong and Yu, Jie}, title = {Unified Adversarial Patch for Cross-Modal Attacks in the Physical World}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4445-4454} }
Unsupervised Accuracy Estimation of Deep Visual Models using Domain-Adaptive Adversarial Perturbation without Source Samples-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2023_ICCV, author = {Lee, JoonHo and Woo, Jae Oh and Moon, Hankyu and Lee, Kwonho}, title = {Unsupervised Accuracy Estimation of Deep Visual Models using Domain-Adaptive Adversarial Perturbation without Source Samples}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16443-16452} }
Misalign, Contrast then Distill: Rethinking Misalignments in Language-Image Pre-training-
[pdf]
[bibtex]@InProceedings{Kim_2023_ICCV, author = {Kim, Bumsoo and Jo, Yeonsik and Kim, Jinhyung and Kim, Seunghwan}, title = {Misalign, Contrast then Distill: Rethinking Misalignments in Language-Image Pre-training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2563-2572} }
SYENet: A Simple Yet Effective Network for Multiple Low-Level Vision Tasks with Real-Time Performance on Mobile Device-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gou_2023_ICCV, author = {Gou, Weiran and Yi, Ziyao and Xiang, Yan and Li, Shaoqing and Liu, Zibin and Kong, Dehui and Xu, Ke}, title = {SYENet: A Simple Yet Effective Network for Multiple Low-Level Vision Tasks with Real-Time Performance on Mobile Device}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12182-12195} }
MATE: Masked Autoencoders are Online 3D Test-Time Learners-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mirza_2023_ICCV, author = {Mirza, M. Jehanzeb and Shin, Inkyu and Lin, Wei and Schriebl, Andreas and Sun, Kunyang and Choe, Jaesung and Kozinski, Mateusz and Possegger, Horst and Kweon, In So and Yoon, Kuk-Jin and Bischof, Horst}, title = {MATE: Masked Autoencoders are Online 3D Test-Time Learners}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16709-16718} }
EdaDet: Open-Vocabulary Object Detection Using Early Dense Alignment-
[pdf]
[arXiv]
[bibtex]@InProceedings{Shi_2023_ICCV, author = {Shi, Cheng and Yang, Sibei}, title = {EdaDet: Open-Vocabulary Object Detection Using Early Dense Alignment}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15724-15734} }
MixPath: A Unified Approach for One-shot Neural Architecture Search-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chu_2023_ICCV, author = {Chu, Xiangxiang and Lu, Shun and Li, Xudong and Zhang, Bo}, title = {MixPath: A Unified Approach for One-shot Neural Architecture Search}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5972-5981} }
Enhancing NeRF akin to Enhancing LLMs: Generalizable NeRF Transformer with Mixture-of-View-Experts-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cong_2023_ICCV, author = {Cong, Wenyan and Liang, Hanxue and Wang, Peihao and Fan, Zhiwen and Chen, Tianlong and Varma, Mukund and Wang, Yi and Wang, Zhangyang}, title = {Enhancing NeRF akin to Enhancing LLMs: Generalizable NeRF Transformer with Mixture-of-View-Experts}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3193-3204} }
Task-aware Adaptive Learning for Cross-domain Few-shot Learning-
[pdf]
[bibtex]@InProceedings{Guo_2023_ICCV, author = {Guo, Yurong and Du, Ruoyi and Dong, Yuan and Hospedales, Timothy and Song, Yi-Zhe and Ma, Zhanyu}, title = {Task-aware Adaptive Learning for Cross-domain Few-shot Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1590-1599} }
Two Birds, One Stone: A Unified Framework for Joint Learning of Image and Video Style Transfers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gu_2023_ICCV, author = {Gu, Bohai and Fan, Heng and Zhang, Libo}, title = {Two Birds, One Stone: A Unified Framework for Joint Learning of Image and Video Style Transfers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23545-23554} }
Revisiting Domain-Adaptive 3D Object Detection by Reliable, Diverse and Class-balanced Pseudo-Labeling-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Zhuoxiao and Luo, Yadan and Wang, Zheng and Baktashmotlagh, Mahsa and Huang, Zi}, title = {Revisiting Domain-Adaptive 3D Object Detection by Reliable, Diverse and Class-balanced Pseudo-Labeling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3714-3726} }
Task-Oriented Multi-Modal Mutual Leaning for Vision-Language Models-
[pdf]
[arXiv]
[bibtex]@InProceedings{Long_2023_ICCV, author = {Long, Sifan and Zhao, Zhen and Yuan, Junkun and Tan, Zichang and Liu, Jiangjiang and Zhou, Luping and Wang, Shengsheng and Wang, Jingdong}, title = {Task-Oriented Multi-Modal Mutual Leaning for Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21959-21969} }
Efficient Adaptive Human-Object Interaction Detection with Concept-guided Memory-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lei_2023_ICCV, author = {Lei, Ting and Caba, Fabian and Chen, Qingchao and Jin, Hailin and Peng, Yuxin and Liu, Yang}, title = {Efficient Adaptive Human-Object Interaction Detection with Concept-guided Memory}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6480-6490} }
NeMF: Inverse Volume Rendering with Neural Microflake Field-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Youjia and Xu, Teng and Yu, Junqing and Ye, Yuteng and Jing, Yanqing and Wang, Junle and Yu, Jingyi and Yang, Wei}, title = {NeMF: Inverse Volume Rendering with Neural Microflake Field}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22919-22929} }
Attentive Mask CLIP-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Yifan and Huang, Weiquan and Wei, Yixuan and Peng, Houwen and Jiang, Xinyang and Jiang, Huiqiang and Wei, Fangyun and Wang, Yin and Hu, Han and Qiu, Lili and Yang, Yuqing}, title = {Attentive Mask CLIP}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2771-2781} }
DOLCE: A Model-Based Probabilistic Diffusion Framework for Limited-Angle CT Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Jiaming and Anirudh, Rushil and Thiagarajan, Jayaraman J. and He, Stewart and Mohan, K Aditya and Kamilov, Ulugbek S. and Kim, Hyojin}, title = {DOLCE: A Model-Based Probabilistic Diffusion Framework for Limited-Angle CT Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10498-10508} }
Beyond Image Borders: Learning Feature Extrapolation for Unbounded Image Composition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Xiaoyu and Liu, Ming and Li, Junyi and Liu, Shuai and Wang, Xiaotao and Lei, Lei and Zuo, Wangmeng}, title = {Beyond Image Borders: Learning Feature Extrapolation for Unbounded Image Composition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13023-13032} }
MasaCtrl: Tuning-Free Mutual Self-Attention Control for Consistent Image Synthesis and Editing-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cao_2023_ICCV, author = {Cao, Mingdeng and Wang, Xintao and Qi, Zhongang and Shan, Ying and Qie, Xiaohu and Zheng, Yinqiang}, title = {MasaCtrl: Tuning-Free Mutual Self-Attention Control for Consistent Image Synthesis and Editing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22560-22570} }
Understanding Hessian Alignment for Domain Generalization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hemati_2023_ICCV, author = {Hemati, Sobhan and Zhang, Guojun and Estiri, Amir and Chen, Xi}, title = {Understanding Hessian Alignment for Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19004-19014} }
DeepChange: A Long-Term Person Re-Identification Benchmark with Clothes Change-
[pdf]
[supp]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Peng and Zhu, Xiatian}, title = {DeepChange: A Long-Term Person Re-Identification Benchmark with Clothes Change}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11196-11205} }
Preserve Your Own Correlation: A Noise Prior for Video Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ge_2023_ICCV, author = {Ge, Songwei and Nah, Seungjun and Liu, Guilin and Poon, Tyler and Tao, Andrew and Catanzaro, Bryan and Jacobs, David and Huang, Jia-Bin and Liu, Ming-Yu and Balaji, Yogesh}, title = {Preserve Your Own Correlation: A Noise Prior for Video Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22930-22941} }
Discrepant and Multi-Instance Proxies for Unsupervised Person Re-Identification-
[pdf]
[supp]
[bibtex]@InProceedings{Zou_2023_ICCV, author = {Zou, Chang and Chen, Zeqi and Cui, Zhichao and Liu, Yuehu and Zhang, Chi}, title = {Discrepant and Multi-Instance Proxies for Unsupervised Person Re-Identification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11058-11068} }
Joint-Relation Transformer for Multi-Person Motion Prediction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Qingyao and Mao, Weibo and Gong, Jingze and Xu, Chenxin and Chen, Siheng and Xie, Weidi and Zhang, Ya and Wang, Yanfeng}, title = {Joint-Relation Transformer for Multi-Person Motion Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9816-9826} }
Revisiting Vision Transformer from the View of Path Ensemble-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chang_2023_ICCV, author = {Chang, Shuning and Wang, Pichao and Luo, Hao and Wang, Fan and Shou, Mike Zheng}, title = {Revisiting Vision Transformer from the View of Path Ensemble}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19889-19899} }
Tetra-NeRF: Representing Neural Radiance Fields Using Tetrahedra-
[pdf]
[supp]
[bibtex]@InProceedings{Kulhanek_2023_ICCV, author = {Kulhanek, Jonas and Sattler, Torsten}, title = {Tetra-NeRF: Representing Neural Radiance Fields Using Tetrahedra}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18458-18469} }
TMA: Temporal Motion Aggregation for Event-based Optical Flow-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Haotian and Chen, Guang and Qu, Sanqing and Zhang, Yanping and Li, Zhijun and Knoll, Alois and Jiang, Changjun}, title = {TMA: Temporal Motion Aggregation for Event-based Optical Flow}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9685-9694} }
Ablating Concepts in Text-to-Image Diffusion Models-
[pdf]
[arXiv]
[bibtex]@InProceedings{Kumari_2023_ICCV, author = {Kumari, Nupur and Zhang, Bingliang and Wang, Sheng-Yu and Shechtman, Eli and Zhang, Richard and Zhu, Jun-Yan}, title = {Ablating Concepts in Text-to-Image Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22691-22702} }
Motion-Guided Masking for Spatiotemporal Representation Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fan_2023_ICCV, author = {Fan, David and Wang, Jue and Liao, Shuai and Zhu, Yi and Bhat, Vimal and Santos-Villalobos, Hector and MV, Rohith and Li, Xinyu}, title = {Motion-Guided Masking for Spatiotemporal Representation Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5619-5629} }
MapFormer: Boosting Change Detection by Using Pre-change Information-
[pdf]
[supp]
[bibtex]@InProceedings{Bernhard_2023_ICCV, author = {Bernhard, Maximilian and Strau{\ss}, Niklas and Schubert, Matthias}, title = {MapFormer: Boosting Change Detection by Using Pre-change Information}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16837-16846} }
Masked Diffusion Transformer is a Strong Image Synthesizer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gao_2023_ICCV, author = {Gao, Shanghua and Zhou, Pan and Cheng, Ming-Ming and Yan, Shuicheng}, title = {Masked Diffusion Transformer is a Strong Image Synthesizer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23164-23173} }
LightDepth: Single-View Depth Self-Supervision from Illumination Decline-
[pdf]
[supp]
[bibtex]@InProceedings{Rodriguez-Puigvert_2023_ICCV, author = {Rodr{\'\i}guez-Puigvert, Javier and Batlle, V{\'\i}ctor M. and Montiel, J.M.M. and Martinez-Cantin, Ruben and Fua, Pascal and Tard\'os, Juan D. and Civera, Javier}, title = {LightDepth: Single-View Depth Self-Supervision from Illumination Decline}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21273-21283} }
Urban Radiance Field Representation with Deformable Neural Mesh Primitives-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lu_2023_ICCV, author = {Lu, Fan and Xu, Yan and Chen, Guang and Li, Hongsheng and Lin, Kwan-Yee and Jiang, Changjun}, title = {Urban Radiance Field Representation with Deformable Neural Mesh Primitives}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {465-476} }
Adaptive Frequency Filters As Efficient Global Token Mixers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Zhipeng and Zhang, Zhizheng and Lan, Cuiling and Zha, Zheng-Jun and Lu, Yan and Guo, Baining}, title = {Adaptive Frequency Filters As Efficient Global Token Mixers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6049-6059} }
Referring Image Segmentation Using Text Supervision-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Fang and Liu, Yuhao and Kong, Yuqiu and Xu, Ke and Zhang, Lihe and Yin, Baocai and Hancke, Gerhard and Lau, Rynson}, title = {Referring Image Segmentation Using Text Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22124-22134} }
Zolly: Zoom Focal Length Correctly for Perspective-Distorted Human Mesh Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Wenjia and Ge, Yongtao and Mei, Haiyi and Cai, Zhongang and Sun, Qingping and Wang, Yanjun and Shen, Chunhua and Yang, Lei and Komura, Taku}, title = {Zolly: Zoom Focal Length Correctly for Perspective-Distorted Human Mesh Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3925-3935} }
Once Detected, Never Lost: Surpassing Human Performance in Offline LiDAR based 3D Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fan_2023_ICCV, author = {Fan, Lue and Yang, Yuxue and Mao, Yiming and Wang, Feng and Chen, Yuntao and Wang, Naiyan and Zhang, Zhaoxiang}, title = {Once Detected, Never Lost: Surpassing Human Performance in Offline LiDAR based 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19820-19829} }
Building a Winning Team: Selecting Source Model Ensembles using a Submodular Transferability Estimation Approach-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{B_2023_ICCV, author = {B, Vimal K and Bachu, Saketh and Garg, Tanmay and Narasimhan, Niveditha Lakshmi and Konuru, Raghavan and Balasubramanian, Vineeth N}, title = {Building a Winning Team: Selecting Source Model Ensembles using a Submodular Transferability Estimation Approach}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11609-11620} }
Eventful Transformers: Leveraging Temporal Redundancy in Vision Transformers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dutson_2023_ICCV, author = {Dutson, Matthew and Li, Yin and Gupta, Mohit}, title = {Eventful Transformers: Leveraging Temporal Redundancy in Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16911-16923} }
Plausible Uncertainties for Human Pose Regression-
[pdf]
[supp]
[bibtex]@InProceedings{Bramlage_2023_ICCV, author = {Bramlage, Lennart and Karg, Michelle and Curio, Crist\'obal}, title = {Plausible Uncertainties for Human Pose Regression}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15133-15142} }
Beyond One-to-One: Rethinking the Referring Image Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Hu_2023_ICCV, author = {Hu, Yutao and Wang, Qixiong and Shao, Wenqi and Xie, Enze and Li, Zhenguo and Han, Jungong and Luo, Ping}, title = {Beyond One-to-One: Rethinking the Referring Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4067-4077} }
Robust Referring Video Object Segmentation with Cyclic Structural Consensus-
[pdf]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Xiang and Wang, Jinglu and Xu, Xiaohao and Li, Xiao and Raj, Bhiksha and Lu, Yan}, title = {Robust Referring Video Object Segmentation with Cyclic Structural Consensus}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22236-22245} }
DiffIR: Efficient Diffusion Model for Image Restoration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xia_2023_ICCV, author = {Xia, Bin and Zhang, Yulun and Wang, Shiyin and Wang, Yitong and Wu, Xinglong and Tian, Yapeng and Yang, Wenming and Van Gool, Luc}, title = {DiffIR: Efficient Diffusion Model for Image Restoration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13095-13105} }
MoreauGrad: Sparse and Robust Interpretation of Neural Networks via Moreau Envelope-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Jingwei and Farnia, Farzan}, title = {MoreauGrad: Sparse and Robust Interpretation of Neural Networks via Moreau Envelope}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2021-2030} }
Building Bridge Across the Time: Disruption and Restoration of Murals In the Wild-
[pdf]
[supp]
[bibtex]@InProceedings{Shao_2023_ICCV, author = {Shao, Huiyang and Xu, Qianqian and Wen, Peisong and Gao, Peifeng and Yang, Zhiyong and Huang, Qingming}, title = {Building Bridge Across the Time: Disruption and Restoration of Murals In the Wild}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20259-20269} }
Class-Incremental Grouping Network for Continual Audio-Visual Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mo_2023_ICCV, author = {Mo, Shentong and Pian, Weiguo and Tian, Yapeng}, title = {Class-Incremental Grouping Network for Continual Audio-Visual Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7788-7798} }
Neural Haircut: Prior-Guided Strand-Based Hair Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sklyarova_2023_ICCV, author = {Sklyarova, Vanessa and Chelishev, Jenya and Dogaru, Andreea and Medvedev, Igor and Lempitsky, Victor and Zakharov, Egor}, title = {Neural Haircut: Prior-Guided Strand-Based Hair Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19762-19773} }
Improving Sample Quality of Diffusion Models Using Self-Attention Guidance-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hong_2023_ICCV, author = {Hong, Susung and Lee, Gyuseong and Jang, Wooseok and Kim, Seungryong}, title = {Improving Sample Quality of Diffusion Models Using Self-Attention Guidance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7462-7471} }
Evaluating Data Attribution for Text-to-Image Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Sheng-Yu and Efros, Alexei A. and Zhu, Jun-Yan and Zhang, Richard}, title = {Evaluating Data Attribution for Text-to-Image Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7192-7203} }
Delta Denoising Score-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hertz_2023_ICCV, author = {Hertz, Amir and Aberman, Kfir and Cohen-Or, Daniel}, title = {Delta Denoising Score}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2328-2337} }
Hierarchical Prior Mining for Non-local Multi-View Stereo-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ren_2023_ICCV, author = {Ren, Chunlin and Xu, Qingshan and Zhang, Shikun and Yang, Jiaqi}, title = {Hierarchical Prior Mining for Non-local Multi-View Stereo}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3611-3620} }
Generative Multiplane Neural Radiance for 3D-Aware Image Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kumar_2023_ICCV, author = {Kumar, Amandeep and Bhunia, Ankan Kumar and Narayan, Sanath and Cholakkal, Hisham and Anwer, Rao Muhammad and Khan, Salman and Yang, Ming-Hsuan and Khan, Fahad Shahbaz}, title = {Generative Multiplane Neural Radiance for 3D-Aware Image Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7388-7398} }
DG-Recon: Depth-Guided Neural 3D Scene Reconstruction-
[pdf]
[supp]
[bibtex]@InProceedings{Ju_2023_ICCV, author = {Ju, Jihong and Tseng, Ching Wei and Bailo, Oleksandr and Dikov, Georgi and Ghafoorian, Mohsen}, title = {DG-Recon: Depth-Guided Neural 3D Scene Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18184-18194} }
Simple Baselines for Interactive Video Retrieval with Questions and Answers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liang_2023_ICCV, author = {Liang, Kaiqu and Albanie, Samuel}, title = {Simple Baselines for Interactive Video Retrieval with Questions and Answers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11091-11101} }
The Stable Signature: Rooting Watermarks in Latent Diffusion Models-
[pdf]
[supp]
[bibtex]@InProceedings{Fernandez_2023_ICCV, author = {Fernandez, Pierre and Couairon, Guillaume and J\'egou, Herv\'e and Douze, Matthijs and Furon, Teddy}, title = {The Stable Signature: Rooting Watermarks in Latent Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22466-22477} }
Boosting Semantic Segmentation from the Perspective of Explicit Class Embeddings-
[pdf]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Yuhe and Liu, Chuanjian and Han, Kai and Tang, Quan and Qin, Zengchang}, title = {Boosting Semantic Segmentation from the Perspective of Explicit Class Embeddings}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {821-831} }
Going Denser with Open-Vocabulary Part Segmentation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Sun_2023_ICCV, author = {Sun, Peize and Chen, Shoufa and Zhu, Chenchen and Xiao, Fanyi and Luo, Ping and Xie, Saining and Yan, Zhicheng}, title = {Going Denser with Open-Vocabulary Part Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15453-15465} }
Learning to Identify Critical States for Reinforcement Learning from Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Haozhe and Zhuge, Mingchen and Li, Bing and Wang, Yuhui and Faccio, Francesco and Ghanem, Bernard and Schmidhuber, J\"urgen}, title = {Learning to Identify Critical States for Reinforcement Learning from Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1955-1965} }
Editing Implicit Assumptions in Text-to-Image Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Orgad_2023_ICCV, author = {Orgad, Hadas and Kawar, Bahjat and Belinkov, Yonatan}, title = {Editing Implicit Assumptions in Text-to-Image Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7053-7061} }
OCHID-Fi: Occlusion-Robust Hand Pose Estimation in 3D via RF-Vision-
[pdf]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Shujie and Zheng, Tianyue and Chen, Zhe and Hu, Jingzhi and Khamis, Abdelwahed and Liu, Jiajun and Luo, Jun}, title = {OCHID-Fi: Occlusion-Robust Hand Pose Estimation in 3D via RF-Vision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15112-15121} }
Conceptual and Hierarchical Latent Space Decomposition for Face Editing-
[pdf]
[supp]
[bibtex]@InProceedings{Ozkan_2023_ICCV, author = {Ozkan, Savas and Ozay, Mete and Robinson, Tom}, title = {Conceptual and Hierarchical Latent Space Decomposition for Face Editing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7248-7257} }
VL-Match: Enhancing Vision-Language Pretraining with Token-Level and Instance-Level Matching-
[pdf]
[bibtex]@InProceedings{Bi_2023_ICCV, author = {Bi, Junyu and Cheng, Daixuan and Yao, Ping and Pang, Bochen and Zhan, Yuefeng and Yang, Chuanguang and Wang, Yujing and Sun, Hao and Deng, Weiwei and Zhang, Qi}, title = {VL-Match: Enhancing Vision-Language Pretraining with Token-Level and Instance-Level Matching}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2584-2593} }
Reconstructing Interacting Hands with Interaction Prior from Monocular Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zuo_2023_ICCV, author = {Zuo, Binghui and Zhao, Zimeng and Sun, Wenqian and Xie, Wei and Xue, Zhou and Wang, Yangang}, title = {Reconstructing Interacting Hands with Interaction Prior from Monocular Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9054-9064} }
Towards Realistic Evaluation of Industrial Continual Learning Scenarios with an Emphasis on Energy Consumption and Computational Footprint-
[pdf]
[supp]
[bibtex]@InProceedings{Chavan_2023_ICCV, author = {Chavan, Vivek and Koch, Paul and Schl\"uter, Marian and Briese, Clemens}, title = {Towards Realistic Evaluation of Industrial Continual Learning Scenarios with an Emphasis on Energy Consumption and Computational Footprint}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11506-11518} }
Translating Images to Road Network: A Non-Autoregressive Sequence-to-Sequence Approach-
[pdf]
[supp]
[bibtex]@InProceedings{Lu_2023_ICCV, author = {Lu, Jiachen and Peng, Renyuan and Cai, Xinyue and Xu, Hang and Li, Hongyang and Wen, Feng and Zhang, Wei and Zhang, Li}, title = {Translating Images to Road Network: A Non-Autoregressive Sequence-to-Sequence Approach}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23-33} }
How Much Temporal Long-Term Context is Needed for Action Segmentation?-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bahrami_2023_ICCV, author = {Bahrami, Emad and Francesca, Gianpiero and Gall, Juergen}, title = {How Much Temporal Long-Term Context is Needed for Action Segmentation?}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10351-10361} }
3D VR Sketch Guided 3D Shape Prototyping and Exploration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Luo_2023_ICCV, author = {Luo, Ling and Chowdhury, Pinaki Nath and Xiang, Tao and Song, Yi-Zhe and Gryaditskaya, Yulia}, title = {3D VR Sketch Guided 3D Shape Prototyping and Exploration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9267-9276} }
Seal-3D: Interactive Pixel-Level Editing for Neural Radiance Fields-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Xiangyu and Zhu, Jingsen and Ye, Qi and Huo, Yuchi and Ran, Yunlong and Zhong, Zhihua and Chen, Jiming}, title = {Seal-3D: Interactive Pixel-Level Editing for Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17683-17693} }
Generative Novel View Synthesis with 3D-Aware Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chan_2023_ICCV, author = {Chan, Eric R. and Nagano, Koki and Chan, Matthew A. and Bergman, Alexander W. and Park, Jeong Joon and Levy, Axel and Aittala, Miika and De Mello, Shalini and Karras, Tero and Wetzstein, Gordon}, title = {Generative Novel View Synthesis with 3D-Aware Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4217-4229} }
MDCS: More Diverse Experts with Consistency Self-distillation for Long-tailed Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Qihao and Jiang, Chen and Hu, Wei and Zhang, Fan and Liu, Jun}, title = {MDCS: More Diverse Experts with Consistency Self-distillation for Long-tailed Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11597-11608} }
Similarity Min-Max: Zero-Shot Day-Night Domain Adaptation-
[pdf]
[supp]
[bibtex]@InProceedings{Luo_2023_ICCV, author = {Luo, Rundong and Wang, Wenjing and Yang, Wenhan and Liu, Jiaying}, title = {Similarity Min-Max: Zero-Shot Day-Night Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8104-8114} }
Dark Side Augmentation: Generating Diverse Night Examples for Metric Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Mohwald_2023_ICCV, author = {Mohwald, Albert and Jenicek, Tomas and Chum, Ond\v{r}ej}, title = {Dark Side Augmentation: Generating Diverse Night Examples for Metric Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11153-11163} }
NeRF-MS: Neural Radiance Fields with Multi-Sequence-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Peihao and Wang, Shaohui and Yang, Chen and Liu, Bingbing and Qiu, Weichao and Wang, Haoqian}, title = {NeRF-MS: Neural Radiance Fields with Multi-Sequence}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18591-18600} }
LVOS: A Benchmark for Long-term Video Object Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hong_2023_ICCV, author = {Hong, Lingyi and Chen, Wenchao and Liu, Zhongying and Zhang, Wei and Guo, Pinxue and Chen, Zhaoyu and Zhang, Wenqiang}, title = {LVOS: A Benchmark for Long-term Video Object Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13480-13492} }
Diffusion Model as Representation Learner-
[pdf]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Xingyi and Wang, Xinchao}, title = {Diffusion Model as Representation Learner}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18938-18949} }
Nerfbusters: Removing Ghostly Artifacts from Casually Captured NeRFs-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Warburg_2023_ICCV, author = {Warburg, Frederik and Weber, Ethan and Tancik, Matthew and Holynski, Aleksander and Kanazawa, Angjoo}, title = {Nerfbusters: Removing Ghostly Artifacts from Casually Captured NeRFs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18120-18130} }
Document Understanding Dataset and Evaluation (DUDE)-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Van_Landeghem_2023_ICCV, author = {Van Landeghem, Jordy and Tito, Rub\`en and Borchmann, {\L}ukasz and Pietruszka, Micha{\l} and Joziak, Pawel and Powalski, Rafal and Jurkiewicz, Dawid and Coustaty, Mickael and Anckaert, Bertrand and Valveny, Ernest and Blaschko, Matthew and Moens, Sien and Stanislawek, Tomasz}, title = {Document Understanding Dataset and Evaluation (DUDE)}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19528-19540} }
ALWOD: Active Learning for Weakly-Supervised Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Yuting and Ilic, Velibor and Li, Jiatong and Kisa\v{c}anin, Branislav and Pavlovic, Vladimir}, title = {ALWOD: Active Learning for Weakly-Supervised Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6459-6469} }
Prototypical Kernel Learning and Open-set Foreground Perception for Generalized Few-shot Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Kai and Wang, Feigege and Xi, Ye and Gao, Yutao}, title = {Prototypical Kernel Learning and Open-set Foreground Perception for Generalized Few-shot Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19256-19265} }
Simple and Effective Out-of-Distribution Detection via Cosine-based Softmax Loss-
[pdf]
[supp]
[bibtex]@InProceedings{Noh_2023_ICCV, author = {Noh, SoonCheol and Jeong, DongEon and Lee, Jee-Hyong}, title = {Simple and Effective Out-of-Distribution Detection via Cosine-based Softmax Loss}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16560-16569} }
CFCG: Semi-Supervised Semantic Segmentation via Cross-Fusion and Contour Guidance Supervision-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Shuo and He, Yue and Zhang, Weiming and Zhang, Wei and Tan, Xiao and Han, Junyu and Ding, Errui and Wang, Jingdong}, title = {CFCG: Semi-Supervised Semantic Segmentation via Cross-Fusion and Contour Guidance Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16348-16358} }
CHAMPAGNE: Learning Real-world Conversation from Large-Scale Web Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Han_2023_ICCV, author = {Han, Seungju and Hessel, Jack and Dziri, Nouha and Choi, Yejin and Yu, Youngjae}, title = {CHAMPAGNE: Learning Real-world Conversation from Large-Scale Web Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15498-15509} }
SLAN: Self-Locator Aided Network for Vision-Language Understanding-
[pdf]
[bibtex]@InProceedings{Zhai_2023_ICCV, author = {Zhai, Jiang-Tian and Zhang, Qi and Wu, Tong and Chen, Xing-Yu and Liu, Jiang-Jiang and Cheng, Ming-Ming}, title = {SLAN: Self-Locator Aided Network for Vision-Language Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21949-21958} }
S-VolSDF: Sparse Multi-View Stereo Regularization of Neural Implicit Surfaces-
[pdf]
[supp]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Haoyu and Graikos, Alexandros and Samaras, Dimitris}, title = {S-VolSDF: Sparse Multi-View Stereo Regularization of Neural Implicit Surfaces}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3556-3568} }
Anomaly Detection using Score-based Perturbation Resilience-
[pdf]
[supp]
[bibtex]@InProceedings{Shin_2023_ICCV, author = {Shin, Woosang and Lee, Jonghyeon and Lee, Taehan and Lee, Sangmoon and Yun, Jong Pil}, title = {Anomaly Detection using Score-based Perturbation Resilience}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23372-23382} }
Generating Visual Scenes from Touch-
[pdf]
[supp]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Fengyu and Zhang, Jiacheng and Owens, Andrew}, title = {Generating Visual Scenes from Touch}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22070-22080} }
DeformToon3D: Deformable Neural Radiance Fields for 3D Toonification-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Junzhe and Lan, Yushi and Yang, Shuai and Hong, Fangzhou and Wang, Quan and Yeo, Chai Kiat and Liu, Ziwei and Loy, Chen Change}, title = {DeformToon3D: Deformable Neural Radiance Fields for 3D Toonification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9144-9154} }
SatlasPretrain: A Large-Scale Dataset for Remote Sensing Image Understanding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bastani_2023_ICCV, author = {Bastani, Favyen and Wolters, Piper and Gupta, Ritwik and Ferdinando, Joe and Kembhavi, Aniruddha}, title = {SatlasPretrain: A Large-Scale Dataset for Remote Sensing Image Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16772-16782} }
Empowering Low-Light Image Enhancer through Customized Learnable Priors-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zheng_2023_ICCV, author = {Zheng, Naishan and Zhou, Man and Dong, Yanmeng and Rui, Xiangyu and Huang, Jie and Li, Chongyi and Zhao, Feng}, title = {Empowering Low-Light Image Enhancer through Customized Learnable Priors}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12559-12569} }
TextManiA: Enriching Visual Feature by Text-driven Manifold Augmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ye-Bin_2023_ICCV, author = {Ye-Bin, Moon and Kim, Jisoo and Kim, Hongyeob and Son, Kilho and Oh, Tae-Hyun}, title = {TextManiA: Enriching Visual Feature by Text-driven Manifold Augmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2526-2537} }
Guiding Image Captioning Models Toward More Specific Captions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kornblith_2023_ICCV, author = {Kornblith, Simon and Li, Lala and Wang, Zirui and Nguyen, Thao}, title = {Guiding Image Captioning Models Toward More Specific Captions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15259-15269} }
Breaking Common Sense: WHOOPS! A Vision-and-Language Benchmark of Synthetic and Compositional Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bitton-Guetta_2023_ICCV, author = {Bitton-Guetta, Nitzan and Bitton, Yonatan and Hessel, Jack and Schmidt, Ludwig and Elovici, Yuval and Stanovsky, Gabriel and Schwartz, Roy}, title = {Breaking Common Sense: WHOOPS! A Vision-and-Language Benchmark of Synthetic and Compositional Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2616-2627} }
Consistent Depth Prediction for Transparent Object Reconstruction from RGB-D Camera-
[pdf]
[supp]
[bibtex]@InProceedings{Cai_2023_ICCV, author = {Cai, Yuxiang and Zhu, Yifan and Zhang, Haiwei and Ren, Bo}, title = {Consistent Depth Prediction for Transparent Object Reconstruction from RGB-D Camera}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3459-3468} }
DReg-NeRF: Deep Registration for Neural Radiance Fields-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Yu and Lee, Gim Hee}, title = {DReg-NeRF: Deep Registration for Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22703-22713} }
DETR Does Not Need Multi-Scale or Locality Design-
[pdf]
[supp]
[bibtex]@InProceedings{Lin_2023_ICCV, author = {Lin, Yutong and Yuan, Yuhui and Zhang, Zheng and Li, Chen and Zheng, Nanning and Hu, Han}, title = {DETR Does Not Need Multi-Scale or Locality Design}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6545-6554} }
Towards Effective Instance Discrimination Contrastive Loss for Unsupervised Domain Adaptation-
[pdf]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Yixin and Wang, Zilei and Li, Junjie and Zhuang, Jiafan and Lin, Zihan}, title = {Towards Effective Instance Discrimination Contrastive Loss for Unsupervised Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11388-11399} }
ClusT3: Information Invariant Test-Time Training-
[pdf]
[supp]
[bibtex]@InProceedings{Hakim_2023_ICCV, author = {Hakim, Gustavo A. Vargas and Osowiechi, David and Noori, Mehrdad and Cheraghalikhani, Milad and Bahri, Ali and Ben Ayed, Ismail and Desrosiers, Christian}, title = {ClusT3: Information Invariant Test-Time Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6136-6145} }
FrozenRecon: Pose-free 3D Scene Reconstruction with Frozen Depth Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Guangkai and Yin, Wei and Chen, Hao and Shen, Chunhua and Cheng, Kai and Zhao, Feng}, title = {FrozenRecon: Pose-free 3D Scene Reconstruction with Frozen Depth Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9310-9320} }
Affective Image Filter: Reflecting Emotions from Text to Images-
[pdf]
[supp]
[bibtex]@InProceedings{Weng_2023_ICCV, author = {Weng, Shuchen and Zhang, Peixuan and Chang, Zheng and Wang, Xinlong and Li, Si and Shi, Boxin}, title = {Affective Image Filter: Reflecting Emotions from Text to Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10810-10819} }
Content-Aware Local GAN for Photo-Realistic Super-Resolution-
[pdf]
[supp]
[bibtex]@InProceedings{Park_2023_ICCV, author = {Park, JoonKyu and Son, Sanghyun and Lee, Kyoung Mu}, title = {Content-Aware Local GAN for Photo-Realistic Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10585-10594} }
Structure-Aware Surface Reconstruction via Primitive Assembly-
[pdf]
[bibtex]@InProceedings{Jiang_2023_ICCV, author = {Jiang, Jingen and Zhao, Mingyang and Xin, Shiqing and Yang, Yanchao and Wang, Hanxiao and Jia, Xiaohong and Yan, Dong-Ming}, title = {Structure-Aware Surface Reconstruction via Primitive Assembly}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14171-14180} }
FineDance: A Fine-grained Choreography Dataset for 3D Full Body Dance Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Ronghui and Zhao, Junfan and Zhang, Yachao and Su, Mingyang and Ren, Zeping and Zhang, Han and Tang, Yansong and Li, Xiu}, title = {FineDance: A Fine-grained Choreography Dataset for 3D Full Body Dance Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10234-10243} }
AssetField: Assets Mining and Reconfiguration in Ground Feature Plane Representation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Xiangli_2023_ICCV, author = {Xiangli, Yuanbo and Xu, Linning and Pan, Xingang and Zhao, Nanxuan and Dai, Bo and Lin, Dahua}, title = {AssetField: Assets Mining and Reconfiguration in Ground Feature Plane Representation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3251-3261} }
Improving Online Lane Graph Extraction by Object-Lane Clustering-
[pdf]
[arXiv]
[bibtex]@InProceedings{Can_2023_ICCV, author = {Can, Yigit Baran and Liniger, Alexander and Paudel, Danda Pani and Van Gool, Luc}, title = {Improving Online Lane Graph Extraction by Object-Lane Clustering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8591-8601} }
SAGA: Spectral Adversarial Geometric Attack on 3D Meshes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Stolik_2023_ICCV, author = {Stolik, Tomer and Lang, Itai and Avidan, Shai}, title = {SAGA: Spectral Adversarial Geometric Attack on 3D Meshes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4284-4294} }
All in Tokens: Unifying Output Space of Visual Tasks via Soft Token-
[pdf]
[arXiv]
[bibtex]@InProceedings{Ning_2023_ICCV, author = {Ning, Jia and Li, Chen and Zhang, Zheng and Wang, Chunyu and Geng, Zigang and Dai, Qi and He, Kun and Hu, Han}, title = {All in Tokens: Unifying Output Space of Visual Tasks via Soft Token}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19900-19910} }
Learning Navigational Visual Representations with Semantic Map Supervision-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hong_2023_ICCV, author = {Hong, Yicong and Zhou, Yang and Zhang, Ruiyi and Dernoncourt, Franck and Bui, Trung and Gould, Stephen and Tan, Hao}, title = {Learning Navigational Visual Representations with Semantic Map Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3055-3067} }
LDL: Line Distance Functions for Panoramic Localization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2023_ICCV, author = {Kim, Junho and Choi, Changwoon and Jang, Hojun and Kim, Young Min}, title = {LDL: Line Distance Functions for Panoramic Localization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17882-17892} }
TransTIC: Transferring Transformer-based Image Compression from Human Perception to Machine Perception-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Yi-Hsin and Weng, Ying-Chieh and Kao, Chia-Hao and Chien, Cheng and Chiu, Wei-Chen and Peng, Wen-Hsiao}, title = {TransTIC: Transferring Transformer-based Image Compression from Human Perception to Machine Perception}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23297-23307} }
CHORUS : Learning Canonicalized 3D Human-Object Spatial Relations from Unbounded Synthesized Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Han_2023_ICCV, author = {Han, Sookwan and Joo, Hanbyul}, title = {CHORUS : Learning Canonicalized 3D Human-Object Spatial Relations from Unbounded Synthesized Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15835-15846} }
Shortcut-V2V: Compression Framework for Video-to-Video Translation Based on Temporal Redundancy Reduction-
[pdf]
[supp]
[bibtex]@InProceedings{Chung_2023_ICCV, author = {Chung, Chaeyeon and Park, Yeojeong and Choi, Seunghwan and Ganbat, Munkhsoyol and Choo, Jaegul}, title = {Shortcut-V2V: Compression Framework for Video-to-Video Translation Based on Temporal Redundancy Reduction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7612-7622} }
ViLLA: Fine-Grained Vision-Language Representation Learning from Real-World Data-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Varma_2023_ICCV, author = {Varma, Maya and Delbrouck, Jean-Benoit and Hooper, Sarah and Chaudhari, Akshay and Langlotz, Curtis}, title = {ViLLA: Fine-Grained Vision-Language Representation Learning from Real-World Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22225-22235} }
SG-Former: Self-guided Transformer with Evolving Token Reallocation-
[pdf]
[bibtex]@InProceedings{Ren_2023_ICCV, author = {Ren, Sucheng and Yang, Xingyi and Liu, Songhua and Wang, Xinchao}, title = {SG-Former: Self-guided Transformer with Evolving Token Reallocation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6003-6014} }
Towards Unifying Medical Vision-and-Language Pre-Training via Soft Prompts-
[pdf]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Zhihong and Diao, Shizhe and Wang, Benyou and Li, Guanbin and Wan, Xiang}, title = {Towards Unifying Medical Vision-and-Language Pre-Training via Soft Prompts}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23403-23413} }
A Large-scale Study of Spatiotemporal Representation Learning with a New Benchmark on Action Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Deng_2023_ICCV, author = {Deng, Andong and Yang, Taojiannan and Chen, Chen}, title = {A Large-scale Study of Spatiotemporal Representation Learning with a New Benchmark on Action Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20519-20531} }
Video Background Music Generation: Dataset, Method and Evaluation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhuo_2023_ICCV, author = {Zhuo, Le and Wang, Zhaokai and Wang, Baisen and Liao, Yue and Bao, Chenxi and Peng, Stanley and Han, Songhao and Zhang, Aixi and Fang, Fei and Liu, Si}, title = {Video Background Music Generation: Dataset, Method and Evaluation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15637-15647} }
HoloFusion: Towards Photo-realistic 3D Generative Modeling-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Karnewar_2023_ICCV, author = {Karnewar, Animesh and Mitra, Niloy J. and Vedaldi, Andrea and Novotny, David}, title = {HoloFusion: Towards Photo-realistic 3D Generative Modeling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22976-22985} }
ProtoTransfer: Cross-Modal Prototype Transfer for Point Cloud Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Tang_2023_ICCV, author = {Tang, Pin and Xu, Hai-Ming and Ma, Chao}, title = {ProtoTransfer: Cross-Modal Prototype Transfer for Point Cloud Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3337-3347} }
Improving Continuous Sign Language Recognition with Cross-Lingual Signs-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wei_2023_ICCV, author = {Wei, Fangyun and Chen, Yutong}, title = {Improving Continuous Sign Language Recognition with Cross-Lingual Signs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23612-23621} }
Markov Game Video Augmentation for Action Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Aziere_2023_ICCV, author = {Aziere, Nicolas and Todorovic, Sinisa}, title = {Markov Game Video Augmentation for Action Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13505-13514} }
Deep Image Harmonization with Globally Guided Feature Transformation and Relation Distillation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Niu_2023_ICCV, author = {Niu, Li and Tan, Linfeng and Tao, Xinhao and Cao, Junyan and Guo, Fengjun and Long, Teng and Zhang, Liqing}, title = {Deep Image Harmonization with Globally Guided Feature Transformation and Relation Distillation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7723-7732} }
TransIFF: An Instance-Level Feature Fusion Framework for Vehicle-Infrastructure Cooperative 3D Detection with Transformers-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Ziming and Shi, Yifeng and Jia, Jinrang}, title = {TransIFF: An Instance-Level Feature Fusion Framework for Vehicle-Infrastructure Cooperative 3D Detection with Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18205-18214} }
RegFormer: An Efficient Projection-Aware Transformer Network for Large-Scale Point Cloud Registration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Jiuming and Wang, Guangming and Liu, Zhe and Jiang, Chaokang and Pollefeys, Marc and Wang, Hesheng}, title = {RegFormer: An Efficient Projection-Aware Transformer Network for Large-Scale Point Cloud Registration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8451-8460} }
Masked Retraining Teacher-Student Framework for Domain Adaptive Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Zijing and Wei, Sitong and Chen, Qingchao and Li, Dehui and Yang, Yifan and Peng, Yuxin and Liu, Yang}, title = {Masked Retraining Teacher-Student Framework for Domain Adaptive Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19039-19049} }
Prune Spatio-temporal Tokens by Semantic-aware Temporal Accumulation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ding_2023_ICCV, author = {Ding, Shuangrui and Zhao, Peisen and Zhang, Xiaopeng and Qian, Rui and Xiong, Hongkai and Tian, Qi}, title = {Prune Spatio-temporal Tokens by Semantic-aware Temporal Accumulation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16945-16956} }
VQ3D: Learning a 3D-Aware Generative Model on ImageNet-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sargent_2023_ICCV, author = {Sargent, Kyle and Koh, Jing Yu and Zhang, Han and Chang, Huiwen and Herrmann, Charles and Srinivasan, Pratul and Wu, Jiajun and Sun, Deqing}, title = {VQ3D: Learning a 3D-Aware Generative Model on ImageNet}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4240-4250} }
Growing a Brain with Sparsity-Inducing Generation for Continual Learning-
[pdf]
[bibtex]@InProceedings{Jin_2023_ICCV, author = {Jin, Hyundong and Kim, Gyeong-hyeon and Ahn, Chanho and Kim, Eunwoo}, title = {Growing a Brain with Sparsity-Inducing Generation for Continual Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18961-18970} }
Cross-Ray Neural Radiance Fields for Novel-View Synthesis from Unconstrained Image Collections-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Yifan and Zhang, Shuhai and Huang, Zixiong and Zhang, Yubing and Tan, Mingkui}, title = {Cross-Ray Neural Radiance Fields for Novel-View Synthesis from Unconstrained Image Collections}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15901-15911} }
Graphics2RAW: Mapping Computer Graphics Images to Sensor RAW Images-
[pdf]
[supp]
[bibtex]@InProceedings{Seo_2023_ICCV, author = {Seo, Donghwan and Punnappurath, Abhijith and Zhao, Luxi and Abdelhamed, Abdelrahman and Tedla, Sai Kiran and Park, Sanguk and Choe, Jihwan and Brown, Michael S.}, title = {Graphics2RAW: Mapping Computer Graphics Images to Sensor RAW Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12622-12631} }
SPACE: Speech-driven Portrait Animation with Controllable Expression-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gururani_2023_ICCV, author = {Gururani, Siddharth and Mallya, Arun and Wang, Ting-Chun and Valle, Rafael and Liu, Ming-Yu}, title = {SPACE: Speech-driven Portrait Animation with Controllable Expression}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20914-20923} }
2D-3D Interlaced Transformer for Point Cloud Segmentation with Scene-Level Supervision-
[pdf]
[supp]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Cheng-Kun and Chen, Min-Hung and Chuang, Yung-Yu and Lin, Yen-Yu}, title = {2D-3D Interlaced Transformer for Point Cloud Segmentation with Scene-Level Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {977-987} }
Collecting The Puzzle Pieces: Disentangled Self-Driven Human Pose Transfer by Permuting Textures-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Nannan and Shih, Kevin J and Plummer, Bryan A.}, title = {Collecting The Puzzle Pieces: Disentangled Self-Driven Human Pose Transfer by Permuting Textures}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7126-7137} }
VAD: Vectorized Scene Representation for Efficient Autonomous Driving-
[pdf]
[arXiv]
[bibtex]@InProceedings{Jiang_2023_ICCV, author = {Jiang, Bo and Chen, Shaoyu and Xu, Qing and Liao, Bencheng and Chen, Jiajie and Zhou, Helong and Zhang, Qian and Liu, Wenyu and Huang, Chang and Wang, Xinggang}, title = {VAD: Vectorized Scene Representation for Efficient Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8340-8350} }
End-to-end 3D Tracking with Decoupled Queries-
[pdf]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Yanwei and Yu, Zhiding and Philion, Jonah and Anandkumar, Anima and Fidler, Sanja and Jia, Jiaya and Alvarez, Jose}, title = {End-to-end 3D Tracking with Decoupled Queries}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18302-18311} }
Sound Localization from Motion: Jointly Learning Sound Direction and Camera Rotation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Ziyang and Qian, Shengyi and Owens, Andrew}, title = {Sound Localization from Motion: Jointly Learning Sound Direction and Camera Rotation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7897-7908} }
Batch-based Model Registration for Fast 3D Sherd Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Jiepeng and Zhang, Congyi and Wang, Peng and Li, Xin and Cobb, Peter J. and Theobalt, Christian and Wang, Wenping}, title = {Batch-based Model Registration for Fast 3D Sherd Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14519-14529} }
HiFace: High-Fidelity 3D Face Reconstruction by Learning Static and Dynamic Details-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chai_2023_ICCV, author = {Chai, Zenghao and Zhang, Tianke and He, Tianyu and Tan, Xu and Baltrusaitis, Tadas and Wu, HsiangTao and Li, Runnan and Zhao, Sheng and Yuan, Chun and Bian, Jiang}, title = {HiFace: High-Fidelity 3D Face Reconstruction by Learning Static and Dynamic Details}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9087-9098} }
Fast and Accurate Transferability Measurement by Evaluating Intra-class Feature Variance-
[pdf]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Huiwen and Kang, U}, title = {Fast and Accurate Transferability Measurement by Evaluating Intra-class Feature Variance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11474-11482} }
Deformable Model-Driven Neural Rendering for High-Fidelity 3D Reconstruction of Human Heads Under Low-View Settings-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Baixin and Zhang, Jiarui and Lin, Kwan-Yee and Qian, Chen and He, Ying}, title = {Deformable Model-Driven Neural Rendering for High-Fidelity 3D Reconstruction of Human Heads Under Low-View Settings}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17924-17934} }
Algebraically Rigorous Quaternion Framework for the Neural Network Pose Estimation Problem-
[pdf]
[bibtex]@InProceedings{Lin_2023_ICCV, author = {Lin, Chen and Hanson, Andrew J. and Hanson, Sonya M.}, title = {Algebraically Rigorous Quaternion Framework for the Neural Network Pose Estimation Problem}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14097-14106} }
Prompt Tuning Inversion for Text-driven Image Editing Using Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dong_2023_ICCV, author = {Dong, Wenkai and Xue, Song and Duan, Xiaoyue and Han, Shumin}, title = {Prompt Tuning Inversion for Text-driven Image Editing Using Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7430-7440} }
CVSformer: Cross-View Synthesis Transformer for Semantic Scene Completion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dong_2023_ICCV, author = {Dong, Haotian and Ma, Enhui and Wang, Lubo and Wang, Miaohui and Xie, Wuyuan and Guo, Qing and Li, Ping and Liang, Lingyu and Yang, Kairui and Lin, Di}, title = {CVSformer: Cross-View Synthesis Transformer for Semantic Scene Completion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8874-8883} }
UrbanGIRAFFE: Representing Urban Scenes as Compositional Generative Neural Feature Fields-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Yuanbo and Yang, Yifei and Guo, Hanlei and Xiong, Rong and Wang, Yue and Liao, Yiyi}, title = {UrbanGIRAFFE: Representing Urban Scenes as Compositional Generative Neural Feature Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9199-9210} }
UnitedHuman: Harnessing Multi-Source Data for High-Resolution Human Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fu_2023_ICCV, author = {Fu, Jianglin and Li, Shikai and Jiang, Yuming and Lin, Kwan-Yee and Wu, Wayne and Liu, Ziwei}, title = {UnitedHuman: Harnessing Multi-Source Data for High-Resolution Human Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7301-7311} }
Active Neural Mapping-
[pdf]
[arXiv]
[bibtex]@InProceedings{Yan_2023_ICCV, author = {Yan, Zike and Yang, Haoxiang and Zha, Hongbin}, title = {Active Neural Mapping}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10981-10992} }
Density-invariant Features for Distant Point Cloud Registration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Quan and Zhu, Hongzi and Zhou, Yunsong and Li, Hongyang and Chang, Shan and Guo, Minyi}, title = {Density-invariant Features for Distant Point Cloud Registration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18215-18225} }
UniverSeg: Universal Medical Image Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Butoi_2023_ICCV, author = {Butoi, Victor Ion and Ortiz, Jose Javier Gonzalez and Ma, Tianyu and Sabuncu, Mert R. and Guttag, John and Dalca, Adrian V.}, title = {UniverSeg: Universal Medical Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21438-21451} }
RecRecNet: Rectangling Rectified Wide-Angle Images by Thin-Plate Spline Model and DoF-based Curriculum Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liao_2023_ICCV, author = {Liao, Kang and Nie, Lang and Lin, Chunyu and Zheng, Zishuo and Zhao, Yao}, title = {RecRecNet: Rectangling Rectified Wide-Angle Images by Thin-Plate Spline Model and DoF-based Curriculum Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10800-10809} }
Neural Microfacet Fields for Inverse Rendering-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mai_2023_ICCV, author = {Mai, Alexander and Verbin, Dor and Kuester, Falko and Fridovich-Keil, Sara}, title = {Neural Microfacet Fields for Inverse Rendering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {408-418} }
Understanding Self-attention Mechanism via Dynamical System Perspective-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Zhongzhan and Liang, Mingfu and Qin, Jinghui and Zhong, Shanshan and Lin, Liang}, title = {Understanding Self-attention Mechanism via Dynamical System Perspective}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1412-1422} }
Learning Versatile 3D Shape Generation with Improved Auto-regressive Models-
[pdf]
[supp]
[bibtex]@InProceedings{Luo_2023_ICCV, author = {Luo, Simian and Qian, Xuelin and Fu, Yanwei and Zhang, Yinda and Tai, Ying and Zhang, Zhenyu and Wang, Chengjie and Xue, Xiangyang}, title = {Learning Versatile 3D Shape Generation with Improved Auto-regressive Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14139-14149} }
DETA: Denoised Task Adaptation for Few-Shot Learning-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Ji and Gao, Lianli and Luo, Xu and Shen, Hengtao and Song, Jingkuan}, title = {DETA: Denoised Task Adaptation for Few-Shot Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11541-11551} }
DDG-Net: Discriminability-Driven Graph Network for Weakly-supervised Temporal Action Localization-
[pdf]
[supp]
[bibtex]@InProceedings{Tang_2023_ICCV, author = {Tang, Xiaojun and Fan, Junsong and Luo, Chuanchen and Zhang, Zhaoxiang and Zhang, Man and Yang, Zongyuan}, title = {DDG-Net: Discriminability-Driven Graph Network for Weakly-supervised Temporal Action Localization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6622-6632} }
Diffusion Models as Masked Autoencoders-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wei_2023_ICCV, author = {Wei, Chen and Mangalam, Karttikeya and Huang, Po-Yao and Li, Yanghao and Fan, Haoqi and Xu, Hu and Wang, Huiyu and Xie, Cihang and Yuille, Alan and Feichtenhofer, Christoph}, title = {Diffusion Models as Masked Autoencoders}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16284-16294} }
Robust Frame-to-Frame Camera Rotation Estimation in Crowded Scenes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Delattre_2023_ICCV, author = {Delattre, Fabien and Dirnfeld, David and Nguyen, Phat and Scarano, Stephen K and Jones, Michael J and Miraldo, Pedro and Learned-Miller, Erik}, title = {Robust Frame-to-Frame Camera Rotation Estimation in Crowded Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9752-9762} }
Bayesian Prompt Learning for Image-Language Model Generalization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Derakhshani_2023_ICCV, author = {Derakhshani, Mohammad Mahdi and Sanchez, Enrique and Bulat, Adrian and da Costa, Victor G. Turrisi and Snoek, Cees G.M. and Tzimiropoulos, Georgios and Martinez, Brais}, title = {Bayesian Prompt Learning for Image-Language Model Generalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15237-15246} }
One-Shot Recognition of Any Material Anywhere Using Contrastive Learning with Physics-Based Rendering-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Drehwald_2023_ICCV, author = {Drehwald, Manuel S. and Eppel, Sagi and Li, Jolina and Hao, Han and Aspuru-Guzik, Alan}, title = {One-Shot Recognition of Any Material Anywhere Using Contrastive Learning with Physics-Based Rendering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23524-23533} }
DiLiGenT-Pi: Photometric Stereo for Planar Surfaces with Rich Details - Benchmark Dataset and Beyond-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Feishi and Ren, Jieji and Guo, Heng and Ren, Mingjun and Shi, Boxin}, title = {DiLiGenT-Pi: Photometric Stereo for Planar Surfaces with Rich Details - Benchmark Dataset and Beyond}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9477-9487} }
Rethinking Data Distillation: Do Not Overlook Calibration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Dongyao and Lei, Bowen and Zhang, Jie and Fang, Yanbo and Xie, Yiqun and Zhang, Ruqi and Xu, Dongkuan}, title = {Rethinking Data Distillation: Do Not Overlook Calibration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4935-4945} }
Accurate and Fast Compressed Video Captioning-
[pdf]
[arXiv]
[bibtex]@InProceedings{Shen_2023_ICCV, author = {Shen, Yaojie and Gu, Xin and Xu, Kai and Fan, Heng and Wen, Longyin and Zhang, Libo}, title = {Accurate and Fast Compressed Video Captioning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15558-15567} }
Building Vision Transformers with Hierarchy Aware Feature Aggregation-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Yongjie and Liu, Hongmin and Yin, Haoran and Fan, Bin}, title = {Building Vision Transformers with Hierarchy Aware Feature Aggregation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5908-5918} }
Visible-Infrared Person Re-Identification via Semantic Alignment and Affinity Inference-
[pdf]
[supp]
[bibtex]@InProceedings{Fang_2023_ICCV, author = {Fang, Xingye and Yang, Yang and Fu, Ying}, title = {Visible-Infrared Person Re-Identification via Semantic Alignment and Affinity Inference}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11270-11279} }
SAL-ViT: Towards Latency Efficient Private Inference on ViT using Selective Attention Search with a Learnable Softmax Approximation-
[pdf]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Yuke and Chen, Dake and Kundu, Souvik and Li, Chenghao and Beerel, Peter A.}, title = {SAL-ViT: Towards Latency Efficient Private Inference on ViT using Selective Attention Search with a Learnable Softmax Approximation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5116-5125} }
TIJO: Trigger Inversion with Joint Optimization for Defending Multimodal Backdoored Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sur_2023_ICCV, author = {Sur, Indranil and Sikka, Karan and Walmer, Matthew and Koneripalli, Kaushik and Roy, Anirban and Lin, Xiao and Divakaran, Ajay and Jha, Susmit}, title = {TIJO: Trigger Inversion with Joint Optimization for Defending Multimodal Backdoored Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {165-175} }
DG3D: Generating High Quality 3D Textured Shapes by Learning to Discriminate Multi-Modal Diffusion-Renderings-
[pdf]
[supp]
[bibtex]@InProceedings{Zuo_2023_ICCV, author = {Zuo, Qi and Song, Yafei and Li, Jianfang and Liu, Lin and Bo, Liefeng}, title = {DG3D: Generating High Quality 3D Textured Shapes by Learning to Discriminate Multi-Modal Diffusion-Renderings}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14575-14584} }
Improving Adversarial Robustness of Masked Autoencoders via Test-time Frequency-domain Prompting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Qidong and Dong, Xiaoyi and Chen, Dongdong and Chen, Yinpeng and Yuan, Lu and Hua, Gang and Zhang, Weiming and Yu, Nenghai}, title = {Improving Adversarial Robustness of Masked Autoencoders via Test-time Frequency-domain Prompting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1600-1610} }
HairCLIPv2: Unifying Hair Editing via Proxy Feature Blending-
[pdf]
[supp]
[bibtex]@InProceedings{Wei_2023_ICCV, author = {Wei, Tianyi and Chen, Dongdong and Zhou, Wenbo and Liao, Jing and Zhang, Weiming and Hua, Gang and Yu, Nenghai}, title = {HairCLIPv2: Unifying Hair Editing via Proxy Feature Blending}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23589-23599} }
VLSlice: Interactive Vision-and-Language Slice Discovery-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Slyman_2023_ICCV, author = {Slyman, Eric and Kahng, Minsuk and Lee, Stefan}, title = {VLSlice: Interactive Vision-and-Language Slice Discovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15291-15301} }
Learning to Ground Instructional Articles in Videos through Narrations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mavroudi_2023_ICCV, author = {Mavroudi, Effrosyni and Afouras, Triantafyllos and Torresani, Lorenzo}, title = {Learning to Ground Instructional Articles in Videos through Narrations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15201-15213} }
DocTr: Document Transformer for Structured Information Extraction in Documents-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liao_2023_ICCV, author = {Liao, Haofu and RoyChowdhury, Aruni and Li, Weijian and Bansal, Ankan and Zhang, Yuting and Tu, Zhuowen and Satzoda, Ravi Kumar and Manmatha, R. and Mahadevan, Vijay}, title = {DocTr: Document Transformer for Structured Information Extraction in Documents}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19584-19594} }
The Making and Breaking of Camouflage-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lamdouar_2023_ICCV, author = {Lamdouar, Hala and Xie, Weidi and Zisserman, Andrew}, title = {The Making and Breaking of Camouflage}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {832-842} }
Role-Aware Interaction Generation from Textual Description-
[pdf]
[supp]
[bibtex]@InProceedings{Tanaka_2023_ICCV, author = {Tanaka, Mikihiro and Fujiwara, Kent}, title = {Role-Aware Interaction Generation from Textual Description}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15999-16009} }
MAMo: Leveraging Memory and Attention for Monocular Video Depth Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yasarla_2023_ICCV, author = {Yasarla, Rajeev and Cai, Hong and Jeong, Jisoo and Shi, Yunxiao and Garrepalli, Risheek and Porikli, Fatih}, title = {MAMo: Leveraging Memory and Attention for Monocular Video Depth Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8754-8764} }
Continual Learning for Personalized Co-speech Gesture Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Ahuja_2023_ICCV, author = {Ahuja, Chaitanya and Joshi, Pratik and Ishii, Ryo and Morency, Louis-Philippe}, title = {Continual Learning for Personalized Co-speech Gesture Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20893-20903} }
Object as Query: Lifting Any 2D Object Detector to 3D Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Zitian and Huang, Zehao and Fu, Jiahui and Wang, Naiyan and Liu, Si}, title = {Object as Query: Lifting Any 2D Object Detector to 3D Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3791-3800} }
HDG-ODE: A Hierarchical Continuous-Time Model for Human Pose Forecasting-
[pdf]
[bibtex]@InProceedings{Xing_2023_ICCV, author = {Xing, Yucheng and Wang, Xin}, title = {HDG-ODE: A Hierarchical Continuous-Time Model for Human Pose Forecasting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14700-14712} }
Versatile Diffusion: Text, Images and Variations All in One Diffusion Model-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Xingqian and Wang, Zhangyang and Zhang, Gong and Wang, Kai and Shi, Humphrey}, title = {Versatile Diffusion: Text, Images and Variations All in One Diffusion Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7754-7765} }
DreamTeacher: Pretraining Image Backbones with Deep Generative Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Daiqing and Ling, Huan and Kar, Amlan and Acuna, David and Kim, Seung Wook and Kreis, Karsten and Torralba, Antonio and Fidler, Sanja}, title = {DreamTeacher: Pretraining Image Backbones with Deep Generative Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16698-16708} }
Decomposition-Based Variational Network for Multi-Contrast MRI Super-Resolution and Reconstruction-
[pdf]
[supp]
[bibtex]@InProceedings{Lei_2023_ICCV, author = {Lei, Pengcheng and Fang, Faming and Zhang, Guixu and Zeng, Tieyong}, title = {Decomposition-Based Variational Network for Multi-Contrast MRI Super-Resolution and Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21296-21306} }
Self-supervised Monocular Underwater Depth Recovery, Image Restoration, and a Real-sea Video Dataset-
[pdf]
[supp]
[bibtex]@InProceedings{Varghese_2023_ICCV, author = {Varghese, Nisha and Kumar, Ashish and Rajagopalan, A. N.}, title = {Self-supervised Monocular Underwater Depth Recovery, Image Restoration, and a Real-sea Video Dataset}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12248-12258} }
Geometrized Transformer for Self-Supervised Homography Estimation-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Jiazhen and Li, Xirong}, title = {Geometrized Transformer for Self-Supervised Homography Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9556-9565} }
Sat2Density: Faithful Density Learning from Satellite-Ground Image Pairs-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Qian_2023_ICCV, author = {Qian, Ming and Xiong, Jincheng and Xia, Gui-Song and Xue, Nan}, title = {Sat2Density: Faithful Density Learning from Satellite-Ground Image Pairs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3683-3692} }
TiDy-PSFs: Computational Imaging with Time-Averaged Dynamic Point-Spread-Functions-
[pdf]
[supp]
[bibtex]@InProceedings{Shah_2023_ICCV, author = {Shah, Sachin and Kulshrestha, Sakshum and Metzler, Christopher A.}, title = {TiDy-PSFs: Computational Imaging with Time-Averaged Dynamic Point-Spread-Functions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10657-10667} }
Expressive Text-to-Image Generation with Rich Text-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ge_2023_ICCV, author = {Ge, Songwei and Park, Taesung and Zhu, Jun-Yan and Huang, Jia-Bin}, title = {Expressive Text-to-Image Generation with Rich Text}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7545-7556} }
Learning Fine-Grained Features for Pixel-Wise Video Correspondences-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Rui and Zhou, Shenglong and Liu, Dong}, title = {Learning Fine-Grained Features for Pixel-Wise Video Correspondences}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9632-9641} }
FS-DETR: Few-Shot DEtection TRansformer with Prompting and without Re-Training-
[pdf]
[supp]
[bibtex]@InProceedings{Bulat_2023_ICCV, author = {Bulat, Adrian and Guerrero, Ricardo and Martinez, Brais and Tzimiropoulos, Georgios}, title = {FS-DETR: Few-Shot DEtection TRansformer with Prompting and without Re-Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11793-11802} }
Semi-supervised Speech-driven 3D Facial Animation via Cross-modal Encoding-
[pdf]
[supp]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Peiji and Wei, Huawei and Zhong, Yicheng and Wang, Zhisheng}, title = {Semi-supervised Speech-driven 3D Facial Animation via Cross-modal Encoding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21032-21041} }
Learning to Learn: How to Continuously Teach Humans and Machines-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Singh_2023_ICCV, author = {Singh, Parantak and Li, You and Sikarwar, Ankur and Lei, Stan Weixian and Gao, Difei and Talbot, Morgan B. and Sun, Ying and Shou, Mike Zheng and Kreiman, Gabriel and Zhang, Mengmi}, title = {Learning to Learn: How to Continuously Teach Humans and Machines}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11708-11719} }
Text-Driven Generative Domain Adaptation with Spectral Consistency Regularization-
[pdf]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Zhenhuan and Li, Liang and Xiao, Jiayu and Zha, Zheng-Jun and Huang, Qingming}, title = {Text-Driven Generative Domain Adaptation with Spectral Consistency Regularization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7019-7029} }
A 5-Point Minimal Solver for Event Camera Relative Motion Estimation-
[pdf]
[bibtex]@InProceedings{Gao_2023_ICCV, author = {Gao, Ling and Su, Hang and Gehrig, Daniel and Cannici, Marco and Scaramuzza, Davide and Kneip, Laurent}, title = {A 5-Point Minimal Solver for Event Camera Relative Motion Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8049-8059} }
TM2D: Bimodality Driven 3D Dance Generation via Music-Text Integration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gong_2023_ICCV, author = {Gong, Kehong and Lian, Dongze and Chang, Heng and Guo, Chuan and Jiang, Zihang and Zuo, Xinxin and Mi, Michael Bi and Wang, Xinchao}, title = {TM2D: Bimodality Driven 3D Dance Generation via Music-Text Integration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9942-9952} }
Bootstrap Motion Forecasting With Self-Consistent Constraints-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ye_2023_ICCV, author = {Ye, Maosheng and Xu, Jiamiao and Xu, Xunnong and Wang, Tengfei and Cao, Tongyi and Chen, Qifeng}, title = {Bootstrap Motion Forecasting With Self-Consistent Constraints}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8504-8514} }
CDAC: Cross-domain Attention Consistency in Transformer for Domain Adaptive Semantic Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Kaihong and Kim, Donghyun and Feris, Rogerio and Betke, Margrit}, title = {CDAC: Cross-domain Attention Consistency in Transformer for Domain Adaptive Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11519-11529} }
WaveNeRF: Wavelet-based Generalizable Neural Radiance Fields-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Muyu and Zhan, Fangneng and Zhang, Jiahui and Yu, Yingchen and Zhang, Xiaoqin and Theobalt, Christian and Shao, Ling and Lu, Shijian}, title = {WaveNeRF: Wavelet-based Generalizable Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18195-18204} }
LoCUS: Learning Multiscale 3D-consistent Features from Posed Images-
[pdf]
[supp]
[bibtex]@InProceedings{Kloepfer_2023_ICCV, author = {Kloepfer, Dominik A. and Campbell, Dylan and Henriques, Jo\~ao F.}, title = {LoCUS: Learning Multiscale 3D-consistent Features from Posed Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16634-16644} }
Neural Reconstruction of Relightable Human Model from Monocular Video-
[pdf]
[supp]
[bibtex]@InProceedings{Sun_2023_ICCV, author = {Sun, Wenzhang and Che, Yunlong and Huang, Han and Guo, Yandong}, title = {Neural Reconstruction of Relightable Human Model from Monocular Video}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {397-407} }
FB-BEV: BEV Representation from Forward-Backward View Transformations-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Zhiqi and Yu, Zhiding and Wang, Wenhai and Anandkumar, Anima and Lu, Tong and Alvarez, Jose M.}, title = {FB-BEV: BEV Representation from Forward-Backward View Transformations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6919-6928} }
BoxSnake: Polygonal Instance Segmentation with Box Supervision-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Rui and Song, Lin and Ge, Yixiao and Li, Xiu}, title = {BoxSnake: Polygonal Instance Segmentation with Box Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {766-776} }
Confidence-based Visual Dispersal for Few-shot Unsupervised Domain Adaptation-
[pdf]
[supp]
[bibtex]@InProceedings{Xiong_2023_ICCV, author = {Xiong, Yizhe and Chen, Hui and Lin, Zijia and Zhao, Sicheng and Ding, Guiguang}, title = {Confidence-based Visual Dispersal for Few-shot Unsupervised Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11621-11631} }
Event-Guided Procedure Planning from Instructional Videos with Text Supervision-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, An-Lan and Lin, Kun-Yu and Du, Jia-Run and Meng, Jingke and Zheng, Wei-Shi}, title = {Event-Guided Procedure Planning from Instructional Videos with Text Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13565-13575} }
Foreground Object Search by Distilling Composite Image Feature-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Bo and Sui, Jiacheng and Niu, Li}, title = {Foreground Object Search by Distilling Composite Image Feature}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22986-22995} }
Multimodal Motion Conditioned Diffusion Model for Skeleton-based Video Anomaly Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Flaborea_2023_ICCV, author = {Flaborea, Alessandro and Collorone, Luca and di Melendugno, Guido Maria D'Amely and D'Arrigo, Stefano and Prenkaj, Bardh and Galasso, Fabio}, title = {Multimodal Motion Conditioned Diffusion Model for Skeleton-based Video Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10318-10329} }
ClimateNeRF: Extreme Weather Synthesis in Neural Radiance Field-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Yuan and Lin, Zhi-Hao and Forsyth, David and Huang, Jia-Bin and Wang, Shenlong}, title = {ClimateNeRF: Extreme Weather Synthesis in Neural Radiance Field}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3227-3238} }
CDFSL-V: Cross-Domain Few-Shot Learning for Videos-
[pdf]
[supp]
[bibtex]@InProceedings{Samarasinghe_2023_ICCV, author = {Samarasinghe, Sarinda and Rizve, Mamshad Nayeem and Kardan, Navid and Shah, Mubarak}, title = {CDFSL-V: Cross-Domain Few-Shot Learning for Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11643-11652} }
Generalized Few-Shot Point Cloud Segmentation via Geometric Words-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Yating and Hu, Conghui and Zhao, Na and Lee, Gim Hee}, title = {Generalized Few-Shot Point Cloud Segmentation via Geometric Words}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21506-21515} }
Monte Carlo Linear Clustering with Single-Point Supervision is Enough for Infrared Small Target Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Boyang and Wang, Yingqian and Wang, Longguang and Zhang, Fei and Liu, Ting and Lin, Zaiping and An, Wei and Guo, Yulan}, title = {Monte Carlo Linear Clustering with Single-Point Supervision is Enough for Infrared Small Target Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1009-1019} }
Practical Membership Inference Attacks Against Large-Scale Multi-Modal Models: A Pilot Study-
[pdf]
[supp]
[bibtex]@InProceedings{Ko_2023_ICCV, author = {Ko, Myeongseob and Jin, Ming and Wang, Chenguang and Jia, Ruoxi}, title = {Practical Membership Inference Attacks Against Large-Scale Multi-Modal Models: A Pilot Study}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4871-4881} }
TCOVIS: Temporally Consistent Online Video Instance Segmentation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Junlong and Yu, Bingyao and Rao, Yongming and Zhou, Jie and Lu, Jiwen}, title = {TCOVIS: Temporally Consistent Online Video Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1097-1107} }
Towards Viewpoint Robustness in Bird's Eye View Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Klinghoffer_2023_ICCV, author = {Klinghoffer, Tzofi and Philion, Jonah and Chen, Wenzheng and Litany, Or and Gojcic, Zan and Joo, Jungseock and Raskar, Ramesh and Fidler, Sanja and Alvarez, Jose M.}, title = {Towards Viewpoint Robustness in Bird's Eye View Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8515-8524} }
Long-Term Photometric Consistent Novel View Synthesis with Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yu_2023_ICCV, author = {Yu, Jason J. and Forghani, Fereshteh and Derpanis, Konstantinos G. and Brubaker, Marcus A.}, title = {Long-Term Photometric Consistent Novel View Synthesis with Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7094-7104} }
What Can a Cook in Italy Teach a Mechanic in India? Action Recognition Generalisation Over Scenarios and Locations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Plizzari_2023_ICCV, author = {Plizzari, Chiara and Perrett, Toby and Caputo, Barbara and Damen, Dima}, title = {What Can a Cook in Italy Teach a Mechanic in India? Action Recognition Generalisation Over Scenarios and Locations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13656-13666} }
EMDB: The Electromagnetic Database of Global 3D Human Pose and Shape in the Wild-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kaufmann_2023_ICCV, author = {Kaufmann, Manuel and Song, Jie and Guo, Chen and Shen, Kaiyue and Jiang, Tianjian and Tang, Chengcheng and Z\'arate, Juan Jos\'e and Hilliges, Otmar}, title = {EMDB: The Electromagnetic Database of Global 3D Human Pose and Shape in the Wild}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14632-14643} }
STEERER: Resolving Scale Variations for Counting and Localization via Selective Inheritance Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Han_2023_ICCV, author = {Han, Tao and Bai, Lei and Liu, Lingbo and Ouyang, Wanli}, title = {STEERER: Resolving Scale Variations for Counting and Localization via Selective Inheritance Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21848-21859} }
Benchmarking Algorithmic Bias in Face Recognition: An Experimental Approach Using Synthetic Faces and Human Evaluation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liang_2023_ICCV, author = {Liang, Hao and Perona, Pietro and Balakrishnan, Guha}, title = {Benchmarking Algorithmic Bias in Face Recognition: An Experimental Approach Using Synthetic Faces and Human Evaluation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4977-4987} }
Spatial-Aware Token for Weakly Supervised Object Localization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Pingyu and Zhai, Wei and Cao, Yang and Luo, Jiebo and Zha, Zheng-Jun}, title = {Spatial-Aware Token for Weakly Supervised Object Localization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1844-1854} }
Harnessing the Spatial-Temporal Attention of Diffusion Models for High-Fidelity Text-to-Image Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Qiucheng and Liu, Yujian and Zhao, Handong and Bui, Trung and Lin, Zhe and Zhang, Yang and Chang, Shiyu}, title = {Harnessing the Spatial-Temporal Attention of Diffusion Models for High-Fidelity Text-to-Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7766-7776} }
GraphAlign: Enhancing Accurate Feature Alignment by Graph matching for Multi-Modal 3D Object Detection-
[pdf]
[bibtex]@InProceedings{Song_2023_ICCV, author = {Song, Ziying and Wei, Haiyue and Bai, Lin and Yang, Lei and Jia, Caiyan}, title = {GraphAlign: Enhancing Accurate Feature Alignment by Graph matching for Multi-Modal 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3358-3369} }
Weakly-Supervised Action Segmentation and Unseen Error Detection in Anomalous Instructional Videos-
[pdf]
[supp]
[bibtex]@InProceedings{Ghoddoosian_2023_ICCV, author = {Ghoddoosian, Reza and Dwivedi, Isht and Agarwal, Nakul and Dariush, Behzad}, title = {Weakly-Supervised Action Segmentation and Unseen Error Detection in Anomalous Instructional Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10128-10138} }
NEMTO: Neural Environment Matting for Novel View and Relighting Synthesis of Transparent Objects-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Dongqing and Zhang, Tong and S\"usstrunk, Sabine}, title = {NEMTO: Neural Environment Matting for Novel View and Relighting Synthesis of Transparent Objects}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {317-327} }
Geometric Viewpoint Learning with Hyper-Rays and Harmonics Encoding-
[pdf]
[supp]
[bibtex]@InProceedings{Min_2023_ICCV, author = {Min, Zhixiang and Dibene, Juan Carlos and Dunn, Enrique}, title = {Geometric Viewpoint Learning with Hyper-Rays and Harmonics Encoding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22520-22530} }
C2F2NeUS: Cascade Cost Frustum Fusion for High Fidelity and Generalizable Neural Surface Reconstruction-
[pdf]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Luoyuan and Guan, Tao and Wang, Yuesong and Liu, Wenkai and Zeng, Zhaojie and Wang, Junle and Yang, Wei}, title = {C2F2NeUS: Cascade Cost Frustum Fusion for High Fidelity and Generalizable Neural Surface Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18291-18301} }
Mesh2Tex: Generating Mesh Textures from Image Queries-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bokhovkin_2023_ICCV, author = {Bokhovkin, Alexey and Tulsiani, Shubham and Dai, Angela}, title = {Mesh2Tex: Generating Mesh Textures from Image Queries}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8918-8928} }
USAGE: A Unified Seed Area Generation Paradigm for Weakly Supervised Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Peng_2023_ICCV, author = {Peng, Zelin and Wang, Guanchun and Xie, Lingxi and Jiang, Dongsheng and Shen, Wei and Tian, Qi}, title = {USAGE: A Unified Seed Area Generation Paradigm for Weakly Supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {624-634} }
NeuS2: Fast Learning of Neural Implicit Surfaces for Multi-view Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Yiming and Han, Qin and Habermann, Marc and Daniilidis, Kostas and Theobalt, Christian and Liu, Lingjie}, title = {NeuS2: Fast Learning of Neural Implicit Surfaces for Multi-view Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3295-3306} }
Deep Feature Deblurring Diffusion for Detecting Out-of-Distribution Objects-
[pdf]
[supp]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Aming and Chen, Da and Deng, Cheng}, title = {Deep Feature Deblurring Diffusion for Detecting Out-of-Distribution Objects}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13381-13391} }
Fast Full-frame Video Stabilization with Iterative Optimization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Weiyue and Li, Xin and Peng, Zhan and Luo, Xianrui and Ye, Xinyi and Lu, Hao and Cao, Zhiguo}, title = {Fast Full-frame Video Stabilization with Iterative Optimization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23534-23544} }
Gender Artifacts in Visual Datasets-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Meister_2023_ICCV, author = {Meister, Nicole and Zhao, Dora and Wang, Angelina and Ramaswamy, Vikram V. and Fong, Ruth and Russakovsky, Olga}, title = {Gender Artifacts in Visual Datasets}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4837-4848} }
Learning Semi-supervised Gaussian Mixture Models for Generalized Category Discovery-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Bingchen and Wen, Xin and Han, Kai}, title = {Learning Semi-supervised Gaussian Mixture Models for Generalized Category Discovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16623-16633} }
SuS-X: Training-Free Name-Only Transfer of Vision-Language Models-
[pdf]
[supp]
[bibtex]@InProceedings{Udandarao_2023_ICCV, author = {Udandarao, Vishaal and Gupta, Ankush and Albanie, Samuel}, title = {SuS-X: Training-Free Name-Only Transfer of Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2725-2736} }
Rethinking Point Cloud Registration as Masking and Reconstruction-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Guangyan and Wang, Meiling and Yuan, Li and Yang, Yi and Yue, Yufeng}, title = {Rethinking Point Cloud Registration as Masking and Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17717-17727} }
Beating Backdoor Attack at Its Own Game-
[pdf]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Min and Sangiovanni-Vincentelli, Alberto and Yue, Xiangyu}, title = {Beating Backdoor Attack at Its Own Game}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4620-4629} }
Introducing Language Guidance in Prompt-based Continual Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Khan_2023_ICCV, author = {Khan, Muhammad Gul Zain Ali and Naeem, Muhammad Ferjad and Van Gool, Luc and Stricker, Didier and Tombari, Federico and Afzal, Muhammad Zeshan}, title = {Introducing Language Guidance in Prompt-based Continual Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11463-11473} }
Invariant Training 2D-3D Joint Hard Samples for Few-Shot Point Cloud Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yi_2023_ICCV, author = {Yi, Xuanyu and Deng, Jiajun and Sun, Qianru and Hua, Xian-Sheng and Lim, Joo-Hwee and Zhang, Hanwang}, title = {Invariant Training 2D-3D Joint Hard Samples for Few-Shot Point Cloud Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14463-14474} }
EigenPlaces: Training Viewpoint Robust Models for Visual Place Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Berton_2023_ICCV, author = {Berton, Gabriele and Trivigno, Gabriele and Caputo, Barbara and Masone, Carlo}, title = {EigenPlaces: Training Viewpoint Robust Models for Visual Place Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11080-11090} }
Do DALL-E and Flamingo Understand Each Other?-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Hang and Gu, Jindong and Koner, Rajat and Sharifzadeh, Sahand and Tresp, Volker}, title = {Do DALL-E and Flamingo Understand Each Other?}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1999-2010} }
CIRI: Curricular Inactivation for Residue-aware One-shot Video Inpainting-
[pdf]
[supp]
[bibtex]@InProceedings{Zheng_2023_ICCV, author = {Zheng, Weiying and Xu, Cheng and Xu, Xuemiao and Liu, Wenxi and He, Shengfeng}, title = {CIRI: Curricular Inactivation for Residue-aware One-shot Video Inpainting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13012-13022} }
Prototype-based Dataset Comparison-
[pdf]
[supp]
[bibtex]@InProceedings{van_Noord_2023_ICCV, author = {van Noord, Nanne}, title = {Prototype-based Dataset Comparison}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1944-1954} }
FreeCOS: Self-Supervised Learning from Fractals and Unlabeled Images for Curvilinear Object Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shi_2023_ICCV, author = {Shi, Tianyi and Ding, Xiaohuan and Zhang, Liang and Yang, Xin}, title = {FreeCOS: Self-Supervised Learning from Fractals and Unlabeled Images for Curvilinear Object Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {876-886} }
Generating Dynamic Kernels via Transformers for Lane Detection-
[pdf]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Ziye and Liu, Yu and Gong, Mingming and Du, Bo and Qian, Guoqi and Smith-Miles, Kate}, title = {Generating Dynamic Kernels via Transformers for Lane Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6835-6844} }
RSFNet: A White-Box Image Retouching Approach using Region-Specific Color Filters-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ouyang_2023_ICCV, author = {Ouyang, Wenqi and Dong, Yi and Kang, Xiaoyang and Ren, Peiran and Xu, Xin and Xie, Xuansong}, title = {RSFNet: A White-Box Image Retouching Approach using Region-Specific Color Filters}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12160-12169} }
Tem-Adapter: Adapting Image-Text Pretraining for Video Question Answer-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Guangyi and Liu, Xiao and Wang, Guangrun and Zhang, Kun and Torr, Philip H.S. and Zhang, Xiao-Ping and Tang, Yansong}, title = {Tem-Adapter: Adapting Image-Text Pretraining for Video Question Answer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13945-13955} }
Boosting Long-tailed Object Detection via Step-wise Learning on Smooth-tail Data-
[pdf]
[arXiv]
[bibtex]@InProceedings{Dong_2023_ICCV, author = {Dong, Na and Zhang, Yongqiang and Ding, Mingli and Lee, Gim Hee}, title = {Boosting Long-tailed Object Detection via Step-wise Learning on Smooth-tail Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6940-6949} }
Talking Head Generation with Probabilistic Audio-to-Visual Diffusion Priors-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yu_2023_ICCV, author = {Yu, Zhentao and Yin, Zixin and Zhou, Deyu and Wang, Duomin and Wong, Finn and Wang, Baoyuan}, title = {Talking Head Generation with Probabilistic Audio-to-Visual Diffusion Priors}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7645-7655} }
Learning Cross-Modal Affinity for Referring Video Object Segmentation Targeting Limited Samples-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Guanghui and Gao, Mingqi and Liu, Heng and Zhen, Xiantong and Zheng, Feng}, title = {Learning Cross-Modal Affinity for Referring Video Object Segmentation Targeting Limited Samples}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2684-2693} }
Human Part-wise 3D Motion Context Learning for Sign Language Recognition-
[pdf]
[arXiv]
[bibtex]@InProceedings{Lee_2023_ICCV, author = {Lee, Taeryung and Oh, Yeonguk and Lee, Kyoung Mu}, title = {Human Part-wise 3D Motion Context Learning for Sign Language Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20740-20750} }
Remembering Normality: Memory-guided Knowledge Distillation for Unsupervised Anomaly Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Gu_2023_ICCV, author = {Gu, Zhihao and Liu, Liang and Chen, Xu and Yi, Ran and Zhang, Jiangning and Wang, Yabiao and Wang, Chengjie and Shu, Annan and Jiang, Guannan and Ma, Lizhuang}, title = {Remembering Normality: Memory-guided Knowledge Distillation for Unsupervised Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16401-16409} }
Coordinate Quantized Neural Implicit Representations for Multi-view Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jiang_2023_ICCV, author = {Jiang, Sijia and Hua, Jing and Han, Zhizhong}, title = {Coordinate Quantized Neural Implicit Representations for Multi-view Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18358-18369} }
Unleashing the Potential of Spiking Neural Networks with Dynamic Confidence-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Chen and Jones, Edward G and Furber, Steve}, title = {Unleashing the Potential of Spiking Neural Networks with Dynamic Confidence}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13350-13360} }
TeD-SPAD: Temporal Distinctiveness for Self-Supervised Privacy-Preservation for Video Anomaly Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Fioresi_2023_ICCV, author = {Fioresi, Joseph and Dave, Ishan Rajendrakumar and Shah, Mubarak}, title = {TeD-SPAD: Temporal Distinctiveness for Self-Supervised Privacy-Preservation for Video Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13598-13609} }
MAS: Towards Resource-Efficient Federated Multiple-Task Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhuang_2023_ICCV, author = {Zhuang, Weiming and Wen, Yonggang and Lyu, Lingjuan and Zhang, Shuai}, title = {MAS: Towards Resource-Efficient Federated Multiple-Task Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23414-23424} }
Bridging Cross-task Protocol Inconsistency for Distillation in Dense Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Longrong and Zhou, Xianpan and Li, Xuewei and Qiao, Liang and Li, Zheyang and Yang, Ziwei and Wang, Gaoang and Li, Xi}, title = {Bridging Cross-task Protocol Inconsistency for Distillation in Dense Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17175-17184} }
Divide and Conquer: a Two-Step Method for High Quality Face De-identification with Model Explainability-
[pdf]
[bibtex]@InProceedings{Wen_2023_ICCV, author = {Wen, Yunqian and Liu, Bo and Cao, Jingyi and Xie, Rong and Song, Li}, title = {Divide and Conquer: a Two-Step Method for High Quality Face De-identification with Model Explainability}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5148-5157} }
HiTeA: Hierarchical Temporal-Aware Video-Language Pre-training-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ye_2023_ICCV, author = {Ye, Qinghao and Xu, Guohai and Yan, Ming and Xu, Haiyang and Qian, Qi and Zhang, Ji and Huang, Fei}, title = {HiTeA: Hierarchical Temporal-Aware Video-Language Pre-training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15405-15416} }
VAPCNet: Viewpoint-Aware 3D Point Cloud Completion-
[pdf]
[bibtex]@InProceedings{Fu_2023_ICCV, author = {Fu, Zhiheng and Wang, Longguang and Xu, Lian and Wang, Zhiyong and Laga, Hamid and Guo, Yulan and Boussaid, Farid and Bennamoun, Mohammed}, title = {VAPCNet: Viewpoint-Aware 3D Point Cloud Completion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12108-12118} }
Set-level Guidance Attack: Boosting Adversarial Transferability of Vision-Language Pre-training Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lu_2023_ICCV, author = {Lu, Dong and Wang, Zhiqiang and Wang, Teng and Guan, Weili and Gao, Hongchang and Zheng, Feng}, title = {Set-level Guidance Attack: Boosting Adversarial Transferability of Vision-Language Pre-training Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {102-111} }
AutoSynth: Learning to Generate 3D Training Data for Object Point Cloud Registration-
[pdf]
[arXiv]
[bibtex]@InProceedings{Dang_2023_ICCV, author = {Dang, Zheng and Salzmann, Mathieu}, title = {AutoSynth: Learning to Generate 3D Training Data for Object Point Cloud Registration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9009-9019} }
Multimodal Distillation for Egocentric Action Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Radevski_2023_ICCV, author = {Radevski, Gorjan and Grujicic, Dusan and Blaschko, Matthew and Moens, Marie-Francine and Tuytelaars, Tinne}, title = {Multimodal Distillation for Egocentric Action Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5213-5224} }
Self-supervised Learning of Implicit Shape Representation with Dense Correspondence for Deformable Objects-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Baowen and Li, Jiahe and Deng, Xiaoming and Zhang, Yinda and Ma, Cuixia and Wang, Hongan}, title = {Self-supervised Learning of Implicit Shape Representation with Dense Correspondence for Deformable Objects}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14268-14278} }
Perceptual Artifacts Localization for Image Synthesis Tasks-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Lingzhi and Xu, Zhengjie and Barnes, Connelly and Zhou, Yuqian and Liu, Qing and Zhang, He and Amirghodsi, Sohrab and Lin, Zhe and Shechtman, Eli and Shi, Jianbo}, title = {Perceptual Artifacts Localization for Image Synthesis Tasks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7579-7590} }
Narrator: Towards Natural Control of Human-Scene Interaction Generation via Relationship Reasoning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xuan_2023_ICCV, author = {Xuan, Haibiao and Li, Xiongzheng and Zhang, Jinsong and Zhang, Hongwen and Liu, Yebin and Li, Kun}, title = {Narrator: Towards Natural Control of Human-Scene Interaction Generation via Relationship Reasoning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22268-22278} }
Vision Relation Transformer for Unbiased Scene Graph Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sudhakaran_2023_ICCV, author = {Sudhakaran, Gopika and Dhami, Devendra Singh and Kersting, Kristian and Roth, Stefan}, title = {Vision Relation Transformer for Unbiased Scene Graph Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21882-21893} }
Scaling Data Generation in Vision-and-Language Navigation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Zun and Li, Jialu and Hong, Yicong and Wang, Yi and Wu, Qi and Bansal, Mohit and Gould, Stephen and Tan, Hao and Qiao, Yu}, title = {Scaling Data Generation in Vision-and-Language Navigation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12009-12020} }
Better May Not Be Fairer: A Study on Subgroup Discrepancy in Image Classification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chiu_2023_ICCV, author = {Chiu, Ming-Chang and Chen, Pin-Yu and Ma, Xuezhe}, title = {Better May Not Be Fairer: A Study on Subgroup Discrepancy in Image Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4956-4966} }
3D Implicit Transporter for Temporally Consistent Keypoint Discovery-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhong_2023_ICCV, author = {Zhong, Chengliang and Zheng, Yuhang and Zheng, Yupeng and Zhao, Hao and Yi, Li and Mu, Xiaodong and Wang, Ling and Li, Pengfei and Zhou, Guyue and Yang, Chao and Zhang, Xinliang and Zhao, Jian}, title = {3D Implicit Transporter for Temporally Consistent Keypoint Discovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3869-3880} }
Adaptive Rotated Convolution for Rotated Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Pu_2023_ICCV, author = {Pu, Yifan and Wang, Yiru and Xia, Zhuofan and Han, Yizeng and Wang, Yulin and Gan, Weihao and Wang, Zidong and Song, Shiji and Huang, Gao}, title = {Adaptive Rotated Convolution for Rotated Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6589-6600} }
Revisit PCA-based Technique for Out-of-Distribution Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Guan_2023_ICCV, author = {Guan, Xiaoyuan and Liu, Zhouwu and Zheng, Wei-Shi and Zhou, Yuren and Wang, Ruixuan}, title = {Revisit PCA-based Technique for Out-of-Distribution Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19431-19439} }
Visually-Prompted Language Model for Fine-Grained Scene Graph Generation in an Open World-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yu_2023_ICCV, author = {Yu, Qifan and Li, Juncheng and Wu, Yu and Tang, Siliang and Ji, Wei and Zhuang, Yueting}, title = {Visually-Prompted Language Model for Fine-Grained Scene Graph Generation in an Open World}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21560-21571} }
FishNet: A Large-scale Dataset and Benchmark for Fish Recognition, Detection, and Functional Trait Prediction-
[pdf]
[bibtex]@InProceedings{Khan_2023_ICCV, author = {Khan, Faizan Farooq and Li, Xiang and Temple, Andrew J. and Elhoseiny, Mohamed}, title = {FishNet: A Large-scale Dataset and Benchmark for Fish Recognition, Detection, and Functional Trait Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20496-20506} }
Dual Learning with Dynamic Knowledge Distillation for Partially Relevant Video Retrieval-
[pdf]
[supp]
[bibtex]@InProceedings{Dong_2023_ICCV, author = {Dong, Jianfeng and Zhang, Minsong and Zhang, Zheng and Chen, Xianke and Liu, Daizong and Qu, Xiaoye and Wang, Xun and Liu, Baolong}, title = {Dual Learning with Dynamic Knowledge Distillation for Partially Relevant Video Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11302-11312} }
UniVTG: Towards Unified Video-Language Temporal Grounding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lin_2023_ICCV, author = {Lin, Kevin Qinghong and Zhang, Pengchuan and Chen, Joya and Pramanick, Shraman and Gao, Difei and Wang, Alex Jinpeng and Yan, Rui and Shou, Mike Zheng}, title = {UniVTG: Towards Unified Video-Language Temporal Grounding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2794-2804} }
Disposable Transfer Learning for Selective Source Task Unlearning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Koh_2023_ICCV, author = {Koh, Seunghee and Shon, Hyounguk and Lee, Janghyeon and Hong, Hyeong Gwon and Kim, Junmo}, title = {Disposable Transfer Learning for Selective Source Task Unlearning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11752-11760} }
Grounding 3D Object Affordance from 2D Interactions in Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Yuhang and Zhai, Wei and Luo, Hongchen and Cao, Yang and Luo, Jiebo and Zha, Zheng-Jun}, title = {Grounding 3D Object Affordance from 2D Interactions in Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10905-10915} }
Fast Globally Optimal Surface Normal Estimation from an Affine Correspondence-
[pdf]
[supp]
[bibtex]@InProceedings{Hajder_2023_ICCV, author = {Hajder, Levente and L\'oczi, Lajos and Barath, Daniel}, title = {Fast Globally Optimal Surface Normal Estimation from an Affine Correspondence}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3390-3401} }
Masked Spatio-Temporal Structure Prediction for Self-supervised Learning on Point Cloud Videos-
[pdf]
[arXiv]
[bibtex]@InProceedings{Shen_2023_ICCV, author = {Shen, Zhiqiang and Sheng, Xiaoxiao and Fan, Hehe and Wang, Longguang and Guo, Yulan and Liu, Qiong and Wen, Hao and Zhou, Xi}, title = {Masked Spatio-Temporal Structure Prediction for Self-supervised Learning on Point Cloud Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16580-16589} }
Frequency-aware GAN for Adversarial Manipulation Generation-
[pdf]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Peifei and Osada, Genki and Kataoka, Hirokatsu and Takahashi, Tsubasa}, title = {Frequency-aware GAN for Adversarial Manipulation Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4315-4324} }
DreamPose: Fashion Video Synthesis with Stable Diffusion-
[pdf]
[supp]
[bibtex]@InProceedings{Karras_2023_ICCV, author = {Karras, Johanna and Holynski, Aleksander and Wang, Ting-Chun and Kemelmacher-Shlizerman, Ira}, title = {DreamPose: Fashion Video Synthesis with Stable Diffusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22680-22690} }
Tube-Link: A Flexible Cross Tube Framework for Universal Video Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Xiangtai and Yuan, Haobo and Zhang, Wenwei and Cheng, Guangliang and Pang, Jiangmiao and Loy, Chen Change}, title = {Tube-Link: A Flexible Cross Tube Framework for Universal Video Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13923-13933} }
Hybrid Spectral Denoising Transformer with Guided Attention-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lai_2023_ICCV, author = {Lai, Zeqiang and Yan, Chenggang and Fu, Ying}, title = {Hybrid Spectral Denoising Transformer with Guided Attention}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13065-13075} }
HiVLP: Hierarchical Interactive Video-Language Pre-Training-
[pdf]
[supp]
[bibtex]@InProceedings{Shao_2023_ICCV, author = {Shao, Bin and Liu, Jianzhuang and Pei, Renjing and Xu, Songcen and Dai, Peng and Lu, Juwei and Li, Weimian and Yan, Youliang}, title = {HiVLP: Hierarchical Interactive Video-Language Pre-Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13756-13766} }
Learning Concordant Attention via Target-aware Alignment for Visible-Infrared Person Re-identification-
[pdf]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Jianbing and Liu, Hong and Su, Yuxin and Shi, Wei and Tang, Hao}, title = {Learning Concordant Attention via Target-aware Alignment for Visible-Infrared Person Re-identification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11122-11131} }
PhysDiff: Physics-Guided Human Motion Diffusion Model-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yuan_2023_ICCV, author = {Yuan, Ye and Song, Jiaming and Iqbal, Umar and Vahdat, Arash and Kautz, Jan}, title = {PhysDiff: Physics-Guided Human Motion Diffusion Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16010-16021} }
Masked Motion Predictors are Strong 3D Action Representation Learners-
[pdf]
[arXiv]
[bibtex]@InProceedings{Mao_2023_ICCV, author = {Mao, Yunyao and Deng, Jiajun and Zhou, Wengang and Fang, Yao and Ouyang, Wanli and Li, Houqiang}, title = {Masked Motion Predictors are Strong 3D Action Representation Learners}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10181-10191} }
Template-guided Hierarchical Feature Restoration for Anomaly Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Guo_2023_ICCV, author = {Guo, Hewei and Ren, Liping and Fu, Jingjing and Wang, Yuwang and Zhang, Zhizheng and Lan, Cuiling and Wang, Haoqian and Hou, Xinwen}, title = {Template-guided Hierarchical Feature Restoration for Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6447-6458} }
SwiftFormer: Efficient Additive Attention for Transformer-based Real-time Mobile Vision Applications-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shaker_2023_ICCV, author = {Shaker, Abdelrahman and Maaz, Muhammad and Rasheed, Hanoona and Khan, Salman and Yang, Ming-Hsuan and Khan, Fahad Shahbaz}, title = {SwiftFormer: Efficient Additive Attention for Transformer-based Real-time Mobile Vision Applications}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17425-17436} }
UpCycling: Semi-supervised 3D Object Detection without Sharing Raw-level Unlabeled Scenes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hwang_2023_ICCV, author = {Hwang, Sunwook and Kim, Youngseok and Kim, Seongwon and Bahk, Saewoong and Kim, Hyung-Sin}, title = {UpCycling: Semi-supervised 3D Object Detection without Sharing Raw-level Unlabeled Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23351-23361} }
RIGID: Recurrent GAN Inversion and Editing of Real Face Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Yangyang and He, Shengfeng and Wong, Kwan-Yee K. and Luo, Ping}, title = {RIGID: Recurrent GAN Inversion and Editing of Real Face Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13691-13701} }
PourIt!: Weakly-Supervised Liquid Perception from a Single Image for Visual Closed-Loop Robotic Pouring-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lin_2023_ICCV, author = {Lin, Haitao and Fu, Yanwei and Xue, Xiangyang}, title = {PourIt!: Weakly-Supervised Liquid Perception from a Single Image for Visual Closed-Loop Robotic Pouring}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {241-251} }
CSDA: Learning Category-Scale Joint Feature for Domain Adaptive Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Gao_2023_ICCV, author = {Gao, Changlong and Liu, Chengxu and Dun, Yujie and Qian, Xueming}, title = {CSDA: Learning Category-Scale Joint Feature for Domain Adaptive Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11421-11430} }
A Latent Space of Stochastic Diffusion Models for Zero-Shot Image Editing and Guidance-
[pdf]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Chen Henry and De la Torre, Fernando}, title = {A Latent Space of Stochastic Diffusion Models for Zero-Shot Image Editing and Guidance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7378-7387} }
Single Image Defocus Deblurring via Implicit Neural Inverse Kernels-
[pdf]
[supp]
[bibtex]@InProceedings{Quan_2023_ICCV, author = {Quan, Yuhui and Yao, Xin and Ji, Hui}, title = {Single Image Defocus Deblurring via Implicit Neural Inverse Kernels}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12600-12610} }
Open Set Video HOI detection from Action-Centric Chain-of-Look Prompting-
[pdf]
[supp]
[bibtex]@InProceedings{Xi_2023_ICCV, author = {Xi, Nan and Meng, Jingjing and Yuan, Junsong}, title = {Open Set Video HOI detection from Action-Centric Chain-of-Look Prompting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3079-3089} }
Robust Mixture-of-Expert Training for Convolutional Neural Networks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Yihua and Cai, Ruisi and Chen, Tianlong and Zhang, Guanhua and Zhang, Huan and Chen, Pin-Yu and Chang, Shiyu and Wang, Zhangyang and Liu, Sijia}, title = {Robust Mixture-of-Expert Training for Convolutional Neural Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {90-101} }
AvatarCraft: Transforming Text into Neural Human Avatars with Parameterized Shape and Pose Control-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jiang_2023_ICCV, author = {Jiang, Ruixiang and Wang, Can and Zhang, Jingbo and Chai, Menglei and He, Mingming and Chen, Dongdong and Liao, Jing}, title = {AvatarCraft: Transforming Text into Neural Human Avatars with Parameterized Shape and Pose Control}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14371-14382} }
s-Adaptive Decoupled Prototype for Few-Shot Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Du_2023_ICCV, author = {Du, Jinhao and Zhang, Shan and Chen, Qiang and Le, Haifeng and Sun, Yanpeng and Ni, Yao and Wang, Jian and He, Bin and Wang, Jingdong}, title = {s-Adaptive Decoupled Prototype for Few-Shot Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18950-18960} }
Why Is Prompt Tuning for Vision-Language Models Robust to Noisy Labels?-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Cheng-En and Tian, Yu and Yu, Haichao and Wang, Heng and Morgado, Pedro and Hu, Yu Hen and Yang, Linjie}, title = {Why Is Prompt Tuning for Vision-Language Models Robust to Noisy Labels?}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15488-15497} }
Unified Pre-Training with Pseudo Texts for Text-To-Image Person Re-Identification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shao_2023_ICCV, author = {Shao, Zhiyin and Zhang, Xinyu and Ding, Changxing and Wang, Jian and Wang, Jingdong}, title = {Unified Pre-Training with Pseudo Texts for Text-To-Image Person Re-Identification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11174-11184} }
Semantics Meets Temporal Correspondence: Self-supervised Object-centric Learning in Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Qian_2023_ICCV, author = {Qian, Rui and Ding, Shuangrui and Liu, Xian and Lin, Dahua}, title = {Semantics Meets Temporal Correspondence: Self-supervised Object-centric Learning in Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16675-16687} }
UniTR: A Unified and Efficient Multi-Modal Transformer for Bird's-Eye-View Representation-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Haiyang and Tang, Hao and Shi, Shaoshuai and Li, Aoxue and Li, Zhenguo and Schiele, Bernt and Wang, Liwei}, title = {UniTR: A Unified and Efficient Multi-Modal Transformer for Bird's-Eye-View Representation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6792-6802} }
Traj-MAE: Masked Autoencoders for Trajectory Prediction-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Hao and Wang, Jiaze and Shao, Kun and Liu, Furui and Hao, Jianye and Guan, Chenyong and Chen, Guangyong and Heng, Pheng-Ann}, title = {Traj-MAE: Masked Autoencoders for Trajectory Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8351-8362} }
First Session Adaptation: A Strong Replay-Free Baseline for Class-Incremental Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Panos_2023_ICCV, author = {Panos, Aristeidis and Kobe, Yuriko and Reino, Daniel Olmeda and Aljundi, Rahaf and Turner, Richard E.}, title = {First Session Adaptation: A Strong Replay-Free Baseline for Class-Incremental Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18820-18830} }
Ada3D : Exploiting the Spatial Redundancy with Adaptive Inference for Efficient 3D Object Detection-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Tianchen and Ning, Xuefei and Hong, Ke and Qiu, Zhongyuan and Lu, Pu and Zhao, Yali and Zhang, Linfeng and Zhou, Lipu and Dai, Guohao and Yang, Huazhong and Wang, Yu}, title = {Ada3D : Exploiting the Spatial Redundancy with Adaptive Inference for Efficient 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17728-17738} }
R3D3: Dense 3D Reconstruction of Dynamic Scenes from Multiple Cameras-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Schmied_2023_ICCV, author = {Schmied, Aron and Fischer, Tobias and Danelljan, Martin and Pollefeys, Marc and Yu, Fisher}, title = {R3D3: Dense 3D Reconstruction of Dynamic Scenes from Multiple Cameras}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3216-3226} }
UniFusion: Unified Multi-View Fusion Transformer for Spatial-Temporal Representation in Bird's-Eye-View-
[pdf]
[supp]
[bibtex]@InProceedings{Qin_2023_ICCV, author = {Qin, Zequn and Chen, Jingyu and Chen, Chao and Chen, Xiaozhi and Li, Xi}, title = {UniFusion: Unified Multi-View Fusion Transformer for Spatial-Temporal Representation in Bird's-Eye-View}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8690-8699} }
Point Contrastive Prediction with Semantic Clustering for Self-Supervised Learning on Point Cloud Videos-
[pdf]
[arXiv]
[bibtex]@InProceedings{Sheng_2023_ICCV, author = {Sheng, Xiaoxiao and Shen, Zhiqiang and Xiao, Gang and Wang, Longguang and Guo, Yulan and Fan, Hehe}, title = {Point Contrastive Prediction with Semantic Clustering for Self-Supervised Learning on Point Cloud Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16515-16524} }
Preserving Modality Structure Improves Multi-Modal Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Swetha_2023_ICCV, author = {Swetha, Sirnam and Rizve, Mamshad Nayeem and Shvetsova, Nina and Kuehne, Hilde and Shah, Mubarak}, title = {Preserving Modality Structure Improves Multi-Modal Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21993-22003} }
Focus the Discrepancy: Intra- and Inter-Correlation Learning for Image Anomaly Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Yao_2023_ICCV, author = {Yao, Xincheng and Li, Ruoqi and Qian, Zefeng and Luo, Yan and Zhang, Chongyang}, title = {Focus the Discrepancy: Intra- and Inter-Correlation Learning for Image Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6803-6813} }
Pre-training Vision Transformers with Very Limited Synthesized Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nakamura_2023_ICCV, author = {Nakamura, Ryo and Kataoka, Hirokatsu and Takashima, Sora and Noriega, Edgar Josafat Martinez and Yokota, Rio and Inoue, Nakamasa}, title = {Pre-training Vision Transformers with Very Limited Synthesized Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20360-20369} }
Sample-adaptive Augmentation for Point Cloud Recognition Against Real-world Corruptions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Jie and Ding, Lihe and Xu, Tingfa and Dong, Shaocong and Xu, Xinli and Bai, Long and Li, Jianan}, title = {Sample-adaptive Augmentation for Point Cloud Recognition Against Real-world Corruptions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14330-14339} }
Make Encoder Great Again in 3D GAN Inversion through Geometry and Occlusion-Aware Encoding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yuan_2023_ICCV, author = {Yuan, Ziyang and Zhu, Yiming and Li, Yu and Liu, Hongyu and Yuan, Chun}, title = {Make Encoder Great Again in 3D GAN Inversion through Geometry and Occlusion-Aware Encoding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2437-2447} }
Modality Unifying Network for Visible-Infrared Person Re-Identification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yu_2023_ICCV, author = {Yu, Hao and Cheng, Xu and Peng, Wei and Liu, Weihao and Zhao, Guoying}, title = {Modality Unifying Network for Visible-Infrared Person Re-Identification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11185-11195} }
DLT: Conditioned layout generation with Joint Discrete-Continuous Diffusion Layout Transformer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Levi_2023_ICCV, author = {Levi, Elad and Brosh, Eli and Mykhailych, Mykola and Perez, Meir}, title = {DLT: Conditioned layout generation with Joint Discrete-Continuous Diffusion Layout Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2106-2115} }
PADDLES: Phase-Amplitude Spectrum Disentangled Early Stopping for Learning with Noisy Labels-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Huaxi and Kang, Hui and Liu, Sheng and Salvado, Olivier and Rakotoarivelo, Thierry and Wang, Dadong and Liu, Tongliang}, title = {PADDLES: Phase-Amplitude Spectrum Disentangled Early Stopping for Learning with Noisy Labels}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16719-16730} }
Taming Contrast Maximization for Learning Sequential, Low-latency, Event-based Optical Flow-
[pdf]
[supp]
[bibtex]@InProceedings{Paredes-Valles_2023_ICCV, author = {Paredes-Vall\'es, Federico and Scheper, Kirk Y. W. and De Wagter, Christophe and de Croon, Guido C. H. E.}, title = {Taming Contrast Maximization for Learning Sequential, Low-latency, Event-based Optical Flow}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9695-9705} }
CLIP-Cluster: CLIP-Guided Attribute Hallucination for Face Clustering-
[pdf]
[bibtex]@InProceedings{Shen_2023_ICCV, author = {Shen, Shuai and Li, Wanhua and Wang, Xiaobing and Zhang, Dafeng and Jin, Zhezhu and Zhou, Jie and Lu, Jiwen}, title = {CLIP-Cluster: CLIP-Guided Attribute Hallucination for Face Clustering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20786-20795} }
CASSPR: Cross Attention Single Scan Place Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xia_2023_ICCV, author = {Xia, Yan and Gladkova, Mariia and Wang, Rui and Li, Qianyun and Stilla, Uwe and Henriques, Jo\~ao F and Cremers, Daniel}, title = {CASSPR: Cross Attention Single Scan Place Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8461-8472} }
DDFM: Denoising Diffusion Model for Multi-Modality Image Fusion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Zixiang and Bai, Haowen and Zhu, Yuanzhi and Zhang, Jiangshe and Xu, Shuang and Zhang, Yulun and Zhang, Kai and Meng, Deyu and Timofte, Radu and Van Gool, Luc}, title = {DDFM: Denoising Diffusion Model for Multi-Modality Image Fusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8082-8093} }
A Unified Continual Learning Framework with General Parameter-Efficient Tuning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gao_2023_ICCV, author = {Gao, Qiankun and Zhao, Chen and Sun, Yifan and Xi, Teng and Zhang, Gang and Ghanem, Bernard and Zhang, Jian}, title = {A Unified Continual Learning Framework with General Parameter-Efficient Tuning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11483-11493} }
Hierarchical Generation of Human-Object Interactions with Diffusion Probabilistic Models-
[pdf]
[bibtex]@InProceedings{Pi_2023_ICCV, author = {Pi, Huaijin and Peng, Sida and Yang, Minghui and Zhou, Xiaowei and Bao, Hujun}, title = {Hierarchical Generation of Human-Object Interactions with Diffusion Probabilistic Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15061-15073} }
Learning Data-Driven Vector-Quantized Degradation Model for Animation Video Super-Resolution-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tuo_2023_ICCV, author = {Tuo, Zixi and Yang, Huan and Fu, Jianlong and Dun, Yujie and Qian, Xueming}, title = {Learning Data-Driven Vector-Quantized Degradation Model for Animation Video Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13179-13189} }
Compositional Feature Augmentation for Unbiased Scene Graph Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Lin and Chen, Guikun and Xiao, Jun and Yang, Yi and Wang, Chunping and Chen, Long}, title = {Compositional Feature Augmentation for Unbiased Scene Graph Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21685-21695} }
Foreground and Text-lines Aware Document Image Rectification-
[pdf]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Heng and Wu, Xiangping and Chen, Qingcai and Xiang, Qianjin}, title = {Foreground and Text-lines Aware Document Image Rectification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19574-19583} }
Open-Vocabulary Semantic Segmentation with Decoupled One-Pass Network-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Han_2023_ICCV, author = {Han, Cong and Zhong, Yujie and Li, Dengjie and Han, Kai and Ma, Lin}, title = {Open-Vocabulary Semantic Segmentation with Decoupled One-Pass Network}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1086-1096} }
INSTA-BNN: Binary Neural Network with INSTAnce-aware Threshold-
[pdf]
[supp]
[bibtex]@InProceedings{Lee_2023_ICCV, author = {Lee, Changhun and Kim, Hyungjun and Park, Eunhyeok and Kim, Jae-Joon}, title = {INSTA-BNN: Binary Neural Network with INSTAnce-aware Threshold}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17325-17334} }
Human-Inspired Facial Sketch Synthesis with Dynamic Adaptation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Gao_2023_ICCV, author = {Gao, Fei and Zhu, Yifan and Jiang, Chang and Wang, Nannan}, title = {Human-Inspired Facial Sketch Synthesis with Dynamic Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7237-7247} }
When Epipolar Constraint Meets Non-Local Operators in Multi-View Stereo-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Tianqi and Ye, Xinyi and Zhao, Weiyue and Pan, Zhiyu and Shi, Min and Cao, Zhiguo}, title = {When Epipolar Constraint Meets Non-Local Operators in Multi-View Stereo}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18088-18097} }
LU-NeRF: Scene and Pose Estimation by Synchronizing Local Unposed NeRFs-
[pdf]
[supp]
[bibtex]@InProceedings{Cheng_2023_ICCV, author = {Cheng, Zezhou and Esteves, Carlos and Jampani, Varun and Kar, Abhishek and Maji, Subhransu and Makadia, Ameesh}, title = {LU-NeRF: Scene and Pose Estimation by Synchronizing Local Unposed NeRFs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18312-18321} }
Calibrating Panoramic Depth Estimation for Practical Localization and Mapping-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2023_ICCV, author = {Kim, Junho and Lee, Eun Sun and Kim, Young Min}, title = {Calibrating Panoramic Depth Estimation for Practical Localization and Mapping}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8830-8840} }
DiffDis: Empowering Generative Diffusion Model with Cross-Modal Discrimination Capability-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Runhui and Han, Jianhua and Lu, Guansong and Liang, Xiaodan and Zeng, Yihan and Zhang, Wei and Xu, Hang}, title = {DiffDis: Empowering Generative Diffusion Model with Cross-Modal Discrimination Capability}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15713-15723} }
DS-Fusion: Artistic Typography via Discriminated and Stylized Diffusion-
[pdf]
[supp]
[bibtex]@InProceedings{Tanveer_2023_ICCV, author = {Tanveer, Maham and Wang, Yizhi and Mahdavi-Amiri, Ali and Zhang, Hao}, title = {DS-Fusion: Artistic Typography via Discriminated and Stylized Diffusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {374-384} }
Distilling DETR with Visual-Linguistic Knowledge for Open-Vocabulary Object Detection-
[pdf]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Liangqi and Miao, Jiaxu and Shi, Dahu and Tan, Wenming and Ren, Ye and Yang, Yi and Pu, Shiliang}, title = {Distilling DETR with Visual-Linguistic Knowledge for Open-Vocabulary Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6501-6510} }
Scale-MAE: A Scale-Aware Masked Autoencoder for Multiscale Geospatial Representation Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Reed_2023_ICCV, author = {Reed, Colorado J and Gupta, Ritwik and Li, Shufan and Brockman, Sarah and Funk, Christopher and Clipp, Brian and Keutzer, Kurt and Candido, Salvatore and Uyttendaele, Matt and Darrell, Trevor}, title = {Scale-MAE: A Scale-Aware Masked Autoencoder for Multiscale Geospatial Representation Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4088-4099} }
View Consistent Purification for Accurate Cross-View Localization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Shan and Zhang, Yanhao and Perincherry, Akhil and Vora, Ankit and Li, Hongdong}, title = {View Consistent Purification for Accurate Cross-View Localization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8197-8206} }
A Unified Framework for Robustness on Diverse Sampling Errors-
[pdf]
[supp]
[bibtex]@InProceedings{Jeon_2023_ICCV, author = {Jeon, Myeongho and Kang, Myungjoo and Lee, Joonseok}, title = {A Unified Framework for Robustness on Diverse Sampling Errors}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1464-1472} }
Efficient Video Action Detection with Token Dropout and Context Refinement-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Lei and Tong, Zhan and Song, Yibing and Wu, Gangshan and Wang, Limin}, title = {Efficient Video Action Detection with Token Dropout and Context Refinement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10388-10399} }
Explicit Motion Disentangling for Efficient Optical Flow Estimation-
[pdf]
[bibtex]@InProceedings{Deng_2023_ICCV, author = {Deng, Changxing and Luo, Ao and Huang, Haibin and Ma, Shaodan and Liu, Jiangyu and Liu, Shuaicheng}, title = {Explicit Motion Disentangling for Efficient Optical Flow Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9521-9530} }
LiDAR-Camera Panoptic Segmentation via Geometry-Consistent and Semantic-Aware Alignment-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Zhiwei and Zhang, Zhizhong and Yu, Qian and Yi, Ran and Xie, Yuan and Ma, Lizhuang}, title = {LiDAR-Camera Panoptic Segmentation via Geometry-Consistent and Semantic-Aware Alignment}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3662-3671} }
GrowCLIP: Data-Aware Automatic Model Growing for Large-scale Contrastive Language-Image Pre-Training-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Deng_2023_ICCV, author = {Deng, Xinchi and Shi, Han and Huang, Runhui and Li, Changlin and Xu, Hang and Han, Jianhua and Kwok, James and Zhao, Shen and Zhang, Wei and Liang, Xiaodan}, title = {GrowCLIP: Data-Aware Automatic Model Growing for Large-scale Contrastive Language-Image Pre-Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22178-22189} }
From Chaos Comes Order: Ordering Event Representations for Object Recognition and Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Zubic_2023_ICCV, author = {Zubi\'c, Nikola and Gehrig, Daniel and Gehrig, Mathias and Scaramuzza, Davide}, title = {From Chaos Comes Order: Ordering Event Representations for Object Recognition and Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12846-12856} }
LA-Net: Landmark-Aware Learning for Reliable Facial Expression Recognition under Label Noise-
[pdf]
[supp]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Zhiyu and Cui, Jinshi}, title = {LA-Net: Landmark-Aware Learning for Reliable Facial Expression Recognition under Label Noise}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20698-20707} }
Identity-Consistent Aggregation for Video Object Detection-
[pdf]
[arXiv]
[bibtex]@InProceedings{Deng_2023_ICCV, author = {Deng, Chaorui and Chen, Da and Wu, Qi}, title = {Identity-Consistent Aggregation for Video Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13434-13444} }
Scene-Aware Label Graph Learning for Multi-Label Image Classification-
[pdf]
[supp]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Xuelin and Liu, Jian and Liu, Weijia and Ge, Jiawei and Liu, Bo and Cao, Jiuxin}, title = {Scene-Aware Label Graph Learning for Multi-Label Image Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1473-1482} }
Relightify: Relightable 3D Faces from a Single Image via Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Papantoniou_2023_ICCV, author = {Papantoniou, Foivos Paraperas and Lattas, Alexandros and Moschoglou, Stylianos and Zafeiriou, Stefanos}, title = {Relightify: Relightable 3D Faces from a Single Image via Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8806-8817} }
Fcaformer: Forward Cross Attention in Hybrid Vision Transformer-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Haokui and Hu, Wenze and Wang, Xiaoyu}, title = {Fcaformer: Forward Cross Attention in Hybrid Vision Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6060-6069} }
Progressive Spatio-Temporal Prototype Matching for Text-Video Retrieval-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Pandeng and Xie, Chen-Wei and Zhao, Liming and Xie, Hongtao and Ge, Jiannan and Zheng, Yun and Zhao, Deli and Zhang, Yongdong}, title = {Progressive Spatio-Temporal Prototype Matching for Text-Video Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4100-4110} }
Leveraging Spatio-Temporal Dependency for Skeleton-Based Action Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2023_ICCV, author = {Lee, Jungho and Lee, Minhyeok and Cho, Suhwan and Woo, Sungmin and Jang, Sungjun and Lee, Sangyoun}, title = {Leveraging Spatio-Temporal Dependency for Skeleton-Based Action Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10255-10264} }
Data Augmented Flatness-aware Gradient Projection for Continual Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Enneng and Shen, Li and Wang, Zhenyi and Liu, Shiwei and Guo, Guibing and Wang, Xingwei}, title = {Data Augmented Flatness-aware Gradient Projection for Continual Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5630-5639} }
Camera-Driven Representation Learning for Unsupervised Domain Adaptive Person Re-identification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2023_ICCV, author = {Lee, Geon and Lee, Sanghoon and Kim, Dohyung and Shin, Younghoon and Yoon, Yongsang and Ham, Bumsub}, title = {Camera-Driven Representation Learning for Unsupervised Domain Adaptive Person Re-identification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11453-11462} }
Sample-wise Label Confidence Incorporation for Learning with Noisy Labels-
[pdf]
[supp]
[bibtex]@InProceedings{Ahn_2023_ICCV, author = {Ahn, Chanho and Kim, Kikyung and Baek, Ji-won and Lim, Jongin and Han, Seungju}, title = {Sample-wise Label Confidence Incorporation for Learning with Noisy Labels}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1823-1832} }
CLIPTrans: Transferring Visual Knowledge with Pre-trained Models for Multimodal Machine Translation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gupta_2023_ICCV, author = {Gupta, Devaansh and Kharbanda, Siddhant and Zhou, Jiawei and Li, Wanhua and Pfister, Hanspeter and Wei, Donglai}, title = {CLIPTrans: Transferring Visual Knowledge with Pre-trained Models for Multimodal Machine Translation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2875-2886} }
SGAligner: 3D Scene Alignment with Scene Graphs-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sarkar_2023_ICCV, author = {Sarkar, Sayan Deb and Miksik, Ondrej and Pollefeys, Marc and Barath, Daniel and Armeni, Iro}, title = {SGAligner: 3D Scene Alignment with Scene Graphs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21927-21937} }
Name Your Colour For the Task: Artificially Discover Colour Naming via Colour Quantisation Transformer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Su_2023_ICCV, author = {Su, Shenghan and Gu, Lin and Yang, Yue and Zhang, Zenghui and Harada, Tatsuya}, title = {Name Your Colour For the Task: Artificially Discover Colour Naming via Colour Quantisation Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12021-12031} }
FSAR: Federated Skeleton-based Action Recognition with Adaptive Topology Structure and Knowledge Distillation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Guo_2023_ICCV, author = {Guo, Jingwen and Liu, Hong and Sun, Shitong and Guo, Tianyu and Zhang, Min and Si, Chenyang}, title = {FSAR: Federated Skeleton-based Action Recognition with Adaptive Topology Structure and Knowledge Distillation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10400-10410} }
Video Adverse-Weather-Component Suppression Network via Weather Messenger and Adversarial Backpropagation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Yijun and Aviles-Rivero, Angelica I. and Fu, Huazhu and Liu, Ye and Wang, Weiming and Zhu, Lei}, title = {Video Adverse-Weather-Component Suppression Network via Weather Messenger and Adversarial Backpropagation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13200-13210} }
Efficient Discovery and Effective Evaluation of Visual Perceptual Similarity: A Benchmark and Beyond-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Barkan_2023_ICCV, author = {Barkan, Oren and Reiss, Tal and Weill, Jonathan and Katz, Ori and Hirsch, Roy and Malkiel, Itzik and Koenigstein, Noam}, title = {Efficient Discovery and Effective Evaluation of Visual Perceptual Similarity: A Benchmark and Beyond}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20007-20018} }
Ego-Only: Egocentric Action Detection without Exocentric Transferring-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Huiyu and Singh, Mitesh Kumar and Torresani, Lorenzo}, title = {Ego-Only: Egocentric Action Detection without Exocentric Transferring}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5250-5261} }
CoinSeg: Contrast Inter- and Intra- Class Representations for Incremental Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Zekang and Gao, Guangyu and Jiao, Jianbo and Liu, Chi Harold and Wei, Yunchao}, title = {CoinSeg: Contrast Inter- and Intra- Class Representations for Incremental Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {843-853} }
Multi-View Active Fine-Grained Visual Recognition-
[pdf]
[bibtex]@InProceedings{Du_2023_ICCV, author = {Du, Ruoyi and Yu, Wenqing and Wang, Heqing and Lin, Ting-En and Chang, Dongliang and Ma, Zhanyu}, title = {Multi-View Active Fine-Grained Visual Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1568-1578} }
Part-Aware Transformer for Generalizable Person Re-identification-
[pdf]
[arXiv]
[bibtex]@InProceedings{Ni_2023_ICCV, author = {Ni, Hao and Li, Yuke and Gao, Lianli and Shen, Heng Tao and Song, Jingkuan}, title = {Part-Aware Transformer for Generalizable Person Re-identification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11280-11289} }
Variational Causal Inference Network for Explanatory Visual Question Answering-
[pdf]
[supp]
[bibtex]@InProceedings{Xue_2023_ICCV, author = {Xue, Dizhan and Qian, Shengsheng and Xu, Changsheng}, title = {Variational Causal Inference Network for Explanatory Visual Question Answering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2515-2525} }
Improving Representation Learning for Histopathologic Images with Cluster Constraints-
[pdf]
[supp]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Weiyi and Gao, Chongyang and DiPalma, Joseph and Vosoughi, Soroush and Hassanpour, Saeed}, title = {Improving Representation Learning for Histopathologic Images with Cluster Constraints}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21404-21414} }
Blending-NeRF: Text-Driven Localized Editing in Neural Radiance Fields-
[pdf]
[supp]
[bibtex]@InProceedings{Song_2023_ICCV, author = {Song, Hyeonseop and Choi, Seokhun and Do, Hoseok and Lee, Chul and Kim, Taehyeong}, title = {Blending-NeRF: Text-Driven Localized Editing in Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14383-14393} }
Panoramas from Photons-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jungerman_2023_ICCV, author = {Jungerman, Sacha and Ingle, Atul and Gupta, Mohit}, title = {Panoramas from Photons}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10626-10636} }
Global Adaptation Meets Local Generalization: Unsupervised Domain Adaptation for 3D Human Pose Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chai_2023_ICCV, author = {Chai, Wenhao and Jiang, Zhongyu and Hwang, Jenq-Neng and Wang, Gaoang}, title = {Global Adaptation Meets Local Generalization: Unsupervised Domain Adaptation for 3D Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14655-14665} }
Learning Neural Implicit Surfaces with Object-Aware Radiance Fields-
[pdf]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Yiheng and Qiu, Zhaofan and Pan, Yingwei and Yao, Ting and Mei, Tao}, title = {Learning Neural Implicit Surfaces with Object-Aware Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17893-17902} }
PADCLIP: Pseudo-labeling with Adaptive Debiasing in CLIP for Unsupervised Domain Adaptation-
[pdf]
[supp]
[bibtex]@InProceedings{Lai_2023_ICCV, author = {Lai, Zhengfeng and Vesdapunt, Noranart and Zhou, Ning and Wu, Jun and Huynh, Cong Phuoc and Li, Xuelu and Fu, Kah Kuen and Chuah, Chen-Nee}, title = {PADCLIP: Pseudo-labeling with Adaptive Debiasing in CLIP for Unsupervised Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16155-16165} }
Causal-DFQ: Causality Guided Data-Free Network Quantization-
[pdf]
[bibtex]@InProceedings{Shang_2023_ICCV, author = {Shang, Yuzhang and Xu, Bingxin and Liu, Gaowen and Kompella, Ramana Rao and Yan, Yan}, title = {Causal-DFQ: Causality Guided Data-Free Network Quantization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17437-17446} }
Enhancing Generalization of Universal Adversarial Perturbation through Gradient Aggregation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Xuannan and Zhong, Yaoyao and Zhang, Yuhang and Qin, Lixiong and Deng, Weihong}, title = {Enhancing Generalization of Universal Adversarial Perturbation through Gradient Aggregation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4435-4444} }
CancerUniT: Towards a Single Unified Model for Effective Detection, Segmentation, and Diagnosis of Eight Major Cancers Using a Large Collection of CT Scans-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Jieneng and Xia, Yingda and Yao, Jiawen and Yan, Ke and Zhang, Jianpeng and Lu, Le and Wang, Fakai and Zhou, Bo and Qiu, Mingyan and Yu, Qihang and Yuan, Mingze and Fang, Wei and Tang, Yuxing and Xu, Minfeng and Zhou, Jian and Zhao, Yuqian and Wang, Qifeng and Ye, Xianghua and Yin, Xiaoli and Shi, Yu and Chen, Xin and Zhou, Jingren and Yuille, Alan and Liu, Zaiyi and Zhang, Ling}, title = {CancerUniT: Towards a Single Unified Model for Effective Detection, Segmentation, and Diagnosis of Eight Major Cancers Using a Large Collection of CT Scans}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21327-21338} }
Dual Meta-Learning with Longitudinally Consistent Regularization for One-Shot Brain Tissue Segmentation Across the Human Lifespan-
[pdf]
[bibtex]@InProceedings{Sun_2023_ICCV, author = {Sun, Yongheng and Wang, Fan and Shu, Jun and Wang, Haifeng and Wang, Li and Meng, Deyu and Lian, Chunfeng}, title = {Dual Meta-Learning with Longitudinally Consistent Regularization for One-Shot Brain Tissue Segmentation Across the Human Lifespan}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21118-21128} }
DeFormer: Integrating Transformers with Deformable Models for 3D Shape Abstraction from a Single Image-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Di and Yu, Xiang and Ye, Meng and Zhangli, Qilong and Li, Zhuowei and Zhang, Zhixing and Metaxas, Dimitris N.}, title = {DeFormer: Integrating Transformers with Deformable Models for 3D Shape Abstraction from a Single Image}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14236-14246} }
Parallel Attention Interaction Network for Few-Shot Skeleton-Based Action Recognition-
[pdf]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Xingyu and Zhou, Sanping and Wang, Le and Hua, Gang}, title = {Parallel Attention Interaction Network for Few-Shot Skeleton-Based Action Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1379-1388} }
Cross-view Semantic Alignment for Livestreaming Product Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Wenjie and Chen, Yiyi and Li, Yan and Cheng, Yanhua and Liu, Xudong and Chen, Quan and Li, Han}, title = {Cross-view Semantic Alignment for Livestreaming Product Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13404-13413} }
Continuously Masked Transformer for Image Inpainting-
[pdf]
[supp]
[bibtex]@InProceedings{Ko_2023_ICCV, author = {Ko, Keunsoo and Kim, Chang-Su}, title = {Continuously Masked Transformer for Image Inpainting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13169-13178} }
Vanishing Point Estimation in Uncalibrated Images with Prior Gravity Direction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Pautrat_2023_ICCV, author = {Pautrat, R\'emi and Liu, Shaohui and Hruby, Petr and Pollefeys, Marc and Barath, Daniel}, title = {Vanishing Point Estimation in Uncalibrated Images with Prior Gravity Direction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14118-14127} }
Learn TAROT with MENTOR: A Meta-Learned Self-Supervised Approach for Trajectory Prediction-
[pdf]
[supp]
[bibtex]@InProceedings{Pourkeshavarz_2023_ICCV, author = {Pourkeshavarz, Mozhgan and Chen, Changhe and Rasouli, Amir}, title = {Learn TAROT with MENTOR: A Meta-Learned Self-Supervised Approach for Trajectory Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8384-8393} }
MatrixVT: Efficient Multi-Camera to BEV Transformation for 3D Perception-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Hongyu and Ge, Zheng and Li, Zeming and Zhang, Xiangyu}, title = {MatrixVT: Efficient Multi-Camera to BEV Transformation for 3D Perception}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8548-8557} }
Local and Global Logit Adjustments for Long-Tailed Learning-
[pdf]
[bibtex]@InProceedings{Tao_2023_ICCV, author = {Tao, Yingfan and Sun, Jingna and Yang, Hao and Chen, Li and Wang, Xu and Yang, Wenming and Du, Daniel and Zheng, Min}, title = {Local and Global Logit Adjustments for Long-Tailed Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11783-11792} }
Active Self-Supervised Learning: A Few Low-Cost Relationships Are All You Need-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cabannes_2023_ICCV, author = {Cabannes, Vivien and Bottou, Leon and Lecun, Yann and Balestriero, Randall}, title = {Active Self-Supervised Learning: A Few Low-Cost Relationships Are All You Need}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16274-16283} }
Wasserstein Expansible Variational Autoencoder for Discriminative and Generative Continual Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Ye_2023_ICCV, author = {Ye, Fei and Bors, Adrian G.}, title = {Wasserstein Expansible Variational Autoencoder for Discriminative and Generative Continual Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18665-18675} }
Sensitivity-Aware Visual Parameter-Efficient Fine-Tuning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{He_2023_ICCV, author = {He, Haoyu and Cai, Jianfei and Zhang, Jing and Tao, Dacheng and Zhuang, Bohan}, title = {Sensitivity-Aware Visual Parameter-Efficient Fine-Tuning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11825-11835} }
Label-Free Event-based Object Recognition via Joint Learning with Image Reconstruction from Events-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cho_2023_ICCV, author = {Cho, Hoonhee and Kim, Hyeonseong and Chae, Yujeong and Yoon, Kuk-Jin}, title = {Label-Free Event-based Object Recognition via Joint Learning with Image Reconstruction from Events}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19866-19877} }
Gloss-Free Sign Language Translation: Improving from Visual-Language Pretraining-
[pdf]
[supp]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Benjia and Chen, Zhigang and Clap\'es, Albert and Wan, Jun and Liang, Yanyan and Escalera, Sergio and Lei, Zhen and Zhang, Du}, title = {Gloss-Free Sign Language Translation: Improving from Visual-Language Pretraining}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20871-20881} }
Weakly-supervised 3D Pose Transfer with Keypoints-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Jinnan and Li, Chen and Lee, Gim Hee}, title = {Weakly-supervised 3D Pose Transfer with Keypoints}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15156-15165} }
Not All Features Matter: Enhancing Few-shot CLIP with Adaptive Prior Refinement-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Xiangyang and Zhang, Renrui and He, Bowei and Zhou, Aojun and Wang, Dong and Zhao, Bin and Gao, Peng}, title = {Not All Features Matter: Enhancing Few-shot CLIP with Adaptive Prior Refinement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2605-2615} }
EgoVLPv2: Egocentric Video-Language Pre-training with Fusion in the Backbone-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Pramanick_2023_ICCV, author = {Pramanick, Shraman and Song, Yale and Nag, Sayan and Lin, Kevin Qinghong and Shah, Hardik and Shou, Mike Zheng and Chellappa, Rama and Zhang, Pengchuan}, title = {EgoVLPv2: Egocentric Video-Language Pre-training with Fusion in the Backbone}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5285-5297} }
On the Effectiveness of Spectral Discriminators for Perceptual Quality Improvement-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Luo_2023_ICCV, author = {Luo, Xin and Zhu, Yunan and Xu, Shunxin and Liu, Dong}, title = {On the Effectiveness of Spectral Discriminators for Perceptual Quality Improvement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13243-13253} }
Shrinking Class Space for Enhanced Certainty in Semi-Supervised Learning-
[pdf]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Lihe and Zhao, Zhen and Qi, Lei and Qiao, Yu and Shi, Yinghuan and Zhao, Hengshuang}, title = {Shrinking Class Space for Enhanced Certainty in Semi-Supervised Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16187-16196} }
Deep Equilibrium Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Shuai and Teng, Yao and Wang, Limin}, title = {Deep Equilibrium Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6296-6306} }
Diffusion-Based 3D Human Pose Estimation with Multi-Hypothesis Aggregation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shan_2023_ICCV, author = {Shan, Wenkang and Liu, Zhenhua and Zhang, Xinfeng and Wang, Zhao and Han, Kai and Wang, Shanshe and Ma, Siwei and Gao, Wen}, title = {Diffusion-Based 3D Human Pose Estimation with Multi-Hypothesis Aggregation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14761-14771} }
RPEFlow: Multimodal Fusion of RGB-PointCloud-Event for Joint Optical Flow and Scene Flow Estimation-
[pdf]
[supp]
[bibtex]@InProceedings{Wan_2023_ICCV, author = {Wan, Zhexiong and Mao, Yuxin and Zhang, Jing and Dai, Yuchao}, title = {RPEFlow: Multimodal Fusion of RGB-PointCloud-Event for Joint Optical Flow and Scene Flow Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10030-10040} }
SMAUG: Sparse Masked Autoencoder for Efficient Video-Language Pre-Training-
[pdf]
[arXiv]
[bibtex]@InProceedings{Lin_2023_ICCV, author = {Lin, Yuanze and Wei, Chen and Wang, Huiyu and Yuille, Alan and Xie, Cihang}, title = {SMAUG: Sparse Masked Autoencoder for Efficient Video-Language Pre-Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2459-2469} }
eP-ALM: Efficient Perceptual Augmentation of Language Models-
[pdf]
[supp]
[bibtex]@InProceedings{Shukor_2023_ICCV, author = {Shukor, Mustafa and Dancette, Corentin and Cord, Matthieu}, title = {eP-ALM: Efficient Perceptual Augmentation of Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22056-22069} }
Multimodal Optimal Transport-based Co-Attention Transformer with Global Structure Consistency for Survival Prediction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Yingxue and Chen, Hao}, title = {Multimodal Optimal Transport-based Co-Attention Transformer with Global Structure Consistency for Survival Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21241-21251} }
Communication-Efficient Vertical Federated Learning with Limited Overlapping Samples-
[pdf]
[arXiv]
[bibtex]@InProceedings{Sun_2023_ICCV, author = {Sun, Jingwei and Xu, Ziyue and Yang, Dong and Nath, Vishwesh and Li, Wenqi and Zhao, Can and Xu, Daguang and Chen, Yiran and Roth, Holger R.}, title = {Communication-Efficient Vertical Federated Learning with Limited Overlapping Samples}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5203-5212} }
On the Audio-visual Synchronization for Lip-to-Speech Synthesis-
[pdf]
[arXiv]
[bibtex]@InProceedings{Niu_2023_ICCV, author = {Niu, Zhe and Mak, Brian}, title = {On the Audio-visual Synchronization for Lip-to-Speech Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7843-7852} }
Robust One-Shot Face Video Re-enactment using Hybrid Latent Spaces of StyleGAN2-
[pdf]
[supp]
[bibtex]@InProceedings{Oorloff_2023_ICCV, author = {Oorloff, Trevine and Yacoob, Yaser}, title = {Robust One-Shot Face Video Re-enactment using Hybrid Latent Spaces of StyleGAN2}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20947-20957} }
BallGAN: 3D-aware Image Synthesis with a Spherical Background-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shin_2023_ICCV, author = {Shin, Minjung and Seo, Yunji and Bae, Jeongmin and Choi, Young Sun and Kim, Hyunsu and Byun, Hyeran and Uh, Youngjung}, title = {BallGAN: 3D-aware Image Synthesis with a Spherical Background}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7268-7279} }
RPG-Palm: Realistic Pseudo-data Generation for Palmprint Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Shen_2023_ICCV, author = {Shen, Lei and Jin, Jianlong and Zhang, Ruixin and Li, Huaen and Zhao, Kai and Zhang, Yingyi and Zhang, Jingyun and Ding, Shouhong and Zhao, Yang and Jia, Wei}, title = {RPG-Palm: Realistic Pseudo-data Generation for Palmprint Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19605-19616} }
Lecture Presentations Multimodal Dataset: Towards Understanding Multimodality in Educational Videos-
[pdf]
[supp]
[bibtex]@InProceedings{Lee_2023_ICCV, author = {Lee, Dong Won and Ahuja, Chaitanya and Liang, Paul Pu and Natu, Sanika and Morency, Louis-Philippe}, title = {Lecture Presentations Multimodal Dataset: Towards Understanding Multimodality in Educational Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20087-20098} }
Window-Based Early-Exit Cascades for Uncertainty Estimation: When Deep Ensembles are More Efficient than Single Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xia_2023_ICCV, author = {Xia, Guoxuan and Bouganis, Christos-Savvas}, title = {Window-Based Early-Exit Cascades for Uncertainty Estimation: When Deep Ensembles are More Efficient than Single Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17368-17380} }
AttT2M: Text-Driven Human Motion Generation with Multi-Perspective Attention Mechanism-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhong_2023_ICCV, author = {Zhong, Chongyang and Hu, Lei and Zhang, Zihao and Xia, Shihong}, title = {AttT2M: Text-Driven Human Motion Generation with Multi-Perspective Attention Mechanism}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {509-519} }
A Theory of Topological Derivatives for Inverse Rendering of Geometry-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mehta_2023_ICCV, author = {Mehta, Ishit and Chandraker, Manmohan and Ramamoorthi, Ravi}, title = {A Theory of Topological Derivatives for Inverse Rendering of Geometry}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {419-429} }
Canonical Factors for Hybrid Neural Fields-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yi_2023_ICCV, author = {Yi, Brent and Zeng, Weijia and Buchanan, Sam and Ma, Yi}, title = {Canonical Factors for Hybrid Neural Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3414-3426} }
XNet: Wavelet-Based Low and High Frequency Fusion Networks for Fully- and Semi-Supervised Semantic Segmentation of Biomedical Images-
[pdf]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Yanfeng and Huang, Jiaxing and Wang, Chenlong and Song, Le and Yang, Ge}, title = {XNet: Wavelet-Based Low and High Frequency Fusion Networks for Fully- and Semi-Supervised Semantic Segmentation of Biomedical Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21085-21096} }
Betrayed by Captions: Joint Caption Grounding and Generation for Open Vocabulary Instance Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Jianzong and Li, Xiangtai and Ding, Henghui and Li, Xia and Cheng, Guangliang and Tong, Yunhai and Loy, Chen Change}, title = {Betrayed by Captions: Joint Caption Grounding and Generation for Open Vocabulary Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21938-21948} }
StyleGANEX: StyleGAN-Based Manipulation Beyond Cropped Aligned Faces-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Shuai and Jiang, Liming and Liu, Ziwei and Loy, Chen Change}, title = {StyleGANEX: StyleGAN-Based Manipulation Beyond Cropped Aligned Faces}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21000-21010} }
HandR2N2: Iterative 3D Hand Pose Estimation Using a Residual Recurrent Neural Network-
[pdf]
[bibtex]@InProceedings{Cheng_2023_ICCV, author = {Cheng, Wencan and Ko, Jong Hwan}, title = {HandR2N2: Iterative 3D Hand Pose Estimation Using a Residual Recurrent Neural Network}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20904-20913} }
GET: Group Event Transformer for Event-Based Vision-
[pdf]
[supp]
[bibtex]@InProceedings{Peng_2023_ICCV, author = {Peng, Yansong and Zhang, Yueyi and Xiong, Zhiwei and Sun, Xiaoyan and Wu, Feng}, title = {GET: Group Event Transformer for Event-Based Vision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6038-6048} }
Unsupervised Learning of Object-Centric Embeddings for Cell Instance Segmentation in Microscopy Images-
[pdf]
[supp]
[bibtex]@InProceedings{Wolf_2023_ICCV, author = {Wolf, Steffen and Lalit, Manan and McDole, Katie and Funke, Jan}, title = {Unsupervised Learning of Object-Centric Embeddings for Cell Instance Segmentation in Microscopy Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21263-21272} }
DyGait: Exploiting Dynamic Representations for High-performance Gait Recognition-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Ming and Guo, Xianda and Lin, Beibei and Yang, Tian and Zhu, Zheng and Li, Lincheng and Zhang, Shunli and Yu, Xin}, title = {DyGait: Exploiting Dynamic Representations for High-performance Gait Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13424-13433} }
When Do Curricula Work in Federated Learning?-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Vahidian_2023_ICCV, author = {Vahidian, Saeed and Kadaveru, Sreevatsank and Baek, Woonjoon and Wang, Weijia and Kungurtsev, Vyacheslav and Chen, Chen and Shah, Mubarak and Lin, Bill}, title = {When Do Curricula Work in Federated Learning?}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5084-5094} }
XiNet: Efficient Neural Networks for tinyML-
[pdf]
[supp]
[bibtex]@InProceedings{Ancilotto_2023_ICCV, author = {Ancilotto, Alberto and Paissan, Francesco and Farella, Elisabetta}, title = {XiNet: Efficient Neural Networks for tinyML}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16968-16977} }
GridPull: Towards Scalability in Learning Implicit Representations from 3D Point Clouds-
[pdf]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Chao and Liu, Yu-Shen and Han, Zhizhong}, title = {GridPull: Towards Scalability in Learning Implicit Representations from 3D Point Clouds}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18322-18334} }
Audio-Visual Class-Incremental Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Pian_2023_ICCV, author = {Pian, Weiguo and Mo, Shentong and Guo, Yunhui and Tian, Yapeng}, title = {Audio-Visual Class-Incremental Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7799-7811} }
GeoMIM: Towards Better 3D Knowledge Transfer via Masked Image Modeling for Multi-view 3D Understanding-
[pdf]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Jihao and Wang, Tai and Liu, Boxiao and Zhang, Qihang and Liu, Yu and Li, Hongsheng}, title = {GeoMIM: Towards Better 3D Knowledge Transfer via Masked Image Modeling for Multi-view 3D Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17839-17849} }
Towards Viewpoint-Invariant Visual Recognition via Adversarial Training-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ruan_2023_ICCV, author = {Ruan, Shouwei and Dong, Yinpeng and Su, Hang and Peng, Jianteng and Chen, Ning and Wei, Xingxing}, title = {Towards Viewpoint-Invariant Visual Recognition via Adversarial Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4709-4719} }
Helping Hands: An Object-Aware Ego-Centric Video Recognition Model-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Chuhan and Gupta, Ankush and Zisserman, Andrew}, title = {Helping Hands: An Object-Aware Ego-Centric Video Recognition Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13901-13912} }
RenderIH: A Large-Scale Synthetic Dataset for 3D Interacting Hand Pose Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Lijun and Tian, Linrui and Zhang, Xindi and Wang, Qi and Zhang, Bang and Bo, Liefeng and Liu, Mengyuan and Chen, Chen}, title = {RenderIH: A Large-Scale Synthetic Dataset for 3D Interacting Hand Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20395-20405} }
Multi-Metrics Adaptively Identifies Backdoors in Federated Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Siquan and Li, Yijiang and Chen, Chong and Shi, Leyu and Gao, Ying}, title = {Multi-Metrics Adaptively Identifies Backdoors in Federated Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4652-4662} }
SpinCam: High-Speed Imaging via a Rotating Point-Spread Function-
[pdf]
[supp]
[bibtex]@InProceedings{Chan_2023_ICCV, author = {Chan, Dorian and Sheinin, Mark and O'Toole, Matthew}, title = {SpinCam: High-Speed Imaging via a Rotating Point-Spread Function}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10789-10799} }
FPR: False Positive Rectification for Weakly Supervised Semantic Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Liyi and Lei, Chenyang and Li, Ruihuang and Li, Shuai and Zhang, Zhaoxiang and Zhang, Lei}, title = {FPR: False Positive Rectification for Weakly Supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1108-1118} }
Cross-modal Scalable Hyperbolic Hierarchical Clustering-
[pdf]
[bibtex]@InProceedings{Long_2023_ICCV, author = {Long, Teng and van Noord, Nanne}, title = {Cross-modal Scalable Hyperbolic Hierarchical Clustering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16655-16664} }
DETRDistill: A Universal Knowledge Distillation Framework for DETR-families-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chang_2023_ICCV, author = {Chang, Jiahao and Wang, Shuo and Xu, Hai-Ming and Chen, Zehui and Yang, Chenhongyi and Zhao, Feng}, title = {DETRDistill: A Universal Knowledge Distillation Framework for DETR-families}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6898-6908} }
F&F Attack: Adversarial Attack against Multiple Object Trackers by Inducing False Negatives and False Positives-
[pdf]
[supp]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Tao and Ye, Qi and Luo, Wenhan and Zhang, Kaihao and Shi, Zhiguo and Chen, Jiming}, title = {F\&F Attack: Adversarial Attack against Multiple Object Trackers by Inducing False Negatives and False Positives}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4573-4583} }
Transferable Decoding with Visual Entities for Zero-Shot Image Captioning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fei_2023_ICCV, author = {Fei, Junjie and Wang, Teng and Zhang, Jinrui and He, Zhenyu and Wang, Chengjie and Zheng, Feng}, title = {Transferable Decoding with Visual Entities for Zero-Shot Image Captioning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3136-3146} }
ReMoDiffuse: Retrieval-Augmented Motion Diffusion Model-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Mingyuan and Guo, Xinying and Pan, Liang and Cai, Zhongang and Hong, Fangzhou and Li, Huirong and Yang, Lei and Liu, Ziwei}, title = {ReMoDiffuse: Retrieval-Augmented Motion Diffusion Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {364-373} }
GlueStick: Robust Image Matching by Sticking Points and Lines Together-
[pdf]
[supp]
[bibtex]@InProceedings{Pautrat_2023_ICCV, author = {Pautrat, R\'emi and Su\'arez, Iago and Yu, Yifan and Pollefeys, Marc and Larsson, Viktor}, title = {GlueStick: Robust Image Matching by Sticking Points and Lines Together}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9706-9716} }
Computational 3D Imaging with Position Sensors-
[pdf]
[supp]
[bibtex]@InProceedings{Klotz_2023_ICCV, author = {Klotz, Jeremy and Gupta, Mohit and Sankaranarayanan, Aswin C.}, title = {Computational 3D Imaging with Position Sensors}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8125-8134} }
PointMBF: A Multi-scale Bidirectional Fusion Network for Unsupervised RGB-D Point Cloud Registration-
[pdf]
[supp]
[bibtex]@InProceedings{Yuan_2023_ICCV, author = {Yuan, Mingzhi and Fu, Kexue and Li, Zhihao and Meng, Yucong and Wang, Manning}, title = {PointMBF: A Multi-scale Bidirectional Fusion Network for Unsupervised RGB-D Point Cloud Registration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17694-17705} }
Towards Multi-Layered 3D Garments Animation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shao_2023_ICCV, author = {Shao, Yidi and Loy, Chen Change and Dai, Bo}, title = {Towards Multi-Layered 3D Garments Animation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14361-14370} }
LiveHand: Real-time and Photorealistic Neural Hand Rendering-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mundra_2023_ICCV, author = {Mundra, Akshay and R, Mallikarjun B and Wang, Jiayi and Habermann, Marc and Theobalt, Christian and Elgharib, Mohamed}, title = {LiveHand: Real-time and Photorealistic Neural Hand Rendering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18035-18045} }
Advancing Referring Expression Segmentation Beyond Single Image-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Yixuan and Zhang, Zhao and Xie, Chi and Zhu, Feng and Zhao, Rui}, title = {Advancing Referring Expression Segmentation Beyond Single Image}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2628-2638} }
Learning Image Harmonization in the Linear Color Space-
[pdf]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Ke and Hancke, Gerhard Petrus and Lau, Rynson W.H.}, title = {Learning Image Harmonization in the Linear Color Space}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12570-12579} }
Chasing Clouds: Differentiable Volumetric Rasterisation of Point Clouds as a Highly Efficient and Accurate Loss for Large-Scale Deformable 3D Registration-
[pdf]
[supp]
[bibtex]@InProceedings{Heinrich_2023_ICCV, author = {Heinrich, Mattias P. and Bigalke, Alexander and Gro{\ss}br\"ohmer, Christoph and Hansen, Lasse}, title = {Chasing Clouds: Differentiable Volumetric Rasterisation of Point Clouds as a Highly Efficient and Accurate Loss for Large-Scale Deformable 3D Registration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8026-8036} }
TripLe: Revisiting Pretrained Model Reuse and Progressive Learning for Efficient Vision Transformer Scaling and Searching-
[pdf]
[supp]
[bibtex]@InProceedings{Fu_2023_ICCV, author = {Fu, Cheng and Huang, Hanxian and Jiang, Zixuan and Ni, Yun and Nai, Lifeng and Wu, Gang and Cheng, Liqun and Zhou, Yanqi and Li, Sheng and Li, Andrew and Zhao, Jishen}, title = {TripLe: Revisiting Pretrained Model Reuse and Progressive Learning for Efficient Vision Transformer Scaling and Searching}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17153-17163} }
LogicSeg: Parsing Visual Semantics with Neural Logic Learning and Reasoning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Liulei and Wang, Wenguan and Yang, Yi}, title = {LogicSeg: Parsing Visual Semantics with Neural Logic Learning and Reasoning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4122-4133} }
The Devil is in the Upsampling: Architectural Decisions Made Simpler for Denoising with Deep Image Prior-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Yilin and Li, Jiang and Pang, Yunkui and Nie, Dong and Yap, Pew-Thian}, title = {The Devil is in the Upsampling: Architectural Decisions Made Simpler for Denoising with Deep Image Prior}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12408-12417} }
Video Object Segmentation-aware Video Frame Interpolation-
[pdf]
[supp]
[bibtex]@InProceedings{Yoo_2023_ICCV, author = {Yoo, Jun-Sang and Lee, Hongjae and Jung, Seung-Won}, title = {Video Object Segmentation-aware Video Frame Interpolation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12322-12333} }
Coherent Event Guided Low-Light Video Enhancement-
[pdf]
[supp]
[bibtex]@InProceedings{Liang_2023_ICCV, author = {Liang, Jinxiu and Yang, Yixin and Li, Boyu and Duan, Peiqi and Xu, Yong and Shi, Boxin}, title = {Coherent Event Guided Low-Light Video Enhancement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10615-10625} }
Texture Learning Domain Randomization for Domain Generalized Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2023_ICCV, author = {Kim, Sunghwan and Kim, Dae-hwan and Kim, Hoseong}, title = {Texture Learning Domain Randomization for Domain Generalized Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {677-687} }
FCCNs: Fully Complex-valued Convolutional Networks using Complex-valued Color Model and Loss Function-
[pdf]
[supp]
[bibtex]@InProceedings{Yadav_2023_ICCV, author = {Yadav, Saurabh and Jerripothula, Koteswar Rao}, title = {FCCNs: Fully Complex-valued Convolutional Networks using Complex-valued Color Model and Loss Function}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10689-10698} }
Learning Concise and Descriptive Attributes for Visual Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yan_2023_ICCV, author = {Yan, An and Wang, Yu and Zhong, Yiwu and Dong, Chengyu and He, Zexue and Lu, Yujie and Wang, William Yang and Shang, Jingbo and McAuley, Julian}, title = {Learning Concise and Descriptive Attributes for Visual Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3090-3100} }
Learning Unified Decompositional and Compositional NeRF for Editable Novel View Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Yuxin and Wu, Wayne and Xu, Dan}, title = {Learning Unified Decompositional and Compositional NeRF for Editable Novel View Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18247-18256} }
Label-Noise Learning with Intrinsically Long-Tailed Data-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lu_2023_ICCV, author = {Lu, Yang and Zhang, Yiliang and Han, Bo and Cheung, Yiu-ming and Wang, Hanzi}, title = {Label-Noise Learning with Intrinsically Long-Tailed Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1369-1378} }
SeeABLE: Soft Discrepancies and Bounded Contrastive Learning for Exposing Deepfakes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Larue_2023_ICCV, author = {Larue, Nicolas and Vu, Ngoc-Son and Struc, Vitomir and Peer, Peter and Christophides, Vassilis}, title = {SeeABLE: Soft Discrepancies and Bounded Contrastive Learning for Exposing Deepfakes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21011-21021} }
Semi-Supervised Learning via Weight-Aware Distillation under Class Distribution Mismatch-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Du_2023_ICCV, author = {Du, Pan and Zhao, Suyun and Sheng, Zisen and Li, Cuiping and Chen, Hong}, title = {Semi-Supervised Learning via Weight-Aware Distillation under Class Distribution Mismatch}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16410-16420} }
ELFNet: Evidential Local-global Fusion for Stereo Matching-
[pdf]
[arXiv]
[bibtex]@InProceedings{Lou_2023_ICCV, author = {Lou, Jieming and Liu, Weide and Chen, Zhuo and Liu, Fayao and Cheng, Jun}, title = {ELFNet: Evidential Local-global Fusion for Stereo Matching}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17784-17793} }
SimpleClick: Interactive Image Segmentation with Simple Vision Transformers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Qin and Xu, Zhenlin and Bertasius, Gedas and Niethammer, Marc}, title = {SimpleClick: Interactive Image Segmentation with Simple Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22290-22300} }
Towards Content-based Pixel Retrieval in Revisited Oxford and Paris-
[pdf]
[arXiv]
[bibtex]@InProceedings{An_2023_ICCV, author = {An, Guoyuan and Kim, Woo Jae and Yang, Saelyne and Li, Rong and Huo, Yuchi and Yoon, Sun-Eui}, title = {Towards Content-based Pixel Retrieval in Revisited Oxford and Paris}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20507-20518} }
S-TREK: Sequential Translation and Rotation Equivariant Keypoints for Local Feature Extraction-
[pdf]
[supp]
[bibtex]@InProceedings{Santellani_2023_ICCV, author = {Santellani, Emanuele and Sormann, Christian and Rossi, Mattia and Kuhn, Andreas and Fraundorfer, Friedrich}, title = {S-TREK: Sequential Translation and Rotation Equivariant Keypoints for Local Feature Extraction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9728-9737} }
Retro-FPN: Retrospective Feature Pyramid Network for Point Cloud Semantic Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Xiang_2023_ICCV, author = {Xiang, Peng and Wen, Xin and Liu, Yu-Shen and Zhang, Hui and Fang, Yi and Han, Zhizhong}, title = {Retro-FPN: Retrospective Feature Pyramid Network for Point Cloud Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17826-17838} }
Rethinking Range View Representation for LiDAR Segmentation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Kong_2023_ICCV, author = {Kong, Lingdong and Liu, Youquan and Chen, Runnan and Ma, Yuexin and Zhu, Xinge and Li, Yikang and Hou, Yuenan and Qiao, Yu and Liu, Ziwei}, title = {Rethinking Range View Representation for LiDAR Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {228-240} }
Divide and Conquer: 3D Point Cloud Instance Segmentation With Point-Wise Binarization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Weiguang and Yan, Yuyao and Yang, Chaolong and Ye, Jianan and Yang, Xi and Huang, Kaizhu}, title = {Divide and Conquer: 3D Point Cloud Instance Segmentation With Point-Wise Binarization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {562-571} }
BANSAC: A Dynamic BAyesian Network for Adaptive SAmple Consensus-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Piedade_2023_ICCV, author = {Piedade, Valter and Miraldo, Pedro}, title = {BANSAC: A Dynamic BAyesian Network for Adaptive SAmple Consensus}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3738-3747} }
ShapeScaffolder: Structure-Aware 3D Shape Generation from Text-
[pdf]
[supp]
[bibtex]@InProceedings{Tian_2023_ICCV, author = {Tian, Xi and Yang, Yong-Liang and Wu, Qi}, title = {ShapeScaffolder: Structure-Aware 3D Shape Generation from Text}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2715-2724} }
Read-only Prompt Optimization for Vision-Language Few-shot Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2023_ICCV, author = {Lee, Dongjun and Song, Seokwon and Suh, Jihee and Choi, Joonmyeong and Lee, Sanghyeok and Kim, Hyunwoo J.}, title = {Read-only Prompt Optimization for Vision-Language Few-shot Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1401-1411} }
COCO-O: A Benchmark for Object Detectors under Natural Distribution Shifts-
[pdf]
[supp]
[bibtex]@InProceedings{Mao_2023_ICCV, author = {Mao, Xiaofeng and Chen, Yuefeng and Zhu, Yao and Chen, Da and Su, Hang and Zhang, Rong and Xue, Hui}, title = {COCO-O: A Benchmark for Object Detectors under Natural Distribution Shifts}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6339-6350} }
E2NeRF: Event Enhanced Neural Radiance Fields from Blurry Images-
[pdf]
[supp]
[bibtex]@InProceedings{Qi_2023_ICCV, author = {Qi, Yunshan and Zhu, Lin and Zhang, Yu and Li, Jia}, title = {E2NeRF: Event Enhanced Neural Radiance Fields from Blurry Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13254-13264} }
EgoTV: Egocentric Task Verification from Natural Language Task Descriptions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hazra_2023_ICCV, author = {Hazra, Rishi and Chen, Brian and Rai, Akshara and Kamra, Nitin and Desai, Ruta}, title = {EgoTV: Egocentric Task Verification from Natural Language Task Descriptions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15417-15429} }
Benchmarking Low-Shot Robustness to Natural Distribution Shifts-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Singh_2023_ICCV, author = {Singh, Aaditya and Sarangmath, Kartik and Chattopadhyay, Prithvijit and Hoffman, Judy}, title = {Benchmarking Low-Shot Robustness to Natural Distribution Shifts}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16232-16242} }
StageInteractor: Query-based Object Detector with Cross-stage Interaction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Teng_2023_ICCV, author = {Teng, Yao and Liu, Haisong and Guo, Sheng and Wang, Limin}, title = {StageInteractor: Query-based Object Detector with Cross-stage Interaction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6577-6588} }
DeLiRa: Self-Supervised Depth, Light, and Radiance Fields-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Guizilini_2023_ICCV, author = {Guizilini, Vitor and Vasiljevic, Igor and Fang, Jiading and Ambrus, Rares and Zakharov, Sergey and Sitzmann, Vincent and Gaidon, Adrien}, title = {DeLiRa: Self-Supervised Depth, Light, and Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17935-17945} }
Moment Detection in Long Tutorial Videos-
[pdf]
[supp]
[bibtex]@InProceedings{Croitoru_2023_ICCV, author = {Croitoru, Ioana and Bogolin, Simion-Vlad and Albanie, Samuel and Liu, Yang and Wang, Zhaowen and Yoon, Seunghyun and Dernoncourt, Franck and Jin, Hailin and Bui, Trung}, title = {Moment Detection in Long Tutorial Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2594-2604} }
Stable Cluster Discrimination for Deep Clustering-
[pdf]
[supp]
[bibtex]@InProceedings{Qian_2023_ICCV, author = {Qian, Qi}, title = {Stable Cluster Discrimination for Deep Clustering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16645-16654} }
Pix2Video: Video Editing using Image Diffusion-
[pdf]
[arXiv]
[bibtex]@InProceedings{Ceylan_2023_ICCV, author = {Ceylan, Duygu and Huang, Chun-Hao P. and Mitra, Niloy J.}, title = {Pix2Video: Video Editing using Image Diffusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23206-23217} }
DFA3D: 3D Deformable Attention For 2D-to-3D Feature Lifting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Hongyang and Zhang, Hao and Zeng, Zhaoyang and Liu, Shilong and Li, Feng and Ren, Tianhe and Zhang, Lei}, title = {DFA3D: 3D Deformable Attention For 2D-to-3D Feature Lifting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6684-6693} }
Holistic Geometric Feature Learning for Structured Reconstruction-
[pdf]
[arXiv]
[bibtex]@InProceedings{Lu_2023_ICCV, author = {Lu, Ziqiong and Huan, Linxi and Ma, Qiyuan and Zheng, Xianwei}, title = {Holistic Geometric Feature Learning for Structured Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21807-21817} }
FateZero: Fusing Attentions for Zero-shot Text-based Video Editing-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{QI_2023_ICCV, author = {QI, Chenyang and Cun, Xiaodong and Zhang, Yong and Lei, Chenyang and Wang, Xintao and Shan, Ying and Chen, Qifeng}, title = {FateZero: Fusing Attentions for Zero-shot Text-based Video Editing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15932-15942} }
Uncertainty-guided Learning for Improving Image Manipulation Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Ji_2023_ICCV, author = {Ji, Kaixiang and Chen, Feng and Guo, Xin and Xu, Yadong and Wang, Jian and Chen, Jingdong}, title = {Uncertainty-guided Learning for Improving Image Manipulation Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22456-22465} }
LMR: A Large-Scale Multi-Reference Dataset for Reference-Based Super-Resolution-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Lin and Li, Xin and He, Dongliang and Li, Fu and Ding, Errui and Zhang, Zhaoxiang}, title = {LMR: A Large-Scale Multi-Reference Dataset for Reference-Based Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13118-13127} }
Neural Implicit Surface Evolution-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Novello_2023_ICCV, author = {Novello, Tiago and da Silva, Vinicius and Schardong, Guilherme and Schirmer, Luiz and Lopes, Helio and Velho, Luiz}, title = {Neural Implicit Surface Evolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14279-14289} }
Distribution-Aligned Diffusion for Human Mesh Recovery-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Foo_2023_ICCV, author = {Foo, Lin Geng and Gong, Jia and Rahmani, Hossein and Liu, Jun}, title = {Distribution-Aligned Diffusion for Human Mesh Recovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9221-9232} }
Rosetta Neurons: Mining the Common Units in a Model Zoo-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dravid_2023_ICCV, author = {Dravid, Amil and Gandelsman, Yossi and Efros, Alexei A. and Shocher, Assaf}, title = {Rosetta Neurons: Mining the Common Units in a Model Zoo}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1934-1943} }
Semi-Supervised Semantic Segmentation under Label Noise via Diverse Learning Groups-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Peixia and Purkait, Pulak and Ajanthan, Thalaiyasingam and Abdolshah, Majid and Garg, Ravi and Husain, Hisham and Xu, Chenchen and Gould, Stephen and Ouyang, Wanli and van den Hengel, Anton}, title = {Semi-Supervised Semantic Segmentation under Label Noise via Diverse Learning Groups}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1229-1238} }
AdaMV-MoE: Adaptive Multi-Task Vision Mixture-of-Experts-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Tianlong and Chen, Xuxi and Du, Xianzhi and Rashwan, Abdullah and Yang, Fan and Chen, Huizhong and Wang, Zhangyang and Li, Yeqing}, title = {AdaMV-MoE: Adaptive Multi-Task Vision Mixture-of-Experts}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17346-17357} }
Hierarchical Visual Categories Modeling: A Joint Representation Learning and Density Estimation Framework for Out-of-Distribution Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Jinglun and Zhou, Xinyu and Guo, Pinxue and Sun, Yixuan and Huang, Yiwen and Ge, Weifeng and Zhang, Wenqiang}, title = {Hierarchical Visual Categories Modeling: A Joint Representation Learning and Density Estimation Framework for Out-of-Distribution Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23425-23435} }
Diffuse3D: Wide-Angle 3D Photography via Bilateral Diffusion-
[pdf]
[supp]
[bibtex]@InProceedings{Jiang_2023_ICCV, author = {Jiang, Yutao and Zhou, Yang and Liang, Yuan and Liu, Wenxi and Jiao, Jianbo and Quan, Yuhui and He, Shengfeng}, title = {Diffuse3D: Wide-Angle 3D Photography via Bilateral Diffusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8998-9008} }
ReNeRF: Relightable Neural Radiance Fields with Nearfield Lighting-
[pdf]
[supp]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Yingyan and Zoss, Gaspard and Chandran, Prashanth and Gross, Markus and Bradley, Derek and Gotardo, Paulo}, title = {ReNeRF: Relightable Neural Radiance Fields with Nearfield Lighting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22581-22591} }
Segment Anything-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kirillov_2023_ICCV, author = {Kirillov, Alexander and Mintun, Eric and Ravi, Nikhila and Mao, Hanzi and Rolland, Chloe and Gustafson, Laura and Xiao, Tete and Whitehead, Spencer and Berg, Alexander C. and Lo, Wan-Yen and Dollar, Piotr and Girshick, Ross}, title = {Segment Anything}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4015-4026} }
Unsupervised Prompt Tuning for Text-Driven Object Detection-
[pdf]
[bibtex]@InProceedings{He_2023_ICCV, author = {He, Weizhen and Chen, Weijie and Chen, Binbin and Yang, Shicai and Xie, Di and Lin, Luojun and Qi, Donglian and Zhuang, Yueting}, title = {Unsupervised Prompt Tuning for Text-Driven Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2651-2661} }
Tubelet-Contrastive Self-Supervision for Video-Efficient Generalization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Thoker_2023_ICCV, author = {Thoker, Fida Mohammad and Doughty, Hazel and Snoek, Cees G. M.}, title = {Tubelet-Contrastive Self-Supervision for Video-Efficient Generalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13812-13823} }
Re-ReND: Real-Time Rendering of NeRFs across Devices-
[pdf]
[supp]
[bibtex]@InProceedings{Rojas_2023_ICCV, author = {Rojas, Sara and Zarzar, Jesus and P\'erez, Juan C. and Sanakoyeu, Artsiom and Thabet, Ali and Pumarola, Albert and Ghanem, Bernard}, title = {Re-ReND: Real-Time Rendering of NeRFs across Devices}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3632-3641} }
360VOT: A New Benchmark Dataset for Omnidirectional Visual Object Tracking-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Huajian and Xu, Yinzhe and Chen, Yingshu and Yeung, Sai-Kit}, title = {360VOT: A New Benchmark Dataset for Omnidirectional Visual Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20566-20576} }
Is Imitation All You Need? Generalized Decision-Making with Dual-Phase Training-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wei_2023_ICCV, author = {Wei, Yao and Sun, Yanchao and Zheng, Ruijie and Vemprala, Sai and Bonatti, Rogerio and Chen, Shuhang and Madaan, Ratnesh and Ba, Zhongjie and Kapoor, Ashish and Ma, Shuang}, title = {Is Imitation All You Need? Generalized Decision-Making with Dual-Phase Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16221-16231} }
Generalizing Event-Based Motion Deblurring in Real-World Scenarios-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Xiang and Yu, Lei and Yang, Wen and Liu, Jianzhuang and Xia, Gui-Song}, title = {Generalizing Event-Based Motion Deblurring in Real-World Scenarios}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10734-10744} }
Handwritten and Printed Text Segmentation: A Signature Case Study-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gholamian_2023_ICCV, author = {Gholamian, Sina and Vahdat, Ali}, title = {Handwritten and Printed Text Segmentation: A Signature Case Study}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {582-592} }
LERF: Language Embedded Radiance Fields-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kerr_2023_ICCV, author = {Kerr, Justin and Kim, Chung Min and Goldberg, Ken and Kanazawa, Angjoo and Tancik, Matthew}, title = {LERF: Language Embedded Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19729-19739} }
DomainAdaptor: A Novel Approach to Test-time Adaptation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Jian and Qi, Lei and Shi, Yinghuan and Gao, Yang}, title = {DomainAdaptor: A Novel Approach to Test-time Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18971-18981} }
RCA-NOC: Relative Contrastive Alignment for Novel Object Captioning-
[pdf]
[bibtex]@InProceedings{Fan_2023_ICCV, author = {Fan, Jiashuo and Liang, Yaoyuan and Liu, Leyao and Huang, Shaolun and Zhang, Lei}, title = {RCA-NOC: Relative Contrastive Alignment for Novel Object Captioning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15510-15520} }
Mitigating and Evaluating Static Bias of Action Representations in the Background and the Foreground-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Haoxin and Liu, Yuan and Zhang, Hanwang and Li, Boyang}, title = {Mitigating and Evaluating Static Bias of Action Representations in the Background and the Foreground}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19911-19923} }
RbA: Segmenting Unknown Regions Rejected by All-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nayal_2023_ICCV, author = {Nayal, Nazir and Yavuz, Misra and Henriques, Jo\~ao F. and G\"uney, Fatma}, title = {RbA: Segmenting Unknown Regions Rejected by All}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {711-722} }
CuNeRF: Cube-Based Neural Radiance Field for Zero-Shot Medical Image Arbitrary-Scale Super Resolution-
[pdf]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Zixuan and Yang, Lingxiao and Lai, Jian-Huang and Xie, Xiaohua}, title = {CuNeRF: Cube-Based Neural Radiance Field for Zero-Shot Medical Image Arbitrary-Scale Super Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21185-21195} }
Beyond Object Recognition: A New Benchmark towards Object Concept Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Yong-Lu and Xu, Yue and Xu, Xinyu and Mao, Xiaohan and Yao, Yuan and Liu, Siqi and Lu, Cewu}, title = {Beyond Object Recognition: A New Benchmark towards Object Concept Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20029-20040} }
Towards Open-Vocabulary Video Instance Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Haochen and Yan, Cilin and Wang, Shuai and Jiang, Xiaolong and Tang, Xu and Hu, Yao and Xie, Weidi and Gavves, Efstratios}, title = {Towards Open-Vocabulary Video Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4057-4066} }
Unleashing the Power of Gradient Signal-to-Noise Ratio for Zero-Shot NAS-
[pdf]
[supp]
[bibtex]@InProceedings{Sun_2023_ICCV, author = {Sun, Zihao and Sun, Yu and Yang, Longxing and Lu, Shun and Mei, Jilin and Zhao, Wenxiao and Hu, Yu}, title = {Unleashing the Power of Gradient Signal-to-Noise Ratio for Zero-Shot NAS}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5763-5773} }
EgoObjects: A Large-Scale Egocentric Dataset for Fine-Grained Object Understanding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Chenchen and Xiao, Fanyi and Alvarado, Andres and Babaei, Yasmine and Hu, Jiabo and El-Mohri, Hichem and Culatana, Sean and Sumbaly, Roshan and Yan, Zhicheng}, title = {EgoObjects: A Large-Scale Egocentric Dataset for Fine-Grained Object Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20110-20120} }
What Can Simple Arithmetic Operations Do for Temporal Modeling?-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Wenhao and Song, Yuxin and Sun, Zhun and Wang, Jingdong and Xu, Chang and Ouyang, Wanli}, title = {What Can Simple Arithmetic Operations Do for Temporal Modeling?}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13712-13722} }
Pixel Adaptive Deep Unfolding Transformer for Hyperspectral Image Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Miaoyu and Fu, Ying and Liu, Ji and Zhang, Yulun}, title = {Pixel Adaptive Deep Unfolding Transformer for Hyperspectral Image Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12959-12968} }
BiViT: Extremely Compressed Binary Vision Transformers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{He_2023_ICCV, author = {He, Yefei and Lou, Zhenyu and Zhang, Luoming and Liu, Jing and Wu, Weijia and Zhou, Hong and Zhuang, Bohan}, title = {BiViT: Extremely Compressed Binary Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5651-5663} }
Dynamic PlenOctree for Adaptive Sampling Refinement in Explicit NeRF-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bai_2023_ICCV, author = {Bai, Haotian and Lin, Yiqi and Chen, Yize and Wang, Lin}, title = {Dynamic PlenOctree for Adaptive Sampling Refinement in Explicit NeRF}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8785-8795} }
Scene Matters: Model-based Deep Video Compression-
[pdf]
[arXiv]
[bibtex]@InProceedings{Tang_2023_ICCV, author = {Tang, Lv and Zhang, Xinfeng and Zhang, Gai and Ma, Xiaoqi}, title = {Scene Matters: Model-based Deep Video Compression}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12481-12491} }
Tree-Structured Shading Decomposition-
[pdf]
[arXiv]
[bibtex]@InProceedings{Geng_2023_ICCV, author = {Geng, Chen and Yu, Hong-Xing and Zhang, Sharon and Agrawala, Maneesh and Wu, Jiajun}, title = {Tree-Structured Shading Decomposition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {488-498} }
EfficientTrain: Exploring Generalized Curriculum Learning for Training Visual Backbones-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Yulin and Yue, Yang and Lu, Rui and Liu, Tianjiao and Zhong, Zhao and Song, Shiji and Huang, Gao}, title = {EfficientTrain: Exploring Generalized Curriculum Learning for Training Visual Backbones}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5852-5864} }
Simulating Fluids in Real-World Still Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fan_2023_ICCV, author = {Fan, Siming and Piao, Jingtan and Qian, Chen and Li, Hongsheng and Lin, Kwan-Yee}, title = {Simulating Fluids in Real-World Still Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15922-15931} }
SC3K: Self-supervised and Coherent 3D Keypoints Estimation from Rotated, Noisy, and Decimated Point Cloud Data-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zohaib_2023_ICCV, author = {Zohaib, Mohammad and Del Bue, Alessio}, title = {SC3K: Self-supervised and Coherent 3D Keypoints Estimation from Rotated, Noisy, and Decimated Point Cloud Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22509-22519} }
IntrinsicNeRF: Learning Intrinsic Neural Radiance Fields for Editable Novel View Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ye_2023_ICCV, author = {Ye, Weicai and Chen, Shuo and Bao, Chong and Bao, Hujun and Pollefeys, Marc and Cui, Zhaopeng and Zhang, Guofeng}, title = {IntrinsicNeRF: Learning Intrinsic Neural Radiance Fields for Editable Novel View Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {339-351} }
Segmenting Known Objects and Unseen Unknowns without Prior Knowledge-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gasperini_2023_ICCV, author = {Gasperini, Stefano and Marcos-Ramiro, Alvaro and Schmidt, Michael and Navab, Nassir and Busam, Benjamin and Tombari, Federico}, title = {Segmenting Known Objects and Unseen Unknowns without Prior Knowledge}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19321-19332} }
A Good Student is Cooperative and Reliable: CNN-Transformer Collaborative Learning for Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Jinjing and Luo, Yunhao and Zheng, Xu and Wang, Hao and Wang, Lin}, title = {A Good Student is Cooperative and Reliable: CNN-Transformer Collaborative Learning for Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11720-11730} }
CMDA: Cross-Modality Domain Adaptation for Nighttime Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xia_2023_ICCV, author = {Xia, Ruihao and Zhao, Chaoqiang and Zheng, Meng and Wu, Ziyan and Sun, Qiyu and Tang, Yang}, title = {CMDA: Cross-Modality Domain Adaptation for Nighttime Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21572-21581} }
Learning with Diversity: Self-Expanded Equalization for Better Generalized Deep Metric Learning-
[pdf]
[bibtex]@InProceedings{Yan_2023_ICCV, author = {Yan, Jiexi and Yin, Zhihui and Yang, Erkun and Yang, Yanhua and Huang, Heng}, title = {Learning with Diversity: Self-Expanded Equalization for Better Generalized Deep Metric Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19365-19374} }
Fan-Beam Binarization Difference Projection (FB-BDP): A Novel Local Object Descriptor for Fine-Grained Leaf Image Retrieval-
[pdf]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Xin and Wang, Bin and Gao, Yongsheng}, title = {Fan-Beam Binarization Difference Projection (FB-BDP): A Novel Local Object Descriptor for Fine-Grained Leaf Image Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11102-11111} }
Dynamic Residual Classifier for Class Incremental Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Xiuwei and Chang, Xiaobin}, title = {Dynamic Residual Classifier for Class Incremental Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18743-18752} }
Optimizing the Placement of Roadside LiDARs for Autonomous Driving-
[pdf]
[supp]
[bibtex]@InProceedings{Jiang_2023_ICCV, author = {Jiang, Wentao and Xiang, Hao and Cai, Xinyu and Xu, Runsheng and Ma, Jiaqi and Li, Yikang and Lee, Gim Hee and Liu, Si}, title = {Optimizing the Placement of Roadside LiDARs for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18381-18390} }
Diverse Inpainting and Editing with GAN Inversion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yildirim_2023_ICCV, author = {Yildirim, Ahmet Burak and Pehlivan, Hamza and Bilecen, Bahri Batuhan and Dundar, Aysegul}, title = {Diverse Inpainting and Editing with GAN Inversion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23120-23130} }
InterDiff: Generating 3D Human-Object Interactions with Physics-Informed Diffusion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Sirui and Li, Zhengyuan and Wang, Yu-Xiong and Gui, Liang-Yan}, title = {InterDiff: Generating 3D Human-Object Interactions with Physics-Informed Diffusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14928-14940} }
DiFaReli: Diffusion Face Relighting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ponglertnapakorn_2023_ICCV, author = {Ponglertnapakorn, Puntawat and Tritrong, Nontawat and Suwajanakorn, Supasorn}, title = {DiFaReli: Diffusion Face Relighting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22646-22657} }
IST-Net: Prior-Free Category-Level Pose Estimation with Implicit Space Transformation-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Jianhui and Chen, Yukang and Ye, Xiaoqing and Qi, Xiaojuan}, title = {IST-Net: Prior-Free Category-Level Pose Estimation with Implicit Space Transformation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13978-13988} }
Building3D: A Urban-Scale Dataset and Benchmarks for Learning Roof Structures from Point Clouds-
[pdf]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Ruisheng and Huang, Shangfeng and Yang, Hongxin}, title = {Building3D: A Urban-Scale Dataset and Benchmarks for Learning Roof Structures from Point Clouds}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20076-20086} }
Multi-Object Discovery by Low-Dimensional Object Motion-
[pdf]
[supp]
[bibtex]@InProceedings{Safadoust_2023_ICCV, author = {Safadoust, Sadra and G\"uney, Fatma}, title = {Multi-Object Discovery by Low-Dimensional Object Motion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {734-744} }
Localizing Object-Level Shape Variations with Text-to-Image Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Patashnik_2023_ICCV, author = {Patashnik, Or and Garibi, Daniel and Azuri, Idan and Averbuch-Elor, Hadar and Cohen-Or, Daniel}, title = {Localizing Object-Level Shape Variations with Text-to-Image Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23051-23061} }
CoSign: Exploring Co-occurrence Signals in Skeleton-based Continuous Sign Language Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Jiao_2023_ICCV, author = {Jiao, Peiqi and Min, Yuecong and Li, Yanan and Wang, Xiaotao and Lei, Lei and Chen, Xilin}, title = {CoSign: Exploring Co-occurrence Signals in Skeleton-based Continuous Sign Language Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20676-20686} }
GACE: Geometry Aware Confidence Enhancement for Black-Box 3D Object Detectors on LiDAR-Data-
[pdf]
[supp]
[bibtex]@InProceedings{Schinagl_2023_ICCV, author = {Schinagl, David and Krispel, Georg and Fruhwirth-Reisinger, Christian and Possegger, Horst and Bischof, Horst}, title = {GACE: Geometry Aware Confidence Enhancement for Black-Box 3D Object Detectors on LiDAR-Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6566-6576} }
Curvature-Aware Training for Coordinate Networks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Saratchandran_2023_ICCV, author = {Saratchandran, Hemanth and Chng, Shin-Fang and Ramasinghe, Sameera and MacDonald, Lachlan and Lucey, Simon}, title = {Curvature-Aware Training for Coordinate Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13328-13338} }
Disentangle then Parse: Night-time Semantic Segmentation with Illumination Disentanglement-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wei_2023_ICCV, author = {Wei, Zhixiang and Chen, Lin and Tu, Tao and Ling, Pengyang and Chen, Huaian and Jin, Yi}, title = {Disentangle then Parse: Night-time Semantic Segmentation with Illumination Disentanglement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21593-21603} }
Large-Scale Land Cover Mapping with Fine-Grained Classes via Class-Aware Semi-Supervised Semantic Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Dong_2023_ICCV, author = {Dong, Runmin and Mou, Lichao and Chen, Mengxuan and Li, Weijia and Tong, Xin-Yi and Yuan, Shuai and Zhang, Lixian and Zheng, Juepeng and Zhu, Xiaoxiang and Fu, Haohuan}, title = {Large-Scale Land Cover Mapping with Fine-Grained Classes via Class-Aware Semi-Supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16783-16793} }
ToonTalker: Cross-Domain Face Reenactment-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gong_2023_ICCV, author = {Gong, Yuan and Zhang, Yong and Cun, Xiaodong and Yin, Fei and Fan, Yanbo and Wang, Xuan and Wu, Baoyuan and Yang, Yujiu}, title = {ToonTalker: Cross-Domain Face Reenactment}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7690-7700} }
LISTER: Neighbor Decoding for Length-Insensitive Scene Text Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cheng_2023_ICCV, author = {Cheng, Changxu and Wang, Peng and Da, Cheng and Zheng, Qi and Yao, Cong}, title = {LISTER: Neighbor Decoding for Length-Insensitive Scene Text Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19541-19551} }
Proxy Anchor-based Unsupervised Learning for Continuous Generalized Category Discovery-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2023_ICCV, author = {Kim, Hyungmin and Suh, Sungho and Kim, Daehwan and Jeong, Daun and Cho, Hansang and Kim, Junmo}, title = {Proxy Anchor-based Unsupervised Learning for Continuous Generalized Category Discovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16688-16697} }
Distribution-Aware Prompt Tuning for Vision-Language Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cho_2023_ICCV, author = {Cho, Eulrang and Kim, Jooyeon and Kim, Hyunwoo J}, title = {Distribution-Aware Prompt Tuning for Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22004-22013} }
Learning Rain Location Prior for Nighttime Deraining-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Fan and You, Shaodi and Li, Yu and Fu, Ying}, title = {Learning Rain Location Prior for Nighttime Deraining}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13148-13157} }
FBLNet: FeedBack Loop Network for Driver Attention Prediction-
[pdf]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Yilong and Nan, Zhixiong and Xiang, Tao}, title = {FBLNet: FeedBack Loop Network for Driver Attention Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13371-13380} }
Source-free Domain Adaptive Human Pose Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Peng_2023_ICCV, author = {Peng, Qucheng and Zheng, Ce and Chen, Chen}, title = {Source-free Domain Adaptive Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4826-4836} }
Video Anomaly Detection via Sequentially Learning Multiple Pretext Tasks-
[pdf]
[supp]
[bibtex]@InProceedings{Shi_2023_ICCV, author = {Shi, Chenrui and Sun, Che and Wu, Yuwei and Jia, Yunde}, title = {Video Anomaly Detection via Sequentially Learning Multiple Pretext Tasks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10330-10340} }
SlaBins: Fisheye Depth Estimation using Slanted Bins on Road Environments-
[pdf]
[supp]
[bibtex]@InProceedings{Lee_2023_ICCV, author = {Lee, Jongsung and Cho, Gyeongsu and Park, Jeongin and Kim, Kyongjun and Lee, Seongoh and Kim, Jung-Hee and Jeong, Seong-Gyun and Joo, Kyungdon}, title = {SlaBins: Fisheye Depth Estimation using Slanted Bins on Road Environments}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8765-8774} }
DOT: A Distillation-Oriented Trainer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Borui and Cui, Quan and Song, Renjie and Liang, Jiajun}, title = {DOT: A Distillation-Oriented Trainer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6189-6198} }
Neural Collage Transfer: Artistic Reconstruction via Material Manipulation-
[pdf]
[supp]
[bibtex]@InProceedings{Lee_2023_ICCV, author = {Lee, Ganghun and Kim, Minji and Lee, Yunsu and Lee, Minsu and Zhang, Byoung-Tak}, title = {Neural Collage Transfer: Artistic Reconstruction via Material Manipulation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2394-2405} }
Fantasia3D: Disentangling Geometry and Appearance for High-quality Text-to-3D Content Creation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Rui and Chen, Yongwei and Jiao, Ningxin and Jia, Kui}, title = {Fantasia3D: Disentangling Geometry and Appearance for High-quality Text-to-3D Content Creation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22246-22256} }
MagicFusion: Boosting Text-to-Image Generation Performance by Fusing Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Jing and Zheng, Heliang and Wang, Chaoyue and Lan, Long and Yang, Wenjing}, title = {MagicFusion: Boosting Text-to-Image Generation Performance by Fusing Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22592-22602} }
UCF: Uncovering Common Features for Generalizable Deepfake Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yan_2023_ICCV, author = {Yan, Zhiyuan and Zhang, Yong and Fan, Yanbo and Wu, Baoyuan}, title = {UCF: Uncovering Common Features for Generalizable Deepfake Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22412-22423} }
March in Chat: Interactive Prompting for Remote Embodied Referring Expression-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Qiao_2023_ICCV, author = {Qiao, Yanyuan and Qi, Yuankai and Yu, Zheng and Liu, Jing and Wu, Qi}, title = {March in Chat: Interactive Prompting for Remote Embodied Referring Expression}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15758-15767} }
Sample4Geo: Hard Negative Sampling For Cross-View Geo-Localisation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Deuser_2023_ICCV, author = {Deuser, Fabian and Habel, Konrad and Oswald, Norbert}, title = {Sample4Geo: Hard Negative Sampling For Cross-View Geo-Localisation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16847-16856} }
Novel Scenes & Classes: Towards Adaptive Open-set Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Wuyang and Guo, Xiaoqing and Yuan, Yixuan}, title = {Novel Scenes \& Classes: Towards Adaptive Open-set Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15780-15790} }
LIMITR: Leveraging Local Information for Medical Image-Text Representation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dawidowicz_2023_ICCV, author = {Dawidowicz, Gefen and Hirsch, Elad and Tal, Ayellet}, title = {LIMITR: Leveraging Local Information for Medical Image-Text Representation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21165-21173} }
Multi-task View Synthesis with Neural Radiance Fields-
[pdf]
[supp]
[bibtex]@InProceedings{Zheng_2023_ICCV, author = {Zheng, Shuhong and Bao, Zhipeng and Hebert, Martial and Wang, Yu-Xiong}, title = {Multi-task View Synthesis with Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21538-21549} }
Informative Data Mining for One-Shot Cross-Domain Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Yuxi and Liang, Jian and Xiao, Jun and Mei, Shuqi and Yang, Yuran and Zhang, Zhaoxiang}, title = {Informative Data Mining for One-Shot Cross-Domain Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1064-1074} }
Efficient Unified Demosaicing for Bayer and Non-Bayer Patterned Image Sensors-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2023_ICCV, author = {Lee, Haechang and Park, Dongwon and Jeong, Wongi and Kim, Kijeong and Je, Hyunwoo and Ryu, Dongil and Chun, Se Young}, title = {Efficient Unified Demosaicing for Bayer and Non-Bayer Patterned Image Sensors}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12750-12759} }
Visual Traffic Knowledge Graph Generation from Scene Images-
[pdf]
[supp]
[bibtex]@InProceedings{Guo_2023_ICCV, author = {Guo, Yunfei and Yin, Fei and Li, Xiao-hui and Yan, Xudong and Xue, Tao and Mei, Shuqi and Liu, Cheng-Lin}, title = {Visual Traffic Knowledge Graph Generation from Scene Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21604-21613} }
Householder Projector for Unsupervised Latent Semantics Discovery-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Song_2023_ICCV, author = {Song, Yue and Zhang, Jichao and Sebe, Nicu and Wang, Wei}, title = {Householder Projector for Unsupervised Latent Semantics Discovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7712-7722} }
Spatially-Adaptive Feature Modulation for Efficient Image Super-Resolution-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sun_2023_ICCV, author = {Sun, Long and Dong, Jiangxin and Tang, Jinhui and Pan, Jinshan}, title = {Spatially-Adaptive Feature Modulation for Efficient Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13190-13199} }
Unsupervised Image Denoising in Real-World Scenarios via Self-Collaboration Parallel Generative Adversarial Branches-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lin_2023_ICCV, author = {Lin, Xin and Ren, Chao and Liu, Xiao and Huang, Jie and Lei, Yinjie}, title = {Unsupervised Image Denoising in Real-World Scenarios via Self-Collaboration Parallel Generative Adversarial Branches}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12642-12652} }
Bayesian Optimization Meets Self-Distillation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2023_ICCV, author = {Lee, HyunJae and Song, Heon and Lee, Hyeonsoo and Lee, Gi-hyeon and Park, Suyeong and Yoo, Donggeun}, title = {Bayesian Optimization Meets Self-Distillation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1696-1705} }
No Fear of Classifier Biases: Neural Collapse Inspired Federated Learning with Synthetic and Fixed Classifier-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Zexi and Shang, Xinyi and He, Rui and Lin, Tao and Wu, Chao}, title = {No Fear of Classifier Biases: Neural Collapse Inspired Federated Learning with Synthetic and Fixed Classifier}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5319-5329} }
MemorySeg: Online LiDAR Semantic Segmentation with a Latent Memory-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Enxu and Casas, Sergio and Urtasun, Raquel}, title = {MemorySeg: Online LiDAR Semantic Segmentation with a Latent Memory}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {745-754} }
Hashing Neural Video Decomposition with Multiplicative Residuals in Space-Time-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chan_2023_ICCV, author = {Chan, Cheng-Hung and Yuan, Cheng-Yang and Sun, Cheng and Chen, Hwann-Tzong}, title = {Hashing Neural Video Decomposition with Multiplicative Residuals in Space-Time}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7743-7753} }
Multimodal Variational Auto-encoder based Audio-Visual Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Mao_2023_ICCV, author = {Mao, Yuxin and Zhang, Jing and Xiang, Mochu and Zhong, Yiran and Dai, Yuchao}, title = {Multimodal Variational Auto-encoder based Audio-Visual Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {954-965} }
DynaMITe: Dynamic Query Bootstrapping for Multi-object Interactive Segmentation Transformer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Rana_2023_ICCV, author = {Rana, Amit Kumar and Mahadevan, Sabarinath and Hermans, Alexander and Leibe, Bastian}, title = {DynaMITe: Dynamic Query Bootstrapping for Multi-object Interactive Segmentation Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1043-1052} }
FRAug: Tackling Federated Learning with Non-IID Features via Representation Augmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Haokun and Frikha, Ahmed and Krompass, Denis and Gu, Jindong and Tresp, Volker}, title = {FRAug: Tackling Federated Learning with Non-IID Features via Representation Augmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4849-4859} }
Homography Guided Temporal Fusion for Road Line and Marking Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Shan and Nguyen, Chuong and Liu, Jiawei and Zhang, Kaihao and Luo, Wenhan and Zhang, Yanhao and Muthu, Sundaram and Maken, Fahira Afzal and Li, Hongdong}, title = {Homography Guided Temporal Fusion for Road Line and Marking Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1075-1085} }
NeuRBF: A Neural Fields Representation with Adaptive Radial Basis Functions-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Zhang and Li, Zhong and Song, Liangchen and Chen, Lele and Yu, Jingyi and Yuan, Junsong and Xu, Yi}, title = {NeuRBF: A Neural Fields Representation with Adaptive Radial Basis Functions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4182-4194} }
OmnimatteRF: Robust Omnimatte with 3D Background Modeling-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lin_2023_ICCV, author = {Lin, Geng and Gao, Chen and Huang, Jia-Bin and Kim, Changil and Wang, Yipeng and Zwicker, Matthias and Saraf, Ayush}, title = {OmnimatteRF: Robust Omnimatte with 3D Background Modeling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23471-23480} }
Self-supervised Image Denoising with Downsampled Invariance Loss and Conditional Blind-Spot Network-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jang_2023_ICCV, author = {Jang, Yeong Il and Lee, Keuntek and Park, Gu Yong and Kim, Seyun and Cho, Nam Ik}, title = {Self-supervised Image Denoising with Downsampled Invariance Loss and Conditional Blind-Spot Network}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12196-12205} }
Multi-granularity Interaction Simulation for Unsupervised Interactive Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Kehan and Zhao, Yian and Wang, Zhennan and Cheng, Zesen and Jin, Peng and Ji, Xiangyang and Yuan, Li and Liu, Chang and Chen, Jie}, title = {Multi-granularity Interaction Simulation for Unsupervised Interactive Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {666-676} }
RecursiveDet: End-to-End Region-Based Recursive Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Jing and Sun, Li and Li, Qingli}, title = {RecursiveDet: End-to-End Region-Based Recursive Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6307-6316} }
Bold but Cautious: Unlocking the Potential of Personalized Federated Learning through Cautiously Aggressive Collaboration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Xinghao and Liu, Xuefeng and Niu, Jianwei and Zhu, Guogang and Tang, Shaojie}, title = {Bold but Cautious: Unlocking the Potential of Personalized Federated Learning through Cautiously Aggressive Collaboration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19375-19384} }
ESSAformer: Efficient Transformer for Hyperspectral Image Super-resolution-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Mingjin and Zhang, Chi and Zhang, Qiming and Guo, Jie and Gao, Xinbo and Zhang, Jing}, title = {ESSAformer: Efficient Transformer for Hyperspectral Image Super-resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23073-23084} }
Generative Action Description Prompts for Skeleton-based Action Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xiang_2023_ICCV, author = {Xiang, Wangmeng and Li, Chao and Zhou, Yuxuan and Wang, Biao and Zhang, Lei}, title = {Generative Action Description Prompts for Skeleton-based Action Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10276-10285} }
Structure Invariant Transformation for better Adversarial Transferability-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Xiaosen and Zhang, Zeliang and Zhang, Jianping}, title = {Structure Invariant Transformation for better Adversarial Transferability}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4607-4619} }
Thinking Image Color Aesthetics Assessment: Models, Datasets and Benchmarks-
[pdf]
[bibtex]@InProceedings{He_2023_ICCV, author = {He, Shuai and Ming, Anlong and Li, Yaqi and Sun, Jinyuan and Zheng, ShunTian and Ma, Huadong}, title = {Thinking Image Color Aesthetics Assessment: Models, Datasets and Benchmarks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21838-21847} }
Multi-body Depth and Camera Pose Estimation from Multiple Views-
[pdf]
[supp]
[bibtex]@InProceedings{Cin_2023_ICCV, author = {Cin, Andrea Porfiri Dal and Boracchi, Giacomo and Magri, Luca}, title = {Multi-body Depth and Camera Pose Estimation from Multiple Views}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17804-17814} }
DISeR: Designing Imaging Systems with Reinforcement Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Klinghoffer_2023_ICCV, author = {Klinghoffer, Tzofi and Tiwary, Kushagra and Behari, Nikhil and Agrawalla, Bhavya and Raskar, Ramesh}, title = {DISeR: Designing Imaging Systems with Reinforcement Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23632-23642} }
The Euclidean Space is Evil: Hyperbolic Attribute Editing for Few-shot Image Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Lingxiao and Zhang, Yi and Wang, Shuhui}, title = {The Euclidean Space is Evil: Hyperbolic Attribute Editing for Few-shot Image Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22714-22724} }
FULLER: Unified Multi-modality Multi-task 3D Perception via Multi-level Gradient Calibration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Zhijian and Lin, Sihao and Liu, Guiyu and Luo, Mukun and Ye, Chaoqiang and Xu, Hang and Chang, Xiaojun and Liang, Xiaodan}, title = {FULLER: Unified Multi-modality Multi-task 3D Perception via Multi-level Gradient Calibration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3502-3511} }
Transparent Shape from a Single View Polarization Image-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shao_2023_ICCV, author = {Shao, Mingqi and Xia, Chongkun and Yang, Zhendong and Huang, Junnan and Wang, Xueqian}, title = {Transparent Shape from a Single View Polarization Image}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9277-9286} }
Invariant Feature Regularization for Fair Face Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Ma_2023_ICCV, author = {Ma, Jiali and Yue, Zhongqi and Tomoyuki, Kagaya and Tomoki, Suzuki and Jayashree, Karlekar and Pranata, Sugiri and Zhang, Hanwang}, title = {Invariant Feature Regularization for Fair Face Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20861-20870} }
Cross-Domain Product Representation Learning for Rich-Content E-Commerce-
[pdf]
[supp]
[bibtex]@InProceedings{Bai_2023_ICCV, author = {Bai, Xuehan and Li, Yan and Cheng, Yanhua and Yang, Wenjie and Chen, Quan and Li, Han}, title = {Cross-Domain Product Representation Learning for Rich-Content E-Commerce}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5697-5706} }
DriveAdapter: Breaking the Coupling Barrier of Perception and Planning in End-to-End Autonomous Driving-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jia_2023_ICCV, author = {Jia, Xiaosong and Gao, Yulu and Chen, Li and Yan, Junchi and Liu, Patrick Langechuan and Li, Hongyang}, title = {DriveAdapter: Breaking the Coupling Barrier of Perception and Planning in End-to-End Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7953-7963} }
General Planar Motion from a Pair of 3D Correspondences-
[pdf]
[supp]
[bibtex]@InProceedings{Dibene_2023_ICCV, author = {Dibene, Juan Carlos and Min, Zhixiang and Dunn, Enrique}, title = {General Planar Motion from a Pair of 3D Correspondences}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8060-8070} }
Single Depth-image 3D Reflection Symmetry and Shape Prediction-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Zhaoxuan and Dong, Bo and Li, Tong and Heide, Felix and Peers, Pieter and Yin, Baocai and Yang, Xin}, title = {Single Depth-image 3D Reflection Symmetry and Shape Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8896-8906} }
Local Context-Aware Active Domain Adaptation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sun_2023_ICCV, author = {Sun, Tao and Lu, Cheng and Ling, Haibin}, title = {Local Context-Aware Active Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18634-18643} }
Deep Incubation: Training Large Models by Divide-and-Conquering-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ni_2023_ICCV, author = {Ni, Zanlin and Wang, Yulin and Yu, Jiangwei and Jiang, Haojun and Cao, Yue and Huang, Gao}, title = {Deep Incubation: Training Large Models by Divide-and-Conquering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17335-17345} }
Downscaled Representation Matters: Improving Image Rescaling with Collaborative Downscaled Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Bingna and Guo, Yong and Jiang, Luoqian and Yu, Mianjie and Chen, Jian}, title = {Downscaled Representation Matters: Improving Image Rescaling with Collaborative Downscaled Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12237-12247} }
Detection Transformer with Stable Matching-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Shilong and Ren, Tianhe and Chen, Jiayu and Zeng, Zhaoyang and Zhang, Hao and Li, Feng and Li, Hongyang and Huang, Jun and Su, Hang and Zhu, Jun and Zhang, Lei}, title = {Detection Transformer with Stable Matching}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6491-6500} }
Be Everywhere - Hear Everything (BEE): Audio Scene Reconstruction by Sparse Audio-Visual Samples-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Mingfei and Su, Kun and Shlizerman, Eli}, title = {Be Everywhere - Hear Everything (BEE): Audio Scene Reconstruction by Sparse Audio-Visual Samples}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7853-7862} }
iVS-Net: Learning Human View Synthesis from Internet Videos-
[pdf]
[supp]
[bibtex]@InProceedings{Dong_2023_ICCV, author = {Dong, Junting and Fang, Qi and Yang, Tianshuo and Shuai, Qing and Qiao, Chengyu and Peng, Sida}, title = {iVS-Net: Learning Human View Synthesis from Internet Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22942-22951} }
Story Visualization by Online Text Augmentation with Context Memory-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ahn_2023_ICCV, author = {Ahn, Daechul and Kim, Daneul and Song, Gwangmo and Kim, Seung Hwan and Lee, Honglak and Kang, Dongyeop and Choi, Jonghyun}, title = {Story Visualization by Online Text Augmentation with Context Memory}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3125-3135} }
Attention Discriminant Sampling for Point Clouds-
[pdf]
[supp]
[bibtex]@InProceedings{Hong_2023_ICCV, author = {Hong, Cheng-Yao and Chou, Yu-Ying and Liu, Tyng-Luh}, title = {Attention Discriminant Sampling for Point Clouds}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14429-14440} }
Global Balanced Experts for Federated Long-Tailed Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Zeng_2023_ICCV, author = {Zeng, Yaopei and Liu, Lei and Liu, Li and Shen, Li and Liu, Shaoguo and Wu, Baoyuan}, title = {Global Balanced Experts for Federated Long-Tailed Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4815-4825} }
All4One: Symbiotic Neighbour Contrastive Learning via Self-Attention and Redundancy Reduction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Estepa_2023_ICCV, author = {Estepa, Imanol G. and Sarasua, Ignacio and Nagarajan, Bhalaji and Radeva, Petia}, title = {All4One: Symbiotic Neighbour Contrastive Learning via Self-Attention and Redundancy Reduction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16243-16253} }
Contrastive Pseudo Learning for Open-World DeepFake Attribution-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sun_2023_ICCV, author = {Sun, Zhimin and Chen, Shen and Yao, Taiping and Yin, Bangjie and Yi, Ran and Ding, Shouhong and Ma, Lizhuang}, title = {Contrastive Pseudo Learning for Open-World DeepFake Attribution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20882-20892} }
ICL-D3IE: In-Context Learning with Diverse Demonstrations Updating for Document Information Extraction-
[pdf]
[bibtex]@InProceedings{He_2023_ICCV, author = {He, Jiabang and Wang, Lei and Hu, Yi and Liu, Ning and Liu, Hui and Xu, Xing and Shen, Heng Tao}, title = {ICL-D3IE: In-Context Learning with Diverse Demonstrations Updating for Document Information Extraction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19485-19494} }
IHNet: Iterative Hierarchical Network Guided by High-Resolution Estimated Information for Scene Flow Estimation-
[pdf]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Yun and Chi, Cheng and Lin, Min and Yang, Xin}, title = {IHNet: Iterative Hierarchical Network Guided by High-Resolution Estimated Information for Scene Flow Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10073-10082} }
SimNP: Learning Self-Similarity Priors Between Neural Points-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wewer_2023_ICCV, author = {Wewer, Christopher and Ilg, Eddy and Schiele, Bernt and Lenssen, Jan Eric}, title = {SimNP: Learning Self-Similarity Priors Between Neural Points}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8841-8852} }
Beyond the Limitation of Monocular 3D Detector via Knowledge Distillation-
[pdf]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Yiran and Yin, Dongshuo and Rong, Xuee and Sun, Xian and Diao, Wenhui and Li, Xinming}, title = {Beyond the Limitation of Monocular 3D Detector via Knowledge Distillation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9077-9086} }
Cascade-DETR: Delving into High-Quality Universal Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Ye_2023_ICCV, author = {Ye, Mingqiao and Ke, Lei and Li, Siyuan and Tai, Yu-Wing and Tang, Chi-Keung and Danelljan, Martin and Yu, Fisher}, title = {Cascade-DETR: Delving into High-Quality Universal Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6704-6714} }
ACLS: Adaptive and Conditional Label Smoothing for Network Calibration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Park_2023_ICCV, author = {Park, Hyekang and Noh, Jongyoun and Oh, Youngmin and Baek, Donghyeon and Ham, Bumsub}, title = {ACLS: Adaptive and Conditional Label Smoothing for Network Calibration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3936-3945} }
EMR-MSF: Self-Supervised Recurrent Monocular Scene Flow Exploiting Ego-Motion Rigidity-
[pdf]
[supp]
[bibtex]@InProceedings{Jiang_2023_ICCV, author = {Jiang, Zijie and Okutomi, Masatoshi}, title = {EMR-MSF: Self-Supervised Recurrent Monocular Scene Flow Exploiting Ego-Motion Rigidity}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {69-78} }
Evaluation and Improvement of Interpretability for Self-Explainable Part-Prototype Networks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Qihan and Xue, Mengqi and Huang, Wenqi and Zhang, Haofei and Song, Jie and Jing, Yongcheng and Song, Mingli}, title = {Evaluation and Improvement of Interpretability for Self-Explainable Part-Prototype Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2011-2020} }
Temporal-Coded Spiking Neural Networks with Dynamic Firing Threshold: Learning with Event-Driven Backpropagation-
[pdf]
[bibtex]@InProceedings{Wei_2023_ICCV, author = {Wei, Wenjie and Zhang, Malu and Qu, Hong and Belatreche, Ammar and Zhang, Jian and Chen, Hong}, title = {Temporal-Coded Spiking Neural Networks with Dynamic Firing Threshold: Learning with Event-Driven Backpropagation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10552-10562} }
Mitigating Adversarial Vulnerability through Causal Parameter Estimation by Adversarial Double Machine Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2023_ICCV, author = {Lee, Byung-Kwan and Kim, Junho and Ro, Yong Man}, title = {Mitigating Adversarial Vulnerability through Causal Parameter Estimation by Adversarial Double Machine Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4499-4509} }
Dynamic Token Pruning in Plain Vision Transformers for Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tang_2023_ICCV, author = {Tang, Quan and Zhang, Bowen and Liu, Jiajun and Liu, Fagui and Liu, Yifan}, title = {Dynamic Token Pruning in Plain Vision Transformers for Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {777-786} }
Shape Anchor Guided Holistic Indoor Scene Understanding-
[pdf]
[arXiv]
[bibtex]@InProceedings{Dong_2023_ICCV, author = {Dong, Mingyue and Huan, Linxi and Xiong, Hanjiang and Shen, Shuhan and Zheng, Xianwei}, title = {Shape Anchor Guided Holistic Indoor Scene Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21916-21926} }
Knowledge-Aware Federated Active Learning with Non-IID Data-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cao_2023_ICCV, author = {Cao, Yu-Tong and Shi, Ye and Yu, Baosheng and Wang, Jingya and Tao, Dacheng}, title = {Knowledge-Aware Federated Active Learning with Non-IID Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22279-22289} }
PlankAssembly: Robust 3D Reconstruction from Three Orthographic Views with Learnt Shape Programs-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hu_2023_ICCV, author = {Hu, Wentao and Zheng, Jia and Zhang, Zixin and Yuan, Xiaojun and Yin, Jian and Zhou, Zihan}, title = {PlankAssembly: Robust 3D Reconstruction from Three Orthographic Views with Learnt Shape Programs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18495-18505} }
PODIA-3D: Domain Adaptation of 3D Generative Model Across Large Domain Gap Using Pose-Preserved Text-to-Image Diffusion-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2023_ICCV, author = {Kim, Gwanghyun and Jang, Ji Ha and Chun, Se Young}, title = {PODIA-3D: Domain Adaptation of 3D Generative Model Across Large Domain Gap Using Pose-Preserved Text-to-Image Diffusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22603-22612} }
Steered Diffusion: A Generalized Framework for Plug-and-Play Conditional Image Synthesis-
[pdf]
[supp]
[bibtex]@InProceedings{Nair_2023_ICCV, author = {Nair, Nithin Gopalakrishnan and Cherian, Anoop and Lohit, Suhas and Wang, Ye and Koike-Akino, Toshiaki and Patel, Vishal M. and Marks, Tim K.}, title = {Steered Diffusion: A Generalized Framework for Plug-and-Play Conditional Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20850-20860} }
DiffFit: Unlocking Transferability of Large Diffusion Models via Simple Parameter-efficient Fine-Tuning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xie_2023_ICCV, author = {Xie, Enze and Yao, Lewei and Shi, Han and Liu, Zhili and Zhou, Daquan and Liu, Zhaoqiang and Li, Jiawei and Li, Zhenguo}, title = {DiffFit: Unlocking Transferability of Large Diffusion Models via Simple Parameter-efficient Fine-Tuning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4230-4239} }
NeO 360: Neural Fields for Sparse View Synthesis of Outdoor Scenes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Irshad_2023_ICCV, author = {Irshad, Muhammad Zubair and Zakharov, Sergey and Liu, Katherine and Guizilini, Vitor and Kollar, Thomas and Gaidon, Adrien and Kira, Zsolt and Ambrus, Rares}, title = {NeO 360: Neural Fields for Sparse View Synthesis of Outdoor Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9187-9198} }
UnLoc: A Unified Framework for Video Localization Tasks-
[pdf]
[arXiv]
[bibtex]@InProceedings{Yan_2023_ICCV, author = {Yan, Shen and Xiong, Xuehan and Nagrani, Arsha and Arnab, Anurag and Wang, Zhonghao and Ge, Weina and Ross, David and Schmid, Cordelia}, title = {UnLoc: A Unified Framework for Video Localization Tasks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13623-13633} }
QD-BEV : Quantization-aware View-guided Distillation for Multi-view 3D Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Yifan and Dong, Zhen and Yang, Huanrui and Lu, Ming and Tseng, Cheng-Ching and Du, Yuan and Keutzer, Kurt and Du, Li and Zhang, Shanghang}, title = {QD-BEV : Quantization-aware View-guided Distillation for Multi-view 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3825-3835} }
Fast Inference and Update of Probabilistic Density Estimation on Trajectory Prediction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Maeda_2023_ICCV, author = {Maeda, Takahiro and Ukita, Norimichi}, title = {Fast Inference and Update of Probabilistic Density Estimation on Trajectory Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9795-9805} }
CLIPascene: Scene Sketching with Different Types and Levels of Abstraction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Vinker_2023_ICCV, author = {Vinker, Yael and Alaluf, Yuval and Cohen-Or, Daniel and Shamir, Ariel}, title = {CLIPascene: Scene Sketching with Different Types and Levels of Abstraction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4146-4156} }
Vision Grid Transformer for Document Layout Analysis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Da_2023_ICCV, author = {Da, Cheng and Luo, Chuwei and Zheng, Qi and Yao, Cong}, title = {Vision Grid Transformer for Document Layout Analysis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19462-19472} }
Multi-Directional Subspace Editing in Style-Space-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Naveh_2023_ICCV, author = {Naveh, Chen}, title = {Multi-Directional Subspace Editing in Style-Space}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7138-7148} }
Adaptive Superpixel for Active Learning in Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2023_ICCV, author = {Kim, Hoyoung and Oh, Minhyeon and Hwang, Sehyun and Kwak, Suha and Ok, Jungseul}, title = {Adaptive Superpixel for Active Learning in Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {943-953} }
Adaptive Spiral Layers for Efficient 3D Representation Learning on Meshes-
[pdf]
[supp]
[bibtex]@InProceedings{Babiloni_2023_ICCV, author = {Babiloni, Francesca and Maggioni, Matteo and Tanay, Thomas and Deng, Jiankang and Leonardis, Ales and Zafeiriou, Stefanos}, title = {Adaptive Spiral Layers for Efficient 3D Representation Learning on Meshes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14620-14631} }
Parametric Information Maximization for Generalized Category Discovery-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chiaroni_2023_ICCV, author = {Chiaroni, Florent and Dolz, Jose and Masud, Ziko Imtiaz and Mitiche, Amar and Ben Ayed, Ismail}, title = {Parametric Information Maximization for Generalized Category Discovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1729-1739} }
Convex Decomposition of Indoor Scenes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Vavilala_2023_ICCV, author = {Vavilala, Vaibhav and Forsyth, David}, title = {Convex Decomposition of Indoor Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9176-9186} }
Toward Unsupervised Realistic Visual Question Answering-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Yuwei and Ho, Chih-Hui and Vasconcelos, Nuno}, title = {Toward Unsupervised Realistic Visual Question Answering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15613-15624} }
A Generalist Framework for Panoptic Segmentation of Images and Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Ting and Li, Lala and Saxena, Saurabh and Hinton, Geoffrey and Fleet, David J.}, title = {A Generalist Framework for Panoptic Segmentation of Images and Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {909-919} }
DALL-Eval: Probing the Reasoning Skills and Social Biases of Text-to-Image Generation Models-
[pdf]
[supp]
[bibtex]@InProceedings{Cho_2023_ICCV, author = {Cho, Jaemin and Zala, Abhay and Bansal, Mohit}, title = {DALL-Eval: Probing the Reasoning Skills and Social Biases of Text-to-Image Generation Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3043-3054} }
Video OWL-ViT: Temporally-consistent Open-world Localization in Video-
[pdf]
[supp]
[bibtex]@InProceedings{Heigold_2023_ICCV, author = {Heigold, Georg and Minderer, Matthias and Gritsenko, Alexey and Bewley, Alex and Keysers, Daniel and Lu\v{c}i\'c, Mario and Yu, Fisher and Kipf, Thomas}, title = {Video OWL-ViT: Temporally-consistent Open-world Localization in Video}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13802-13811} }
Few Shot Font Generation Via Transferring Similarity Guided Global Style and Quantization Local Style-
[pdf]
[arXiv]
[bibtex]@InProceedings{Pan_2023_ICCV, author = {Pan, Wei and Zhu, Anna and Zhou, Xinyu and Iwana, Brian Kenji and Li, Shilin}, title = {Few Shot Font Generation Via Transferring Similarity Guided Global Style and Quantization Local Style}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19506-19516} }
Differentiable Transportation Pruning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Yunqiang and van Gemert, Jan C. and Hoefler, Torsten and Moons, Bert and Eleftheriou, Evangelos and Verhoef, Bram-Ernst}, title = {Differentiable Transportation Pruning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16957-16967} }
Physics-Driven Turbulence Image Restoration with Stochastic Refinement-
[pdf]
[arXiv]
[bibtex]@InProceedings{Jaiswal_2023_ICCV, author = {Jaiswal, Ajay and Zhang, Xingguang and Chan, Stanley H. and Wang, Zhangyang}, title = {Physics-Driven Turbulence Image Restoration with Stochastic Refinement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12170-12181} }
Enhancing Non-line-of-sight Imaging via Learnable Inverse Kernel and Attention Mechanisms-
[pdf]
[bibtex]@InProceedings{Yu_2023_ICCV, author = {Yu, Yanhua and Shen, Siyuan and Wang, Zi and Huang, Binbin and Wang, Yuehan and Peng, Xingyue and Xia, Suan and Liu, Ping and Li, Ruiqian and Li, Shiying}, title = {Enhancing Non-line-of-sight Imaging via Learnable Inverse Kernel and Attention Mechanisms}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10563-10573} }
DECO: Dense Estimation of 3D Human-Scene Contact In The Wild-
[pdf]
[supp]
[bibtex]@InProceedings{Tripathi_2023_ICCV, author = {Tripathi, Shashank and Chatterjee, Agniv and Passy, Jean-Claude and Yi, Hongwei and Tzionas, Dimitrios and Black, Michael J.}, title = {DECO: Dense Estimation of 3D Human-Scene Contact In The Wild}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8001-8013} }
Scale-Aware Modulation Meet Transformer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lin_2023_ICCV, author = {Lin, Weifeng and Wu, Ziheng and Chen, Jiayu and Huang, Jun and Jin, Lianwen}, title = {Scale-Aware Modulation Meet Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6015-6026} }
Large Selective Kernel Network for Remote Sensing Object Detection-
[pdf]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Yuxuan and Hou, Qibin and Zheng, Zhaohui and Cheng, Ming-Ming and Yang, Jian and Li, Xiang}, title = {Large Selective Kernel Network for Remote Sensing Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16794-16805} }
PlaneRecTR: Unified Query Learning for 3D Plane Recovery from a Single View-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shi_2023_ICCV, author = {Shi, Jingjia and Zhi, Shuaifeng and Xu, Kai}, title = {PlaneRecTR: Unified Query Learning for 3D Plane Recovery from a Single View}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9377-9386} }
EigenTrajectory: Low-Rank Descriptors for Multi-Modal Trajectory Forecasting-
[pdf]
[arXiv]
[bibtex]@InProceedings{Bae_2023_ICCV, author = {Bae, Inhwan and Oh, Jean and Jeon, Hae-Gon}, title = {EigenTrajectory: Low-Rank Descriptors for Multi-Modal Trajectory Forecasting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10017-10029} }
I-ViT: Integer-only Quantization for Efficient Vision Transformer Inference-
[pdf]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Zhikai and Gu, Qingyi}, title = {I-ViT: Integer-only Quantization for Efficient Vision Transformer Inference}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17065-17075} }
SUMMIT: Source-Free Adaptation of Uni-Modal Models to Multi-Modal Targets-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Simons_2023_ICCV, author = {Simons, Cody and Raychaudhuri, Dripta S. and Ahmed, Sk Miraj and You, Suya and Karydis, Konstantinos and Roy-Chowdhury, Amit K.}, title = {SUMMIT: Source-Free Adaptation of Uni-Modal Models to Multi-Modal Targets}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1239-1249} }
Learning a More Continuous Zero Level Set in Unsigned Distance Fields through Level Set Projection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Junsheng and Ma, Baorui and Li, Shujuan and Liu, Yu-Shen and Han, Zhizhong}, title = {Learning a More Continuous Zero Level Set in Unsigned Distance Fields through Level Set Projection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3181-3192} }
Video-FocalNets: Spatio-Temporal Focal Modulation for Video Action Recognition-
[pdf]
[bibtex]@InProceedings{Wasim_2023_ICCV, author = {Wasim, Syed Talal and Khattak, Muhammad Uzair and Naseer, Muzammal and Khan, Salman and Shah, Mubarak and Khan, Fahad Shahbaz}, title = {Video-FocalNets: Spatio-Temporal Focal Modulation for Video Action Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13778-13789} }
To Adapt or Not to Adapt? Real-Time Adaptation for Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Colomer_2023_ICCV, author = {Colomer, Marc Botet and Dovesi, Pier Luigi and Panagiotakopoulos, Theodoros and Carvalho, Joao Frederico and H\"arenstam-Nielsen, Linus and Azizpour, Hossein and Kjellstr\"om, Hedvig and Cremers, Daniel and Poggi, Matteo}, title = {To Adapt or Not to Adapt? Real-Time Adaptation for Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16548-16559} }
Hidden Biases of End-to-End Driving Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jaeger_2023_ICCV, author = {Jaeger, Bernhard and Chitta, Kashyap and Geiger, Andreas}, title = {Hidden Biases of End-to-End Driving Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8240-8249} }
HairNeRF: Geometry-Aware Image Synthesis for Hairstyle Transfer-
[pdf]
[bibtex]@InProceedings{Chang_2023_ICCV, author = {Chang, Seunggyu and Kim, Gihoon and Kim, Hayeon}, title = {HairNeRF: Geometry-Aware Image Synthesis for Hairstyle Transfer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2448-2458} }
Strivec: Sparse Tri-Vector Radiance Fields-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gao_2023_ICCV, author = {Gao, Quankai and Xu, Qiangeng and Su, Hao and Neumann, Ulrich and Xu, Zexiang}, title = {Strivec: Sparse Tri-Vector Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17569-17579} }
Multiscale Representation for Real-Time Anti-Aliasing Neural Rendering-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hu_2023_ICCV, author = {Hu, Dongting and Zhang, Zhenkai and Hou, Tingbo and Liu, Tongliang and Fu, Huan and Gong, Mingming}, title = {Multiscale Representation for Real-Time Anti-Aliasing Neural Rendering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17772-17783} }
Borrowing Knowledge From Pre-trained Language Model: A New Data-efficient Visual Learning Paradigm-
[pdf]
[supp]
[bibtex]@InProceedings{Ma_2023_ICCV, author = {Ma, Wenxuan and Li, Shuang and Zhang, JinMing and Liu, Chi Harold and Kang, Jingxuan and Wang, Yulin and Huang, Gao}, title = {Borrowing Knowledge From Pre-trained Language Model: A New Data-efficient Visual Learning Paradigm}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18786-18797} }
GETAvatar: Generative Textured Meshes for Animatable Human Avatars-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Xuanmeng and Zhang, Jianfeng and Chacko, Rohan and Xu, Hongyi and Song, Guoxian and Yang, Yi and Feng, Jiashi}, title = {GETAvatar: Generative Textured Meshes for Animatable Human Avatars}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2273-2282} }
Tracking without Label: Unsupervised Multiple Object Tracking via Contrastive Similarity Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Meng_2023_ICCV, author = {Meng, Sha and Shao, Dian and Guo, Jiacheng and Gao, Shan}, title = {Tracking without Label: Unsupervised Multiple Object Tracking via Contrastive Similarity Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16264-16273} }
PIDRo: Parallel Isomeric Attention with Dynamic Routing for Text-Video Retrieval-
[pdf]
[supp]
[bibtex]@InProceedings{Guan_2023_ICCV, author = {Guan, Peiyan and Pei, Renjing and Shao, Bin and Liu, Jianzhuang and Li, Weimian and Gu, Jiaxi and Xu, Hang and Xu, Songcen and Yan, Youliang and Lam, Edmund Y.}, title = {PIDRo: Parallel Isomeric Attention with Dynamic Routing for Text-Video Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11164-11173} }
Re-mine, Learn and Reason: Exploring the Cross-modal Semantic Correlations for Language-guided HOI detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cao_2023_ICCV, author = {Cao, Yichao and Tang, Qingfei and Yang, Feng and Su, Xiu and You, Shan and Lu, Xiaobo and Xu, Chang}, title = {Re-mine, Learn and Reason: Exploring the Cross-modal Semantic Correlations for Language-guided HOI detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23492-23503} }
Strata-NeRF : Neural Radiance Fields for Stratified Scenes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dhiman_2023_ICCV, author = {Dhiman, Ankit and Srinath, R and Rangwani, Harsh and Parihar, Rishubh and Boregowda, Lokesh R and Sridhar, Srinath and Babu, R Venkatesh}, title = {Strata-NeRF : Neural Radiance Fields for Stratified Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17603-17614} }
StylerDALLE: Language-Guided Style Transfer Using a Vector-Quantized Tokenizer of a Large-Scale Generative Model-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Zipeng and Sangineto, Enver and Sebe, Nicu}, title = {StylerDALLE: Language-Guided Style Transfer Using a Vector-Quantized Tokenizer of a Large-Scale Generative Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7601-7611} }
3D-aware Blending with Generative NeRFs-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2023_ICCV, author = {Kim, Hyunsu and Lee, Gayoung and Choi, Yunjey and Kim, Jin-Hwa and Zhu, Jun-Yan}, title = {3D-aware Blending with Generative NeRFs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22906-22918} }
Multi-Modal Gated Mixture of Local-to-Global Experts for Dynamic Image Fusion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cao_2023_ICCV, author = {Cao, Bing and Sun, Yiming and Zhu, Pengfei and Hu, Qinghua}, title = {Multi-Modal Gated Mixture of Local-to-Global Experts for Dynamic Image Fusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23555-23564} }
Deep Image Harmonization with Learnable Augmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Niu_2023_ICCV, author = {Niu, Li and Cao, Junyan and Cong, Wenyan and Zhang, Liqing}, title = {Deep Image Harmonization with Learnable Augmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7482-7491} }
DELFlow: Dense Efficient Learning of Scene Flow for Large-Scale Point Clouds-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Peng_2023_ICCV, author = {Peng, Chensheng and Wang, Guangming and Lo, Xian Wan and Wu, Xinrui and Xu, Chenfeng and Tomizuka, Masayoshi and Zhan, Wei and Wang, Hesheng}, title = {DELFlow: Dense Efficient Learning of Scene Flow for Large-Scale Point Clouds}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16901-16910} }
RFD-ECNet: Extreme Underwater Image Compression with Reference to Feature Dictionary-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Mengyao and Shen, Liquan and Ye, Peng and Feng, Guorui and Wang, Zheyin}, title = {RFD-ECNet: Extreme Underwater Image Compression with Reference to Feature Dictionary}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12980-12989} }
E^2VPT: An Effective and Efficient Approach for Visual Prompt Tuning-
[pdf]
[supp]
[bibtex]@InProceedings{Han_2023_ICCV, author = {Han, Cheng and Wang, Qifan and Cui, Yiming and Cao, Zhiwen and Wang, Wenguan and Qi, Siyuan and Liu, Dongfang}, title = {E{\textasciicircum}2VPT: An Effective and Efficient Approach for Visual Prompt Tuning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17491-17502} }
High-Resolution Document Shadow Removal via A Large-Scale Real-World Dataset and A Frequency-Aware Shadow Erasing Net-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Zinuo and Chen, Xuhang and Pun, Chi-Man and Cun, Xiaodong}, title = {High-Resolution Document Shadow Removal via A Large-Scale Real-World Dataset and A Frequency-Aware Shadow Erasing Net}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12449-12458} }
Scalable Diffusion Models with Transformers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Peebles_2023_ICCV, author = {Peebles, William and Xie, Saining}, title = {Scalable Diffusion Models with Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4195-4205} }
MMST-ViT: Climate Change-aware Crop Yield Prediction via Multi-Modal Spatial-Temporal Vision Transformer-
[pdf]
[bibtex]@InProceedings{Lin_2023_ICCV, author = {Lin, Fudong and Crawford, Summer and Guillot, Kaleb and Zhang, Yihe and Chen, Yan and Yuan, Xu and Chen, Li and Williams, Shelby and Minvielle, Robert and Xiao, Xiangming and Gholson, Drew and Ashwell, Nicolas and Setiyono, Tri and Tubana, Brenda and Peng, Lu and Bayoumi, Magdy and Tzeng, Nian-Feng}, title = {MMST-ViT: Climate Change-aware Crop Yield Prediction via Multi-Modal Spatial-Temporal Vision Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5774-5784} }
From Knowledge Distillation to Self-Knowledge Distillation: A Unified Approach with Normalized Loss and Customized Soft Labels-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Zhendong and Zeng, Ailing and Li, Zhe and Zhang, Tianke and Yuan, Chun and Li, Yu}, title = {From Knowledge Distillation to Self-Knowledge Distillation: A Unified Approach with Normalized Loss and Customized Soft Labels}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17185-17194} }
SILT: Shadow-Aware Iterative Label Tuning for Learning to Detect Shadows from Noisy Labels-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Han and Wang, Tianyu and Hu, Xiaowei and Fu, Chi-Wing}, title = {SILT: Shadow-Aware Iterative Label Tuning for Learning to Detect Shadows from Noisy Labels}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12687-12698} }
Implicit Autoencoder for Point-Cloud Self-Supervised Representation Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yan_2023_ICCV, author = {Yan, Siming and Yang, Zhenpei and Li, Haoxiang and Song, Chen and Guan, Li and Kang, Hao and Hua, Gang and Huang, Qixing}, title = {Implicit Autoencoder for Point-Cloud Self-Supervised Representation Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14530-14542} }
Grounded Image Text Matching with Mismatched Relation Reasoning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Yu and Wei, Yana and Wang, Haozhe and Liu, Yongfei and Yang, Sibei and He, Xuming}, title = {Grounded Image Text Matching with Mismatched Relation Reasoning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2976-2987} }
UniKD: Universal Knowledge Distillation for Mimicking Homogeneous or Heterogeneous Object Detectors-
[pdf]
[supp]
[bibtex]@InProceedings{Lao_2023_ICCV, author = {Lao, Shanshan and Song, Guanglu and Liu, Boxiao and Liu, Yu and Yang, Yujiu}, title = {UniKD: Universal Knowledge Distillation for Mimicking Homogeneous or Heterogeneous Object Detectors}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6362-6372} }
Speech4Mesh: Speech-Assisted Monocular 3D Facial Reconstruction for Speech-Driven 3D Facial Animation-
[pdf]
[supp]
[bibtex]@InProceedings{He_2023_ICCV, author = {He, Shan and He, Haonan and Yang, Shuo and Wu, Xiaoyan and Xia, Pengcheng and Yin, Bing and Liu, Cong and Dai, Lirong and Xu, Chang}, title = {Speech4Mesh: Speech-Assisted Monocular 3D Facial Reconstruction for Speech-Driven 3D Facial Animation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14192-14202} }
BoxDiff: Text-to-Image Synthesis with Training-Free Box-Constrained Diffusion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xie_2023_ICCV, author = {Xie, Jinheng and Li, Yuexiang and Huang, Yawen and Liu, Haozhe and Zhang, Wentian and Zheng, Yefeng and Shou, Mike Zheng}, title = {BoxDiff: Text-to-Image Synthesis with Training-Free Box-Constrained Diffusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7452-7461} }
Generalizing Neural Human Fitting to Unseen Poses With Articulated SE(3) Equivariance-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Feng_2023_ICCV, author = {Feng, Haiwen and Kulits, Peter and Liu, Shichen and Black, Michael J. and Abrevaya, Victoria Fernandez}, title = {Generalizing Neural Human Fitting to Unseen Poses With Articulated SE(3) Equivariance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7977-7988} }
Rapid Network Adaptation: Learning to Adapt Neural Networks Using Test-Time Feedback-
[pdf]
[bibtex]@InProceedings{Yeo_2023_ICCV, author = {Yeo, Teresa and Kar, O\u{g}uzhan Fatih and Sodagar, Zahra and Zamir, Amir}, title = {Rapid Network Adaptation: Learning to Adapt Neural Networks Using Test-Time Feedback}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4674-4687} }
Theoretical and Numerical Analysis of 3D Reconstruction Using Point and Line Incidences-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Rydell_2023_ICCV, author = {Rydell, Felix and Shehu, Elima and Torres, Ang\'elica}, title = {Theoretical and Numerical Analysis of 3D Reconstruction Using Point and Line Incidences}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3748-3757} }
Explaining Adversarial Robustness of Neural Networks from Clustering Effect Perspective-
[pdf]
[bibtex]@InProceedings{Jin_2023_ICCV, author = {Jin, Yulin and Zhang, Xiaoyu and Lou, Jian and Ma, Xu and Wang, Zilong and Chen, Xiaofeng}, title = {Explaining Adversarial Robustness of Neural Networks from Clustering Effect Perspective}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4522-4531} }
Leaping Into Memories: Space-Time Deep Feature Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Stergiou_2023_ICCV, author = {Stergiou, Alexandros and Deligiannis, Nikos}, title = {Leaping Into Memories: Space-Time Deep Feature Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1966-1976} }
Improving Generalization in Visual Reinforcement Learning via Conflict-aware Gradient Agreement Augmentation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Siao and Chen, Zhaoyu and Liu, Yang and Wang, Yuzheng and Yang, Dingkang and Zhao, Zhile and Zhou, Ziqing and Yi, Xie and Li, Wei and Zhang, Wenqiang and Gan, Zhongxue}, title = {Improving Generalization in Visual Reinforcement Learning via Conflict-aware Gradient Agreement Augmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23436-23446} }
Graph Matching with Bi-level Noisy Correspondence-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lin_2023_ICCV, author = {Lin, Yijie and Yang, Mouxing and Yu, Jun and Hu, Peng and Zhang, Changqing and Peng, Xi}, title = {Graph Matching with Bi-level Noisy Correspondence}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23362-23371} }
Learning from Noisy Pseudo Labels for Semi-Supervised Temporal Action Localization-
[pdf]
[supp]
[bibtex]@InProceedings{Xia_2023_ICCV, author = {Xia, Kun and Wang, Le and Zhou, Sanping and Hua, Gang and Tang, Wei}, title = {Learning from Noisy Pseudo Labels for Semi-Supervised Temporal Action Localization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10160-10169} }
InfiniCity: Infinite-Scale City Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lin_2023_ICCV, author = {Lin, Chieh Hubert and Lee, Hsin-Ying and Menapace, Willi and Chai, Menglei and Siarohin, Aliaksandr and Yang, Ming-Hsuan and Tulyakov, Sergey}, title = {InfiniCity: Infinite-Scale City Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22808-22818} }
OpenOccupancy: A Large Scale Benchmark for Surrounding Semantic Occupancy Perception-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Xiaofeng and Zhu, Zheng and Xu, Wenbo and Zhang, Yunpeng and Wei, Yi and Chi, Xu and Ye, Yun and Du, Dalong and Lu, Jiwen and Wang, Xingang}, title = {OpenOccupancy: A Large Scale Benchmark for Surrounding Semantic Occupancy Perception}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17850-17859} }
Weakly-Supervised Text-Driven Contrastive Learning for Facial Behavior Understanding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Xiang and Wang, Taoyue and Li, Xiaotian and Yang, Huiyuan and Yin, Lijun}, title = {Weakly-Supervised Text-Driven Contrastive Learning for Facial Behavior Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20751-20762} }
Box-based Refinement for Weakly Supervised and Unsupervised Localization Tasks-
[pdf]
[supp]
[bibtex]@InProceedings{Gomel_2023_ICCV, author = {Gomel, Eyal and Shaharbany, Tal and Wolf, Lior}, title = {Box-based Refinement for Weakly Supervised and Unsupervised Localization Tasks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16044-16054} }
Activate and Reject: Towards Safe Domain Generalization under Category Shift-
[pdf]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Chaoqi and Tang, Luyao and Tao, Leitian and Zhou, Hong-Yu and Huang, Yue and Han, Xiaoguang and Yu, Yizhou}, title = {Activate and Reject: Towards Safe Domain Generalization under Category Shift}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11552-11563} }
PRIOR: Prototype Representation Joint Learning from Medical Images and Reports-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cheng_2023_ICCV, author = {Cheng, Pujin and Lin, Li and Lyu, Junyan and Huang, Yijin and Luo, Wenhan and Tang, Xiaoying}, title = {PRIOR: Prototype Representation Joint Learning from Medical Images and Reports}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21361-21371} }
Dynamic Mesh Recovery from Partial Point Cloud Sequence-
[pdf]
[supp]
[bibtex]@InProceedings{Jang_2023_ICCV, author = {Jang, Hojun and Kim, Minkwan and Bae, Jinseok and Kim, Young Min}, title = {Dynamic Mesh Recovery from Partial Point Cloud Sequence}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15074-15084} }
WDiscOOD: Out-of-Distribution Detection via Whitened Linear Discriminant Analysis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Yiye and Lin, Yunzhi and Xu, Ruinian and Vela, Patricio A.}, title = {WDiscOOD: Out-of-Distribution Detection via Whitened Linear Discriminant Analysis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5298-5307} }
Boosting Few-shot Action Recognition with Graph-guided Hybrid Matching-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xing_2023_ICCV, author = {Xing, Jiazheng and Wang, Mengmeng and Ruan, Yudi and Chen, Bofan and Guo, Yaowei and Mu, Boyu and Dai, Guang and Wang, Jingdong and Liu, Yong}, title = {Boosting Few-shot Action Recognition with Graph-guided Hybrid Matching}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1740-1750} }
Neural Deformable Models for 3D Bi-Ventricular Heart Shape Reconstruction and Modeling from 2D Sparse Cardiac Magnetic Resonance Imaging-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ye_2023_ICCV, author = {Ye, Meng and Yang, Dong and Kanski, Mikael and Axel, Leon and Metaxas, Dimitris}, title = {Neural Deformable Models for 3D Bi-Ventricular Heart Shape Reconstruction and Modeling from 2D Sparse Cardiac Magnetic Resonance Imaging}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14247-14256} }
Vision HGNN: An Image is More than a Graph of Nodes-
[pdf]
[bibtex]@InProceedings{Han_2023_ICCV, author = {Han, Yan and Wang, Peihao and Kundu, Souvik and Ding, Ying and Wang, Zhangyang}, title = {Vision HGNN: An Image is More than a Graph of Nodes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19878-19888} }
Nonrigid Object Contact Estimation With Regional Unwrapping Transformer-
[pdf]
[arXiv]
[bibtex]@InProceedings{Xie_2023_ICCV, author = {Xie, Wei and Zhao, Zimeng and Li, Shiying and Zuo, Binghui and Wang, Yangang}, title = {Nonrigid Object Contact Estimation With Regional Unwrapping Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9342-9351} }
Diffusion in Style-
[pdf]
[supp]
[bibtex]@InProceedings{Everaert_2023_ICCV, author = {Everaert, Martin Nicolas and Bocchio, Marco and Arpa, Sami and S\"usstrunk, Sabine and Achanta, Radhakrishna}, title = {Diffusion in Style}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2251-2261} }
FunnyBirds: A Synthetic Vision Dataset for a Part-Based Analysis of Explainable AI Methods-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hesse_2023_ICCV, author = {Hesse, Robin and Schaub-Meyer, Simone and Roth, Stefan}, title = {FunnyBirds: A Synthetic Vision Dataset for a Part-Based Analysis of Explainable AI Methods}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3981-3991} }
Deformable Neural Radiance Fields using RGB and Event Cameras-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ma_2023_ICCV, author = {Ma, Qi and Paudel, Danda Pani and Chhatkuli, Ajad and Van Gool, Luc}, title = {Deformable Neural Radiance Fields using RGB and Event Cameras}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3590-3600} }
BeLFusion: Latent Diffusion for Behavior-Driven Human Motion Prediction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Barquero_2023_ICCV, author = {Barquero, German and Escalera, Sergio and Palmero, Cristina}, title = {BeLFusion: Latent Diffusion for Behavior-Driven Human Motion Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2317-2327} }
Semi-supervised Semantics-guided Adversarial Training for Robust Trajectory Prediction-
[pdf]
[supp]
[bibtex]@InProceedings{Jiao_2023_ICCV, author = {Jiao, Ruochen and Liu, Xiangguo and Sato, Takami and Chen, Qi Alfred and Zhu, Qi}, title = {Semi-supervised Semantics-guided Adversarial Training for Robust Trajectory Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8207-8217} }
Linear-Covariance Loss for End-to-End Learning of 6D Pose Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Fulin and Hu, Yinlin and Salzmann, Mathieu}, title = {Linear-Covariance Loss for End-to-End Learning of 6D Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14107-14117} }
RLSAC: Reinforcement Learning Enhanced Sample Consensus for End-to-End Robust Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nie_2023_ICCV, author = {Nie, Chang and Wang, Guangming and Liu, Zhe and Cavalli, Luca and Pollefeys, Marc and Wang, Hesheng}, title = {RLSAC: Reinforcement Learning Enhanced Sample Consensus for End-to-End Robust Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9891-9900} }
CleanCLIP: Mitigating Data Poisoning Attacks in Multimodal Contrastive Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bansal_2023_ICCV, author = {Bansal, Hritik and Singhi, Nishad and Yang, Yu and Yin, Fan and Grover, Aditya and Chang, Kai-Wei}, title = {CleanCLIP: Mitigating Data Poisoning Attacks in Multimodal Contrastive Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {112-123} }
Multi-Frequency Representation Enhancement with Privilege Information for Video Super-Resolution-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Fei and Zhang, Linfeng and Liu, Zikun and Lei, Juan and Li, Zhenbo}, title = {Multi-Frequency Representation Enhancement with Privilege Information for Video Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12814-12825} }
Self-supervised Pre-training for Mirror Detection-
[pdf]
[bibtex]@InProceedings{Lin_2023_ICCV, author = {Lin, Jiaying and Lau, Rynson W.H.}, title = {Self-supervised Pre-training for Mirror Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12227-12236} }
GlowGAN: Unsupervised Learning of HDR Images from LDR Images in the Wild-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Chao and Serrano, Ana and Pan, Xingang and Chen, Bin and Myszkowski, Karol and Seidel, Hans-Peter and Theobalt, Christian and Leimk\"uhler, Thomas}, title = {GlowGAN: Unsupervised Learning of HDR Images from LDR Images in the Wild}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10509-10519} }
Cumulative Spatial Knowledge Distillation for Vision Transformers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Borui and Song, Renjie and Liang, Jiajun}, title = {Cumulative Spatial Knowledge Distillation for Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6146-6155} }
Dual Pseudo-Labels Interactive Self-Training for Semi-Supervised Visible-Infrared Person Re-Identification-
[pdf]
[supp]
[bibtex]@InProceedings{Shi_2023_ICCV, author = {Shi, Jiangming and Zhang, Yachao and Yin, Xiangbo and Xie, Yuan and Zhang, Zhizhong and Fan, Jianping and Shi, Zhongchao and Qu, Yanyun}, title = {Dual Pseudo-Labels Interactive Self-Training for Semi-Supervised Visible-Infrared Person Re-Identification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11218-11228} }
Less is More: Focus Attention for Efficient DETR-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zheng_2023_ICCV, author = {Zheng, Dehua and Dong, Wenhui and Hu, Hailin and Chen, Xinghao and Wang, Yunhe}, title = {Less is More: Focus Attention for Efficient DETR}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6674-6683} }
Efficient Controllable Multi-Task Architectures-
[pdf]
[arXiv]
[bibtex]@InProceedings{Aich_2023_ICCV, author = {Aich, Abhishek and Schulter, Samuel and Roy-Chowdhury, Amit K. and Chandraker, Manmohan and Suh, Yumin}, title = {Efficient Controllable Multi-Task Architectures}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5740-5751} }
HumanSD: A Native Skeleton-Guided Diffusion Model for Human Image Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ju_2023_ICCV, author = {Ju, Xuan and Zeng, Ailing and Zhao, Chenchen and Wang, Jianan and Zhang, Lei and Xu, Qiang}, title = {HumanSD: A Native Skeleton-Guided Diffusion Model for Human Image Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15988-15998} }
Lens Parameter Estimation for Realistic Depth of Field Modeling-
[pdf]
[supp]
[bibtex]@InProceedings{Piche-Meunier_2023_ICCV, author = {Pich\'e-Meunier, Dominique and Hold-Geoffroy, Yannick and Zhang, Jianming and Lalonde, Jean-Fran\c{c}ois}, title = {Lens Parameter Estimation for Realistic Depth of Field Modeling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {499-508} }
Learned Compressive Representations for Single-Photon 3D Imaging-
[pdf]
[supp]
[bibtex]@InProceedings{Gutierrez-Barragan_2023_ICCV, author = {Gutierrez-Barragan, Felipe and Mu, Fangzhou and Ardelean, Andrei and Ingle, Atul and Bruschini, Claudio and Charbon, Edoardo and Li, Yin and Gupta, Mohit and Velten, Andreas}, title = {Learned Compressive Representations for Single-Photon 3D Imaging}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10756-10766} }
Alignment-free HDR Deghosting with Semantics Consistent Transformer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tel_2023_ICCV, author = {Tel, Steven and Wu, Zongwei and Zhang, Yulun and Heyrman, Barth\'el\'emy and Demonceaux, C\'edric and Timofte, Radu and Ginhac, Dominique}, title = {Alignment-free HDR Deghosting with Semantics Consistent Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12836-12845} }
Semantic-Aware Implicit Template Learning via Part Deformation Consistency-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2023_ICCV, author = {Kim, Sihyeon and Joo, Minseok and Lee, Jaewon and Ko, Juyeon and Cha, Juhan and Kim, Hyunwoo J.}, title = {Semantic-Aware Implicit Template Learning via Part Deformation Consistency}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {593-603} }
HRS-Bench: Holistic, Reliable and Scalable Benchmark for Text-to-Image Models-
[pdf]
[supp]
[bibtex]@InProceedings{Bakr_2023_ICCV, author = {Bakr, Eslam Mohamed and Sun, Pengzhan and Shen, Xiaoqian and Khan, Faizan Farooq and Li, Li Erran and Elhoseiny, Mohamed}, title = {HRS-Bench: Holistic, Reliable and Scalable Benchmark for Text-to-Image Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20041-20053} }
Multi3DRefer: Grounding Text Description to Multiple 3D Objects-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Yiming and Gong, ZeMing and Chang, Angel X.}, title = {Multi3DRefer: Grounding Text Description to Multiple 3D Objects}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15225-15236} }
Examining Autoexposure for Challenging Scenes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tedla_2023_ICCV, author = {Tedla, SaiKiran and Yang, Beixuan and Brown, Michael S.}, title = {Examining Autoexposure for Challenging Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13076-13085} }
DiffCloth: Diffusion Based Garment Synthesis and Manipulation via Structural Cross-modal Semantic Alignment-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Xujie and Yang, Binbin and Kampffmeyer, Michael C. and Zhang, Wenqing and Zhang, Shiyue and Lu, Guansong and Lin, Liang and Xu, Hang and Liang, Xiaodan}, title = {DiffCloth: Diffusion Based Garment Synthesis and Manipulation via Structural Cross-modal Semantic Alignment}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23154-23163} }
Improved Visual Fine-tuning with Natural Language Supervision-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Junyang and Xu, Yuanhong and Hu, Juhua and Yan, Ming and Sang, Jitao and Qian, Qi}, title = {Improved Visual Fine-tuning with Natural Language Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11899-11909} }
Person Re-Identification without Identification via Event anonymization-
[pdf]
[arXiv]
[bibtex]@InProceedings{Ahmad_2023_ICCV, author = {Ahmad, Shafiq and Morerio, Pietro and Del Bue, Alessio}, title = {Person Re-Identification without Identification via Event anonymization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11132-11141} }
GRAM-HD: 3D-Consistent Image Generation at High Resolution with Generative Radiance Manifolds-
[pdf]
[supp]
[bibtex]@InProceedings{Xiang_2023_ICCV, author = {Xiang, Jianfeng and Yang, Jiaolong and Deng, Yu and Tong, Xin}, title = {GRAM-HD: 3D-Consistent Image Generation at High Resolution with Generative Radiance Manifolds}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2195-2205} }
Small Object Detection via Coarse-to-fine Proposal Generation and Imitation Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yuan_2023_ICCV, author = {Yuan, Xiang and Cheng, Gong and Yan, Kebing and Zeng, Qinghua and Han, Junwei}, title = {Small Object Detection via Coarse-to-fine Proposal Generation and Imitation Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6317-6327} }
Anomaly Detection Under Distribution Shift-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cao_2023_ICCV, author = {Cao, Tri and Zhu, Jiawen and Pang, Guansong}, title = {Anomaly Detection Under Distribution Shift}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6511-6523} }
Class Prior-Free Positive-Unlabeled Learning with Taylor Variational Loss for Hyperspectral Remote Sensing Imagery-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Hengwei and Wang, Xinyu and Li, Jingtao and Zhong, Yanfei}, title = {Class Prior-Free Positive-Unlabeled Learning with Taylor Variational Loss for Hyperspectral Remote Sensing Imagery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16827-16836} }
HoloAssist: an Egocentric Human Interaction Dataset for Interactive AI Assistants in the Real World-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Xin and Kwon, Taein and Rad, Mahdi and Pan, Bowen and Chakraborty, Ishani and Andrist, Sean and Bohus, Dan and Feniello, Ashley and Tekin, Bugra and Frujeri, Felipe Vieira and Joshi, Neel and Pollefeys, Marc}, title = {HoloAssist: an Egocentric Human Interaction Dataset for Interactive AI Assistants in the Real World}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20270-20281} }
Self-Feedback DETR for Temporal Action Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2023_ICCV, author = {Kim, Jihwan and Lee, Miso and Heo, Jae-Pil}, title = {Self-Feedback DETR for Temporal Action Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10286-10296} }
StableVideo: Text-driven Consistency-aware Diffusion Video Editing-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chai_2023_ICCV, author = {Chai, Wenhao and Guo, Xun and Wang, Gaoang and Lu, Yan}, title = {StableVideo: Text-driven Consistency-aware Diffusion Video Editing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23040-23050} }
PIRNet: Privacy-Preserving Image Restoration Network via Wavelet Lifting-
[pdf]
[bibtex]@InProceedings{Deng_2023_ICCV, author = {Deng, Xin and Gao, Chao and Xu, Mai}, title = {PIRNet: Privacy-Preserving Image Restoration Network via Wavelet Lifting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22368-22377} }
LAW-Diffusion: Complex Scene Generation by Diffusion with Layouts-
[pdf]
[supp]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Binbin and Luo, Yi and Chen, Ziliang and Wang, Guangrun and Liang, Xiaodan and Lin, Liang}, title = {LAW-Diffusion: Complex Scene Generation by Diffusion with Layouts}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22669-22679} }
Multi-Label Knowledge Distillation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Penghui and Xie, Ming-Kun and Zong, Chen-Chen and Feng, Lei and Niu, Gang and Sugiyama, Masashi and Huang, Sheng-Jun}, title = {Multi-Label Knowledge Distillation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17271-17280} }
Towards Geospatial Foundation Models via Continual Pretraining-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mendieta_2023_ICCV, author = {Mendieta, Mat{\'\i}as and Han, Boran and Shi, Xingjian and Zhu, Yi and Chen, Chen}, title = {Towards Geospatial Foundation Models via Continual Pretraining}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16806-16816} }
ConSlide: Asynchronous Hierarchical Interaction Transformer with Breakup-Reorganize Rehearsal for Continual Whole Slide Image Analysis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Yanyan and Zhao, Weiqin and Wang, Shujun and Fu, Yu and Jiang, Yuming and Yu, Lequan}, title = {ConSlide: Asynchronous Hierarchical Interaction Transformer with Breakup-Reorganize Rehearsal for Continual Whole Slide Image Analysis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21349-21360} }
RepQ-ViT: Scale Reparameterization for Post-Training Quantization of Vision Transformers-
[pdf]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Zhikai and Xiao, Junrui and Yang, Lianwei and Gu, Qingyi}, title = {RepQ-ViT: Scale Reparameterization for Post-Training Quantization of Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17227-17236} }
Enhancing Privacy Preservation in Federated Learning via Learning Rate Perturbation-
[pdf]
[supp]
[bibtex]@InProceedings{Wan_2023_ICCV, author = {Wan, Guangnian and Du, Haitao and Yuan, Xuejing and Yang, Jun and Chen, Meiling and Xu, Jie}, title = {Enhancing Privacy Preservation in Federated Learning via Learning Rate Perturbation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4772-4781} }
UMC: A Unified Bandwidth-efficient and Multi-resolution based Collaborative Perception Framework-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Tianhang and Chen, Guang and Chen, Kai and Liu, Zhengfa and Zhang, Bo and Knoll, Alois and Jiang, Changjun}, title = {UMC: A Unified Bandwidth-efficient and Multi-resolution based Collaborative Perception Framework}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8187-8196} }
Viewing Graph Solvability in Practice-
[pdf]
[bibtex]@InProceedings{Arrigoni_2023_ICCV, author = {Arrigoni, Federica and Pajdla, Tomas and Fusiello, Andrea}, title = {Viewing Graph Solvability in Practice}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8147-8155} }
SATR: Zero-Shot Semantic Segmentation of 3D Shapes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Abdelreheem_2023_ICCV, author = {Abdelreheem, Ahmed and Skorokhodov, Ivan and Ovsjanikov, Maks and Wonka, Peter}, title = {SATR: Zero-Shot Semantic Segmentation of 3D Shapes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15166-15179} }
ReactioNet: Learning High-Order Facial Behavior from Universal Stimulus-Reaction by Dyadic Relation Reasoning-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Xiaotian and Wang, Taoyue and Zhao, Geran and Zhang, Xiang and Kang, Xi and Yin, Lijun}, title = {ReactioNet: Learning High-Order Facial Behavior from Universal Stimulus-Reaction by Dyadic Relation Reasoning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20774-20785} }
Pseudo Flow Consistency for Self-Supervised 6D Object Pose Estimation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Hai_2023_ICCV, author = {Hai, Yang and Song, Rui and Li, Jiaojiao and Ferstl, David and Hu, Yinlin}, title = {Pseudo Flow Consistency for Self-Supervised 6D Object Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14075-14085} }
Emotional Listener Portrait: Neural Listener Head Generation with Emotion-
[pdf]
[supp]
[bibtex]@InProceedings{Song_2023_ICCV, author = {Song, Luchuan and Yin, Guojun and Jin, Zhenchao and Dong, Xiaoyi and Xu, Chenliang}, title = {Emotional Listener Portrait: Neural Listener Head Generation with Emotion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20839-20849} }
Unsupervised Domain Adaptation for Training Event-Based Networks Using Contrastive Learning and Uncorrelated Conditioning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jian_2023_ICCV, author = {Jian, Dayuan and Rostami, Mohammad}, title = {Unsupervised Domain Adaptation for Training Event-Based Networks Using Contrastive Learning and Uncorrelated Conditioning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18721-18731} }
Probabilistic Human Mesh Recovery in 3D Scenes from Egocentric Views-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Siwei and Ma, Qianli and Zhang, Yan and Aliakbarian, Sadegh and Cosker, Darren and Tang, Siyu}, title = {Probabilistic Human Mesh Recovery in 3D Scenes from Egocentric Views}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7989-8000} }
ImGeoNet: Image-induced Geometry-aware Voxel Representation for Multi-view 3D Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tu_2023_ICCV, author = {Tu, Tao and Chuang, Shun-Po and Liu, Yu-Lun and Sun, Cheng and Zhang, Ke and Roy, Donna and Kuo, Cheng-Hao and Sun, Min}, title = {ImGeoNet: Image-induced Geometry-aware Voxel Representation for Multi-view 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6996-7007} }
DRAW: Defending Camera-shooted RAW Against Image Manipulation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hu_2023_ICCV, author = {Hu, Xiaoxiao and Ying, Qichao and Qian, Zhenxing and Li, Sheng and Zhang, Xinpeng}, title = {DRAW: Defending Camera-shooted RAW Against Image Manipulation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22434-22444} }
Controllable Person Image Synthesis with Pose-Constrained Latent Diffusion-
[pdf]
[supp]
[bibtex]@InProceedings{Han_2023_ICCV, author = {Han, Xiao and Zhu, Xiatian and Deng, Jiankang and Song, Yi-Zhe and Xiang, Tao}, title = {Controllable Person Image Synthesis with Pose-Constrained Latent Diffusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22768-22777} }
Diffusion-based Image Translation with Label Guidance for Domain Adaptive Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Peng_2023_ICCV, author = {Peng, Duo and Hu, Ping and Ke, Qiuhong and Liu, Jun}, title = {Diffusion-based Image Translation with Label Guidance for Domain Adaptive Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {808-820} }
TopoSeg: Topology-Aware Nuclear Instance Segmentation-
[pdf]
[bibtex]@InProceedings{He_2023_ICCV, author = {He, Hongliang and Wang, Jun and Wei, Pengxu and Xu, Fan and Ji, Xiangyang and Liu, Chang and Chen, Jie}, title = {TopoSeg: Topology-Aware Nuclear Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21307-21316} }
SceneRF: Self-Supervised Monocular 3D Scene Reconstruction with Radiance Fields-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cao_2023_ICCV, author = {Cao, Anh-Quan and de Charette, Raoul}, title = {SceneRF: Self-Supervised Monocular 3D Scene Reconstruction with Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9387-9398} }
Isomer: Isomerous Transformer for Zero-shot Video Object Segmentation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Yuan_2023_ICCV, author = {Yuan, Yichen and Wang, Yifan and Wang, Lijun and Zhao, Xiaoqi and Lu, Huchuan and Wang, Yu and Su, Weibo and Zhang, Lei}, title = {Isomer: Isomerous Transformer for Zero-shot Video Object Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {966-976} }
CPCM: Contextual Point Cloud Modeling for Weakly-supervised Point Cloud Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Lizhao and Zhuang, Zhuangwei and Huang, Shangxin and Xiao, Xunlong and Xiang, Tianhang and Chen, Cen and Wang, Jingdong and Tan, Mingkui}, title = {CPCM: Contextual Point Cloud Modeling for Weakly-supervised Point Cloud Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18413-18422} }
PATMAT: Person Aware Tuning of Mask-Aware Transformer for Face Inpainting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Motamed_2023_ICCV, author = {Motamed, Saman and Xu, Jianjin and Wu, Chen Henry and H\"ane, Christian and Bazin, Jean-Charles and De la Torre, Fernando}, title = {PATMAT: Person Aware Tuning of Mask-Aware Transformer for Face Inpainting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22778-22787} }
Adaptive Nonlinear Latent Transformation for Conditional Face Editing-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Zhizhong and Ma, Siteng and Zhang, Junping and Shan, Hongming}, title = {Adaptive Nonlinear Latent Transformation for Conditional Face Editing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21022-21031} }
Tiny Updater: Towards Efficient Neural Network-Driven Software Updating-
[pdf]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Linfeng and Ma, Kaisheng}, title = {Tiny Updater: Towards Efficient Neural Network-Driven Software Updating}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23447-23459} }
INT2: Interactive Trajectory Prediction at Intersections-
[pdf]
[bibtex]@InProceedings{Yan_2023_ICCV, author = {Yan, Zhijie and Li, Pengfei and Fu, Zheng and Xu, Shaocong and Shi, Yongliang and Chen, Xiaoxue and Zheng, Yuhang and Li, Yang and Liu, Tianyu and Li, Chuxuan and Luo, Nairui and Gao, Xu and Chen, Yilun and Wang, Zuoxu and Shi, Yifeng and Huang, Pengfei and Han, Zhengxiao and Yuan, Jirui and Gong, Jiangtao and Zhou, Guyue and Zhao, Hang and Zhao, Hao}, title = {INT2: Interactive Trajectory Prediction at Intersections}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8536-8547} }
MapPrior: Bird's-Eye View Map Layout Estimation with Generative Models-
[pdf]
[supp]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Xiyue and Zyrianov, Vlas and Liu, Zhijian and Wang, Shenlong}, title = {MapPrior: Bird's-Eye View Map Layout Estimation with Generative Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8228-8239} }
CAD-Estate: Large-scale CAD Model Annotation in RGB Videos-
[pdf]
[bibtex]@InProceedings{Maninis_2023_ICCV, author = {Maninis, Kevis-Kokitsi and Popov, Stefan and Nie{\ss}ner, Matthias and Ferrari, Vittorio}, title = {CAD-Estate: Large-scale CAD Model Annotation in RGB Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20189-20199} }
Conditional Cross Attention Network for Multi-Space Embedding without Entanglement in Only a SINGLE Network-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Song_2023_ICCV, author = {Song, Chull Hwan and Hwang, Taebaek and Yoon, Jooyoung and Choi, Shunghyun and Gu, Yeong Hyeon}, title = {Conditional Cross Attention Network for Multi-Space Embedding without Entanglement in Only a SINGLE Network}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11112-11121} }
MB-TaylorFormer: Multi-Branch Efficient Transformer Expanded by Taylor Formula for Image Dehazing-
[pdf]
[supp]
[bibtex]@InProceedings{Qiu_2023_ICCV, author = {Qiu, Yuwei and Zhang, Kaihao and Wang, Chenxi and Luo, Wenhan and Li, Hongdong and Jin, Zhi}, title = {MB-TaylorFormer: Multi-Branch Efficient Transformer Expanded by Taylor Formula for Image Dehazing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12802-12813} }
X-Mesh: Towards Fast and Accurate Text-driven 3D Stylization via Dynamic Textual Guidance-
[pdf]
[bibtex]@InProceedings{Ma_2023_ICCV, author = {Ma, Yiwei and Zhang, Xiaoqing and Sun, Xiaoshuai and Ji, Jiayi and Wang, Haowei and Jiang, Guannan and Zhuang, Weilin and Ji, Rongrong}, title = {X-Mesh: Towards Fast and Accurate Text-driven 3D Stylization via Dynamic Textual Guidance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2749-2760} }
Muscles in Action-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chiquier_2023_ICCV, author = {Chiquier, Mia and Vondrick, Carl}, title = {Muscles in Action}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22091-22101} }
Large-Scale Person Detection and Localization Using Overhead Fisheye Cameras-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Lu and Li, Liulei and Xin, Xueshi and Sun, Yifan and Song, Qing and Wang, Wenguan}, title = {Large-Scale Person Detection and Localization Using Overhead Fisheye Cameras}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19961-19971} }
ViLTA: Enhancing Vision-Language Pre-training through Textual Augmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Weihan and Yang, Zhen and Xu, Bin and Li, Juanzi and Sun, Yankui}, title = {ViLTA: Enhancing Vision-Language Pre-training through Textual Augmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3158-3169} }
All-to-Key Attention for Arbitrary Style Transfer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Mingrui and He, Xiao and Wang, Nannan and Wang, Xiaoyu and Gao, Xinbo}, title = {All-to-Key Attention for Arbitrary Style Transfer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23109-23119} }
Learning to Distill Global Representation for Sparse-View CT-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Zilong and Ma, Chenglong and Chen, Jie and Zhang, Junping and Shan, Hongming}, title = {Learning to Distill Global Representation for Sparse-View CT}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21196-21207} }
FocalFormer3D: Focusing on Hard Instance for 3D Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Yilun and Yu, Zhiding and Chen, Yukang and Lan, Shiyi and Anandkumar, Anima and Jia, Jiaya and Alvarez, Jose M.}, title = {FocalFormer3D: Focusing on Hard Instance for 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8394-8405} }
Not Every Side Is Equal: Localization Uncertainty Estimation for Semi-Supervised 3D Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Chuxin and Yang, Wenfei and Zhang, Tianzhu}, title = {Not Every Side Is Equal: Localization Uncertainty Estimation for Semi-Supervised 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3814-3824} }
Teaching CLIP to Count to Ten-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Paiss_2023_ICCV, author = {Paiss, Roni and Ephrat, Ariel and Tov, Omer and Zada, Shiran and Mosseri, Inbar and Irani, Michal and Dekel, Tali}, title = {Teaching CLIP to Count to Ten}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3170-3180} }
TEMPO: Efficient Multi-View Pose Estimation, Tracking, and Forecasting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Choudhury_2023_ICCV, author = {Choudhury, Rohan and Kitani, Kris M. and Jeni, L\'aszl\'o A.}, title = {TEMPO: Efficient Multi-View Pose Estimation, Tracking, and Forecasting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14750-14760} }
SparseMAE: Sparse Training Meets Masked Autoencoders-
[pdf]
[supp]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Aojun and Li, Yang and Qin, Zipeng and Liu, Jianbo and Pan, Junting and Zhang, Renrui and Zhao, Rui and Gao, Peng and Li, Hongsheng}, title = {SparseMAE: Sparse Training Meets Masked Autoencoders}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16176-16186} }
DiffPose: SpatioTemporal Diffusion Model for Video-Based Human Pose Estimation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Feng_2023_ICCV, author = {Feng, Runyang and Gao, Yixing and Tse, Tze Ho Elden and Ma, Xueqing and Chang, Hyung Jin}, title = {DiffPose: SpatioTemporal Diffusion Model for Video-Based Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14861-14872} }
ELITE: Encoding Visual Concepts into Textual Embeddings for Customized Text-to-Image Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wei_2023_ICCV, author = {Wei, Yuxiang and Zhang, Yabo and Ji, Zhilong and Bai, Jinfeng and Zhang, Lei and Zuo, Wangmeng}, title = {ELITE: Encoding Visual Concepts into Textual Embeddings for Customized Text-to-Image Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15943-15953} }
Text2Performer: Text-Driven Human Video Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jiang_2023_ICCV, author = {Jiang, Yuming and Yang, Shuai and Koh, Tong Liang and Wu, Wayne and Loy, Chen Change and Liu, Ziwei}, title = {Text2Performer: Text-Driven Human Video Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22747-22757} }
A Simple Recipe to Meta-Learn Forward and Backward Transfer-
[pdf]
[supp]
[bibtex]@InProceedings{Cetin_2023_ICCV, author = {Cetin, Edoardo and Carta, Antonio and Celiktutan, Oya}, title = {A Simple Recipe to Meta-Learn Forward and Backward Transfer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18732-18742} }
4D Myocardium Reconstruction with Decoupled Motion and Shape Model-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yuan_2023_ICCV, author = {Yuan, Xiaohan and Liu, Cong and Wang, Yangang}, title = {4D Myocardium Reconstruction with Decoupled Motion and Shape Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21252-21262} }
IntentQA: Context-aware Video Intent Reasoning-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Jiapeng and Wei, Ping and Han, Wenjuan and Fan, Lifeng}, title = {IntentQA: Context-aware Video Intent Reasoning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11963-11974} }
LiDAR-UDA: Self-ensembling Through Time for Unsupervised LiDAR Domain Adaptation-
[pdf]
[supp]
[bibtex]@InProceedings{Shaban_2023_ICCV, author = {Shaban, Amirreza and Lee, JoonHo and Jung, Sanghun and Meng, Xiangyun and Boots, Byron}, title = {LiDAR-UDA: Self-ensembling Through Time for Unsupervised LiDAR Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19784-19794} }
Robust Monocular Depth Estimation under Challenging Conditions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gasperini_2023_ICCV, author = {Gasperini, Stefano and Morbitzer, Nils and Jung, HyunJun and Navab, Nassir and Tombari, Federico}, title = {Robust Monocular Depth Estimation under Challenging Conditions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8177-8186} }
Parametric Depth Based Feature Representation Learning for Object Detection and Segmentation in Bird's-Eye View-
[pdf]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Jiayu and Xie, Enze and Liu, Miaomiao and Alvarez, Jose M.}, title = {Parametric Depth Based Feature Representation Learning for Object Detection and Segmentation in Bird's-Eye View}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8483-8492} }
MSI: Maximize Support-Set Information for Few-Shot Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Moon_2023_ICCV, author = {Moon, Seonghyeon and Sohn, Samuel S. and Zhou, Honglu and Yoon, Sejong and Pavlovic, Vladimir and Khan, Muhammad Haris and Kapadia, Mubbasir}, title = {MSI: Maximize Support-Set Information for Few-Shot Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19266-19276} }
Global Features are All You Need for Image Retrieval and Reranking-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shao_2023_ICCV, author = {Shao, Shihao and Chen, Kaifeng and Karpur, Arjun and Cui, Qinghua and Araujo, Andr\'e and Cao, Bingyi}, title = {Global Features are All You Need for Image Retrieval and Reranking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11036-11046} }
DPF-Net: Combining Explicit Shape Priors in Deformable Primitive Field for Unsupervised Structural Reconstruction of 3D Objects-
[pdf]
[supp]
[bibtex]@InProceedings{Shuai_2023_ICCV, author = {Shuai, Qingyao and Zhang, Chi and Yang, Kaizhi and Chen, Xuejin}, title = {DPF-Net: Combining Explicit Shape Priors in Deformable Primitive Field for Unsupervised Structural Reconstruction of 3D Objects}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14321-14329} }
CORE: Co-planarity Regularized Monocular Geometry Estimation with Weak Supervision-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Yuguang and Wang, Kai and Li, Hui and Rhee, Seon-Min and Han, Seungju and Kim, Jihye and Yang, Min and Yang, Ran and Zhu, Feng}, title = {CORE: Co-planarity Regularized Monocular Geometry Estimation with Weak Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8796-8805} }
A Sentence Speaks a Thousand Images: Domain Generalization through Distilling CLIP with Language Guidance-
[pdf]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Zeyi and Zhou, Andy and Ling, Zijian and Cai, Mu and Wang, Haohan and Lee, Yong Jae}, title = {A Sentence Speaks a Thousand Images: Domain Generalization through Distilling CLIP with Language Guidance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11685-11695} }
H3WB: Human3.6M 3D WholeBody Dataset and Benchmark-
[pdf]
[supp]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Yue and Samet, Nermin and Picard, David}, title = {H3WB: Human3.6M 3D WholeBody Dataset and Benchmark}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20166-20177} }
Yes, we CANN: Constrained Approximate Nearest Neighbors for Local Feature-Based Visual Localization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Aiger_2023_ICCV, author = {Aiger, Dror and Araujo, Andre and Lynen, Simon}, title = {Yes, we CANN: Constrained Approximate Nearest Neighbors for Local Feature-Based Visual Localization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13339-13349} }
Multi-Object Navigation with Dynamically Learned Neural Implicit Representations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Marza_2023_ICCV, author = {Marza, Pierre and Matignon, Laetitia and Simonin, Olivier and Wolf, Christian}, title = {Multi-Object Navigation with Dynamically Learned Neural Implicit Representations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11004-11015} }
NPC: Neural Point Characters from Video-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Su_2023_ICCV, author = {Su, Shih-Yang and Bagautdinov, Timur and Rhodin, Helge}, title = {NPC: Neural Point Characters from Video}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14795-14805} }
LDP-Feat: Image Features with Local Differential Privacy-
[pdf]
[supp]
[bibtex]@InProceedings{Pittaluga_2023_ICCV, author = {Pittaluga, Francesco and Zhuang, Bingbing}, title = {LDP-Feat: Image Features with Local Differential Privacy}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17580-17590} }
Pre-Training-Free Image Manipulation Localization through Non-Mutually Exclusive Contrastive Learning-
[pdf]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Jizhe and Ma, Xiaochen and Du, Xia and Alhammadi, Ahmed Y. and Feng, Wentao}, title = {Pre-Training-Free Image Manipulation Localization through Non-Mutually Exclusive Contrastive Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22346-22356} }
MRN: Multiplexed Routing Network for Incremental Multilingual Text Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zheng_2023_ICCV, author = {Zheng, Tianlun and Chen, Zhineng and Huang, Bingchen and Zhang, Wei and Jiang, Yu-Gang}, title = {MRN: Multiplexed Routing Network for Incremental Multilingual Text Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18644-18653} }
Domain Generalization Guided by Gradient Signal to Noise Ratio of Parameters-
[pdf]
[supp]
[bibtex]@InProceedings{Michalkiewicz_2023_ICCV, author = {Michalkiewicz, Mateusz and Faraki, Masoud and Yu, Xiang and Chandraker, Manmohan and Baktashmotlagh, Mahsa}, title = {Domain Generalization Guided by Gradient Signal to Noise Ratio of Parameters}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6177-6188} }
Counterfactual-based Saliency Map: Towards Visual Contrastive Explanations for Neural Networks-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Xue and Wang, Zhibo and Weng, Haiqin and Guo, Hengchang and Zhang, Zhifei and Jin, Lu and Wei, Tao and Ren, Kui}, title = {Counterfactual-based Saliency Map: Towards Visual Contrastive Explanations for Neural Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2042-2051} }
MST-compression: Compressing and Accelerating Binary Neural Networks with Minimum Spanning Tree-
[pdf]
[supp]
[bibtex]@InProceedings{Vo_2023_ICCV, author = {Vo, Quang Hieu and Tran, Linh-Tam and Bae, Sung-Ho and Kim, Lok-Won and Hong, Choong Seon}, title = {MST-compression: Compressing and Accelerating Binary Neural Networks with Minimum Spanning Tree}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6091-6100} }
MOST: Multiple Object Localization with Self-Supervised Transformers for Object Discovery-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Rambhatla_2023_ICCV, author = {Rambhatla, Sai Saketh and Misra, Ishan and Chellappa, Rama and Shrivastava, Abhinav}, title = {MOST: Multiple Object Localization with Self-Supervised Transformers for Object Discovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15823-15834} }
IIEU: Rethinking Neural Feature Activation from Decision-Making-
[pdf]
[supp]
[bibtex]@InProceedings{Cai_2023_ICCV, author = {Cai, Sudong}, title = {IIEU: Rethinking Neural Feature Activation from Decision-Making}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5796-5806} }
Integrally Migrating Pre-trained Transformer Encoder-decoders for Visual Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Feng and Zhang, Xiaosong and Peng, Zhiliang and Guo, Zonghao and Wan, Fang and Ji, Xiangyang and Ye, Qixiang}, title = {Integrally Migrating Pre-trained Transformer Encoder-decoders for Visual Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6825-6834} }
V-FUSE: Volumetric Depth Map Fusion with Long-Range Constraints-
[pdf]
[supp]
[bibtex]@InProceedings{Burgdorfer_2023_ICCV, author = {Burgdorfer, Nathaniel and Mordohai, Philippos}, title = {V-FUSE: Volumetric Depth Map Fusion with Long-Range Constraints}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3449-3458} }
CrossLoc3D: Aerial-Ground Cross-Source 3D Place Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Guan_2023_ICCV, author = {Guan, Tianrui and Muthuselvam, Aswath and Hoover, Montana and Wang, Xijun and Liang, Jing and Sathyamoorthy, Adarsh Jagan and Conover, Damon and Manocha, Dinesh}, title = {CrossLoc3D: Aerial-Ground Cross-Source 3D Place Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11335-11344} }
Recursive Video Lane Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jin_2023_ICCV, author = {Jin, Dongkwon and Kim, Dahyun and Kim, Chang-Su}, title = {Recursive Video Lane Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8473-8482} }
GECCO: Geometrically-Conditioned Point Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tyszkiewicz_2023_ICCV, author = {Tyszkiewicz, Micha{\l} J and Fua, Pascal and Trulls, Eduard}, title = {GECCO: Geometrically-Conditioned Point Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2128-2138} }
Unsupervised Self-Driving Attention Prediction via Uncertainty Mining and Knowledge Embedding-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Pengfei and Qi, Mengshi and Li, Xia and Li, Weijian and Ma, Huadong}, title = {Unsupervised Self-Driving Attention Prediction via Uncertainty Mining and Knowledge Embedding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8558-8568} }
PETRv2: A Unified Framework for 3D Perception from Multi-Camera Images-
[pdf]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Yingfei and Yan, Junjie and Jia, Fan and Li, Shuailin and Gao, Aqi and Wang, Tiancai and Zhang, Xiangyu}, title = {PETRv2: A Unified Framework for 3D Perception from Multi-Camera Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3262-3272} }
Out-of-Domain GAN Inversion via Invertibility Decomposition for Photo-Realistic Human Face Manipulation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Xin and XU, Xiaogang and Chen, Yingcong}, title = {Out-of-Domain GAN Inversion via Invertibility Decomposition for Photo-Realistic Human Face Manipulation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7492-7501} }
SAFE: Machine Unlearning With Shard Graphs-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dukler_2023_ICCV, author = {Dukler, Yonatan and Bowman, Benjamin and Achille, Alessandro and Golatkar, Aditya and Swaminathan, Ashwin and Soatto, Stefano}, title = {SAFE: Machine Unlearning With Shard Graphs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17108-17118} }
Learning Trajectory-Word Alignments for Video-Language Tasks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Xu and Li, Zhangzikang and Xu, Haiyang and Zhang, Hanwang and Ye, Qinghao and Li, Chenliang and Yan, Ming and Zhang, Yu and Huang, Fei and Huang, Songfang}, title = {Learning Trajectory-Word Alignments for Video-Language Tasks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2504-2514} }
OrthoPlanes: A Novel Representation for Better 3D-Awareness of GANs-
[pdf]
[supp]
[bibtex]@InProceedings{He_2023_ICCV, author = {He, Honglin and Yang, Zhuoqian and Li, Shikai and Dai, Bo and Wu, Wayne}, title = {OrthoPlanes: A Novel Representation for Better 3D-Awareness of GANs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22996-23007} }
Geometry-guided Feature Learning and Fusion for Indoor Scene Reconstruction-
[pdf]
[supp]
[bibtex]@InProceedings{Yin_2023_ICCV, author = {Yin, Ruihong and Karaoglu, Sezer and Gevers, Theo}, title = {Geometry-guided Feature Learning and Fusion for Indoor Scene Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3652-3661} }
Atmospheric Transmission and Thermal Inertia Induced Blind Road Segmentation with a Large-Scale Dataset TBRSD-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Junzhang and Bai, Xiangzhi}, title = {Atmospheric Transmission and Thermal Inertia Induced Blind Road Segmentation with a Large-Scale Dataset TBRSD}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1053-1063} }
NeTO:Neural Reconstruction of Transparent Objects with Self-Occlusion Aware Refraction-Tracing-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Zongcheng and Long, Xiaoxiao and Wang, Yusen and Cao, Tuo and Wang, Wenping and Luo, Fei and Xiao, Chunxia}, title = {NeTO:Neural Reconstruction of Transparent Objects with Self-Occlusion Aware Refraction-Tracing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18547-18557} }
Boosting 3-DoF Ground-to-Satellite Camera Localization Accuracy via Geometry-Guided Cross-View Transformer-
[pdf]
[supp]
[bibtex]@InProceedings{Shi_2023_ICCV, author = {Shi, Yujiao and Wu, Fei and Perincherry, Akhil and Vora, Ankit and Li, Hongdong}, title = {Boosting 3-DoF Ground-to-Satellite Camera Localization Accuracy via Geometry-Guided Cross-View Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21516-21526} }
Efficient-VQGAN: Towards High-Resolution Image Generation with Efficient Vision Transformers-
[pdf]
[bibtex]@InProceedings{Cao_2023_ICCV, author = {Cao, Shiyue and Yin, Yueqin and Huang, Lianghua and Liu, Yu and Zhao, Xin and Zhao, Deli and Huang, Kaigi}, title = {Efficient-VQGAN: Towards High-Resolution Image Generation with Efficient Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7368-7377} }
DLGSANet: Lightweight Dynamic Local and Global Self-Attention Networks for Image Super-Resolution-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Xiang and Dong, Jiangxin and Tang, Jinhui and Pan, Jinshan}, title = {DLGSANet: Lightweight Dynamic Local and Global Self-Attention Networks for Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12792-12801} }
Adaptive Reordering Sampler with Neurally Guided MAGSAC-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wei_2023_ICCV, author = {Wei, Tong and Matas, Jiri and Barath, Daniel}, title = {Adaptive Reordering Sampler with Neurally Guided MAGSAC}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18163-18173} }
Learning Cross-Representation Affinity Consistency for Sparsely Supervised Biomedical Instance Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Xiaoyu and Huang, Wei and Xiong, Zhiwei and Zhou, Shenglong and Zhang, Yueyi and Chen, Xuejin and Zha, Zheng-Jun and Wu, Feng}, title = {Learning Cross-Representation Affinity Consistency for Sparsely Supervised Biomedical Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21107-21117} }
Black-Box Unsupervised Domain Adaptation with Bi-Directional Atkinson-Shiffrin Memory-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Jingyi and Huang, Jiaxing and Jiang, Xueying and Lu, Shijian}, title = {Black-Box Unsupervised Domain Adaptation with Bi-Directional Atkinson-Shiffrin Memory}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11771-11782} }
Towards Fair and Comprehensive Comparisons for Image-Based 3D Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Ma_2023_ICCV, author = {Ma, Xinzhu and Wang, Yongtao and Zhang, Yinmin and Xia, Zhiyi and Meng, Yuan and Wang, Zhihui and Li, Haojie and Ouyang, Wanli}, title = {Towards Fair and Comprehensive Comparisons for Image-Based 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6425-6435} }
Disentangling Spatial and Temporal Learning for Efficient Image-to-Video Transfer Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Qing_2023_ICCV, author = {Qing, Zhiwu and Zhang, Shiwei and Huang, Ziyuan and Zhang, Yingya and Gao, Changxin and Zhao, Deli and Sang, Nong}, title = {Disentangling Spatial and Temporal Learning for Efficient Image-to-Video Transfer Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13934-13944} }
A Skeletonization Algorithm for Gradient-Based Optimization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Menten_2023_ICCV, author = {Menten, Martin J. and Paetzold, Johannes C. and Zimmer, Veronika A. and Shit, Suprosanna and Ezhov, Ivan and Holland, Robbie and Probst, Monika and Schnabel, Julia A. and Rueckert, Daniel}, title = {A Skeletonization Algorithm for Gradient-Based Optimization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21394-21403} }
V3Det: Vast Vocabulary Visual Detection Dataset-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Jiaqi and Zhang, Pan and Chu, Tao and Cao, Yuhang and Zhou, Yujie and Wu, Tong and Wang, Bin and He, Conghui and Lin, Dahua}, title = {V3Det: Vast Vocabulary Visual Detection Dataset}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19844-19854} }
Coarse-to-Fine: Learning Compact Discriminative Representation for Single-Stage Image Retrieval-
[pdf]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Yunquan and Gao, Xinkai and Ke, Bo and Qiao, Ruizhi and Sun, Xing}, title = {Coarse-to-Fine: Learning Compact Discriminative Representation for Single-Stage Image Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11260-11269} }
Multi-weather Image Restoration via Domain Translation-
[pdf]
[supp]
[bibtex]@InProceedings{Patil_2023_ICCV, author = {Patil, Prashant W. and Gupta, Sunil and Rana, Santu and Venkatesh, Svetha and Murala, Subrahmanyam}, title = {Multi-weather Image Restoration via Domain Translation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21696-21705} }
Deep Fusion Transformer Network with Weighted Vector-Wise Keypoints Voting for Robust 6D Object Pose Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Jun and Chen, Kai and Xu, Linlin and Dou, Qi and Qin, Jing}, title = {Deep Fusion Transformer Network with Weighted Vector-Wise Keypoints Voting for Robust 6D Object Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13967-13977} }
BT^2: Backward-compatible Training with Basis Transformation-
[pdf]
[supp]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Yifei and Li, Zilu and Shrivastava, Abhinav and Zhao, Hengshuang and Torralba, Antonio and Tian, Taipeng and Lim, Ser-Nam}, title = {BT{\textasciicircum}2: Backward-compatible Training with Basis Transformation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11229-11238} }
ViperGPT: Visual Inference via Python Execution for Reasoning-
[pdf]
[supp]
[bibtex]@InProceedings{Suris_2023_ICCV, author = {Sur{\'\i}s, D{\'\i}dac and Menon, Sachit and Vondrick, Carl}, title = {ViperGPT: Visual Inference via Python Execution for Reasoning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11888-11898} }
Improving Unsupervised Visual Program Inference with Code Rewriting Families-
[pdf]
[supp]
[bibtex]@InProceedings{Ganeshan_2023_ICCV, author = {Ganeshan, Aditya and Jones, R. Kenny and Ritchie, Daniel}, title = {Improving Unsupervised Visual Program Inference with Code Rewriting Families}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15791-15801} }
Essential Matrix Estimation using Convex Relaxations in Orthogonal Space-
[pdf]
[supp]
[bibtex]@InProceedings{Karimian_2023_ICCV, author = {Karimian, Arman and Tron, Roberto}, title = {Essential Matrix Estimation using Convex Relaxations in Orthogonal Space}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17142-17152} }
Concept-wise Fine-tuning Matters in Preventing Negative Transfer-
[pdf]
[supp]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Yunqiao and Huang, Long-Kai and Wei, Ying}, title = {Concept-wise Fine-tuning Matters in Preventing Negative Transfer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18753-18763} }
Learning Human Dynamics in Autonomous Driving Scenarios-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Jingbo and Yuan, Ye and Luo, Zhengyi and Xie, Kevin and Lin, Dahua and Iqbal, Umar and Fidler, Sanja and Khamis, Sameh}, title = {Learning Human Dynamics in Autonomous Driving Scenarios}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20796-20806} }
Fine-grained Visible Watermark Removal-
[pdf]
[bibtex]@InProceedings{Niu_2023_ICCV, author = {Niu, Li and Zhao, Xing and Zhang, Bo and Zhang, Liqing}, title = {Fine-grained Visible Watermark Removal}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12770-12779} }
DDP: Diffusion Model for Dense Visual Prediction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ji_2023_ICCV, author = {Ji, Yuanfeng and Chen, Zhe and Xie, Enze and Hong, Lanqing and Liu, Xihui and Liu, Zhaoqiang and Lu, Tong and Li, Zhenguo and Luo, Ping}, title = {DDP: Diffusion Model for Dense Visual Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21741-21752} }
Semantics-Consistent Feature Search for Self-Supervised Visual Representation Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Song_2023_ICCV, author = {Song, Kaiyou and Zhang, Shan and Luo, Zimeng and Wang, Tong and Xie, Jin}, title = {Semantics-Consistent Feature Search for Self-Supervised Visual Representation Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16099-16108} }
GridMM: Grid Memory Map for Vision-and-Language Navigation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Zihan and Li, Xiangyang and Yang, Jiahao and Liu, Yeqi and Jiang, Shuqiang}, title = {GridMM: Grid Memory Map for Vision-and-Language Navigation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15625-15636} }
Probabilistic Modeling of Inter- and Intra-observer Variability in Medical Image Segmentation-
[pdf]
[bibtex]@InProceedings{Schmidt_2023_ICCV, author = {Schmidt, Arne and Morales-\'Alvarez, Pablo and Molina, Rafael}, title = {Probabilistic Modeling of Inter- and Intra-observer Variability in Medical Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21097-21106} }
LAC - Latent Action Composition for Skeleton-based Action Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Di and Wang, Yaohui and Dantcheva, Antitza and Kong, Quan and Garattoni, Lorenzo and Francesca, Gianpiero and Bremond, Francois}, title = {LAC - Latent Action Composition for Skeleton-based Action Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13679-13690} }
Learning Vision-and-Language Navigation from YouTube Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lin_2023_ICCV, author = {Lin, Kunyang and Chen, Peihao and Huang, Diwei and Li, Thomas H. and Tan, Mingkui and Gan, Chuang}, title = {Learning Vision-and-Language Navigation from YouTube Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8317-8326} }
Total-Recon: Deformable Scene Reconstruction for Embodied View Synthesis-
[pdf]
[supp]
[bibtex]@InProceedings{Song_2023_ICCV, author = {Song, Chonghyuk and Yang, Gengshan and Deng, Kangle and Zhu, Jun-Yan and Ramanan, Deva}, title = {Total-Recon: Deformable Scene Reconstruction for Embodied View Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17671-17682} }
AdaNIC: Towards Practical Neural Image Compression via Dynamic Transform Routing-
[pdf]
[bibtex]@InProceedings{Tao_2023_ICCV, author = {Tao, Lvfang and Gao, Wei and Li, Ge and Zhang, Chenhao}, title = {AdaNIC: Towards Practical Neural Image Compression via Dynamic Transform Routing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16879-16888} }
Uncertainty-aware State Space Transformer for Egocentric 3D Hand Trajectory Forecasting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bao_2023_ICCV, author = {Bao, Wentao and Chen, Lele and Zeng, Libing and Li, Zhong and Xu, Yi and Yuan, Junsong and Kong, Yu}, title = {Uncertainty-aware State Space Transformer for Egocentric 3D Hand Trajectory Forecasting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13702-13711} }
Pretrained Language Models as Visual Planners for Human Assistance-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Patel_2023_ICCV, author = {Patel, Dhruvesh and Eghbalzadeh, Hamid and Kamra, Nitin and Iuzzolino, Michael Louis and Jain, Unnat and Desai, Ruta}, title = {Pretrained Language Models as Visual Planners for Human Assistance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15302-15314} }
Dynamic Point Fields-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Prokudin_2023_ICCV, author = {Prokudin, Sergey and Ma, Qianli and Raafat, Maxime and Valentin, Julien and Tang, Siyu}, title = {Dynamic Point Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7964-7976} }
Lip2Vec: Efficient and Robust Visual Speech Recognition via Latent-to-Latent Visual to Audio Representation Mapping-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Djilali_2023_ICCV, author = {Djilali, Yasser Abdelaziz Dahou and Narayan, Sanath and Boussaid, Haithem and Almazrouei, Ebtessam and Debbah, Merouane}, title = {Lip2Vec: Efficient and Robust Visual Speech Recognition via Latent-to-Latent Visual to Audio Representation Mapping}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13790-13801} }
Privacy Preserving Localization via Coordinate Permutations-
[pdf]
[supp]
[bibtex]@InProceedings{Pan_2023_ICCV, author = {Pan, Linfei and Sch\"onberger, Johannes L. and Larsson, Viktor and Pollefeys, Marc}, title = {Privacy Preserving Localization via Coordinate Permutations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18174-18183} }
Random Boxes Are Open-world Object Detectors-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Yanghao and Yue, Zhongqi and Hua, Xian-Sheng and Zhang, Hanwang}, title = {Random Boxes Are Open-world Object Detectors}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6233-6243} }
DiffDreamer: Towards Consistent Unsupervised Single-view Scene Extrapolation with Conditional Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cai_2023_ICCV, author = {Cai, Shengqu and Chan, Eric Ryan and Peng, Songyou and Shahbazi, Mohamad and Obukhov, Anton and Van Gool, Luc and Wetzstein, Gordon}, title = {DiffDreamer: Towards Consistent Unsupervised Single-view Scene Extrapolation with Conditional Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2139-2150} }
Spectral Graphormer: Spectral Graph-Based Transformer for Egocentric Two-Hand Reconstruction using Multi-View Color Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tse_2023_ICCV, author = {Tse, Tze Ho Elden and Mueller, Franziska and Shen, Zhengyang and Tang, Danhang and Beeler, Thabo and Dou, Mingsong and Zhang, Yinda and Petrovic, Sasa and Chang, Hyung Jin and Taylor, Jonathan and Doosti, Bardia}, title = {Spectral Graphormer: Spectral Graph-Based Transformer for Egocentric Two-Hand Reconstruction using Multi-View Color Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14666-14677} }
SMMix: Self-Motivated Image Mixing for Vision Transformers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Mengzhao and Lin, Mingbao and Lin, Zhihang and Zhang, Yuxin and Chao, Fei and Ji, Rongrong}, title = {SMMix: Self-Motivated Image Mixing for Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17260-17270} }
Enhancing Adversarial Robustness in Low-Label Regime via Adaptively Weighted Regularization and Knowledge Distillation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Dongyoon and Kong, Insung and Kim, Yongdai}, title = {Enhancing Adversarial Robustness in Low-Label Regime via Adaptively Weighted Regularization and Knowledge Distillation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4552-4561} }
Recovering a Molecule's 3D Dynamics from Liquid-phase Electron Microscopy Movies-
[pdf]
[supp]
[bibtex]@InProceedings{Ye_2023_ICCV, author = {Ye, Enze and Wang, Yuhang and Zhang, Hong and Gao, Yiqin and Wang, Huan and Sun, He}, title = {Recovering a Molecule's 3D Dynamics from Liquid-phase Electron Microscopy Movies}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10767-10777} }
Reconciling Object-Level and Global-Level Objectives for Long-Tail Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Shaoyu and Chen, Chen and Peng, Silong}, title = {Reconciling Object-Level and Global-Level Objectives for Long-Tail Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18982-18992} }
In-Style: Bridging Text and Uncurated Videos with Style Transfer for Text-Video Retrieval-
[pdf]
[supp]
[bibtex]@InProceedings{Shvetsova_2023_ICCV, author = {Shvetsova, Nina and Kukleva, Anna and Schiele, Bernt and Kuehne, Hilde}, title = {In-Style: Bridging Text and Uncurated Videos with Style Transfer for Text-Video Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21981-21992} }
MIMO-NeRF: Fast Neural Rendering with Multi-input Multi-output Neural Radiance Fields-
[pdf]
[supp]
[bibtex]@InProceedings{Kaneko_2023_ICCV, author = {Kaneko, Takuhiro}, title = {MIMO-NeRF: Fast Neural Rendering with Multi-input Multi-output Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3273-3283} }
Instance Neural Radiance Field-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Yichen and Hu, Benran and Huang, Junkai and Tai, Yu-Wing and Tang, Chi-Keung}, title = {Instance Neural Radiance Field}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {787-796} }
One-bit Flip is All You Need: When Bit-flip Attack Meets Model Training-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dong_2023_ICCV, author = {Dong, Jianshuo and Qiu, Han and Li, Yiming and Zhang, Tianwei and Li, Yuanjie and Lai, Zeqi and Zhang, Chao and Xia, Shu-Tao}, title = {One-bit Flip is All You Need: When Bit-flip Attack Meets Model Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4688-4698} }
CLIPTER: Looking at the Bigger Picture in Scene Text Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Aberdam_2023_ICCV, author = {Aberdam, Aviad and Bensaid, David and Golts, Alona and Ganz, Roy and Nuriel, Oren and Tichauer, Royee and Mazor, Shai and Litman, Ron}, title = {CLIPTER: Looking at the Bigger Picture in Scene Text Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21706-21717} }
Revisiting Scene Text Recognition: A Data Perspective-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jiang_2023_ICCV, author = {Jiang, Qing and Wang, Jiapeng and Peng, Dezhi and Liu, Chongyu and Jin, Lianwen}, title = {Revisiting Scene Text Recognition: A Data Perspective}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20543-20554} }
Improving CLIP Fine-tuning Performance-
[pdf]
[supp]
[bibtex]@InProceedings{Wei_2023_ICCV, author = {Wei, Yixuan and Hu, Han and Xie, Zhenda and Liu, Ze and Zhang, Zheng and Cao, Yue and Bao, Jianmin and Chen, Dong and Guo, Baining}, title = {Improving CLIP Fine-tuning Performance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5439-5449} }
The Power of Sound (TPoS): Audio Reactive Video Generation with Stable Diffusion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jeong_2023_ICCV, author = {Jeong, Yujin and Ryoo, Wonjeong and Lee, Seunghyun and Seo, Dabin and Byeon, Wonmin and Kim, Sangpil and Kim, Jinkyu}, title = {The Power of Sound (TPoS): Audio Reactive Video Generation with Stable Diffusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7822-7832} }
SOCS: Semantically-Aware Object Coordinate Space for Category-Level 6D Object Pose Estimation under Large Shape Variations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wan_2023_ICCV, author = {Wan, Boyan and Shi, Yifei and Xu, Kai}, title = {SOCS: Semantically-Aware Object Coordinate Space for Category-Level 6D Object Pose Estimation under Large Shape Variations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14065-14074} }
NeRF-LOAM: Neural Implicit Representation for Large-Scale Incremental LiDAR Odometry and Mapping-
[pdf]
[supp]
[bibtex]@InProceedings{Deng_2023_ICCV, author = {Deng, Junyuan and Wu, Qi and Chen, Xieyuanli and Xia, Songpengcheng and Sun, Zhen and Liu, Guoqing and Yu, Wenxian and Pei, Ling}, title = {NeRF-LOAM: Neural Implicit Representation for Large-Scale Incremental LiDAR Odometry and Mapping}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8218-8227} }
DINAR: Diffusion Inpainting of Neural Textures for One-Shot Human Avatars-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Svitov_2023_ICCV, author = {Svitov, David and Gudkov, Dmitrii and Bashirov, Renat and Lempitsky, Victor}, title = {DINAR: Diffusion Inpainting of Neural Textures for One-Shot Human Avatars}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7062-7072} }
DPM-OT: A New Diffusion Probabilistic Model Based on Optimal Transport-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Zezeng and Li, Shenghao and Wang, Zhanpeng and Lei, Na and Luo, Zhongxuan and Gu, David Xianfeng}, title = {DPM-OT: A New Diffusion Probabilistic Model Based on Optimal Transport}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22624-22633} }
ElasticViT: Conflict-aware Supernet Training for Deploying Fast Vision Transformer on Diverse Mobile Devices-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tang_2023_ICCV, author = {Tang, Chen and Zhang, Li Lyna and Jiang, Huiqiang and Xu, Jiahang and Cao, Ting and Zhang, Quanlu and Yang, Yuqing and Wang, Zhi and Yang, Mao}, title = {ElasticViT: Conflict-aware Supernet Training for Deploying Fast Vision Transformer on Diverse Mobile Devices}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5829-5840} }
OmniLabel: A Challenging Benchmark for Language-Based Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Schulter_2023_ICCV, author = {Schulter, Samuel and G, Vijay Kumar B and Suh, Yumin and Dafnis, Konstantinos M. and Zhang, Zhixing and Zhao, Shiyu and Metaxas, Dimitris}, title = {OmniLabel: A Challenging Benchmark for Language-Based Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11953-11962} }
Noise-Aware Learning from Web-Crawled Image-Text Data for Image Captioning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kang_2023_ICCV, author = {Kang, Wooyoung and Mun, Jonghwan and Lee, Sungjun and Roh, Byungseok}, title = {Noise-Aware Learning from Web-Crawled Image-Text Data for Image Captioning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2942-2952} }
Divide&Classify: Fine-Grained Classification for City-Wide Visual Geo-Localization-
[pdf]
[supp]
[bibtex]@InProceedings{Trivigno_2023_ICCV, author = {Trivigno, Gabriele and Berton, Gabriele and Aragon, Juan and Caputo, Barbara and Masone, Carlo}, title = {Divide\&Classify: Fine-Grained Classification for City-Wide Visual Geo-Localization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11142-11152} }
3D Semantic Subspace Traverser: Empowering 3D Generative Model with Shape Editing Capability-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Ruowei and Liu, Yu and Su, Pei and Zhang, Jianwei and Zhao, Qijun}, title = {3D Semantic Subspace Traverser: Empowering 3D Generative Model with Shape Editing Capability}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14406-14417} }
Inherent Redundancy in Spiking Neural Networks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yao_2023_ICCV, author = {Yao, Man and Hu, Jiakui and Zhao, Guangshe and Wang, Yaoyuan and Zhang, Ziyang and Xu, Bo and Li, Guoqi}, title = {Inherent Redundancy in Spiking Neural Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16924-16934} }
Text2Room: Extracting Textured 3D Meshes from 2D Text-to-Image Models-
[pdf]
[supp]
[bibtex]@InProceedings{Hollein_2023_ICCV, author = {H\"ollein, Lukas and Cao, Ang and Owens, Andrew and Johnson, Justin and Nie{\ss}ner, Matthias}, title = {Text2Room: Extracting Textured 3D Meshes from 2D Text-to-Image Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7909-7920} }
On the Robustness of Normalizing Flows for Inverse Problems in Imaging-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hong_2023_ICCV, author = {Hong, Seongmin and Park, Inbum and Chun, Se Young}, title = {On the Robustness of Normalizing Flows for Inverse Problems in Imaging}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10745-10755} }
FastRecon: Few-shot Industrial Anomaly Detection via Fast Feature Reconstruction-
[pdf]
[bibtex]@InProceedings{Fang_2023_ICCV, author = {Fang, Zheng and Wang, Xiaoyang and Li, Haocheng and Liu, Jiejie and Hu, Qiugui and Xiao, Jimin}, title = {FastRecon: Few-shot Industrial Anomaly Detection via Fast Feature Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17481-17490} }
Local or Global: Selective Knowledge Assimilation for Federated Learning with Limited Labels-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cho_2023_ICCV, author = {Cho, Yae Jee and Joshi, Gauri and Dimitriadis, Dimitrios}, title = {Local or Global: Selective Knowledge Assimilation for Federated Learning with Limited Labels}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17087-17096} }
DistillBEV: Boosting Multi-Camera 3D Object Detection with Cross-Modal Knowledge Distillation-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Zeyu and Li, Dingwen and Luo, Chenxu and Xie, Cihang and Yang, Xiaodong}, title = {DistillBEV: Boosting Multi-Camera 3D Object Detection with Cross-Modal Knowledge Distillation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8637-8646} }
PoseFix: Correcting 3D Human Poses with Natural Language-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Delmas_2023_ICCV, author = {Delmas, Ginger and Weinzaepfel, Philippe and Moreno-Noguer, Francesc and Rogez, Gr\'egory}, title = {PoseFix: Correcting 3D Human Poses with Natural Language}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15018-15028} }
TAPIR: Tracking Any Point with Per-Frame Initialization and Temporal Refinement-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Doersch_2023_ICCV, author = {Doersch, Carl and Yang, Yi and Vecerik, Mel and Gokay, Dilara and Gupta, Ankush and Aytar, Yusuf and Carreira, Joao and Zisserman, Andrew}, title = {TAPIR: Tracking Any Point with Per-Frame Initialization and Temporal Refinement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10061-10072} }
SwinLSTM: Improving Spatiotemporal Prediction Accuracy using Swin Transformer and LSTM-
[pdf]
[arXiv]
[bibtex]@InProceedings{Tang_2023_ICCV, author = {Tang, Song and Li, Chuang and Zhang, Pu and Tang, RongNian}, title = {SwinLSTM: Improving Spatiotemporal Prediction Accuracy using Swin Transformer and LSTM}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13470-13479} }
Detecting Objects with Context-Likelihood Graphs and Graph Refinement-
[pdf]
[bibtex]@InProceedings{Bhowmik_2023_ICCV, author = {Bhowmik, Aritra and Wang, Yu and Baka, Nora and Oswald, Martin R. and Snoek, Cees G. M.}, title = {Detecting Objects with Context-Likelihood Graphs and Graph Refinement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6524-6533} }
Coarse-to-Fine Amodal Segmentation with Shape Prior-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gao_2023_ICCV, author = {Gao, Jianxiong and Qian, Xuelin and Wang, Yikai and Xiao, Tianjun and He, Tong and Zhang, Zheng and Fu, Yanwei}, title = {Coarse-to-Fine Amodal Segmentation with Shape Prior}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1262-1271} }
DEDRIFT: Robust Similarity Search under Content Drift-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Baranchuk_2023_ICCV, author = {Baranchuk, Dmitry and Douze, Matthijs and Upadhyay, Yash and Yalniz, I. Zeki}, title = {DEDRIFT: Robust Similarity Search under Content Drift}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11026-11035} }
Learning Pseudo-Relations for Cross-domain Semantic Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Dong and Wang, Shuang and Zang, Qi and Quan, Dou and Ye, Xiutiao and Yang, Rui and Jiao, Licheng}, title = {Learning Pseudo-Relations for Cross-domain Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19191-19203} }
AdVerb: Visually Guided Audio Dereverberation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chowdhury_2023_ICCV, author = {Chowdhury, Sanjoy and Ghosh, Sreyan and Dasgupta, Subhrajyoti and Ratnarajah, Anton and Tyagi, Utkarsh and Manocha, Dinesh}, title = {AdVerb: Visually Guided Audio Dereverberation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7884-7896} }
Audio-Enhanced Text-to-Video Retrieval using Text-Conditioned Feature Alignment-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ibrahimi_2023_ICCV, author = {Ibrahimi, Sarah and Sun, Xiaohang and Wang, Pichao and Garg, Amanmeet and Sanan, Ashutosh and Omar, Mohamed}, title = {Audio-Enhanced Text-to-Video Retrieval using Text-Conditioned Feature Alignment}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12054-12064} }
Open-vocabulary Object Segmentation with Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Ziyi and Zhou, Qinye and Zhang, Xiaoyun and Zhang, Ya and Wang, Yanfeng and Xie, Weidi}, title = {Open-vocabulary Object Segmentation with Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7667-7676} }
Human-centric Scene Understanding for 3D Large-scale Scenarios-
[pdf]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Yiteng and Cong, Peishan and Yao, Yichen and Chen, Runnan and Hou, Yuenan and Zhu, Xinge and He, Xuming and Yu, Jingyi and Ma, Yuexin}, title = {Human-centric Scene Understanding for 3D Large-scale Scenarios}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20349-20359} }
With a Little Help from Your Own Past: Prototypical Memory Networks for Image Captioning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Barraco_2023_ICCV, author = {Barraco, Manuele and Sarto, Sara and Cornia, Marcella and Baraldi, Lorenzo and Cucchiara, Rita}, title = {With a Little Help from Your Own Past: Prototypical Memory Networks for Image Captioning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3021-3031} }
SimMatchV2: Semi-Supervised Learning with Graph Consistency-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zheng_2023_ICCV, author = {Zheng, Mingkai and You, Shan and Huang, Lang and Luo, Chen and Wang, Fei and Qian, Chen and Xu, Chang}, title = {SimMatchV2: Semi-Supervised Learning with Graph Consistency}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16432-16442} }
Reinforced Disentanglement for Face Swapping without Skip Connection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ren_2023_ICCV, author = {Ren, Xiaohang and Chen, Xingyu and Yao, Pengfei and Shum, Heung-Yeung and Wang, Baoyuan}, title = {Reinforced Disentanglement for Face Swapping without Skip Connection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20665-20675} }
PDiscoNet: Semantically consistent part discovery for fine-grained recognition-
[pdf]
[arXiv]
[bibtex]@InProceedings{van_der_Klis_2023_ICCV, author = {van der Klis, Robert and Alaniz, Stephan and Mancini, Massimiliano and Dantas, Cassio F. and Ienco, Dino and Akata, Zeynep and Marcos, Diego}, title = {PDiscoNet: Semantically consistent part discovery for fine-grained recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1866-1876} }
Privacy-Preserving Face Recognition Using Random Frequency Components-
[pdf]
[arXiv]
[bibtex]@InProceedings{Mi_2023_ICCV, author = {Mi, Yuxi and Huang, Yuge and Ji, Jiazhen and Zhao, Minyi and Wu, Jiaxiang and Xu, Xingkun and Ding, Shouhong and Zhou, Shuigeng}, title = {Privacy-Preserving Face Recognition Using Random Frequency Components}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19673-19684} }
Vision Transformer Adapters for Generalizable Multitask Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Bhattacharjee_2023_ICCV, author = {Bhattacharjee, Deblina and S\"usstrunk, Sabine and Salzmann, Mathieu}, title = {Vision Transformer Adapters for Generalizable Multitask Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19015-19026} }
How to Choose your Best Allies for a Transferable Attack?-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Maho_2023_ICCV, author = {Maho, Thibault and Moosavi-Dezfooli, Seyed-Mohsen and Furon, Teddy}, title = {How to Choose your Best Allies for a Transferable Attack?}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4542-4551} }
CVRecon: Rethinking 3D Geometric Feature Learning For Neural Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Feng_2023_ICCV, author = {Feng, Ziyue and Yang, Liang and Guo, Pengsheng and Li, Bing}, title = {CVRecon: Rethinking 3D Geometric Feature Learning For Neural Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17750-17760} }
Self-Supervised Object Detection from Egocentric Videos-
[pdf]
[supp]
[bibtex]@InProceedings{Akiva_2023_ICCV, author = {Akiva, Peri and Huang, Jing and Liang, Kevin J and Kovvuri, Rama and Chen, Xingyu and Feiszli, Matt and Dana, Kristin and Hassner, Tal}, title = {Self-Supervised Object Detection from Egocentric Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5225-5237} }
Prior-guided Source-free Domain Adaptation for Human Pose Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Raychaudhuri_2023_ICCV, author = {Raychaudhuri, Dripta S. and Ta, Calvin-Khang and Dutta, Arindam and Lal, Rohit and Roy-Chowdhury, Amit K.}, title = {Prior-guided Source-free Domain Adaptation for Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14996-15006} }
ClothesNet: An Information-Rich 3D Garment Model Repository with Simulated Clothes Environment-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Bingyang and Zhou, Haoyu and Liang, Tianhai and Yu, Qiaojun and Zhao, Siheng and Zeng, Yuwei and Lv, Jun and Luo, Siyuan and Wang, Qiancai and Yu, Xinyuan and Chen, Haonan and Lu, Cewu and Shao, Lin}, title = {ClothesNet: An Information-Rich 3D Garment Model Repository with Simulated Clothes Environment}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20428-20438} }
Auxiliary Tasks Benefit 3D Skeleton-based Human Motion Prediction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Chenxin and Tan, Robby T. and Tan, Yuhong and Chen, Siheng and Wang, Xinchao and Wang, Yanfeng}, title = {Auxiliary Tasks Benefit 3D Skeleton-based Human Motion Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9509-9520} }
Measuring Asymmetric Gradient Discrepancy in Parallel Continual Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Lyu_2023_ICCV, author = {Lyu, Fan and Sun, Qing and Shang, Fanhua and Wan, Liang and Feng, Wei}, title = {Measuring Asymmetric Gradient Discrepancy in Parallel Continual Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11411-11420} }
StyleLipSync: Style-based Personalized Lip-sync Video Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ki_2023_ICCV, author = {Ki, Taekyung and Min, Dongchan}, title = {StyleLipSync: Style-based Personalized Lip-sync Video Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22841-22850} }
Cross Contrasting Feature Perturbation for Domain Generalization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Chenming and Zhang, Daoan and Huang, Wenjian and Zhang, Jianguo}, title = {Cross Contrasting Feature Perturbation for Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1327-1337} }
DiffusionRet: Generative Text-Video Retrieval with Diffusion Model-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jin_2023_ICCV, author = {Jin, Peng and Li, Hao and Cheng, Zesen and Li, Kehan and Ji, Xiangyang and Liu, Chang and Yuan, Li and Chen, Jie}, title = {DiffusionRet: Generative Text-Video Retrieval with Diffusion Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2470-2481} }
Efficient 3D Semantic Segmentation with Superpoint Transformer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Robert_2023_ICCV, author = {Robert, Damien and Raguet, Hugo and Landrieu, Loic}, title = {Efficient 3D Semantic Segmentation with Superpoint Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17195-17204} }
Adversarial Finetuning with Latent Representation Constraint to Mitigate Accuracy-Robustness Tradeoff-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Suzuki_2023_ICCV, author = {Suzuki, Satoshi and Yamaguchi, Shin'ya and Takeda, Shoichiro and Kanai, Sekitoshi and Makishima, Naoki and Ando, Atsushi and Masumura, Ryo}, title = {Adversarial Finetuning with Latent Representation Constraint to Mitigate Accuracy-Robustness Tradeoff}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4390-4401} }
HyperDiffusion: Generating Implicit Neural Fields with Weight-Space Diffusion-
[pdf]
[supp]
[bibtex]@InProceedings{Erkoc_2023_ICCV, author = {Erko\c{c}, Ziya and Ma, Fangchang and Shan, Qi and Nie{\ss}ner, Matthias and Dai, Angela}, title = {HyperDiffusion: Generating Implicit Neural Fields with Weight-Space Diffusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14300-14310} }
Retinexformer: One-stage Retinex-based Transformer for Low-light Image Enhancement-
[pdf]
[arXiv]
[bibtex]@InProceedings{Cai_2023_ICCV, author = {Cai, Yuanhao and Bian, Hao and Lin, Jing and Wang, Haoqian and Timofte, Radu and Zhang, Yulun}, title = {Retinexformer: One-stage Retinex-based Transformer for Low-light Image Enhancement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12504-12513} }
Minimum Latency Deep Online Video Stabilization-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Zhuofan and Liu, Zhen and Tan, Ping and Zeng, Bing and Liu, Shuaicheng}, title = {Minimum Latency Deep Online Video Stabilization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23030-23039} }
Speech2Lip: High-fidelity Speech to Lip Generation by Learning from a Short Video-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Xiuzhe and Hu, Pengfei and Wu, Yang and Lyu, Xiaoyang and Cao, Yan-Pei and Shan, Ying and Yang, Wenming and Sun, Zhongqian and Qi, Xiaojuan}, title = {Speech2Lip: High-fidelity Speech to Lip Generation by Learning from a Short Video}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22168-22177} }
UHDNeRF: Ultra-High-Definition Neural Radiance Fields-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Quewei and Li, Feichao and Guo, Jie and Guo, Yanwen}, title = {UHDNeRF: Ultra-High-Definition Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23097-23108} }
Linear Spaces of Meanings: Compositional Structures in Vision-Language Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Trager_2023_ICCV, author = {Trager, Matthew and Perera, Pramuditha and Zancato, Luca and Achille, Alessandro and Bhatia, Parminder and Soatto, Stefano}, title = {Linear Spaces of Meanings: Compositional Structures in Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15395-15404} }
MULLER: Multilayer Laplacian Resizer for Vision-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tu_2023_ICCV, author = {Tu, Zhengzhong and Milanfar, Peyman and Talebi, Hossein}, title = {MULLER: Multilayer Laplacian Resizer for Vision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6877-6887} }
X-VoE: Measuring eXplanatory Violation of Expectation in Physical Events-
[pdf]
[supp]
[bibtex]@InProceedings{Dai_2023_ICCV, author = {Dai, Bo and Wang, Linge and Jia, Baoxiong and Zhang, Zeyu and Zhu, Song-Chun and Zhang, Chi and Zhu, Yixin}, title = {X-VoE: Measuring eXplanatory Violation of Expectation in Physical Events}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3992-4002} }
Tracking by Natural Language Specification with Long Short-term Context Decoupling-
[pdf]
[bibtex]@InProceedings{Ma_2023_ICCV, author = {Ma, Ding and Wu, Xiangqian}, title = {Tracking by Natural Language Specification with Long Short-term Context Decoupling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14012-14021} }
COOP: Decoupling and Coupling of Whole-Body Grasping Pose Generation-
[pdf]
[bibtex]@InProceedings{Zheng_2023_ICCV, author = {Zheng, Yanzhao and Shi, Yunzhou and Cui, Yuhao and Zhao, Zhongzhou and Luo, Zhiling and Zhou, Wei}, title = {COOP: Decoupling and Coupling of Whole-Body Grasping Pose Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2163-2173} }
Pyramid Dual Domain Injection Network for Pan-sharpening-
[pdf]
[bibtex]@InProceedings{He_2023_ICCV, author = {He, Xuanhua and Yan, Keyu and Li, Rui and Xie, Chengjun and Zhang, Jie and Zhou, Man}, title = {Pyramid Dual Domain Injection Network for Pan-sharpening}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12908-12917} }
Why do networks have inhibitory/negative connections?-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Qingyang and Powell, Mike A. and Geisa, Ali and Bridgeford, Eric and Priebe, Carey E. and Vogelstein, Joshua T.}, title = {Why do networks have inhibitory/negative connections?}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22551-22559} }
Ordinal Label Distribution Learning-
[pdf]
[bibtex]@InProceedings{Wen_2023_ICCV, author = {Wen, Changsong and Zhang, Xin and Yao, Xingxu and Yang, Jufeng}, title = {Ordinal Label Distribution Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23481-23491} }
Model Calibration in Dense Classification with Adaptive Label Perturbation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Jiawei and Ye, Changkun and Wang, Shan and Cui, Ruikai and Zhang, Jing and Zhang, Kaihao and Barnes, Nick}, title = {Model Calibration in Dense Classification with Adaptive Label Perturbation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1173-1184} }
Boosting Multi-modal Model Performance with Adaptive Gradient Modulation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Hong and Li, Xingyu and Hu, Pengbo and Lei, Yinuo and Li, Chunxiao and Zhou, Yi}, title = {Boosting Multi-modal Model Performance with Adaptive Gradient Modulation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22214-22224} }
Semantic Information in Contrastive Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Quan_2023_ICCV, author = {Quan, Shengjiang and Hirano, Masahiro and Yamakawa, Yuji}, title = {Semantic Information in Contrastive Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5686-5696} }
Structure and Content-Guided Video Synthesis with Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Esser_2023_ICCV, author = {Esser, Patrick and Chiu, Johnathan and Atighehchian, Parmida and Granskog, Jonathan and Germanidis, Anastasis}, title = {Structure and Content-Guided Video Synthesis with Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7346-7356} }
NeSS-ST: Detecting Good and Stable Keypoints with a Neural Stability Score and the Shi-Tomasi detector-
[pdf]
[supp]
[bibtex]@InProceedings{Pakulev_2023_ICCV, author = {Pakulev, Konstantin and Vakhitov, Alexander and Ferrer, Gonzalo}, title = {NeSS-ST: Detecting Good and Stable Keypoints with a Neural Stability Score and the Shi-Tomasi detector}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9578-9588} }
Beyond Skin Tone: A Multidimensional Measure of Apparent Skin Color-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Thong_2023_ICCV, author = {Thong, William and Joniak, Przemyslaw and Xiang, Alice}, title = {Beyond Skin Tone: A Multidimensional Measure of Apparent Skin Color}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4903-4913} }
PODA: Prompt-driven Zero-shot Domain Adaptation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fahes_2023_ICCV, author = {Fahes, Mohammad and Vu, Tuan-Hung and Bursuc, Andrei and P\'erez, Patrick and de Charette, Raoul}, title = {PODA: Prompt-driven Zero-shot Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18623-18633} }
Video Action Segmentation via Contextually Refined Temporal Keypoints-
[pdf]
[supp]
[bibtex]@InProceedings{Jiang_2023_ICCV, author = {Jiang, Borui and Jin, Yang and Tan, Zhentao and Mu, Yadong}, title = {Video Action Segmentation via Contextually Refined Temporal Keypoints}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13836-13845} }
Shatter and Gather: Learning Referring Image Segmentation with Text Supervision-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2023_ICCV, author = {Kim, Dongwon and Kim, Namyup and Lan, Cuiling and Kwak, Suha}, title = {Shatter and Gather: Learning Referring Image Segmentation with Text Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15547-15557} }
Two-in-One Depth: Bridging the Gap Between Monocular and Binocular Self-Supervised Depth Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Zhengming and Dong, Qiulei}, title = {Two-in-One Depth: Bridging the Gap Between Monocular and Binocular Self-Supervised Depth Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9411-9421} }
SAFL-Net: Semantic-Agnostic Feature Learning Network with Auxiliary Plugins for Image Manipulation Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Sun_2023_ICCV, author = {Sun, Zhihao and Jiang, Haoran and Wang, Danding and Li, Xirong and Cao, Juan}, title = {SAFL-Net: Semantic-Agnostic Feature Learning Network with Auxiliary Plugins for Image Manipulation Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22424-22433} }
DataDAM: Efficient Dataset Distillation with Attention Matching-
[pdf]
[supp]
[bibtex]@InProceedings{Sajedi_2023_ICCV, author = {Sajedi, Ahmad and Khaki, Samir and Amjadian, Ehsan and Liu, Lucy Z. and Lawryshyn, Yuri A. and Plataniotis, Konstantinos N.}, title = {DataDAM: Efficient Dataset Distillation with Attention Matching}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17097-17107} }
Rethinking Pose Estimation in Crowds: Overcoming the Detection Information Bottleneck and Ambiguity-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Mu and Stoffl, Lucas and Mathis, Mackenzie Weygandt and Mathis, Alexander}, title = {Rethinking Pose Estimation in Crowds: Overcoming the Detection Information Bottleneck and Ambiguity}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14689-14699} }
Social Diffusion: Long-term Multiple Human Motion Anticipation-
[pdf]
[supp]
[bibtex]@InProceedings{Tanke_2023_ICCV, author = {Tanke, Julian and Zhang, Linguang and Zhao, Amy and Tang, Chengcheng and Cai, Yujun and Wang, Lezi and Wu, Po-Chen and Gall, Juergen and Keskin, Cem}, title = {Social Diffusion: Long-term Multiple Human Motion Anticipation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9601-9611} }
Synchronize Feature Extracting and Matching: A Single Branch Framework for 3D Object Tracking-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ma_2023_ICCV, author = {Ma, Teli and Wang, Mengmeng and Xiao, Jimin and Wu, Huifeng and Liu, Yong}, title = {Synchronize Feature Extracting and Matching: A Single Branch Framework for 3D Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9953-9963} }
Leveraging Intrinsic Properties for Non-Rigid Garment Alignment-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lin_2023_ICCV, author = {Lin, Siyou and Zhou, Boyao and Zheng, Zerong and Zhang, Hongwen and Liu, Yebin}, title = {Leveraging Intrinsic Properties for Non-Rigid Garment Alignment}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14485-14496} }
NeILF++: Inter-Reflectable Light Fields for Geometry and Material Estimation-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Jingyang and Yao, Yao and Li, Shiwei and Liu, Jingbo and Fang, Tian and McKinnon, David and Tsin, Yanghai and Quan, Long}, title = {NeILF++: Inter-Reflectable Light Fields for Geometry and Material Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3601-3610} }
MAGI: Multi-Annotated Explanation-Guided Learning-
[pdf]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Yifei and Gu, Siyi and Gao, Yuyang and Pan, Bo and Yang, Xiaofeng and Zhao, Liang}, title = {MAGI: Multi-Annotated Explanation-Guided Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1977-1987} }
Adaptive Positional Encoding for Bundle-Adjusting Neural Radiance Fields-
[pdf]
[bibtex]@InProceedings{Gao_2023_ICCV, author = {Gao, Zelin and Dai, Weichen and Zhang, Yu}, title = {Adaptive Positional Encoding for Bundle-Adjusting Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3284-3294} }
Inducing Neural Collapse to a Fixed Hierarchy-Aware Frame for Reducing Mistake Severity-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liang_2023_ICCV, author = {Liang, Tong and Davis, Jim}, title = {Inducing Neural Collapse to a Fixed Hierarchy-Aware Frame for Reducing Mistake Severity}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1443-1452} }
PlanarTrack: A Large-scale Challenging Benchmark for Planar Object Tracking-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Xinran and Liu, Xiaoqiong and Yi, Ziruo and Zhou, Xin and Le, Thanh and Zhang, Libo and Huang, Yan and Yang, Qing and Fan, Heng}, title = {PlanarTrack: A Large-scale Challenging Benchmark for Planar Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20449-20458} }
Factorized Inverse Path Tracing for Efficient and Accurate Material-Lighting Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Liwen and Zhu, Rui and Yaldiz, Mustafa B. and Zhu, Yinhao and Cai, Hong and Matai, Janarbek and Porikli, Fatih and Li, Tzu-Mao and Chandraker, Manmohan and Ramamoorthi, Ravi}, title = {Factorized Inverse Path Tracing for Efficient and Accurate Material-Lighting Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3848-3858} }
P2C: Self-Supervised Point Cloud Completion from Single Partial Clouds-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cui_2023_ICCV, author = {Cui, Ruikai and Qiu, Shi and Anwar, Saeed and Liu, Jiawei and Xing, Chaoyue and Zhang, Jing and Barnes, Nick}, title = {P2C: Self-Supervised Point Cloud Completion from Single Partial Clouds}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14351-14360} }
Overwriting Pretrained Bias with Finetuning Data-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Angelina and Russakovsky, Olga}, title = {Overwriting Pretrained Bias with Finetuning Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3957-3968} }
Anti-DreamBooth: Protecting Users from Personalized Text-to-image Synthesis-
[pdf]
[supp]
[bibtex]@InProceedings{Van_Le_2023_ICCV, author = {Van Le, Thanh and Phung, Hao and Nguyen, Thuan Hoang and Dao, Quan and Tran, Ngoc N. and Tran, Anh}, title = {Anti-DreamBooth: Protecting Users from Personalized Text-to-image Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2116-2127} }
Contrastive Continuity on Augmentation Stability Rehearsal for Continual Self-Supervised Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Cheng_2023_ICCV, author = {Cheng, Haoyang and Wen, Haitao and Zhang, Xiaoliang and Qiu, Heqian and Wang, Lanxiao and Li, Hongliang}, title = {Contrastive Continuity on Augmentation Stability Rehearsal for Continual Self-Supervised Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5707-5717} }
Treating Pseudo-labels Generation as Image Matting for Weakly Supervised Semantic Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Changwei and Xu, Rongtao and Xu, Shibiao and Meng, Weiliang and Zhang, Xiaopeng}, title = {Treating Pseudo-labels Generation as Image Matting for Weakly Supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {755-765} }
Structural Alignment for Network Pruning through Partial Regularization-
[pdf]
[supp]
[bibtex]@InProceedings{Gao_2023_ICCV, author = {Gao, Shangqian and Zhang, Zeyu and Zhang, Yanfu and Huang, Feihu and Huang, Heng}, title = {Structural Alignment for Network Pruning through Partial Regularization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17402-17412} }
Learning Long-Range Information with Dual-Scale Transformers for Indoor Scene Completion-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Ziqi and Luo, Fei and Long, Xiaoxiao and Zhang, Wenxiao and Xiao, Chunxia}, title = {Learning Long-Range Information with Dual-Scale Transformers for Indoor Scene Completion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18569-18579} }
A Game of Bundle Adjustment - Learning Efficient Convergence-
[pdf]
[bibtex]@InProceedings{Belder_2023_ICCV, author = {Belder, Amir and Vivanti, Refael and Tal, Ayellet}, title = {A Game of Bundle Adjustment - Learning Efficient Convergence}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8428-8437} }
Learning Correction Filter via Degradation-Adaptive Regression for Blind Single Image Super-Resolution-
[pdf]
[supp]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Hongyang and Zhu, Xiaobin and Zhu, Jianqing and Han, Zheng and Zhang, Shi-Xue and Qin, Jingyan and Yin, Xu-Cheng}, title = {Learning Correction Filter via Degradation-Adaptive Regression for Blind Single Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12365-12375} }
UMFuse: Unified Multi View Fusion for Human Editing Applications-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jain_2023_ICCV, author = {Jain, Rishabh and Hemani, Mayur and Ceylan, Duygu and Singh, Krishna Kumar and Lu, Jingwan and Sarkar, Mausoom and Krishnamurthy, Balaji}, title = {UMFuse: Unified Multi View Fusion for Human Editing Applications}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7182-7191} }
CROSSFIRE: Camera Relocalization On Self-Supervised Features from an Implicit Representation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Moreau_2023_ICCV, author = {Moreau, Arthur and Piasco, Nathan and Bennehar, Moussab and Tsishkou, Dzmitry and Stanciulescu, Bogdan and de La Fortelle, Arnaud}, title = {CROSSFIRE: Camera Relocalization On Self-Supervised Features from an Implicit Representation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {252-262} }
Discriminative Class Tokens for Text-to-Image Diffusion Models-
[pdf]
[supp]
[bibtex]@InProceedings{Schwartz_2023_ICCV, author = {Schwartz, Idan and Sn{\ae}bjarnarson, V\'esteinn and Chefer, Hila and Belongie, Serge and Wolf, Lior and Benaim, Sagie}, title = {Discriminative Class Tokens for Text-to-Image Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22725-22735} }
SINC: Spatial Composition of 3D Human Motions for Simultaneous Action Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Athanasiou_2023_ICCV, author = {Athanasiou, Nikos and Petrovich, Mathis and Black, Michael J. and Varol, G\"ul}, title = {SINC: Spatial Composition of 3D Human Motions for Simultaneous Action Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9984-9995} }
ORC: Network Group-based Knowledge Distillation using Online Role Change-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Choi_2023_ICCV, author = {Choi, Junyong and Cho, Hyeon and Cheung, Seokhwa and Hwang, Wonjun}, title = {ORC: Network Group-based Knowledge Distillation using Online Role Change}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17381-17390} }
Audiovisual Masked Autoencoders-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Georgescu_2023_ICCV, author = {Georgescu, Mariana-Iuliana and Fonseca, Eduardo and Ionescu, Radu Tudor and Lucic, Mario and Schmid, Cordelia and Arnab, Anurag}, title = {Audiovisual Masked Autoencoders}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16144-16154} }
MV-DeepSDF: Implicit Modeling with Multi-Sweep Point Clouds for 3D Vehicle Reconstruction in Autonomous Driving-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Yibo and Zhu, Kelly and Wu, Guile and Ren, Yuan and Liu, Bingbing and Liu, Yang and Shan, Jinjun}, title = {MV-DeepSDF: Implicit Modeling with Multi-Sweep Point Clouds for 3D Vehicle Reconstruction in Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8306-8316} }
CHORD: Category-level Hand-held Object Reconstruction via Shape Deformation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Kailin and Yang, Lixin and Zhen, Haoyu and Lin, Zenan and Zhan, Xinyu and Zhong, Licheng and Xu, Jian and Wu, Kejian and Lu, Cewu}, title = {CHORD: Category-level Hand-held Object Reconstruction via Shape Deformation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9444-9454} }
Unmasking Anomalies in Road-Scene Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Rai_2023_ICCV, author = {Rai, Shyam Nandan and Cermelli, Fabio and Fontanel, Dario and Masone, Carlo and Caputo, Barbara}, title = {Unmasking Anomalies in Road-Scene Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4037-4046} }
DomainDrop: Suppressing Domain-Sensitive Channels for Domain Generalization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Guo_2023_ICCV, author = {Guo, Jintao and Qi, Lei and Shi, Yinghuan}, title = {DomainDrop: Suppressing Domain-Sensitive Channels for Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19114-19124} }
Towards Universal LiDAR-Based 3D Object Detection by Multi-Domain Knowledge Transfer-
[pdf]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Guile and Cao, Tongtong and Liu, Bingbing and Chen, Xingxin and Ren, Yuan}, title = {Towards Universal LiDAR-Based 3D Object Detection by Multi-Domain Knowledge Transfer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8669-8678} }
StyleInV: A Temporal Style Modulated Inversion Network for Unconditional Video Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Yuhan and Jiang, Liming and Loy, Chen Change}, title = {StyleInV: A Temporal Style Modulated Inversion Network for Unconditional Video Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22851-22861} }
Self-Calibrated Cross Attention Network for Few-Shot Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2023_ICCV, author = {Xu, Qianxiong and Zhao, Wenting and Lin, Guosheng and Long, Cheng}, title = {Self-Calibrated Cross Attention Network for Few-Shot Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {655-665} }
Anatomical Invariance Modeling and Semantic Alignment for Self-supervised Learning in 3D Medical Image Analysis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jiang_2023_ICCV, author = {Jiang, Yankai and Sun, Mingze and Guo, Heng and Bai, Xiaoyu and Yan, Ke and Lu, Le and Xu, Minfeng}, title = {Anatomical Invariance Modeling and Semantic Alignment for Self-supervised Learning in 3D Medical Image Analysis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15859-15869} }
Towards High-Fidelity Text-Guided 3D Face Generation and Manipulation Using only Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yu_2023_ICCV, author = {Yu, Cuican and Lu, Guansong and Zeng, Yihan and Sun, Jian and Liang, Xiaodan and Li, Huibin and Xu, Zongben and Xu, Songcen and Zhang, Wei and Xu, Hang}, title = {Towards High-Fidelity Text-Guided 3D Face Generation and Manipulation Using only Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15326-15337} }
SSDA: Secure Source-Free Domain Adaptation-
[pdf]
[supp]
[bibtex]@InProceedings{Ahmed_2023_ICCV, author = {Ahmed, Sabbir and Al Arafat, Abdullah and Rizve, Mamshad Nayeem and Hossain, Rahim and Guo, Zhishan and Rakin, Adnan Siraj}, title = {SSDA: Secure Source-Free Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19180-19190} }
ENTL: Embodied Navigation Trajectory Learner-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kotar_2023_ICCV, author = {Kotar, Klemen and Walsman, Aaron and Mottaghi, Roozbeh}, title = {ENTL: Embodied Navigation Trajectory Learner}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10863-10872} }
AGG-Net: Attention Guided Gated-Convolutional Network for Depth Image Completion-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Dongyue and Huang, Tingxuan and Song, Zhimin and Deng, Shizhuo and Jia, Tong}, title = {AGG-Net: Attention Guided Gated-Convolutional Network for Depth Image Completion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8853-8862} }
Learning Global-aware Kernel for Image Harmonization-
[pdf]
[arXiv]
[bibtex]@InProceedings{Shen_2023_ICCV, author = {Shen, Xintian and Zhang, Jiangning and Chen, Jun and Bai, Shipeng and Han, Yue and Wang, Yabiao and Wang, Chengjie and Liu, Yong}, title = {Learning Global-aware Kernel for Image Harmonization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7535-7544} }
Real-Time Neural Rasterization for Large Scenes-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Jeffrey Yunfan and Chen, Yun and Yang, Ze and Wang, Jingkang and Manivasagam, Sivabalan and Urtasun, Raquel}, title = {Real-Time Neural Rasterization for Large Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8416-8427} }
ESTextSpotter: Towards Better Scene Text Spotting with Explicit Synergy in Transformer-
[pdf]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Mingxin and Zhang, Jiaxin and Peng, Dezhi and Lu, Hao and Huang, Can and Liu, Yuliang and Bai, Xiang and Jin, Lianwen}, title = {ESTextSpotter: Towards Better Scene Text Spotting with Explicit Synergy in Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19495-19505} }
UGC: Unified GAN Compression for Efficient Image-to-Image Translation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ren_2023_ICCV, author = {Ren, Yuxi and Wu, Jie and Zhang, Peng and Zhang, Manlin and Xiao, Xuefeng and He, Qian and Wang, Rui and Zheng, Min and Pan, Xin}, title = {UGC: Unified GAN Compression for Efficient Image-to-Image Translation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17281-17291} }
Efficient View Synthesis with Neural Radiance Distribution Field-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Yushuang and Li, Xiao and Wang, Jinglu and Han, Xiaoguang and Cui, Shuguang and Lu, Yan}, title = {Efficient View Synthesis with Neural Radiance Distribution Field}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18506-18515} }
MixSpeech: Cross-Modality Self-Learning with Audio-Visual Stream Mixup for Visual Speech Translation and Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cheng_2023_ICCV, author = {Cheng, Xize and Jin, Tao and Huang, Rongjie and Li, Linjun and Lin, Wang and Wang, Zehan and Wang, Ye and Liu, Huadai and Yin, Aoxiong and Zhao, Zhou}, title = {MixSpeech: Cross-Modality Self-Learning with Audio-Visual Stream Mixup for Visual Speech Translation and Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15735-15745} }
Chordal Averaging on Flag Manifolds and Its Applications-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mankovich_2023_ICCV, author = {Mankovich, Nathan and Birdal, Tolga}, title = {Chordal Averaging on Flag Manifolds and Its Applications}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3881-3890} }
Towards Building More Robust Models with Frequency Bias-
[pdf]
[arXiv]
[bibtex]@InProceedings{Bu_2023_ICCV, author = {Bu, Qingwen and Huang, Dong and Cui, Heming}, title = {Towards Building More Robust Models with Frequency Bias}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4402-4411} }
SparseBEV: High-Performance Sparse 3D Object Detection from Multi-Camera Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Haisong and Teng, Yao and Lu, Tao and Wang, Haiguang and Wang, Limin}, title = {SparseBEV: High-Performance Sparse 3D Object Detection from Multi-Camera Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18580-18590} }
Boosting Whole Slide Image Classification from the Perspectives of Distribution, Correlation and Magnification-
[pdf]
[bibtex]@InProceedings{Qu_2023_ICCV, author = {Qu, Linhao and Yang, Zhiwei and Duan, Minghong and Ma, Yingfan and Wang, Shuo and Wang, Manning and Song, Zhijian}, title = {Boosting Whole Slide Image Classification from the Perspectives of Distribution, Correlation and Magnification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21463-21473} }
PolicyCleanse: Backdoor Detection and Mitigation for Competitive Reinforcement Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Guo_2023_ICCV, author = {Guo, Junfeng and Li, Ang and Wang, Lixu and Liu, Cong}, title = {PolicyCleanse: Backdoor Detection and Mitigation for Competitive Reinforcement Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4699-4708} }
Ref-NeuS: Ambiguity-Reduced Neural Implicit Surface Learning for Multi-View Reconstruction with Reflection-
[pdf]
[supp]
[bibtex]@InProceedings{Ge_2023_ICCV, author = {Ge, Wenhang and Hu, Tao and Zhao, Haoyu and Liu, Shu and Chen, Ying-Cong}, title = {Ref-NeuS: Ambiguity-Reduced Neural Implicit Surface Learning for Multi-View Reconstruction with Reflection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4251-4260} }
Innovating Real Fisheye Image Correction with Dual Diffusion Architecture-
[pdf]
[supp]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Shangrong and Lin, Chunyu and Liao, Kang and Zhao, Yao}, title = {Innovating Real Fisheye Image Correction with Dual Diffusion Architecture}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12699-12708} }
Global Perception Based Autoregressive Neural Processes-
[pdf]
[bibtex]@InProceedings{Tai_2023_ICCV, author = {Tai, Jinyang}, title = {Global Perception Based Autoregressive Neural Processes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10487-10497} }
Class-incremental Continual Learning for Instance Segmentation with Image-level Weak Supervision-
[pdf]
[supp]
[bibtex]@InProceedings{Hsieh_2023_ICCV, author = {Hsieh, Yu-Hsing and Chen, Guan-Sheng and Cai, Shun-Xian and Wei, Ting-Yun and Yang, Huei-Fang and Chen, Chu-Song}, title = {Class-incremental Continual Learning for Instance Segmentation with Image-level Weak Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1250-1261} }
When Prompt-based Incremental Learning Does Not Meet Strong Pretraining-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tang_2023_ICCV, author = {Tang, Yu-Ming and Peng, Yi-Xing and Zheng, Wei-Shi}, title = {When Prompt-based Incremental Learning Does Not Meet Strong Pretraining}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1706-1716} }
Multimodal High-order Relation Transformer for Scene Boundary Detection-
[pdf]
[bibtex]@InProceedings{Wei_2023_ICCV, author = {Wei, Xi and Shi, Zhangxiang and Zhang, Tianzhu and Yu, Xiaoyuan and Xiao, Lei}, title = {Multimodal High-order Relation Transformer for Scene Boundary Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22081-22090} }
Tri-MipRF: Tri-Mip Representation for Efficient Anti-Aliasing Neural Radiance Fields-
[pdf]
[bibtex]@InProceedings{Hu_2023_ICCV, author = {Hu, Wenbo and Wang, Yuling and Ma, Lin and Yang, Bangbang and Gao, Lin and Liu, Xiao and Ma, Yuewen}, title = {Tri-MipRF: Tri-Mip Representation for Efficient Anti-Aliasing Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19774-19783} }
LaRS: A Diverse Panoptic Maritime Obstacle Detection Dataset and Benchmark-
[pdf]
[supp]
[bibtex]@InProceedings{Zust_2023_ICCV, author = {\v{Z}ust, Lojze and Per\v{s}, Janez and Kristan, Matej}, title = {LaRS: A Diverse Panoptic Maritime Obstacle Detection Dataset and Benchmark}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20304-20314} }
Exploring Transformers for Open-world Instance Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Jiannan and Jiang, Yi and Yan, Bin and Lu, Huchuan and Yuan, Zehuan and Luo, Ping}, title = {Exploring Transformers for Open-world Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6611-6621} }
VQA Therapy: Exploring Answer Differences by Visually Grounding Answers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Chongyan and Anjum, Samreen and Gurari, Danna}, title = {VQA Therapy: Exploring Answer Differences by Visually Grounding Answers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15315-15325} }
Energy-based Self-Training and Normalization for Unsupervised Domain Adaptation-
[pdf]
[supp]
[bibtex]@InProceedings{Herath_2023_ICCV, author = {Herath, Samitha and Fernando, Basura and Abbasnejad, Ehsan and Hayat, Munawar and Khadivi, Shahram and Harandi, Mehrtash and Rezatofighi, Hamid and Haffari, Gholamreza}, title = {Energy-based Self-Training and Normalization for Unsupervised Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11653-11662} }
Self-Evolved Dynamic Expansion Model for Task-Free Continual Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Ye_2023_ICCV, author = {Ye, Fei and Bors, Adrian G.}, title = {Self-Evolved Dynamic Expansion Model for Task-Free Continual Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22102-22112} }
Adaptive Template Transformer for Mitochondria Segmentation in Electron Microscopy Images-
[pdf]
[bibtex]@InProceedings{Pan_2023_ICCV, author = {Pan, Yuwen and Luo, Naisong and Sun, Rui and Meng, Meng and Zhang, Tianzhu and Xiong, Zhiwei and Zhang, Yongdong}, title = {Adaptive Template Transformer for Mitochondria Segmentation in Electron Microscopy Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21474-21484} }
Collaborative Tracking Learning for Frame-Rate-Insensitive Multi-Object Tracking-
[pdf]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Yiheng and Wu, Junta and Fu, Yi}, title = {Collaborative Tracking Learning for Frame-Rate-Insensitive Multi-Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9964-9973} }
Tangent Model Composition for Ensembling and Continual Fine-tuning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Tian Yu and Soatto, Stefano}, title = {Tangent Model Composition for Ensembling and Continual Fine-tuning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18676-18686} }
Knowledge-Spreader: Learning Semi-Supervised Facial Action Dynamics by Consistifying Knowledge Granularity-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Xiaotian and Zhang, Xiang and Wang, Taoyue and Yin, Lijun}, title = {Knowledge-Spreader: Learning Semi-Supervised Facial Action Dynamics by Consistifying Knowledge Granularity}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20979-20989} }
SSF: Accelerating Training of Spiking Neural Networks with Stabilized Spiking Flow-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Jingtao and Song, Zengjie and Wang, Yuxi and Xiao, Jun and Yang, Yuran and Mei, Shuqi and Zhang, Zhaoxiang}, title = {SSF: Accelerating Training of Spiking Neural Networks with Stabilized Spiking Flow}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5982-5991} }
Manipulate by Seeing: Creating Manipulation Controllers from Pre-Trained Representations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Jianren and Dasari, Sudeep and Srirama, Mohan Kumar and Tulsiani, Shubham and Gupta, Abhinav}, title = {Manipulate by Seeing: Creating Manipulation Controllers from Pre-Trained Representations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3859-3868} }
Learning Human-Human Interactions in Images from Weak Textual Supervision-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Alper_2023_ICCV, author = {Alper, Morris and Averbuch-Elor, Hadar}, title = {Learning Human-Human Interactions in Images from Weak Textual Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2887-2899} }
Prompt-aligned Gradient for Prompt Tuning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Beier and Niu, Yulei and Han, Yucheng and Wu, Yue and Zhang, Hanwang}, title = {Prompt-aligned Gradient for Prompt Tuning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15659-15669} }
Aperture Diffraction for Compact Snapshot Spectral Imaging-
[pdf]
[supp]
[bibtex]@InProceedings{Lv_2023_ICCV, author = {Lv, Tao and Ye, Hao and Yuan, Quan and Shi, Zhan and Wang, Yibo and Wang, Shuming and Cao, Xun}, title = {Aperture Diffraction for Compact Snapshot Spectral Imaging}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10574-10584} }
Diffusion Action Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Daochang and Li, Qiyue and Dinh, Anh-Dung and Jiang, Tingting and Shah, Mubarak and Xu, Chang}, title = {Diffusion Action Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10139-10149} }
Prototype Reminiscence and Augmented Asymmetric Knowledge Aggregation for Non-Exemplar Class-Incremental Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Shi_2023_ICCV, author = {Shi, Wuxuan and Ye, Mang}, title = {Prototype Reminiscence and Augmented Asymmetric Knowledge Aggregation for Non-Exemplar Class-Incremental Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1772-1781} }
Exemplar-Free Continual Transformer with Convolutions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Roy_2023_ICCV, author = {Roy, Anurag and Verma, Vinay K. and Voonna, Sravan and Ghosh, Kripabandhu and Ghosh, Saptarshi and Das, Abir}, title = {Exemplar-Free Continual Transformer with Convolutions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5897-5907} }
Scalable Video Object Segmentation with Simplified Framework-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Qiangqiang and Yang, Tianyu and Wu, Wei and Chan, Antoni B.}, title = {Scalable Video Object Segmentation with Simplified Framework}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13879-13889} }
Rehearsal-Free Domain Continual Face Anti-Spoofing: Generalize More and Forget Less-
[pdf]
[supp]
[bibtex]@InProceedings{Cai_2023_ICCV, author = {Cai, Rizhao and Cui, Yawen and Li, Zhi and Yu, Zitong and Li, Haoliang and Hu, Yongjian and Kot, Alex}, title = {Rehearsal-Free Domain Continual Face Anti-Spoofing: Generalize More and Forget Less}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8037-8048} }
Efficient Decision-based Black-box Patch Attacks on Video Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jiang_2023_ICCV, author = {Jiang, Kaixun and Chen, Zhaoyu and Huang, Hao and Wang, Jiafeng and Yang, Dingkang and Li, Bo and Wang, Yan and Zhang, Wenqiang}, title = {Efficient Decision-based Black-box Patch Attacks on Video Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4379-4389} }
Kick Back & Relax: Learning to Reconstruct the World by Watching SlowTV-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Spencer_2023_ICCV, author = {Spencer, Jaime and Russell, Chris and Hadfield, Simon and Bowden, Richard}, title = {Kick Back \& Relax: Learning to Reconstruct the World by Watching SlowTV}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15768-15779} }
MetaGCD: Learning to Continually Learn in Generalized Category Discovery-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Yanan and Chi, Zhixiang and Wang, Yang and Feng, Songhe}, title = {MetaGCD: Learning to Continually Learn in Generalized Category Discovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1655-1665} }
Strip-MLP: Efficient Token Interaction for Vision MLP-
[pdf]
[bibtex]@InProceedings{Cao_2023_ICCV, author = {Cao, Guiping and Luo, Shengda and Huang, Wenjian and Lan, Xiangyuan and Jiang, Dongmei and Wang, Yaowei and Zhang, Jianguo}, title = {Strip-MLP: Efficient Token Interaction for Vision MLP}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1494-1504} }
SAFARI: Versatile and Efficient Evaluations for Robustness of Interpretability-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Wei and Zhao, Xingyu and Jin, Gaojie and Huang, Xiaowei}, title = {SAFARI: Versatile and Efficient Evaluations for Robustness of Interpretability}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1988-1998} }
ChildPlay: A New Benchmark for Understanding Children's Gaze Behaviour-
[pdf]
[supp]
[bibtex]@InProceedings{Tafasca_2023_ICCV, author = {Tafasca, Samy and Gupta, Anshul and Odobez, Jean-Marc}, title = {ChildPlay: A New Benchmark for Understanding Children's Gaze Behaviour}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20935-20946} }
Towards General Low-Light Raw Noise Synthesis and Modeling-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Feng and Xu, Bin and Li, Zhiqiang and Liu, Xinran and Lu, Qingbo and Gao, Changxin and Sang, Nong}, title = {Towards General Low-Light Raw Noise Synthesis and Modeling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10820-10830} }
Combating Noisy Labels with Sample Selection by Mining High-Discrepancy Examples-
[pdf]
[supp]
[bibtex]@InProceedings{Xia_2023_ICCV, author = {Xia, Xiaobo and Han, Bo and Zhan, Yibing and Yu, Jun and Gong, Mingming and Gong, Chen and Liu, Tongliang}, title = {Combating Noisy Labels with Sample Selection by Mining High-Discrepancy Examples}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1833-1843} }
Beyond the Pixel: a Photometrically Calibrated HDR Dataset for Luminance and Color Prediction-
[pdf]
[supp]
[bibtex]@InProceedings{Bolduc_2023_ICCV, author = {Bolduc, Christophe and Giroux, Justine and H\'ebert, Marc and Demers, Claude and Lalonde, Jean-Fran\c{c}ois}, title = {Beyond the Pixel: a Photometrically Calibrated HDR Dataset for Luminance and Color Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8071-8081} }
What can Discriminator do? Towards Box-free Ownership Verification of Generative Adversarial Networks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Ziheng and Li, Boheng and Cai, Yan and Wang, Run and Guo, Shangwei and Fang, Liming and Chen, Jing and Wang, Lina}, title = {What can Discriminator do? Towards Box-free Ownership Verification of Generative Adversarial Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5009-5019} }
When Noisy Labels Meet Long Tail Dilemmas: A Representation Calibration Method-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Manyi and Zhao, Xuyang and Yao, Jun and Yuan, Chun and Huang, Weiran}, title = {When Noisy Labels Meet Long Tail Dilemmas: A Representation Calibration Method}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15890-15900} }
Reinforce Data, Multiply Impact: Improved Model Accuracy and Robustness with Dataset Reinforcement-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Faghri_2023_ICCV, author = {Faghri, Fartash and Pouransari, Hadi and Mehta, Sachin and Farajtabar, Mehrdad and Farhadi, Ali and Rastegari, Mohammad and Tuzel, Oncel}, title = {Reinforce Data, Multiply Impact: Improved Model Accuracy and Robustness with Dataset Reinforcement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17032-17043} }
An Adaptive Model Ensemble Adversarial Attack for Boosting Adversarial Transferability-
[pdf]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Bin and Yin, Jiali and Chen, Shukai and Chen, Bohao and Liu, Ximeng}, title = {An Adaptive Model Ensemble Adversarial Attack for Boosting Adversarial Transferability}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4489-4498} }
Incremental Generalized Category Discovery-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Bingchen and Mac Aodha, Oisin}, title = {Incremental Generalized Category Discovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19137-19147} }
Prototypical Mixing and Retrieval-Based Refinement for Label Noise-Resistant Image Retrieval-
[pdf]
[supp]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Xinlong and Wang, Haixin and Sun, Jinan and Zhang, Shikun and Chen, Chong and Hua, Xian-Sheng and Luo, Xiao}, title = {Prototypical Mixing and Retrieval-Based Refinement for Label Noise-Resistant Image Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11239-11249} }
AccFlow: Backward Accumulation for Long-Range Optical Flow-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Guangyang and Liu, Xiaohong and Luo, Kunming and Liu, Xi and Zheng, Qingqing and Liu, Shuaicheng and Jiang, Xinyang and Zhai, Guangtao and Wang, Wenyi}, title = {AccFlow: Backward Accumulation for Long-Range Optical Flow}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12119-12128} }
Guiding Local Feature Matching with Surface Curvature-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Shuzhe and Kannala, Juho and Pollefeys, Marc and Barath, Daniel}, title = {Guiding Local Feature Matching with Surface Curvature}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17981-17991} }
3D-VisTA: Pre-trained Transformer for 3D Vision and Text Alignment-
[pdf]
[supp]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Ziyu and Ma, Xiaojian and Chen, Yixin and Deng, Zhidong and Huang, Siyuan and Li, Qing}, title = {3D-VisTA: Pre-trained Transformer for 3D Vision and Text Alignment}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2911-2921} }
Constraining Depth Map Geometry for Multi-View Stereo: A Dual-Depth Approach with Saddle-shaped Depth Cells-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ye_2023_ICCV, author = {Ye, Xinyi and Zhao, Weiyue and Liu, Tianqi and Huang, Zihao and Cao, Zhiguo and Li, Xin}, title = {Constraining Depth Map Geometry for Multi-View Stereo: A Dual-Depth Approach with Saddle-shaped Depth Cells}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17661-17670} }
SparseDet: Improving Sparsely Annotated Object Detection with Pseudo-positive Mining-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Suri_2023_ICCV, author = {Suri, Saksham and Rambhatla, Saketh and Chellappa, Rama and Shrivastava, Abhinav}, title = {SparseDet: Improving Sparsely Annotated Object Detection with Pseudo-positive Mining}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6770-6781} }
Among Us: Adversarially Robust Collaborative Perception by Consensus-
[pdf]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Yiming and Fang, Qi and Bai, Jiamu and Chen, Siheng and Juefei-Xu, Felix and Feng, Chen}, title = {Among Us: Adversarially Robust Collaborative Perception by Consensus}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {186-195} }
BUS: Efficient and Effective Vision-Language Pre-Training with Bottom-Up Patch Summarization.-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jiang_2023_ICCV, author = {Jiang, Chaoya and Xu, Haiyang and Ye, Wei and Ye, Qinghao and Li, Chenliang and Yan, Ming and Bi, Bin and Zhang, Shikun and Huang, Fei and Huang, Songfang}, title = {BUS: Efficient and Effective Vision-Language Pre-Training with Bottom-Up Patch Summarization.}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2900-2910} }
DiffusionDet: Diffusion Model for Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Shoufa and Sun, Peize and Song, Yibing and Luo, Ping}, title = {DiffusionDet: Diffusion Model for Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19830-19843} }
Forward Flow for Novel View Synthesis of Dynamic Scenes-
[pdf]
[supp]
[bibtex]@InProceedings{Guo_2023_ICCV, author = {Guo, Xiang and Sun, Jiadai and Dai, Yuchao and Chen, Guanying and Ye, Xiaoqing and Tan, Xiao and Ding, Errui and Zhang, Yumeng and Wang, Jingdong}, title = {Forward Flow for Novel View Synthesis of Dynamic Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16022-16033} }
CopyRNeRF: Protecting the CopyRight of Neural Radiance Fields-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Luo_2023_ICCV, author = {Luo, Ziyuan and Guo, Qing and Cheung, Ka Chun and See, Simon and Wan, Renjie}, title = {CopyRNeRF: Protecting the CopyRight of Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22401-22411} }
Contrastive Model Adaptation for Cross-Condition Robustness in Semantic Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Bruggemann_2023_ICCV, author = {Br\"uggemann, David and Sakaridis, Christos and Broedermann, Tim and Van Gool, Luc}, title = {Contrastive Model Adaptation for Cross-Condition Robustness in Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11378-11387} }
SegRCDB: Semantic Segmentation via Formula-Driven Supervised Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Shinoda_2023_ICCV, author = {Shinoda, Risa and Hayamizu, Ryo and Nakashima, Kodai and Inoue, Nakamasa and Yokota, Rio and Kataoka, Hirokatsu}, title = {SegRCDB: Semantic Segmentation via Formula-Driven Supervised Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20054-20063} }
Creative Birds: Self-Supervised Single-View 3D Style Transfer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Renke and Que, Guimin and Chen, Shuo and Li, Xiang and Li, Jun and Yang, Jian}, title = {Creative Birds: Self-Supervised Single-View 3D Style Transfer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8775-8784} }
LoTE-Animal: A Long Time-span Dataset for Endangered Animal Behavior Understanding-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Dan and Hou, Jin and Huang, Shaoli and Liu, Jing and He, Yuxin and Zheng, Bochuan and Ning, Jifeng and Zhang, Jingdong}, title = {LoTE-Animal: A Long Time-span Dataset for Endangered Animal Behavior Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20064-20075} }
DQS3D: Densely-matched Quantization-aware Semi-supervised 3D Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gao_2023_ICCV, author = {Gao, Huan-ang and Tian, Beiwen and Li, Pengfei and Zhao, Hao and Zhou, Guyue}, title = {DQS3D: Densely-matched Quantization-aware Semi-supervised 3D Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21905-21915} }
Towards Inadequately Pre-trained Models in Transfer Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Deng_2023_ICCV, author = {Deng, Andong and Li, Xingjian and Hu, Di and Wang, Tianyang and Xiong, Haoyi and Xu, Cheng-Zhong}, title = {Towards Inadequately Pre-trained Models in Transfer Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19397-19408} }
Boosting Novel Category Discovery Over Domains with Soft Contrastive Learning and All in One Classifier-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zang_2023_ICCV, author = {Zang, Zelin and Shang, Lei and Yang, Senqiao and Wang, Fei and Sun, Baigui and Xie, Xuansong and Li, Stan Z.}, title = {Boosting Novel Category Discovery Over Domains with Soft Contrastive Learning and All in One Classifier}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11858-11867} }
Class-Aware Patch Embedding Adaptation for Few-Shot Image Classification-
[pdf]
[supp]
[bibtex]@InProceedings{Hao_2023_ICCV, author = {Hao, Fusheng and He, Fengxiang and Liu, Liu and Wu, Fuxiang and Tao, Dacheng and Cheng, Jun}, title = {Class-Aware Patch Embedding Adaptation for Few-Shot Image Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18905-18915} }
SegPrompt: Boosting Open-World Segmentation via Category-Level Prompt Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2023_ICCV, author = {Zhu, Muzhi and Li, Hengtao and Chen, Hao and Fan, Chengxiang and Mao, Weian and Jing, Chenchen and Liu, Yifan and Shen, Chunhua}, title = {SegPrompt: Boosting Open-World Segmentation via Category-Level Prompt Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {999-1008} }
Search for or Navigate to? Dual Adaptive Thinking for Object Navigation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Dang_2023_ICCV, author = {Dang, Ronghao and Wang, Liuyi and He, Zongtao and Su, Shuai and Tang, Jiagui and Liu, Chengju and Chen, Qijun}, title = {Search for or Navigate to? Dual Adaptive Thinking for Object Navigation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8250-8259} }
CL-MVSNet: Unsupervised Multi-View Stereo with Dual-Level Contrastive Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Xiong_2023_ICCV, author = {Xiong, Kaiqiang and Peng, Rui and Zhang, Zhe and Feng, Tianxing and Jiao, Jianbo and Gao, Feng and Wang, Ronggang}, title = {CL-MVSNet: Unsupervised Multi-View Stereo with Dual-Level Contrastive Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3769-3780} }
Federated Learning Over Images: Vertical Decompositions and Pre-Trained Backbones Are Difficult to Beat-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hu_2023_ICCV, author = {Hu, Erdong and Tang, Yuxin and Kyrillidis, Anastasios and Jermaine, Chris}, title = {Federated Learning Over Images: Vertical Decompositions and Pre-Trained Backbones Are Difficult to Beat}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19385-19396} }
HOSNeRF: Dynamic Human-Object-Scene Neural Radiance Fields from a Single Video-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Jia-Wei and Cao, Yan-Pei and Yang, Tianyuan and Xu, Zhongcong and Keppo, Jussi and Shan, Ying and Qie, Xiaohu and Shou, Mike Zheng}, title = {HOSNeRF: Dynamic Human-Object-Scene Neural Radiance Fields from a Single Video}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18483-18494} }
OmniZoomer: Learning to Move and Zoom in on Sphere at High-Resolution-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cao_2023_ICCV, author = {Cao, Zidong and Ai, Hao and Cao, Yan-Pei and Shan, Ying and Qie, Xiaohu and Wang, Lin}, title = {OmniZoomer: Learning to Move and Zoom in on Sphere at High-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12897-12907} }
Knowing Where to Focus: Event-aware Transformer for Video Grounding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jang_2023_ICCV, author = {Jang, Jinhyun and Park, Jungin and Kim, Jin and Kwon, Hyeongjun and Sohn, Kwanghoon}, title = {Knowing Where to Focus: Event-aware Transformer for Video Grounding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13846-13856} }
TF-ICON: Diffusion-Based Training-Free Cross-Domain Image Composition-
[pdf]
[supp]
[bibtex]@InProceedings{Lu_2023_ICCV, author = {Lu, Shilin and Liu, Yanzhu and Kong, Adams Wai-Kin}, title = {TF-ICON: Diffusion-Based Training-Free Cross-Domain Image Composition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2294-2305} }
Landscape Learning for Neural Network Inversion-
[pdf]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Ruoshi and Mao, Chengzhi and Tendulkar, Purva and Wang, Hao and Vondrick, Carl}, title = {Landscape Learning for Neural Network Inversion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2239-2250} }
Movement Enhancement toward Multi-Scale Video Feature Representation for Temporal Action Detection-
[pdf]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Zixuan and Wang, Dongqi and Zhao, Xu}, title = {Movement Enhancement toward Multi-Scale Video Feature Representation for Temporal Action Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13555-13564} }
Collaborative Propagation on Multiple Instance Graphs for 3D Instance Segmentation with Single-point Supervision-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dong_2023_ICCV, author = {Dong, Shichao and Li, Ruibo and Wei, Jiacheng and Liu, Fayao and Lin, Guosheng}, title = {Collaborative Propagation on Multiple Instance Graphs for 3D Instance Segmentation with Single-point Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16665-16674} }
PPR: Physically Plausible Reconstruction from Monocular Videos-
[pdf]
[supp]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Gengshan and Yang, Shuo and Zhang, John Z. and Manchester, Zachary and Ramanan, Deva}, title = {PPR: Physically Plausible Reconstruction from Monocular Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3914-3924} }
Single Image Deblurring with Row-dependent Blur Magnitude-
[pdf]
[supp]
[bibtex]@InProceedings{Ji_2023_ICCV, author = {Ji, Xiang and Wang, Zhixiang and Satoh, Shin'ichi and Zheng, Yinqiang}, title = {Single Image Deblurring with Row-dependent Blur Magnitude}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12269-12280} }
Robust Heterogeneous Federated Learning under Data Corruption-
[pdf]
[supp]
[bibtex]@InProceedings{Fang_2023_ICCV, author = {Fang, Xiuwen and Ye, Mang and Yang, Xiyuan}, title = {Robust Heterogeneous Federated Learning under Data Corruption}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5020-5030} }
RMP-Loss: Regularizing Membrane Potential Distribution for Spiking Neural Networks-
[pdf]
[bibtex]@InProceedings{Guo_2023_ICCV, author = {Guo, Yufei and Liu, Xiaode and Chen, Yuanpei and Zhang, Liwen and Peng, Weihang and Zhang, Yuhan and Huang, Xuhui and Ma, Zhe}, title = {RMP-Loss: Regularizing Membrane Potential Distribution for Spiking Neural Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17391-17401} }
Cyclic-Bootstrap Labeling for Weakly Supervised Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yin_2023_ICCV, author = {Yin, Yufei and Deng, Jiajun and Zhou, Wengang and Li, Li and Li, Houqiang}, title = {Cyclic-Bootstrap Labeling for Weakly Supervised Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7008-7018} }
Deep Active Contours for Real-time 6-DoF Object Tracking-
[pdf]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Long and Yan, Shen and Zhen, Jianan and Liu, Yu and Zhang, Maojun and Zhang, Guofeng and Zhou, Xiaowei}, title = {Deep Active Contours for Real-time 6-DoF Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14034-14044} }
Tangent Sampson Error: Fast Approximate Two-view Reprojection Error for Central Camera Models-
[pdf]
[supp]
[bibtex]@InProceedings{Terekhov_2023_ICCV, author = {Terekhov, Mikhail and Larsson, Viktor}, title = {Tangent Sampson Error: Fast Approximate Two-view Reprojection Error for Central Camera Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3370-3378} }
Multi-grained Temporal Prototype Learning for Few-shot Video Object Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Nian and Nan, Kepan and Zhao, Wangbo and Liu, Yuanwei and Yao, Xiwen and Khan, Salman and Cholakkal, Hisham and Anwer, Rao Muhammad and Han, Junwei and Khan, Fahad Shahbaz}, title = {Multi-grained Temporal Prototype Learning for Few-shot Video Object Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18862-18871} }
Improving 3D Imaging with Pre-Trained Perpendicular 2D Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2023_ICCV, author = {Lee, Suhyeon and Chung, Hyungjin and Park, Minyoung and Park, Jonghyuk and Ryu, Wi-Sun and Ye, Jong Chul}, title = {Improving 3D Imaging with Pre-Trained Perpendicular 2D Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10710-10720} }
Time Does Tell: Self-Supervised Time-Tuning of Dense Image Representations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Salehi_2023_ICCV, author = {Salehi, Mohammadreza and Gavves, Efstratios and Snoek, Cees G.M. and Asano, Yuki M.}, title = {Time Does Tell: Self-Supervised Time-Tuning of Dense Image Representations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16536-16547} }
CroCo v2: Improved Cross-view Completion Pre-training for Stereo Matching and Optical Flow-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Weinzaepfel_2023_ICCV, author = {Weinzaepfel, Philippe and Lucas, Thomas and Leroy, Vincent and Cabon, Yohann and Arora, Vaibhav and Br\'egier, Romain and Csurka, Gabriela and Antsfeld, Leonid and Chidlovskii, Boris and Revaud, Jerome}, title = {CroCo v2: Improved Cross-view Completion Pre-training for Stereo Matching and Optical Flow}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17969-17980} }
ExBluRF: Efficient Radiance Fields for Extreme Motion Blurred Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2023_ICCV, author = {Lee, Dongwoo and Oh, Jeongtaek and Rim, Jaesung and Cho, Sunghyun and Lee, Kyoung Mu}, title = {ExBluRF: Efficient Radiance Fields for Extreme Motion Blurred Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17639-17648} }
MPCViT: Searching for Accurate and Efficient MPC-Friendly Vision Transformer with Heterogeneous Attention-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zeng_2023_ICCV, author = {Zeng, Wenxuan and Li, Meng and Xiong, Wenjie and Tong, Tong and Lu, Wen-jie and Tan, Jin and Wang, Runsheng and Huang, Ru}, title = {MPCViT: Searching for Accurate and Efficient MPC-Friendly Vision Transformer with Heterogeneous Attention}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5052-5063} }
Online Class Incremental Learning on Stochastic Blurry Task Boundary via Mask and Visual Prompt Tuning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Moon_2023_ICCV, author = {Moon, Jun-Yeong and Park, Keon-Hee and Kim, Jung Uk and Park, Gyeong-Moon}, title = {Online Class Incremental Learning on Stochastic Blurry Task Boundary via Mask and Visual Prompt Tuning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11731-11741} }
Text2Video-Zero: Text-to-Image Diffusion Models are Zero-Shot Video Generators-
[pdf]
[supp]
[bibtex]@InProceedings{Khachatryan_2023_ICCV, author = {Khachatryan, Levon and Movsisyan, Andranik and Tadevosyan, Vahram and Henschel, Roberto and Wang, Zhangyang and Navasardyan, Shant and Shi, Humphrey}, title = {Text2Video-Zero: Text-to-Image Diffusion Models are Zero-Shot Video Generators}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15954-15964} }
Masked Spiking Transformer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Ziqing and Fang, Yuetong and Cao, Jiahang and Zhang, Qiang and Wang, Zhongrui and Xu, Renjing}, title = {Masked Spiking Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1761-1771} }
Exploring Video Quality Assessment on User Generated Contents from Aesthetic and Technical Perspectives-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Haoning and Zhang, Erli and Liao, Liang and Chen, Chaofeng and Hou, Jingwen and Wang, Annan and Sun, Wenxiu and Yan, Qiong and Lin, Weisi}, title = {Exploring Video Quality Assessment on User Generated Contents from Aesthetic and Technical Perspectives}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20144-20154} }
Distributed Bundle Adjustment with Block-Based Sparse Matrix Compression for Super Large Scale Datasets-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zheng_2023_ICCV, author = {Zheng, Maoteng and Chen, Nengcheng and Zhu, Junfeng and Zeng, Xiaoru and Qiu, Huanbin and Jiang, Yuyao and Lu, Xingyue and Qu, Hao}, title = {Distributed Bundle Adjustment with Block-Based Sparse Matrix Compression for Super Large Scale Datasets}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18152-18162} }
SCANet: Scene Complexity Aware Network for Weakly-Supervised Video Moment Retrieval-
[pdf]
[supp]
[bibtex]@InProceedings{Yoon_2023_ICCV, author = {Yoon, Sunjae and Koo, Gwanhyeong and Kim, Dahyun and Yoo, Chang D.}, title = {SCANet: Scene Complexity Aware Network for Weakly-Supervised Video Moment Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13576-13586} }
Neural Interactive Keypoint Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Jie and Zeng, Ailing and Li, Feng and Liu, Shilong and Zhang, Ruimao and Zhang, Lei}, title = {Neural Interactive Keypoint Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15122-15132} }
Joint Implicit Neural Representation for High-fidelity and Compact Vector Fonts-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Chia-Hao and Liu, Ying-Tian and Zhang, Zhifei and Guo, Yuan-Chen and Zhang, Song-Hai}, title = {Joint Implicit Neural Representation for High-fidelity and Compact Vector Fonts}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5538-5548} }
Spurious Features Everywhere - Large-Scale Detection of Harmful Spurious Features in ImageNet-
[pdf]
[supp]
[bibtex]@InProceedings{Neuhaus_2023_ICCV, author = {Neuhaus, Yannic and Augustin, Maximilian and Boreiko, Valentyn and Hein, Matthias}, title = {Spurious Features Everywhere - Large-Scale Detection of Harmful Spurious Features in ImageNet}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20235-20246} }
Knowledge-Aware Prompt Tuning for Generalizable Vision-Language Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kan_2023_ICCV, author = {Kan, Baoshuo and Wang, Teng and Lu, Wenpeng and Zhen, Xiantong and Guan, Weili and Zheng, Feng}, title = {Knowledge-Aware Prompt Tuning for Generalizable Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15670-15680} }
Delicate Textured Mesh Recovery from NeRF via Adaptive Surface Refinement-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tang_2023_ICCV, author = {Tang, Jiaxiang and Zhou, Hang and Chen, Xiaokang and Hu, Tianshu and Ding, Errui and Wang, Jingdong and Zeng, Gang}, title = {Delicate Textured Mesh Recovery from NeRF via Adaptive Surface Refinement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17739-17749} }
Leveraging Inpainting for Single-Image Shadow Removal-
[pdf]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Xiaoguang and Guo, Qing and Abdelfattah, Rabab and Lin, Di and Feng, Wei and Tsang, Ivor and Wang, Song}, title = {Leveraging Inpainting for Single-Image Shadow Removal}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13055-13064} }
Neural Characteristic Function Learning for Conditional Image Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Shengxi and Zhang, Jialu and Li, Yifei and Xu, Mai and Deng, Xin and Li, Li}, title = {Neural Characteristic Function Learning for Conditional Image Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7204-7214} }
Accurate 3D Face Reconstruction with Facial Component Tokens-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Tianke and Chu, Xuangeng and Liu, Yunfei and Lin, Lijian and Yang, Zhendong and Xu, Zhengzhuo and Cao, Chengkun and Yu, Fei and Zhou, Changyin and Yuan, Chun and Li, Yu}, title = {Accurate 3D Face Reconstruction with Facial Component Tokens}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9033-9042} }
Holistic Label Correction for Noisy Multi-Label Classification-
[pdf]
[supp]
[bibtex]@InProceedings{Xia_2023_ICCV, author = {Xia, Xiaobo and Deng, Jiankang and Bao, Wei and Du, Yuxuan and Han, Bo and Shan, Shiguang and Liu, Tongliang}, title = {Holistic Label Correction for Noisy Multi-Label Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1483-1493} }
Probabilistic Precision and Recall Towards Reliable Evaluation of Generative Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Park_2023_ICCV, author = {Park, Dogyun and Kim, Suhyun}, title = {Probabilistic Precision and Recall Towards Reliable Evaluation of Generative Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20099-20109} }
Deep Multitask Learning with Progressive Parameter Sharing-
[pdf]
[supp]
[bibtex]@InProceedings{Shi_2023_ICCV, author = {Shi, Haosen and Ren, Shen and Zhang, Tianwei and Pan, Sinno Jialin}, title = {Deep Multitask Learning with Progressive Parameter Sharing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19924-19935} }
Personalized Semantics Excitation for Federated Image Classification-
[pdf]
[bibtex]@InProceedings{Xia_2023_ICCV, author = {Xia, Haifeng and Li, Kai and Ding, Zhengming}, title = {Personalized Semantics Excitation for Federated Image Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19301-19310} }
Unified Data-Free Compression: Pruning and Quantization without Fine-Tuning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bai_2023_ICCV, author = {Bai, Shipeng and Chen, Jun and Shen, Xintian and Qian, Yixuan and Liu, Yong}, title = {Unified Data-Free Compression: Pruning and Quantization without Fine-Tuning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5876-5885} }
SurroundOcc: Multi-camera 3D Occupancy Prediction for Autonomous Driving-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wei_2023_ICCV, author = {Wei, Yi and Zhao, Linqing and Zheng, Wenzhao and Zhu, Zheng and Zhou, Jie and Lu, Jiwen}, title = {SurroundOcc: Multi-camera 3D Occupancy Prediction for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21729-21740} }
Temporal Enhanced Training of Multi-view 3D Object Detector via Historical Object Prediction-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zong_2023_ICCV, author = {Zong, Zhuofan and Jiang, Dongzhi and Song, Guanglu and Xue, Zeyue and Su, Jingyong and Li, Hongsheng and Liu, Yu}, title = {Temporal Enhanced Training of Multi-view 3D Object Detector via Historical Object Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3781-3790} }
PARIS: Part-level Reconstruction and Motion Analysis for Articulated Objects-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Jiayi and Mahdavi-Amiri, Ali and Savva, Manolis}, title = {PARIS: Part-level Reconstruction and Motion Analysis for Articulated Objects}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {352-363} }
OnlineRefer: A Simple Online Baseline for Referring Video Object Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Dongming and Wang, Tiancai and Zhang, Yuang and Zhang, Xiangyu and Shen, Jianbing}, title = {OnlineRefer: A Simple Online Baseline for Referring Video Object Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2761-2770} }
Implicit Neural Representation for Cooperative Low-light Image Enhancement-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2023_ICCV, author = {Yang, Shuzhou and Ding, Moxuan and Wu, Yanmin and Li, Zihan and Zhang, Jian}, title = {Implicit Neural Representation for Cooperative Low-light Image Enhancement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12918-12927} }
Environment Agnostic Representation for Visual Reinforcement Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Choi_2023_ICCV, author = {Choi, Hyesong and Lee, Hunsang and Jeong, Seongwon and Min, Dongbo}, title = {Environment Agnostic Representation for Visual Reinforcement Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {263-273} }
Deep Multiview Clustering by Contrasting Cluster Assignments-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Jie and Mao, Hua and Woo, Wai Lok and Peng, Xi}, title = {Deep Multiview Clustering by Contrasting Cluster Assignments}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16752-16761} }
Mimic3D: Thriving 3D-Aware GANs via 3D-to-2D Imitation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Xingyu and Deng, Yu and Wang, Baoyuan}, title = {Mimic3D: Thriving 3D-Aware GANs via 3D-to-2D Imitation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2338-2348} }
Look at the Neighbor: Distortion-aware Unsupervised Domain Adaptation for Panoramic Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zheng_2023_ICCV, author = {Zheng, Xu and Pan, Tianbo and Luo, Yunhao and Wang, Lin}, title = {Look at the Neighbor: Distortion-aware Unsupervised Domain Adaptation for Panoramic Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18687-18698} }
Rethinking Safe Semi-supervised Learning: Transferring the Open-set Problem to A Close-set One-
[pdf]
[supp]
[bibtex]@InProceedings{Ma_2023_ICCV, author = {Ma, Qiankun and Gao, Jiyao and Zhan, Bo and Guo, Yunpeng and Zhou, Jiliu and Wang, Yan}, title = {Rethinking Safe Semi-supervised Learning: Transferring the Open-set Problem to A Close-set One}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16370-16379} }
Does Physical Adversarial Example Really Matter to Autonomous Driving? Towards System-Level Effect of Adversarial Object Evasion Attack-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Ningfei and Luo, Yunpeng and Sato, Takami and Xu, Kaidi and Chen, Qi Alfred}, title = {Does Physical Adversarial Example Really Matter to Autonomous Driving? Towards System-Level Effect of Adversarial Object Evasion Attack}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4412-4423} }
ReLeaPS : Reinforcement Learning-based Illumination Planning for Generalized Photometric Stereo-
[pdf]
[supp]
[bibtex]@InProceedings{Chan_2023_ICCV, author = {Chan, Jun Hoong and Yu, Bohan and Guo, Heng and Ren, Jieji and Lu, Zongqing and Shi, Boxin}, title = {ReLeaPS : Reinforcement Learning-based Illumination Planning for Generalized Photometric Stereo}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9167-9175} }
Learning Foresightful Dense Visual Affordance for Deformable Object Manipulation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Ruihai and Ning, Chuanruo and Dong, Hao}, title = {Learning Foresightful Dense Visual Affordance for Deformable Object Manipulation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10947-10956} }
Generalizable Neural Fields as Partially Observed Neural Processes-
[pdf]
[arXiv]
[bibtex]@InProceedings{Gu_2023_ICCV, author = {Gu, Jeffrey and Wang, Kuan-Chieh and Yeung, Serena}, title = {Generalizable Neural Fields as Partially Observed Neural Processes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5330-5339} }
CiteTracker: Correlating Image and Text for Visual Tracking-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Xin and Huang, Yuqing and He, Zhenyu and Wang, Yaowei and Lu, Huchuan and Yang, Ming-Hsuan}, title = {CiteTracker: Correlating Image and Text for Visual Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9974-9983} }
Adding Conditional Control to Text-to-Image Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Lvmin and Rao, Anyi and Agrawala, Maneesh}, title = {Adding Conditional Control to Text-to-Image Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3836-3847} }
3D Instance Segmentation via Enhanced Spatial and Semantic Supervision-
[pdf]
[bibtex]@InProceedings{Al_Khatib_2023_ICCV, author = {Al Khatib, Salwa and El Amine Boudjoghra, Mohamed and Lahoud, Jean and Khan, Fahad Shahbaz}, title = {3D Instance Segmentation via Enhanced Spatial and Semantic Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {541-550} }
Unleashing Text-to-Image Diffusion Models for Visual Perception-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Wenliang and Rao, Yongming and Liu, Zuyan and Liu, Benlin and Zhou, Jie and Lu, Jiwen}, title = {Unleashing Text-to-Image Diffusion Models for Visual Perception}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5729-5739} }
Iterative Superquadric Recomposition of 3D Objects from Multiple Views-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Alaniz_2023_ICCV, author = {Alaniz, Stephan and Mancini, Massimiliano and Akata, Zeynep}, title = {Iterative Superquadric Recomposition of 3D Objects from Multiple Views}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18013-18023} }
PHRIT: Parametric Hand Representation with Implicit Template-
[pdf]
[supp]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Zhisheng and Chen, Yujin and Kang, Di and Zhang, Jinlu and Tu, Zhigang}, title = {PHRIT: Parametric Hand Representation with Implicit Template}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14974-14984} }
BEVPlace: Learning LiDAR-based Place Recognition using Bird's Eye View Images-
[pdf]
[supp]
[bibtex]@InProceedings{Luo_2023_ICCV, author = {Luo, Lun and Zheng, Shuhang and Li, Yixuan and Fan, Yongzhi and Yu, Beinan and Cao, Si-Yuan and Li, Junwei and Shen, Hui-Liang}, title = {BEVPlace: Learning LiDAR-based Place Recognition using Bird's Eye View Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8700-8709} }
Transferable Adversarial Attack for Both Vision Transformers and Convolutional Networks via Momentum Integrated Gradients-
[pdf]
[supp]
[bibtex]@InProceedings{Ma_2023_ICCV, author = {Ma, Wenshuo and Li, Yidong and Jia, Xiaofeng and Xu, Wei}, title = {Transferable Adversarial Attack for Both Vision Transformers and Convolutional Networks via Momentum Integrated Gradients}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4630-4639} }
TrajPAC: Towards Robustness Verification of Pedestrian Trajectory Prediction Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Liang and Xu, Nathaniel and Yang, Pengfei and Jin, Gaojie and Huang, Cheng-Chao and Zhang, Lijun}, title = {TrajPAC: Towards Robustness Verification of Pedestrian Trajectory Prediction Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8327-8339} }
Adaptive Image Anonymization in the Context of Image Classification with Neural Networks-
[pdf]
[bibtex]@InProceedings{Shvai_2023_ICCV, author = {Shvai, Nadiya and Carmona, Arcadi Llanza and Nakib, Amir}, title = {Adaptive Image Anonymization in the Context of Image Classification with Neural Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5074-5083} }
SiLK: Simple Learned Keypoints-
[pdf]
[supp]
[bibtex]@InProceedings{Gleize_2023_ICCV, author = {Gleize, Pierre and Wang, Weiyao and Feiszli, Matt}, title = {SiLK: Simple Learned Keypoints}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22499-22508} }
EfficientViT: Lightweight Multi-Scale Attention for High-Resolution Dense Prediction-
[pdf]
[bibtex]@InProceedings{Cai_2023_ICCV, author = {Cai, Han and Li, Junyan and Hu, Muyan and Gan, Chuang and Han, Song}, title = {EfficientViT: Lightweight Multi-Scale Attention for High-Resolution Dense Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17302-17313} }
Efficient Neural Supersampling on a Novel Gaming Dataset-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mercier_2023_ICCV, author = {Mercier, Antoine and Erasmus, Ruan and Savani, Yashesh and Dhingra, Manik and Porikli, Fatih and Berger, Guillaume}, title = {Efficient Neural Supersampling on a Novel Gaming Dataset}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {296-306} }
Rapid Adaptation in Online Continual Learning: Are We Evaluating It Right?-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Al_Kader_Hammoud_2023_ICCV, author = {Al Kader Hammoud, Hasan Abed and Prabhu, Ameya and Lim, Ser-Nam and Torr, Philip H.S. and Bibi, Adel and Ghanem, Bernard}, title = {Rapid Adaptation in Online Continual Learning: Are We Evaluating It Right?}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18852-18861} }
Label-Efficient Online Continual Object Detection in Streaming Video-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2023_ICCV, author = {Wu, Jay Zhangjie and Zhang, David Junhao and Hsu, Wynne and Zhang, Mengmi and Shou, Mike Zheng}, title = {Label-Efficient Online Continual Object Detection in Streaming Video}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19246-19255} }
Learning Point Cloud Completion without Complete Point Clouds: A Pose-Aware Approach-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2023_ICCV, author = {Kim, Jihun and Kweon, Hyeokjun and Yang, Yunseo and Yoon, Kuk-Jin}, title = {Learning Point Cloud Completion without Complete Point Clouds: A Pose-Aware Approach}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14203-14213} }
Frequency Guidance Matters in Few-Shot Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Cheng_2023_ICCV, author = {Cheng, Hao and Yang, Siyuan and Zhou, Joey Tianyi and Guo, Lanqing and Wen, Bihan}, title = {Frequency Guidance Matters in Few-Shot Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11814-11824} }
Walking Your LiDOG: A Journey Through Multiple Domains for LiDAR Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Saltori_2023_ICCV, author = {Saltori, Cristiano and Osep, Aljosa and Ricci, Elisa and Leal-Taix\'e, Laura}, title = {Walking Your LiDOG: A Journey Through Multiple Domains for LiDAR Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {196-206} }
Diverse Cotraining Makes Strong Semi-Supervised Segmentor-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Yijiang and Wang, Xinjiang and Yang, Lihe and Feng, Litong and Zhang, Wayne and Gao, Ying}, title = {Diverse Cotraining Makes Strong Semi-Supervised Segmentor}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16055-16067} }
Spherical Space Feature Decomposition for Guided Depth Map Super-Resolution-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Zixiang and Zhang, Jiangshe and Gu, Xiang and Tan, Chengli and Xu, Shuang and Zhang, Yulun and Timofte, Radu and Van Gool, Luc}, title = {Spherical Space Feature Decomposition for Guided Depth Map Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12547-12558} }
Tiled Multiplane Images for Practical 3D Photography-
[pdf]
[arXiv]
[bibtex]@InProceedings{Khan_2023_ICCV, author = {Khan, Numair and Xiao, Lei and Lanman, Douglas}, title = {Tiled Multiplane Images for Practical 3D Photography}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10454-10464} }
VQA-GNN: Reasoning with Multimodal Knowledge via Graph Neural Networks for Visual Question Answering-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2023_ICCV, author = {Wang, Yanan and Yasunaga, Michihiro and Ren, Hongyu and Wada, Shinya and Leskovec, Jure}, title = {VQA-GNN: Reasoning with Multimodal Knowledge via Graph Neural Networks for Visual Question Answering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21582-21592} }
Unmasked Teacher: Towards Training-Efficient Video Foundation Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Kunchang and Wang, Yali and Li, Yizhuo and Wang, Yi and He, Yinan and Wang, Limin and Qiao, Yu}, title = {Unmasked Teacher: Towards Training-Efficient Video Foundation Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19948-19960} }
Explore and Tell: Embodied Visual Captioning in 3D Environments-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hu_2023_ICCV, author = {Hu, Anwen and Chen, Shizhe and Zhang, Liang and Jin, Qin}, title = {Explore and Tell: Embodied Visual Captioning in 3D Environments}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2482-2491} }
FastViT: A Fast Hybrid Vision Transformer Using Structural Reparameterization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Vasu_2023_ICCV, author = {Vasu, Pavan Kumar Anasosalu and Gabriel, James and Zhu, Jeff and Tuzel, Oncel and Ranjan, Anurag}, title = {FastViT: A Fast Hybrid Vision Transformer Using Structural Reparameterization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5785-5795} }
OFVL-MS: Once for Visual Localization across Multiple Indoor Scenes-
[pdf]
[supp]
[bibtex]@InProceedings{Xie_2023_ICCV, author = {Xie, Tao and Dai, Kun and Lu, Siyi and Wang, Ke and Jiang, Zhiqiang and Gao, Jinghan and Liu, Dedong and Xu, Jie and Zhao, Lijun and Li, Ruifeng}, title = {OFVL-MS: Once for Visual Localization across Multiple Indoor Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5516-5526} }
HTML: Hybrid Temporal-scale Multimodal Learning Framework for Referring Video Object Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Han_2023_ICCV, author = {Han, Mingfei and Wang, Yali and Li, Zhihui and Yao, Lina and Chang, Xiaojun and Qiao, Yu}, title = {HTML: Hybrid Temporal-scale Multimodal Learning Framework for Referring Video Object Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13414-13423} }
SQAD: Automatic Smartphone Camera Quality Assessment and Benchmarking-
[pdf]
[supp]
[bibtex]@InProceedings{Fang_2023_ICCV, author = {Fang, Zilin and Ignatov, Andrey and Zamfir, Eduard and Timofte, Radu}, title = {SQAD: Automatic Smartphone Camera Quality Assessment and Benchmarking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20532-20542} }
PointDC: Unsupervised Semantic Segmentation of 3D Point Clouds via Cross-Modal Distillation and Super-Voxel Clustering-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Zisheng and Xu, Hongbin and Chen, Weitao and Zhou, Zhipeng and Xiao, Haihong and Sun, Baigui and Xie, Xuansong and kang, Wenxiong}, title = {PointDC: Unsupervised Semantic Segmentation of 3D Point Clouds via Cross-Modal Distillation and Super-Voxel Clustering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14290-14299} }
MV-Map: Offboard HD-Map Generation with Multi-view Consistency-
[pdf]
[supp]
[bibtex]@InProceedings{Xie_2023_ICCV, author = {Xie, Ziyang and Pang, Ziqi and Wang, Yu-Xiong}, title = {MV-Map: Offboard HD-Map Generation with Multi-view Consistency}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8658-8668} }
Multi-view Self-supervised Disentanglement for General Image Denoising-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Hao and Qu, Chenyuan and Zhang, Yu and Chen, Chen and Jiao, Jianbo}, title = {Multi-view Self-supervised Disentanglement for General Image Denoising}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12281-12291} }
Inter-Realization Channels: Unsupervised Anomaly Detection Beyond One-Class Classification-
[pdf]
[supp]
[bibtex]@InProceedings{McIntosh_2023_ICCV, author = {McIntosh, Declan and Albu, Alexandra Branzan}, title = {Inter-Realization Channels: Unsupervised Anomaly Detection Beyond One-Class Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6285-6295} }
Multi-Event Video-Text Retrieval-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Gengyuan and Ren, Jisen and Gu, Jindong and Tresp, Volker}, title = {Multi-Event Video-Text Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22113-22123} }
SHERF: Generalizable Human NeRF from a Single Image-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hu_2023_ICCV, author = {Hu, Shoukang and Hong, Fangzhou and Pan, Liang and Mei, Haiyi and Yang, Lei and Liu, Ziwei}, title = {SHERF: Generalizable Human NeRF from a Single Image}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9352-9364} }
MVPSNet: Fast Generalizable Multi-view Photometric Stereo-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Dongxu and Lichy, Daniel and Perrin, Pierre-Nicolas and Frahm, Jan-Michael and Sengupta, Soumyadip}, title = {MVPSNet: Fast Generalizable Multi-view Photometric Stereo}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12525-12536} }
High Quality Entity Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Qi_2023_ICCV, author = {Qi, Lu and Kuen, Jason and Shen, Tiancheng and Gu, Jiuxiang and Li, Wenbo and Guo, Weidong and Jia, Jiaya and Lin, Zhe and Yang, Ming-Hsuan}, title = {High Quality Entity Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4047-4056} }
CoTDet: Affordance Knowledge Prompting for Task Driven Object Detection-
[pdf]
[arXiv]
[bibtex]@InProceedings{Tang_2023_ICCV, author = {Tang, Jiajin and Zheng, Ge and Yu, Jingyi and Yang, Sibei}, title = {CoTDet: Affordance Knowledge Prompting for Task Driven Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3068-3078} }
You Never Get a Second Chance To Make a Good First Impression: Seeding Active Learning for 3D Semantic Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Samet_2023_ICCV, author = {Samet, Nermin and Sim\'eoni, Oriane and Puy, Gilles and Ponimatkin, Georgy and Marlet, Renaud and Lepetit, Vincent}, title = {You Never Get a Second Chance To Make a Good First Impression: Seeding Active Learning for 3D Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18445-18457} }
Scalable Multi-Temporal Remote Sensing Change Data Generation via Simulating Stochastic Change Process-
[pdf]
[supp]
[bibtex]@InProceedings{Zheng_2023_ICCV, author = {Zheng, Zhuo and Tian, Shiqi and Ma, Ailong and Zhang, Liangpei and Zhong, Yanfei}, title = {Scalable Multi-Temporal Remote Sensing Change Data Generation via Simulating Stochastic Change Process}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21818-21827} }
Human from Blur: Human Pose Tracking from Blurry Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhao_2023_ICCV, author = {Zhao, Yiming and Rozumnyi, Denys and Song, Jie and Hilliges, Otmar and Pollefeys, Marc and Oswald, Martin R.}, title = {Human from Blur: Human Pose Tracking from Blurry Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14905-14915} }
NerfAcc: Efficient Sampling Accelerates NeRFs-
[pdf]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Ruilong and Gao, Hang and Tancik, Matthew and Kanazawa, Angjoo}, title = {NerfAcc: Efficient Sampling Accelerates NeRFs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18537-18546} }
A2Q: Accumulator-Aware Quantization with Guaranteed Overflow Avoidance-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Colbert_2023_ICCV, author = {Colbert, Ian and Pappalardo, Alessandro and Petri-Koenig, Jakoba}, title = {A2Q: Accumulator-Aware Quantization with Guaranteed Overflow Avoidance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16989-16998} }
Uni-3D: A Universal Model for Panoptic 3D Scene Reconstruction-
[pdf]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Xiang and Chen, Zeyuan and Wei, Fangyin and Tu, Zhuowen}, title = {Uni-3D: A Universal Model for Panoptic 3D Scene Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9256-9266} }
ARNOLD: A Benchmark for Language-Grounded Task Learning with Continuous States in Realistic 3D Scenes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gong_2023_ICCV, author = {Gong, Ran and Huang, Jiangyong and Zhao, Yizhou and Geng, Haoran and Gao, Xiaofeng and Wu, Qingyang and Ai, Wensi and Zhou, Ziheng and Terzopoulos, Demetri and Zhu, Song-Chun and Jia, Baoxiong and Huang, Siyuan}, title = {ARNOLD: A Benchmark for Language-Grounded Task Learning with Continuous States in Realistic 3D Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20483-20495} }
Full-Body Articulated Human-Object Interaction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jiang_2023_ICCV, author = {Jiang, Nan and Liu, Tengyu and Cao, Zhexuan and Cui, Jieming and Zhang, Zhiyuan and Chen, Yixin and Wang, He and Zhu, Yixin and Huang, Siyuan}, title = {Full-Body Articulated Human-Object Interaction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9365-9376} }
FeatureNeRF: Learning Generalizable NeRFs by Distilling Foundation Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ye_2023_ICCV, author = {Ye, Jianglong and Wang, Naiyan and Wang, Xiaolong}, title = {FeatureNeRF: Learning Generalizable NeRFs by Distilling Foundation Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8962-8973} }
SRFormer: Permuted Self-Attention for Single Image Super-Resolution-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhou_2023_ICCV, author = {Zhou, Yupeng and Li, Zhen and Guo, Chun-Le and Bai, Song and Cheng, Ming-Ming and Hou, Qibin}, title = {SRFormer: Permuted Self-Attention for Single Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12780-12791} }
Deep Homography Mixture for Single Image Rolling Shutter Correction-
[pdf]
[bibtex]@InProceedings{Yan_2023_ICCV, author = {Yan, Weilong and Tan, Robby T. and Zeng, Bing and Liu, Shuaicheng}, title = {Deep Homography Mixture for Single Image Rolling Shutter Correction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9868-9877} }
Audio-Visual Glance Network for Efficient Video Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nugroho_2023_ICCV, author = {Nugroho, Muhammad Adi and Woo, Sangmin and Lee, Sumin and Kim, Changick}, title = {Audio-Visual Glance Network for Efficient Video Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10150-10159} }
CLNeRF: Continual Learning Meets NeRF-
[pdf]
[supp]
[bibtex]@InProceedings{Cai_2023_ICCV, author = {Cai, Zhipeng and M\"uller, Matthias}, title = {CLNeRF: Continual Learning Meets NeRF}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23185-23194} }
Rendering Humans from Object-Occluded Monocular Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xiang_2023_ICCV, author = {Xiang, Tiange and Sun, Adam and Wu, Jiajun and Adeli, Ehsan and Fei-Fei, Li}, title = {Rendering Humans from Object-Occluded Monocular Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3239-3250} }
CrossMatch: Source-Free Domain Adaptive Semantic Segmentation via Cross-Modal Consistency Training-
[pdf]
[bibtex]@InProceedings{Yin_2023_ICCV, author = {Yin, Yifang and Hu, Wenmiao and Liu, Zhenguang and Wang, Guanfeng and Xiang, Shili and Zimmermann, Roger}, title = {CrossMatch: Source-Free Domain Adaptive Semantic Segmentation via Cross-Modal Consistency Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21786-21796} }
Out-of-Distribution Detection for Monocular Depth Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hornauer_2023_ICCV, author = {Hornauer, Julia and Holzbock, Adrian and Belagiannis, Vasileios}, title = {Out-of-Distribution Detection for Monocular Depth Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1911-1921} }
STEPs: Self-Supervised Key Step Extraction and Localization from Unlabeled Procedural Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shah_2023_ICCV, author = {Shah, Anshul and Lundell, Benjamin and Sawhney, Harpreet and Chellappa, Rama}, title = {STEPs: Self-Supervised Key Step Extraction and Localization from Unlabeled Procedural Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10375-10387} }
Improving Equivariance in State-of-the-Art Supervised Depth and Normal Predictors-
[pdf]
[supp]
[bibtex]@InProceedings{Zhong_2023_ICCV, author = {Zhong, Yuanyi and Bhattad, Anand and Wang, Yu-Xiong and Forsyth, David}, title = {Improving Equivariance in State-of-the-Art Supervised Depth and Normal Predictors}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21775-21785} }
Towards Robust and Smooth 3D Multi-Person Pose Estimation from Monocular Videos in the Wild-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Park_2023_ICCV, author = {Park, Sungchan and You, Eunyi and Lee, Inhoe and Lee, Joonseok}, title = {Towards Robust and Smooth 3D Multi-Person Pose Estimation from Monocular Videos in the Wild}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14772-14782} }
Reducing Training Time in Cross-Silo Federated Learning Using Multigraph Topology-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Do_2023_ICCV, author = {Do, Tuong and Nguyen, Binh X. and Pham, Vuong and Tran, Toan and Tjiputra, Erman and Tran, Quang D. and Nguyen, Anh}, title = {Reducing Training Time in Cross-Silo Federated Learning Using Multigraph Topology}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19409-19419} }
Counting Crowds in Bad Weather-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Zhi-Kai and Chen, Wei-Ting and Chiang, Yuan-Chun and Kuo, Sy-Yen and Yang, Ming-Hsuan}, title = {Counting Crowds in Bad Weather}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23308-23319} }
FreeDoM: Training-Free Energy-Guided Conditional Diffusion Model-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yu_2023_ICCV, author = {Yu, Jiwen and Wang, Yinhuai and Zhao, Chen and Ghanem, Bernard and Zhang, Jian}, title = {FreeDoM: Training-Free Energy-Guided Conditional Diffusion Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23174-23184} }
UniT3D: A Unified Transformer for 3D Dense Captioning and Visual Grounding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Zhenyu and Hu, Ronghang and Chen, Xinlei and Nie{\ss}ner, Matthias and Chang, Angel X.}, title = {UniT3D: A Unified Transformer for 3D Dense Captioning and Visual Grounding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18109-18119} }
SKiT: a Fast Key Information Video Transformer for Online Surgical Phase Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2023_ICCV, author = {Liu, Yang and Huo, Jiayu and Peng, Jingjing and Sparks, Rachel and Dasgupta, Prokar and Granados, Alejandro and Ourselin, Sebastien}, title = {SKiT: a Fast Key Information Video Transformer for Online Surgical Phase Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21074-21084} }
Clustering based Point Cloud Representation Learning for 3D Analysis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Feng_2023_ICCV, author = {Feng, Tuo and Wang, Wenguan and Wang, Xiaohan and Yang, Yi and Zheng, Qinghua}, title = {Clustering based Point Cloud Representation Learning for 3D Analysis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8283-8294} }
Automatic Network Pruning via Hilbert-Schmidt Independence Criterion Lasso under Information Bottleneck Principle-
[pdf]
[supp]
[bibtex]@InProceedings{Guo_2023_ICCV, author = {Guo, Song and Zhang, Lei and Zheng, Xiawu and Wang, Yan and Li, Yuchao and Chao, Fei and Wu, Chenglin and Zhang, Shengchuan and Ji, Rongrong}, title = {Automatic Network Pruning via Hilbert-Schmidt Independence Criterion Lasso under Information Bottleneck Principle}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17458-17469} }
Forecast-MAE: Self-supervised Pre-training for Motion Forecasting with Masked Autoencoders-
[pdf]
[supp]
[bibtex]@InProceedings{Cheng_2023_ICCV, author = {Cheng, Jie and Mei, Xiaodong and Liu, Ming}, title = {Forecast-MAE: Self-supervised Pre-training for Motion Forecasting with Masked Autoencoders}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8679-8689} }
Efficient Transformer-based 3D Object Detection with Dynamic Token Halting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ye_2023_ICCV, author = {Ye, Mao and Meyer, Gregory P. and Chai, Yuning and Liu, Qiang}, title = {Efficient Transformer-based 3D Object Detection with Dynamic Token Halting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8438-8450} }
Neglected Free Lunch - Learning Image Classifiers Using Annotation Byproducts-
[pdf]
[supp]
[bibtex]@InProceedings{Han_2023_ICCV, author = {Han, Dongyoon and Choe, Junsuk and Chun, Seonghyeok and Chung, John Joon Young and Chang, Minsuk and Yun, Sangdoo and Song, Jean Y. and Oh, Seong Joon}, title = {Neglected Free Lunch - Learning Image Classifiers Using Annotation Byproducts}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20200-20212} }
Rethinking the Role of Pre-Trained Networks in Source-Free Domain Adaptation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2023_ICCV, author = {Zhang, Wenyu and Shen, Li and Foo, Chuan-Sheng}, title = {Rethinking the Role of Pre-Trained Networks in Source-Free Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18841-18851} }
RLIPv2: Fast Scaling of Relational Language-Image Pre-Training-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yuan_2023_ICCV, author = {Yuan, Hangjie and Zhang, Shiwei and Wang, Xiang and Albanie, Samuel and Pan, Yining and Feng, Tao and Jiang, Jianwen and Ni, Dong and Zhang, Yingya and Zhao, Deli}, title = {RLIPv2: Fast Scaling of Relational Language-Image Pre-Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21649-21661} }
TransFace: Calibrating Transformer Training for Face Recognition from a Data-Centric Perspective-
[pdf]
[arXiv]
[bibtex]@InProceedings{Dan_2023_ICCV, author = {Dan, Jun and Liu, Yang and Xie, Haoyu and Deng, Jiankang and Xie, Haoran and Xie, Xuansong and Sun, Baigui}, title = {TransFace: Calibrating Transformer Training for Face Recognition from a Data-Centric Perspective}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20642-20653} }
LLM-Planner: Few-Shot Grounded Planning for Embodied Agents with Large Language Models-
[pdf]
[supp]
[bibtex]@InProceedings{Song_2023_ICCV, author = {Song, Chan Hee and Wu, Jiaman and Washington, Clayton and Sadler, Brian M and Chao, Wei-Lun and Su, Yu}, title = {LLM-Planner: Few-Shot Grounded Planning for Embodied Agents with Large Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2998-3009} }
Exploring Model Transferability through the Lens of Potential Energy-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2023_ICCV, author = {Li, Xiaotong and Hu, Zixuan and Ge, Yixiao and Shan, Ying and Duan, Ling-Yu}, title = {Exploring Model Transferability through the Lens of Potential Energy}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5429-5438} }
Video Task Decathlon: Unifying Image and Video Tasks in Autonomous Driving-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2023_ICCV, author = {Huang, Thomas E. and Liu, Yifan and Van Gool, Luc and Yu, Fisher}, title = {Video Task Decathlon: Unifying Image and Video Tasks in Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8647-8657} }
Aria Digital Twin: A New Benchmark Dataset for Egocentric 3D Machine Perception-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Pan_2023_ICCV, author = {Pan, Xiaqing and Charron, Nicholas and Yang, Yongqian and Peters, Scott and Whelan, Thomas and Kong, Chen and Parkhi, Omkar and Newcombe, Richard and Ren, Yuheng (Carl)}, title = {Aria Digital Twin: A New Benchmark Dataset for Egocentric 3D Machine Perception}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20133-20143} }
PreSTU: Pre-Training for Scene-Text Understanding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kil_2023_ICCV, author = {Kil, Jihyung and Changpinyo, Soravit and Chen, Xi and Hu, Hexiang and Goodman, Sebastian and Chao, Wei-Lun and Soricut, Radu}, title = {PreSTU: Pre-Training for Scene-Text Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15270-15280} }
Back