ICCV 2023 Open Access Repository

Papers

Back
Towards Attack-tolerant Federated Learning via Critical Parameter Analysis: Sungwon Han,

Sungwon Park,

Fangzhao Wu,

Sundong Kim,

Bin Zhu,

Xing Xie,

Meeyoung Cha; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Han_2023_ICCV, author = {Han, Sungwon and Park, Sungwon and Wu, Fangzhao and Kim, Sundong and Zhu, Bin and Xie, Xing and Cha, Meeyoung}, title = {Towards Attack-tolerant Federated Learning via Critical Parameter Analysis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4999-5008} }
Stochastic Segmentation with Conditional Categorical Diffusion Models: Lukas Zbinden,

Lars Doorenbos,

Theodoros Pissas,

Adrian Thomas Huber,

Raphael Sznitman,

Pablo Márquez-Neila; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zbinden_2023_ICCV, author = {Zbinden, Lukas and Doorenbos, Lars and Pissas, Theodoros and Huber, Adrian Thomas and Sznitman, Raphael and M\'arquez-Neila, Pablo}, title = {Stochastic Segmentation with Conditional Categorical Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1119-1129} }
Diff-Retinex: Rethinking Low-light Image Enhancement with A Generative Diffusion Model: Xunpeng Yi,

Han Xu,

Hao Zhang,

Linfeng Tang,

Jiayi Ma; [pdf]
[bibtex]
@InProceedings{Yi_2023_ICCV, author = {Yi, Xunpeng and Xu, Han and Zhang, Hao and Tang, Linfeng and Ma, Jiayi}, title = {Diff-Retinex: Rethinking Low-light Image Enhancement with A Generative Diffusion Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12302-12311} }
Bird's-Eye-View Scene Graph for Vision-Language Navigation: Rui Liu,

Xiaohan Wang,

Wenguan Wang,

Yi Yang; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Rui and Wang, Xiaohan and Wang, Wenguan and Yang, Yi}, title = {Bird's-Eye-View Scene Graph for Vision-Language Navigation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10968-10980} }
PVT++: A Simple End-to-End Latency-Aware Visual Tracking Framework: Bowen Li,

Ziyuan Huang,

Junjie Ye,

Yiming Li,

Sebastian Scherer,

Hang Zhao,

Changhong Fu; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Bowen and Huang, Ziyuan and Ye, Junjie and Li, Yiming and Scherer, Sebastian and Zhao, Hang and Fu, Changhong}, title = {PVT++: A Simple End-to-End Latency-Aware Visual Tracking Framework}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10006-10016} }
A Dynamic Dual-Processing Object Detection Framework Inspired by the Brain's Recognition Mechanism: Minying Zhang,

Tianpeng Bu,

Lulu Hu; [pdf]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Minying and Bu, Tianpeng and Hu, Lulu}, title = {A Dynamic Dual-Processing Object Detection Framework Inspired by the Brain's Recognition Mechanism}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6264-6274} }
Hard No-Box Adversarial Attack on Skeleton-Based Human Action Recognition with Skeleton-Motion-Informed Gradient: Zhengzhi Lu,

He Wang,

Ziyi Chang,

Guoan Yang,

Hubert P. H. Shum; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lu_2023_ICCV, author = {Lu, Zhengzhi and Wang, He and Chang, Ziyi and Yang, Guoan and Shum, Hubert P. H.}, title = {Hard No-Box Adversarial Attack on Skeleton-Based Human Action Recognition with Skeleton-Motion-Informed Gradient}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4597-4606} }
GameFormer: Game-theoretic Modeling and Learning of Transformer-based Interactive Prediction and Planning for Autonomous Driving: Zhiyu Huang,

Haochen Liu,

Chen Lv; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Zhiyu and Liu, Haochen and Lv, Chen}, title = {GameFormer: Game-theoretic Modeling and Learning of Transformer-based Interactive Prediction and Planning for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3903-3913} }
Towards Better Robustness against Common Corruptions for Unsupervised Domain Adaptation: Zhiqiang Gao,

Kaizhu Huang,

Rui Zhang,

Dawei Liu,

Jieming Ma; [pdf] [supp]
[bibtex]
@InProceedings{Gao_2023_ICCV, author = {Gao, Zhiqiang and Huang, Kaizhu and Zhang, Rui and Liu, Dawei and Ma, Jieming}, title = {Towards Better Robustness against Common Corruptions for Unsupervised Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18882-18893} }
Learning in Imperfect Environment: Multi-Label Classification with Long-Tailed Distribution and Partial Labels: Wenqiao Zhang,

Changshuo Liu,

Lingze Zeng,

Bengchin Ooi,

Siliang Tang,

Yueting Zhuang; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Wenqiao and Liu, Changshuo and Zeng, Lingze and Ooi, Bengchin and Tang, Siliang and Zhuang, Yueting}, title = {Learning in Imperfect Environment: Multi-Label Classification with Long-Tailed Distribution and Partial Labels}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1423-1432} }
Flexible Visual Recognition by Evidential Modeling of Confusion and Ignorance: Lei Fan,

Bo Liu,

Haoxiang Li,

Ying Wu,

Gang Hua; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Fan_2023_ICCV, author = {Fan, Lei and Liu, Bo and Li, Haoxiang and Wu, Ying and Hua, Gang}, title = {Flexible Visual Recognition by Evidential Modeling of Confusion and Ignorance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1338-1347} }
Texture Generation on 3D Meshes with Point-UV Diffusion: Xin Yu,

Peng Dai,

Wenbo Li,

Lan Ma,

Zhengzhe Liu,

Xiaojuan Qi; [pdf] [arXiv]
[bibtex]
@InProceedings{Yu_2023_ICCV, author = {Yu, Xin and Dai, Peng and Li, Wenbo and Ma, Lan and Liu, Zhengzhe and Qi, Xiaojuan}, title = {Texture Generation on 3D Meshes with Point-UV Diffusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4206-4216} }
Supervised Homography Learning with Realistic Dataset Generation: Hai Jiang,

Haipeng Li,

Songchen Han,

Haoqiang Fan,

Bing Zeng,

Shuaicheng Liu; [pdf] [arXiv]
[bibtex]
@InProceedings{Jiang_2023_ICCV, author = {Jiang, Hai and Li, Haipeng and Han, Songchen and Fan, Haoqiang and Zeng, Bing and Liu, Shuaicheng}, title = {Supervised Homography Learning with Realistic Dataset Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9806-9815} }
E2E-LOAD: End-to-End Long-form Online Action Detection: Shuqiang Cao,

Weixin Luo,

Bairui Wang,

Wei Zhang,

Lin Ma; [pdf] [supp]
[bibtex]
@InProceedings{Cao_2023_ICCV, author = {Cao, Shuqiang and Luo, Weixin and Wang, Bairui and Zhang, Wei and Ma, Lin}, title = {E2E-LOAD: End-to-End Long-form Online Action Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10422-10432} }
TALL: Thumbnail Layout for Deepfake Video Detection: Yuting Xu,

Jian Liang,

Gengyun Jia,

Ziming Yang,

Yanhao Zhang,

Ran He; [pdf] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Yuting and Liang, Jian and Jia, Gengyun and Yang, Ziming and Zhang, Yanhao and He, Ran}, title = {TALL: Thumbnail Layout for Deepfake Video Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22658-22668} }
Enhanced Soft Label for Semi-Supervised Semantic Segmentation: Jie Ma,

Chuan Wang,

Yang Liu,

Liang Lin,

Guanbin Li; [pdf] [supp]
[bibtex]
@InProceedings{Ma_2023_ICCV, author = {Ma, Jie and Wang, Chuan and Liu, Yang and Lin, Liang and Li, Guanbin}, title = {Enhanced Soft Label for Semi-Supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1185-1195} }
Self-supervised Monocular Depth Estimation: Let's Talk About The Weather: Kieran Saunders,

George Vogiatzis,

Luis J. Manso; [pdf] [supp]
[bibtex]
@InProceedings{Saunders_2023_ICCV, author = {Saunders, Kieran and Vogiatzis, George and Manso, Luis J.}, title = {Self-supervised Monocular Depth Estimation: Let's Talk About The Weather}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8907-8917} }
Bidirectional Alignment for Domain Adaptive Detection with Transformers: Liqiang He,

Wei Wang,

Albert Chen,

Min Sun,

Cheng-Hao Kuo,

Sinisa Todorovic; [pdf] [supp]
[bibtex]
@InProceedings{He_2023_ICCV, author = {He, Liqiang and Wang, Wei and Chen, Albert and Sun, Min and Kuo, Cheng-Hao and Todorovic, Sinisa}, title = {Bidirectional Alignment for Domain Adaptive Detection with Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18775-18785} }
Fast Neural Scene Flow: Xueqian Li,

Jianqiao Zheng,

Francesco Ferroni,

Jhony Kaesemodel Pontes,

Simon Lucey; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Xueqian and Zheng, Jianqiao and Ferroni, Francesco and Pontes, Jhony Kaesemodel and Lucey, Simon}, title = {Fast Neural Scene Flow}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9878-9890} }
CAME: Contrastive Automated Model Evaluation: Ru Peng,

Qiuyang Duan,

Haobo Wang,

Jiachen Ma,

Yanbo Jiang,

Yongjun Tu,

Xiu Jiang,

Junbo Zhao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Peng_2023_ICCV, author = {Peng, Ru and Duan, Qiuyang and Wang, Haobo and Ma, Jiachen and Jiang, Yanbo and Tu, Yongjun and Jiang, Xiu and Zhao, Junbo}, title = {CAME: Contrastive Automated Model Evaluation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20121-20132} }
ExposureDiffusion: Learning to Expose for Low-light Image Enhancement: Yufei Wang,

Yi Yu,

Wenhan Yang,

Lanqing Guo,

Lap-Pui Chau,

Alex C. Kot,

Bihan Wen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Yufei and Yu, Yi and Yang, Wenhan and Guo, Lanqing and Chau, Lap-Pui and Kot, Alex C. and Wen, Bihan}, title = {ExposureDiffusion: Learning to Expose for Low-light Image Enhancement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12438-12448} }
HM-ViT: Hetero-Modal Vehicle-to-Vehicle Cooperative Perception with Vision Transformer: Hao Xiang,

Runsheng Xu,

Jiaqi Ma; [pdf] [supp]
[bibtex]
@InProceedings{Xiang_2023_ICCV, author = {Xiang, Hao and Xu, Runsheng and Ma, Jiaqi}, title = {HM-ViT: Hetero-Modal Vehicle-to-Vehicle Cooperative Perception with Vision Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {284-295} }
HyperReenact: One-Shot Reenactment via Jointly Learning to Refine and Retarget Faces: Stella Bounareli,

Christos Tzelepis,

Vasileios Argyriou,

Ioannis Patras,

Georgios Tzimiropoulos; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bounareli_2023_ICCV, author = {Bounareli, Stella and Tzelepis, Christos and Argyriou, Vasileios and Patras, Ioannis and Tzimiropoulos, Georgios}, title = {HyperReenact: One-Shot Reenactment via Jointly Learning to Refine and Retarget Faces}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7149-7159} }
Order-preserving Consistency Regularization for Domain Adaptation and Generalization: Mengmeng Jing,

Xiantong Zhen,

Jingjing Li,

Cees G. M. Snoek; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jing_2023_ICCV, author = {Jing, Mengmeng and Zhen, Xiantong and Li, Jingjing and Snoek, Cees G. M.}, title = {Order-preserving Consistency Regularization for Domain Adaptation and Generalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18916-18927} }
RefEgo: Referring Expression Comprehension Dataset from First-Person Perception of Ego4D: Shuhei Kurita,

Naoki Katsura,

Eri Onami; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kurita_2023_ICCV, author = {Kurita, Shuhei and Katsura, Naoki and Onami, Eri}, title = {RefEgo: Referring Expression Comprehension Dataset from First-Person Perception of Ego4D}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15214-15224} }
Exploring Temporal Frequency Spectrum in Deep Video Deblurring: Qi Zhu,

Man Zhou,

Naishan Zheng,

Chongyi Li,

Jie Huang,

Feng Zhao; [pdf]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Qi and Zhou, Man and Zheng, Naishan and Li, Chongyi and Huang, Jie and Zhao, Feng}, title = {Exploring Temporal Frequency Spectrum in Deep Video Deblurring}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12428-12437} }
Unified Visual Relationship Detection with Vision and Language Models: Long Zhao,

Liangzhe Yuan,

Boqing Gong,

Yin Cui,

Florian Schroff,

Ming-Hsuan Yang,

Hartwig Adam,

Ting Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Long and Yuan, Liangzhe and Gong, Boqing and Cui, Yin and Schroff, Florian and Yang, Ming-Hsuan and Adam, Hartwig and Liu, Ting}, title = {Unified Visual Relationship Detection with Vision and Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6962-6973} }
Occ^2Net: Robust Image Matching Based on 3D Occupancy Estimation for Occluded Regions: Miao Fan,

Mingrui Chen,

Chen Hu,

Shuchang Zhou; [pdf]
[bibtex]
@InProceedings{Fan_2023_ICCV, author = {Fan, Miao and Chen, Mingrui and Hu, Chen and Zhou, Shuchang}, title = {Occ{\textasciicircum}2Net: Robust Image Matching Based on 3D Occupancy Estimation for Occluded Regions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9652-9662} }
Make-An-Animation: Large-Scale Text-conditional 3D Human Motion Generation: Samaneh Azadi,

Akbar Shah,

Thomas Hayes,

Devi Parikh,

Sonal Gupta; [pdf]
[bibtex]
@InProceedings{Azadi_2023_ICCV, author = {Azadi, Samaneh and Shah, Akbar and Hayes, Thomas and Parikh, Devi and Gupta, Sonal}, title = {Make-An-Animation: Large-Scale Text-conditional 3D Human Motion Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15039-15048} }
Rickrolling the Artist: Injecting Backdoors into Text Encoders for Text-to-Image Synthesis: Lukas Struppek,

Dominik Hintersdorf,

Kristian Kersting; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Struppek_2023_ICCV, author = {Struppek, Lukas and Hintersdorf, Dominik and Kersting, Kristian}, title = {Rickrolling the Artist: Injecting Backdoors into Text Encoders for Text-to-Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4584-4596} }
LD-ZNet: A Latent Diffusion Approach for Text-Based Image Segmentation: Koutilya PNVR,

Bharat Singh,

Pallabi Ghosh,

Behjat Siddiquie,

David Jacobs; [pdf] [supp]
[bibtex]
@InProceedings{PNVR_2023_ICCV, author = {PNVR, Koutilya and Singh, Bharat and Ghosh, Pallabi and Siddiquie, Behjat and Jacobs, David}, title = {LD-ZNet: A Latent Diffusion Approach for Text-Based Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4157-4168} }
Workie-Talkie: Accelerating Federated Learning by Overlapping Computing and Communications via Contrastive Regularization: Rui Chen,

Qiyu Wan,

Pavana Prakash,

Lan Zhang,

Xu Yuan,

Yanmin Gong,

Xin Fu,

Miao Pan; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Rui and Wan, Qiyu and Prakash, Pavana and Zhang, Lan and Yuan, Xu and Gong, Yanmin and Fu, Xin and Pan, Miao}, title = {Workie-Talkie: Accelerating Federated Learning by Overlapping Computing and Communications via Contrastive Regularization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16999-17009} }
Downstream-agnostic Adversarial Examples: Ziqi Zhou,

Shengshan Hu,

Ruizhi Zhao,

Qian Wang,

Leo Yu Zhang,

Junhui Hou,

Hai Jin; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Ziqi and Hu, Shengshan and Zhao, Ruizhi and Wang, Qian and Zhang, Leo Yu and Hou, Junhui and Jin, Hai}, title = {Downstream-agnostic Adversarial Examples}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4345-4355} }
Late Stopping: Avoiding Confidently Learning from Mislabeled Examples: Suqin Yuan,

Lei Feng,

Tongliang Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yuan_2023_ICCV, author = {Yuan, Suqin and Feng, Lei and Liu, Tongliang}, title = {Late Stopping: Avoiding Confidently Learning from Mislabeled Examples}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16079-16088} }
AerialVLN: Vision-and-Language Navigation for UAVs: Shubo Liu,

Hongsheng Zhang,

Yuankai Qi,

Peng Wang,

Yanning Zhang,

Qi Wu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Shubo and Zhang, Hongsheng and Qi, Yuankai and Wang, Peng and Zhang, Yanning and Wu, Qi}, title = {AerialVLN: Vision-and-Language Navigation for UAVs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15384-15394} }
On the Robustness of Open-World Test-Time Training: Self-Training with Dynamic Prototype Expansion: Yushu Li,

Xun Xu,

Yongyi Su,

Kui Jia; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Yushu and Xu, Xun and Su, Yongyi and Jia, Kui}, title = {On the Robustness of Open-World Test-Time Training: Self-Training with Dynamic Prototype Expansion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11836-11846} }
Studying How to Efficiently and Effectively Guide Models with Explanations: Sukrut Rao,

Moritz Böhle,

Amin Parchami-Araghi,

Bernt Schiele; [pdf] [supp]
[bibtex]
@InProceedings{Rao_2023_ICCV, author = {Rao, Sukrut and B\"ohle, Moritz and Parchami-Araghi, Amin and Schiele, Bernt}, title = {Studying How to Efficiently and Effectively Guide Models with Explanations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1922-1933} }
Most Important Person-Guided Dual-Branch Cross-Patch Attention for Group Affect Recognition: Hongxia Xie,

Ming-Xian Lee,

Tzu-Jui Chen,

Hung-Jen Chen,

Hou-I Liu,

Hong-Han Shuai,

Wen-Huang Cheng; [pdf]
[bibtex]
@InProceedings{Xie_2023_ICCV, author = {Xie, Hongxia and Lee, Ming-Xian and Chen, Tzu-Jui and Chen, Hung-Jen and Liu, Hou-I and Shuai, Hong-Han and Cheng, Wen-Huang}, title = {Most Important Person-Guided Dual-Branch Cross-Patch Attention for Group Affect Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20598-20608} }
SkeletonMAE: Graph-based Masked Autoencoder for Skeleton Sequence Pre-training: Hong Yan,

Yang Liu,

Yushen Wei,

Zhen Li,

Guanbin Li,

Liang Lin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yan_2023_ICCV, author = {Yan, Hong and Liu, Yang and Wei, Yushen and Li, Zhen and Li, Guanbin and Lin, Liang}, title = {SkeletonMAE: Graph-based Masked Autoencoder for Skeleton Sequence Pre-training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5606-5618} }
Achievement-Based Training Progress Balancing for Multi-Task Learning: Hayoung Yun,

Hanjoo Cho; [pdf] [supp]
[bibtex]
@InProceedings{Yun_2023_ICCV, author = {Yun, Hayoung and Cho, Hanjoo}, title = {Achievement-Based Training Progress Balancing for Multi-Task Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16935-16944} }
Pose-Free Neural Radiance Fields via Implicit Pose Regularization: Jiahui Zhang,

Fangneng Zhan,

Yingchen Yu,

Kunhao Liu,

Rongliang Wu,

Xiaoqin Zhang,

Ling Shao,

Shijian Lu; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Jiahui and Zhan, Fangneng and Yu, Yingchen and Liu, Kunhao and Wu, Rongliang and Zhang, Xiaoqin and Shao, Ling and Lu, Shijian}, title = {Pose-Free Neural Radiance Fields via Implicit Pose Regularization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3534-3543} }
Self-supervised Learning to Bring Dual Reversed Rolling Shutter Images Alive: Wei Shang,

Dongwei Ren,

Chaoyu Feng,

Xiaotao Wang,

Lei Lei,

Wangmeng Zuo; [pdf] [arXiv]
[bibtex]
@InProceedings{Shang_2023_ICCV, author = {Shang, Wei and Ren, Dongwei and Feng, Chaoyu and Wang, Xiaotao and Lei, Lei and Zuo, Wangmeng}, title = {Self-supervised Learning to Bring Dual Reversed Rolling Shutter Images Alive}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13086-13094} }
Logic-induced Diagnostic Reasoning for Semi-supervised Semantic Segmentation: Chen Liang,

Wenguan Wang,

Jiaxu Miao,

Yi Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liang_2023_ICCV, author = {Liang, Chen and Wang, Wenguan and Miao, Jiaxu and Yang, Yi}, title = {Logic-induced Diagnostic Reasoning for Semi-supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16197-16208} }
Self-Supervised Monocular Depth Estimation by Direction-aware Cumulative Convolution Network: Wencheng Han,

Junbo Yin,

Jianbing Shen; [pdf] [arXiv]
[bibtex]
@InProceedings{Han_2023_ICCV, author = {Han, Wencheng and Yin, Junbo and Shen, Jianbing}, title = {Self-Supervised Monocular Depth Estimation by Direction-aware Cumulative Convolution Network}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8613-8623} }
Encyclopedic VQA: Visual Questions About Detailed Properties of Fine-Grained Categories: Thomas Mensink,

Jasper Uijlings,

Lluis Castrejon,

Arushi Goel,

Felipe Cadar,

Howard Zhou,

Fei Sha,

André Araujo,

Vittorio Ferrari; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mensink_2023_ICCV, author = {Mensink, Thomas and Uijlings, Jasper and Castrejon, Lluis and Goel, Arushi and Cadar, Felipe and Zhou, Howard and Sha, Fei and Araujo, Andr\'e and Ferrari, Vittorio}, title = {Encyclopedic VQA: Visual Questions About Detailed Properties of Fine-Grained Categories}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3113-3124} }
Towards Understanding the Generalization of Deepfake Detectors from a Game-Theoretical View: Kelu Yao,

Jin Wang,

Boyu Diao,

Chao Li; [pdf] [supp]
[bibtex]
@InProceedings{Yao_2023_ICCV, author = {Yao, Kelu and Wang, Jin and Diao, Boyu and Li, Chao}, title = {Towards Understanding the Generalization of Deepfake Detectors from a Game-Theoretical View}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2031-2041} }
Few-Shot Common Action Localization via Cross-Attentional Fusion of Context and Temporal Dynamics: Juntae Lee,

Mihir Jain,

Sungrack Yun; [pdf]
[bibtex]
@InProceedings{Lee_2023_ICCV, author = {Lee, Juntae and Jain, Mihir and Yun, Sungrack}, title = {Few-Shot Common Action Localization via Cross-Attentional Fusion of Context and Temporal Dynamics}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10214-10223} }
Physically-Plausible Illumination Distribution Estimation: Egor Ershov,

Vasily Tesalin,

Ivan Ermakov,

Michael S. Brown; [pdf]
[bibtex]
@InProceedings{Ershov_2023_ICCV, author = {Ershov, Egor and Tesalin, Vasily and Ermakov, Ivan and Brown, Michael S.}, title = {Physically-Plausible Illumination Distribution Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12928-12936} }
3DPPE: 3D Point Positional Encoding for Transformer-based Multi-Camera 3D Object Detection: Changyong Shu,

Jiajun Deng,

Fisher Yu,

Yifan Liu; [pdf] [supp]
[bibtex]
@InProceedings{Shu_2023_ICCV, author = {Shu, Changyong and Deng, Jiajun and Yu, Fisher and Liu, Yifan}, title = {3DPPE: 3D Point Positional Encoding for Transformer-based Multi-Camera 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3580-3589} }
Revisiting Foreground and Background Separation in Weakly-supervised Temporal Action Localization: A Clustering-based Approach: Qinying Liu,

Zilei Wang,

Shenghai Rong,

Junjie Li,

Yixin Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Qinying and Wang, Zilei and Rong, Shenghai and Li, Junjie and Zhang, Yixin}, title = {Revisiting Foreground and Background Separation in Weakly-supervised Temporal Action Localization: A Clustering-based Approach}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10433-10443} }
VertexSerum: Poisoning Graph Neural Networks for Link Inference: Ruyi Ding,

Shijin Duan,

Xiaolin Xu,

Yunsi Fei; [pdf] [arXiv]
[bibtex]
@InProceedings{Ding_2023_ICCV, author = {Ding, Ruyi and Duan, Shijin and Xu, Xiaolin and Fei, Yunsi}, title = {VertexSerum: Poisoning Graph Neural Networks for Link Inference}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4532-4541} }
NeRF-Det: Learning Geometry-Aware Volumetric Representation for Multi-View 3D Object Detection: Chenfeng Xu,

Bichen Wu,

Ji Hou,

Sam Tsai,

Ruilong Li,

Jialiang Wang,

Wei Zhan,

Zijian He,

Peter Vajda,

Kurt Keutzer,

Masayoshi Tomizuka; [pdf] [supp]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Chenfeng and Wu, Bichen and Hou, Ji and Tsai, Sam and Li, Ruilong and Wang, Jialiang and Zhan, Wei and He, Zijian and Vajda, Peter and Keutzer, Kurt and Tomizuka, Masayoshi}, title = {NeRF-Det: Learning Geometry-Aware Volumetric Representation for Multi-View 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23320-23330} }
Spatio-Temporal Domain Awareness for Multi-Agent Collaborative Perception: Kun Yang,

Dingkang Yang,

Jingyu Zhang,

Mingcheng Li,

Yang Liu,

Jing Liu,

Hanqi Wang,

Peng Sun,

Liang Song; [pdf] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Kun and Yang, Dingkang and Zhang, Jingyu and Li, Mingcheng and Liu, Yang and Liu, Jing and Wang, Hanqi and Sun, Peng and Song, Liang}, title = {Spatio-Temporal Domain Awareness for Multi-Agent Collaborative Perception}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23383-23392} }
LPFF: A Portrait Dataset for Face Generators Across Large Poses: Yiqian Wu,

Jing Zhang,

Hongbo Fu,

Xiaogang Jin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Yiqian and Zhang, Jing and Fu, Hongbo and Jin, Xiaogang}, title = {LPFF: A Portrait Dataset for Face Generators Across Large Poses}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20327-20337} }
Pseudo-label Alignment for Semi-supervised Instance Segmentation: Jie Hu,

Chen Chen,

Liujuan Cao,

Shengchuan Zhang,

Annan Shu,

Guannan Jiang,

Rongrong Ji; [pdf] [arXiv]
[bibtex]
@InProceedings{Hu_2023_ICCV, author = {Hu, Jie and Chen, Chen and Cao, Liujuan and Zhang, Shengchuan and Shu, Annan and Jiang, Guannan and Ji, Rongrong}, title = {Pseudo-label Alignment for Semi-supervised Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16337-16347} }
Deep Geometrized Cartoon Line Inbetweening: Li Siyao,

Tianpei Gu,

Weiye Xiao,

Henghui Ding,

Ziwei Liu,

Chen Change Loy; [pdf] [supp]
[bibtex]
@InProceedings{Siyao_2023_ICCV, author = {Siyao, Li and Gu, Tianpei and Xiao, Weiye and Ding, Henghui and Liu, Ziwei and Loy, Chen Change}, title = {Deep Geometrized Cartoon Line Inbetweening}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7291-7300} }
MixBag: Bag-Level Data Augmentation for Learning from Label Proportions: Takanori Asanomi,

Shinnosuke Matsuo,

Daiki Suehiro,

Ryoma Bise; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Asanomi_2023_ICCV, author = {Asanomi, Takanori and Matsuo, Shinnosuke and Suehiro, Daiki and Bise, Ryoma}, title = {MixBag: Bag-Level Data Augmentation for Learning from Label Proportions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16570-16579} }
Effective Real Image Editing with Accelerated Iterative Diffusion Inversion: Zhihong Pan,

Riccardo Gherardi,

Xiufeng Xie,

Stephen Huang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Pan_2023_ICCV, author = {Pan, Zhihong and Gherardi, Riccardo and Xie, Xiufeng and Huang, Stephen}, title = {Effective Real Image Editing with Accelerated Iterative Diffusion Inversion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15912-15921} }
3D-Aware Neural Body Fitting for Occlusion Robust 3D Human Pose Estimation: Yi Zhang,

Pengliang Ji,

Angtian Wang,

Jieru Mei,

Adam Kortylewski,

Alan Yuille; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Yi and Ji, Pengliang and Wang, Angtian and Mei, Jieru and Kortylewski, Adam and Yuille, Alan}, title = {3D-Aware Neural Body Fitting for Occlusion Robust 3D Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9399-9410} }
Chinese Text Recognition with A Pre-Trained CLIP-Like Model Through Image-IDS Aligning: Haiyang Yu,

Xiaocong Wang,

Bin Li,

Xiangyang Xue; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yu_2023_ICCV, author = {Yu, Haiyang and Wang, Xiaocong and Li, Bin and Xue, Xiangyang}, title = {Chinese Text Recognition with A Pre-Trained CLIP-Like Model Through Image-IDS Aligning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11943-11952} }
MatrixCity: A Large-scale City Dataset for City-scale Neural Rendering and Beyond: Yixuan Li,

Lihan Jiang,

Linning Xu,

Yuanbo Xiangli,

Zhenzhi Wang,

Dahua Lin,

Bo Dai; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Yixuan and Jiang, Lihan and Xu, Linning and Xiangli, Yuanbo and Wang, Zhenzhi and Lin, Dahua and Dai, Bo}, title = {MatrixCity: A Large-scale City Dataset for City-scale Neural Rendering and Beyond}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3205-3215} }
LinkGAN: Linking GAN Latents to Pixels for Controllable Image Synthesis: Jiapeng Zhu,

Ceyuan Yang,

Yujun Shen,

Zifan Shi,

Bo Dai,

Deli Zhao,

Qifeng Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Jiapeng and Yang, Ceyuan and Shen, Yujun and Shi, Zifan and Dai, Bo and Zhao, Deli and Chen, Qifeng}, title = {LinkGAN: Linking GAN Latents to Pixels for Controllable Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7656-7666} }
Exploiting Proximity-Aware Tasks for Embodied Social Navigation: Enrico Cancelli,

Tommaso Campari,

Luciano Serafini,

Angel X. Chang,

Lamberto Ballan; [pdf] [arXiv]
[bibtex]
@InProceedings{Cancelli_2023_ICCV, author = {Cancelli, Enrico and Campari, Tommaso and Serafini, Luciano and Chang, Angel X. and Ballan, Lamberto}, title = {Exploiting Proximity-Aware Tasks for Embodied Social Navigation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10957-10967} }
SVDiff: Compact Parameter Space for Diffusion Fine-Tuning: Ligong Han,

Yinxiao Li,

Han Zhang,

Peyman Milanfar,

Dimitris Metaxas,

Feng Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Han_2023_ICCV, author = {Han, Ligong and Li, Yinxiao and Zhang, Han and Milanfar, Peyman and Metaxas, Dimitris and Yang, Feng}, title = {SVDiff: Compact Parameter Space for Diffusion Fine-Tuning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7323-7334} }
UniFace: Unified Cross-Entropy Loss for Deep Face Recognition: Jiancan Zhou,

Xi Jia,

Qiufu Li,

Linlin Shen,

Jinming Duan; [pdf] [supp]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Jiancan and Jia, Xi and Li, Qiufu and Shen, Linlin and Duan, Jinming}, title = {UniFace: Unified Cross-Entropy Loss for Deep Face Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20730-20739} }
Jumping through Local Minima: Quantization in the Loss Landscape of Vision Transformers: Natalia Frumkin,

Dibakar Gope,

Diana Marculescu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Frumkin_2023_ICCV, author = {Frumkin, Natalia and Gope, Dibakar and Marculescu, Diana}, title = {Jumping through Local Minima: Quantization in the Loss Landscape of Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16978-16988} }
Hierarchical Contrastive Learning for Pattern-Generalizable Image Corruption Detection: Xin Feng,

Yifeng Xu,

Guangming Lu,

Wenjie Pei; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Feng_2023_ICCV, author = {Feng, Xin and Xu, Yifeng and Lu, Guangming and Pei, Wenjie}, title = {Hierarchical Contrastive Learning for Pattern-Generalizable Image Corruption Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12076-12085} }
Learning Optical Flow from Event Camera with Rendered Dataset: Xinglong Luo,

Kunming Luo,

Ao Luo,

Zhengning Wang,

Ping Tan,

Shuaicheng Liu; [pdf] [arXiv]
[bibtex]
@InProceedings{Luo_2023_ICCV, author = {Luo, Xinglong and Luo, Kunming and Luo, Ao and Wang, Zhengning and Tan, Ping and Liu, Shuaicheng}, title = {Learning Optical Flow from Event Camera with Rendered Dataset}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9847-9857} }
EPiC: Ensemble of Partial Point Clouds for Robust Classification: Meir Yossef Levi,

Guy Gilboa; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Levi_2023_ICCV, author = {Levi, Meir Yossef and Gilboa, Guy}, title = {EPiC: Ensemble of Partial Point Clouds for Robust Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14475-14484} }
Distilling Large Vision-Language Model with Out-of-Distribution Generalizability: Xuanlin Li,

Yunhao Fang,

Minghua Liu,

Zhan Ling,

Zhuowen Tu,

Hao Su; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Xuanlin and Fang, Yunhao and Liu, Minghua and Ling, Zhan and Tu, Zhuowen and Su, Hao}, title = {Distilling Large Vision-Language Model with Out-of-Distribution Generalizability}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2492-2503} }
Cross-Modal Learning with 3D Deformable Attention for Action Recognition: Sangwon Kim,

Dasom Ahn,

Byoung Chul Ko; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2023_ICCV, author = {Kim, Sangwon and Ahn, Dasom and Ko, Byoung Chul}, title = {Cross-Modal Learning with 3D Deformable Attention for Action Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10265-10275} }
What do neural networks learn in image classification? A frequency shortcut perspective: Shunxin Wang,

Raymond Veldhuis,

Christoph Brune,

Nicola Strisciuglio; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Shunxin and Veldhuis, Raymond and Brune, Christoph and Strisciuglio, Nicola}, title = {What do neural networks learn in image classification? A frequency shortcut perspective}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1433-1442} }
Tracking by 3D Model Estimation of Unknown Objects in Videos: Denys Rozumnyi,

Jiří Matas,

Marc Pollefeys,

Vittorio Ferrari,

Martin R. Oswald; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Rozumnyi_2023_ICCV, author = {Rozumnyi, Denys and Matas, Ji\v{r}{\'\i} and Pollefeys, Marc and Ferrari, Vittorio and Oswald, Martin R.}, title = {Tracking by 3D Model Estimation of Unknown Objects in Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14086-14096} }
ScatterNeRF: Seeing Through Fog with Physically-Based Inverse Neural Rendering: Andrea Ramazzina,

Mario Bijelic,

Stefanie Walz,

Alessandro Sanvito,

Dominik Scheuble,

Felix Heide; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ramazzina_2023_ICCV, author = {Ramazzina, Andrea and Bijelic, Mario and Walz, Stefanie and Sanvito, Alessandro and Scheuble, Dominik and Heide, Felix}, title = {ScatterNeRF: Seeing Through Fog with Physically-Based Inverse Neural Rendering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17957-17968} }
Sigmoid Loss for Language Image Pre-Training: Xiaohua Zhai,

Basil Mustafa,

Alexander Kolesnikov,

Lucas Beyer; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhai_2023_ICCV, author = {Zhai, Xiaohua and Mustafa, Basil and Kolesnikov, Alexander and Beyer, Lucas}, title = {Sigmoid Loss for Language Image Pre-Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11975-11986} }
PromptCap: Prompt-Guided Image Captioning for VQA with GPT-3: Yushi Hu,

Hang Hua,

Zhengyuan Yang,

Weijia Shi,

Noah A. Smith,

Jiebo Luo; [pdf] [supp]
[bibtex]
@InProceedings{Hu_2023_ICCV, author = {Hu, Yushi and Hua, Hang and Yang, Zhengyuan and Shi, Weijia and Smith, Noah A. and Luo, Jiebo}, title = {PromptCap: Prompt-Guided Image Captioning for VQA with GPT-3}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2963-2975} }
Neural Video Depth Stabilizer: Yiran Wang,

Min Shi,

Jiaqi Li,

Zihao Huang,

Zhiguo Cao,

Jianming Zhang,

Ke Xian,

Guosheng Lin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Yiran and Shi, Min and Li, Jiaqi and Huang, Zihao and Cao, Zhiguo and Zhang, Jianming and Xian, Ke and Lin, Guosheng}, title = {Neural Video Depth Stabilizer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9466-9476} }
Learning Symmetry-Aware Geometry Correspondences for 6D Object Pose Estimation: Heng Zhao,

Shenxing Wei,

Dahu Shi,

Wenming Tan,

Zheyang Li,

Ye Ren,

Xing Wei,

Yi Yang,

Shiliang Pu; [pdf]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Heng and Wei, Shenxing and Shi, Dahu and Tan, Wenming and Li, Zheyang and Ren, Ye and Wei, Xing and Yang, Yi and Pu, Shiliang}, title = {Learning Symmetry-Aware Geometry Correspondences for 6D Object Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14045-14054} }
TrackFlow: Multi-Object tracking with Normalizing Flows: Gianluca Mancusi,

Aniello Panariello,

Angelo Porrello,

Matteo Fabbri,

Simone Calderara,

Rita Cucchiara; [pdf] [arXiv]
[bibtex]
@InProceedings{Mancusi_2023_ICCV, author = {Mancusi, Gianluca and Panariello, Aniello and Porrello, Angelo and Fabbri, Matteo and Calderara, Simone and Cucchiara, Rita}, title = {TrackFlow: Multi-Object tracking with Normalizing Flows}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9531-9543} }
Towards Generic Image Manipulation Detection with Weakly-Supervised Self-Consistency Learning: Yuanhao Zhai,

Tianyu Luan,

David Doermann,

Junsong Yuan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhai_2023_ICCV, author = {Zhai, Yuanhao and Luan, Tianyu and Doermann, David and Yuan, Junsong}, title = {Towards Generic Image Manipulation Detection with Weakly-Supervised Self-Consistency Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22390-22400} }
PARF: Primitive-Aware Radiance Fusion for Indoor Scene Novel View Synthesis: Haiyang Ying,

Baowei Jiang,

Jinzhi Zhang,

Di Xu,

Tao Yu,

Qionghai Dai,

Lu Fang; [pdf] [supp]
[bibtex]
@InProceedings{Ying_2023_ICCV, author = {Ying, Haiyang and Jiang, Baowei and Zhang, Jinzhi and Xu, Di and Yu, Tao and Dai, Qionghai and Fang, Lu}, title = {PARF: Primitive-Aware Radiance Fusion for Indoor Scene Novel View Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17706-17716} }
DeePoint: Visual Pointing Recognition and Direction Estimation: Shu Nakamura,

Yasutomo Kawanishi,

Shohei Nobuhara,

Ko Nishino; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Nakamura_2023_ICCV, author = {Nakamura, Shu and Kawanishi, Yasutomo and Nobuhara, Shohei and Nishino, Ko}, title = {DeePoint: Visual Pointing Recognition and Direction Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20577-20587} }
Periodically Exchange Teacher-Student for Source-Free Object Detection: Qipeng Liu,

Luojun Lin,

Zhifeng Shen,

Zhifeng Yang; [pdf]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Qipeng and Lin, Luojun and Shen, Zhifeng and Yang, Zhifeng}, title = {Periodically Exchange Teacher-Student for Source-Free Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6414-6424} }
Generating Instance-level Prompts for Rehearsal-free Continual Learning: Dahuin Jung,

Dongyoon Han,

Jihwan Bang,

Hwanjun Song; [pdf] [supp]
[bibtex]
@InProceedings{Jung_2023_ICCV, author = {Jung, Dahuin and Han, Dongyoon and Bang, Jihwan and Song, Hwanjun}, title = {Generating Instance-level Prompts for Rehearsal-free Continual Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11847-11857} }
Deformer: Dynamic Fusion Transformer for Robust Hand Pose Estimation: Qichen Fu,

Xingyu Liu,

Ran Xu,

Juan Carlos Niebles,

Kris M. Kitani; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Fu_2023_ICCV, author = {Fu, Qichen and Liu, Xingyu and Xu, Ran and Niebles, Juan Carlos and Kitani, Kris M.}, title = {Deformer: Dynamic Fusion Transformer for Robust Hand Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23600-23611} }
HSE: Hybrid Species Embedding for Deep Metric Learning: Bailin Yang,

Haoqiang Sun,

Frederick W. B. Li,

Zheng Chen,

Jianlu Cai,

Chao Song; [pdf]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Bailin and Sun, Haoqiang and Li, Frederick W. B. and Chen, Zheng and Cai, Jianlu and Song, Chao}, title = {HSE: Hybrid Species Embedding for Deep Metric Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11047-11057} }
Online Continual Learning on Hierarchical Label Expansion: Byung Hyun Lee,

Okchul Jung,

Jonghyun Choi,

Se Young Chun; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2023_ICCV, author = {Lee, Byung Hyun and Jung, Okchul and Choi, Jonghyun and Chun, Se Young}, title = {Online Continual Learning on Hierarchical Label Expansion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11761-11770} }
iDAG: Invariant DAG Searching for Domain Generalization: Zenan Huang,

Haobo Wang,

Junbo Zhao,

Nenggan Zheng; [pdf] [supp]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Zenan and Wang, Haobo and Zhao, Junbo and Zheng, Nenggan}, title = {iDAG: Invariant DAG Searching for Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19169-19179} }
Spacetime Surface Regularization for Neural Dynamic Scene Reconstruction: Jaesung Choe,

Christopher Choy,

Jaesik Park,

In So Kweon,

Anima Anandkumar; [pdf] [supp]
[bibtex]
@InProceedings{Choe_2023_ICCV, author = {Choe, Jaesung and Choy, Christopher and Park, Jaesik and Kweon, In So and Anandkumar, Anima}, title = {Spacetime Surface Regularization for Neural Dynamic Scene Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17871-17881} }
GasMono: Geometry-Aided Self-Supervised Monocular Depth Estimation for Indoor Scenes: Chaoqiang Zhao,

Matteo Poggi,

Fabio Tosi,

Lei Zhou,

Qiyu Sun,

Yang Tang,

Stefano Mattoccia; [pdf] [supp]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Chaoqiang and Poggi, Matteo and Tosi, Fabio and Zhou, Lei and Sun, Qiyu and Tang, Yang and Mattoccia, Stefano}, title = {GasMono: Geometry-Aided Self-Supervised Monocular Depth Estimation for Indoor Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16209-16220} }
3D Motion Magnification: Visualizing Subtle Motions from Time-Varying Radiance Fields: Brandon Y. Feng,

Hadi Alzayer,

Michael Rubinstein,

William T. Freeman,

Jia-bin Huang; [pdf]
[bibtex]
@InProceedings{Feng_2023_ICCV, author = {Feng, Brandon Y. and Alzayer, Hadi and Rubinstein, Michael and Freeman, William T. and Huang, Jia-bin}, title = {3D Motion Magnification: Visualizing Subtle Motions from Time-Varying Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9837-9846} }
Learning to Transform for Generalizable Instance-wise Invariance: Utkarsh Singhal,

Carlos Esteves,

Ameesh Makadia,

Stella X. Yu; [pdf]
[bibtex]
@InProceedings{Singhal_2023_ICCV, author = {Singhal, Utkarsh and Esteves, Carlos and Makadia, Ameesh and Yu, Stella X.}, title = {Learning to Transform for Generalizable Instance-wise Invariance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6211-6221} }
Audio-Visual Deception Detection: DOLOS Dataset and Parameter-Efficient Crossmodal Learning: Xiaobao Guo,

Nithish Muthuchamy Selvaraj,

Zitong Yu,

Adams Wai-Kin Kong,

Bingquan Shen,

Alex Kot; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Guo_2023_ICCV, author = {Guo, Xiaobao and Selvaraj, Nithish Muthuchamy and Yu, Zitong and Kong, Adams Wai-Kin and Shen, Bingquan and Kot, Alex}, title = {Audio-Visual Deception Detection: DOLOS Dataset and Parameter-Efficient Crossmodal Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22135-22145} }
Multiple Instance Learning Framework with Masked Hard Instance Mining for Whole Slide Image Classification: Wenhao Tang,

Sheng Huang,

Xiaoxian Zhang,

Fengtao Zhou,

Yi Zhang,

Bo Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tang_2023_ICCV, author = {Tang, Wenhao and Huang, Sheng and Zhang, Xiaoxian and Zhou, Fengtao and Zhang, Yi and Liu, Bo}, title = {Multiple Instance Learning Framework with Masked Hard Instance Mining for Whole Slide Image Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4078-4087} }
Unsupervised Compositional Concepts Discovery with Text-to-Image Generative Models: Nan Liu,

Yilun Du,

Shuang Li,

Joshua B. Tenenbaum,

Antonio Torralba; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Nan and Du, Yilun and Li, Shuang and Tenenbaum, Joshua B. and Torralba, Antonio}, title = {Unsupervised Compositional Concepts Discovery with Text-to-Image Generative Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2085-2095} }
Partition-And-Debias: Agnostic Biases Mitigation via a Mixture of Biases-Specific Experts: Jiaxuan Li,

Duc Minh Vo,

Hideki Nakayama; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Jiaxuan and Vo, Duc Minh and Nakayama, Hideki}, title = {Partition-And-Debias: Agnostic Biases Mitigation via a Mixture of Biases-Specific Experts}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4924-4934} }
Spatial Self-Distillation for Object Detection with Inaccurate Bounding Boxes: Di Wu,

Pengfei Chen,

Xuehui Yu,

Guorong Li,

Zhenjun Han,

Jianbin Jiao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Di and Chen, Pengfei and Yu, Xuehui and Li, Guorong and Han, Zhenjun and Jiao, Jianbin}, title = {Spatial Self-Distillation for Object Detection with Inaccurate Bounding Boxes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6855-6865} }
CC3D: Layout-Conditioned Generation of Compositional 3D Scenes: Sherwin Bahmani,

Jeong Joon Park,

Despoina Paschalidou,

Xingguang Yan,

Gordon Wetzstein,

Leonidas Guibas,

Andrea Tagliasacchi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bahmani_2023_ICCV, author = {Bahmani, Sherwin and Park, Jeong Joon and Paschalidou, Despoina and Yan, Xingguang and Wetzstein, Gordon and Guibas, Leonidas and Tagliasacchi, Andrea}, title = {CC3D: Layout-Conditioned Generation of Compositional 3D Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7171-7181} }
Alleviating Catastrophic Forgetting of Incremental Object Detection via Within-Class and Between-Class Knowledge Distillation: Mengxue Kang,

Jinpeng Zhang,

Jinming Zhang,

Xiashuang Wang,

Yang Chen,

Zhe Ma,

Xuhui Huang; [pdf] [supp]
[bibtex]
@InProceedings{Kang_2023_ICCV, author = {Kang, Mengxue and Zhang, Jinpeng and Zhang, Jinming and Wang, Xiashuang and Chen, Yang and Ma, Zhe and Huang, Xuhui}, title = {Alleviating Catastrophic Forgetting of Incremental Object Detection via Within-Class and Between-Class Knowledge Distillation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18894-18904} }
TextPSG: Panoptic Scene Graph Generation from Textual Descriptions: Chengyang Zhao,

Yikang Shen,

Zhenfang Chen,

Mingyu Ding,

Chuang Gan; [pdf] [supp]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Chengyang and Shen, Yikang and Chen, Zhenfang and Ding, Mingyu and Gan, Chuang}, title = {TextPSG: Panoptic Scene Graph Generation from Textual Descriptions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2839-2850} }
Revisiting the Parameter Efficiency of Adapters from the Perspective of Precision Redundancy: Shibo Jie,

Haoqing Wang,

Zhi-Hong Deng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jie_2023_ICCV, author = {Jie, Shibo and Wang, Haoqing and Deng, Zhi-Hong}, title = {Revisiting the Parameter Efficiency of Adapters from the Perspective of Precision Redundancy}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17217-17226} }
EMQ: Evolving Training-free Proxies for Automated Mixed Precision Quantization: Peijie Dong,

Lujun Li,

Zimian Wei,

Xin Niu,

Zhiliang Tian,

Hengyue Pan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dong_2023_ICCV, author = {Dong, Peijie and Li, Lujun and Wei, Zimian and Niu, Xin and Tian, Zhiliang and Pan, Hengyue}, title = {EMQ: Evolving Training-free Proxies for Automated Mixed Precision Quantization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17076-17086} }
Face Clustering via Graph Convolutional Networks with Confidence Edges: Yang Wu,

Zhiwei Ge,

Yuhao Luo,

Lin Liu,

Sulong Xu; [pdf]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Yang and Ge, Zhiwei and Luo, Yuhao and Liu, Lin and Xu, Sulong}, title = {Face Clustering via Graph Convolutional Networks with Confidence Edges}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20990-20999} }
Learning Spatial-context-aware Global Visual Feature Representation for Instance Image Retrieval: Zhongyan Zhang,

Lei Wang,

Luping Zhou,

Piotr Koniusz; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Zhongyan and Wang, Lei and Zhou, Luping and Koniusz, Piotr}, title = {Learning Spatial-context-aware Global Visual Feature Representation for Instance Image Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11250-11259} }
Cross-modal Latent Space Alignment for Image to Avatar Translation: Manuel Ladron de Guevara,

Jose Echevarria,

Yijun Li,

Yannick Hold-Geoffroy,

Cameron Smith,

Daichi Ito; [pdf] [supp]
[bibtex]
@InProceedings{de_Guevara_2023_ICCV, author = {de Guevara, Manuel Ladron and Echevarria, Jose and Li, Yijun and Hold-Geoffroy, Yannick and Smith, Cameron and Ito, Daichi}, title = {Cross-modal Latent Space Alignment for Image to Avatar Translation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {520-529} }
Inspecting the Geographical Representativeness of Images from Text-to-Image Models: Abhipsa Basu,

R. Venkatesh Babu,

Danish Pruthi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Basu_2023_ICCV, author = {Basu, Abhipsa and Babu, R. Venkatesh and Pruthi, Danish}, title = {Inspecting the Geographical Representativeness of Images from Text-to-Image Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5136-5147} }
Space-time Prompting for Video Class-incremental Learning: Yixuan Pei,

Zhiwu Qing,

Shiwei Zhang,

Xiang Wang,

Yingya Zhang,

Deli Zhao,

Xueming Qian; [pdf] [supp]
[bibtex]
@InProceedings{Pei_2023_ICCV, author = {Pei, Yixuan and Qing, Zhiwu and Zhang, Shiwei and Wang, Xiang and Zhang, Yingya and Zhao, Deli and Qian, Xueming}, title = {Space-time Prompting for Video Class-incremental Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11932-11942} }
Multimodal Garment Designer: Human-Centric Latent Diffusion Models for Fashion Image Editing: Alberto Baldrati,

Davide Morelli,

Giuseppe Cartella,

Marcella Cornia,

Marco Bertini,

Rita Cucchiara; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Baldrati_2023_ICCV, author = {Baldrati, Alberto and Morelli, Davide and Cartella, Giuseppe and Cornia, Marcella and Bertini, Marco and Cucchiara, Rita}, title = {Multimodal Garment Designer: Human-Centric Latent Diffusion Models for Fashion Image Editing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23393-23402} }
Time-to-Contact Map by Joint Estimation of Up-to-Scale Inverse Depth and Global Motion using a Single Event Camera: Urbano Miguel Nunes,

Laurent Udo Perrinet,

Sio-Hoi Ieng; [pdf] [supp]
[bibtex]
@InProceedings{Nunes_2023_ICCV, author = {Nunes, Urbano Miguel and Perrinet, Laurent Udo and Ieng, Sio-Hoi}, title = {Time-to-Contact Map by Joint Estimation of Up-to-Scale Inverse Depth and Global Motion using a Single Event Camera}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23653-23663} }
Sparse Sampling Transformer with Uncertainty-Driven Ranking for Unified Removal of Raindrops and Rain Streaks: Sixiang Chen,

Tian Ye,

Jinbin Bai,

Erkang Chen,

Jun Shi,

Lei Zhu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Sixiang and Ye, Tian and Bai, Jinbin and Chen, Erkang and Shi, Jun and Zhu, Lei}, title = {Sparse Sampling Transformer with Uncertainty-Driven Ranking for Unified Removal of Raindrops and Rain Streaks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13106-13117} }
A Benchmark for Chinese-English Scene Text Image Super-Resolution: Jianqi Ma,

Zhetong Liang,

Wangmeng Xiang,

Xi Yang,

Lei Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ma_2023_ICCV, author = {Ma, Jianqi and Liang, Zhetong and Xiang, Wangmeng and Yang, Xi and Zhang, Lei}, title = {A Benchmark for Chinese-English Scene Text Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19452-19461} }
HSR-Diff: Hyperspectral Image Super-Resolution via Conditional Diffusion Models: Chanyue Wu,

Dong Wang,

Yunpeng Bai,

Hanyu Mao,

Ying Li,

Qiang Shen; [pdf] [supp]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Chanyue and Wang, Dong and Bai, Yunpeng and Mao, Hanyu and Li, Ying and Shen, Qiang}, title = {HSR-Diff: Hyperspectral Image Super-Resolution via Conditional Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7083-7093} }
Replay: Multi-modal Multi-view Acted Videos for Casual Holography: Roman Shapovalov,

Yanir Kleiman,

Ignacio Rocco,

David Novotny,

Andrea Vedaldi,

Changan Chen,

Filippos Kokkinos,

Ben Graham,

Natalia Neverova; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shapovalov_2023_ICCV, author = {Shapovalov, Roman and Kleiman, Yanir and Rocco, Ignacio and Novotny, David and Vedaldi, Andrea and Chen, Changan and Kokkinos, Filippos and Graham, Ben and Neverova, Natalia}, title = {Replay: Multi-modal Multi-view Acted Videos for Casual Holography}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20338-20348} }
Advancing Example Exploitation Can Alleviate Critical Challenges in Adversarial Training: Yao Ge,

Yun Li,

Keji Han,

Junyi Zhu,

Xianzhong Long; [pdf] [supp]
[bibtex]
@InProceedings{Ge_2023_ICCV, author = {Ge, Yao and Li, Yun and Han, Keji and Zhu, Junyi and Long, Xianzhong}, title = {Advancing Example Exploitation Can Alleviate Critical Challenges in Adversarial Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {145-154} }
Affine-Consistent Transformer for Multi-Class Cell Nuclei Detection: Junjia Huang,

Haofeng Li,

Xiang Wan,

Guanbin Li; [pdf] [supp]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Junjia and Li, Haofeng and Wan, Xiang and Li, Guanbin}, title = {Affine-Consistent Transformer for Multi-Class Cell Nuclei Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21384-21393} }
Removing Anomalies as Noises for Industrial Defect Localization: Fanbin Lu,

Xufeng Yao,

Chi-Wing Fu,

Jiaya Jia; [pdf]
[bibtex]
@InProceedings{Lu_2023_ICCV, author = {Lu, Fanbin and Yao, Xufeng and Fu, Chi-Wing and Jia, Jiaya}, title = {Removing Anomalies as Noises for Industrial Defect Localization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16166-16175} }
GPGait: Generalized Pose-based Gait Recognition: Yang Fu,

Shibei Meng,

Saihui Hou,

Xuecai Hu,

Yongzhen Huang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Fu_2023_ICCV, author = {Fu, Yang and Meng, Shibei and Hou, Saihui and Hu, Xuecai and Huang, Yongzhen}, title = {GPGait: Generalized Pose-based Gait Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19595-19604} }
Stable and Causal Inference for Discriminative Self-supervised Deep Visual Representations: Yuewei Yang,

Hai Li,

Yiran Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Yuewei and Li, Hai and Chen, Yiran}, title = {Stable and Causal Inference for Discriminative Self-supervised Deep Visual Representations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16109-16120} }
ShiftNAS: Improving One-shot NAS via Probability Shift: Mingyang Zhang,

Xinyi Yu,

Haodong Zhao,

Linlin Ou; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Mingyang and Yu, Xinyi and Zhao, Haodong and Ou, Linlin}, title = {ShiftNAS: Improving One-shot NAS via Probability Shift}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5919-5928} }
Semantic Attention Flow Fields for Monocular Dynamic Scene Decomposition: Yiqing Liang,

Eliot Laidlaw,

Alexander Meyerowitz,

Srinath Sridhar,

James Tompkin; [pdf] [supp]
[bibtex]
@InProceedings{Liang_2023_ICCV, author = {Liang, Yiqing and Laidlaw, Eliot and Meyerowitz, Alexander and Sridhar, Srinath and Tompkin, James}, title = {Semantic Attention Flow Fields for Monocular Dynamic Scene Decomposition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21797-21806} }
LexLIP: Lexicon-Bottlenecked Language-Image Pre-Training for Large-Scale Image-Text Sparse Retrieval: Ziyang Luo,

Pu Zhao,

Can Xu,

Xiubo Geng,

Tao Shen,

Chongyang Tao,

Jing Ma,

Qingwei Lin,

Daxin Jiang; [pdf] [supp]
[bibtex]
@InProceedings{Luo_2023_ICCV, author = {Luo, Ziyang and Zhao, Pu and Xu, Can and Geng, Xiubo and Shen, Tao and Tao, Chongyang and Ma, Jing and Lin, Qingwei and Jiang, Daxin}, title = {LexLIP: Lexicon-Bottlenecked Language-Image Pre-Training for Large-Scale Image-Text Sparse Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11206-11217} }
A Fast Unified System for 3D Object Detection and Tracking: Thomas Heitzinger,

Martin Kampel; [pdf] [supp]
[bibtex]
@InProceedings{Heitzinger_2023_ICCV, author = {Heitzinger, Thomas and Kampel, Martin}, title = {A Fast Unified System for 3D Object Detection and Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17044-17054} }
Adaptive Testing of Computer Vision Models: Irena Gao,

Gabriel Ilharco,

Scott Lundberg,

Marco Tulio Ribeiro; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gao_2023_ICCV, author = {Gao, Irena and Ilharco, Gabriel and Lundberg, Scott and Ribeiro, Marco Tulio}, title = {Adaptive Testing of Computer Vision Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4003-4014} }
LFS-GAN: Lifelong Few-Shot Image Generation: Juwon Seo,

Ji-Su Kang,

Gyeong-Moon Park; [pdf] [supp]
[bibtex]
@InProceedings{Seo_2023_ICCV, author = {Seo, Juwon and Kang, Ji-Su and Park, Gyeong-Moon}, title = {LFS-GAN: Lifelong Few-Shot Image Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11356-11366} }
AIDE: A Vision-Driven Multi-View, Multi-Modal, Multi-Tasking Dataset for Assistive Driving Perception: Dingkang Yang,

Shuai Huang,

Zhi Xu,

Zhenpeng Li,

Shunli Wang,

Mingcheng Li,

Yuzheng Wang,

Yang Liu,

Kun Yang,

Zhaoyu Chen,

Yan Wang,

Jing Liu,

Peixuan Zhang,

Peng Zhai,

Lihua Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Dingkang and Huang, Shuai and Xu, Zhi and Li, Zhenpeng and Wang, Shunli and Li, Mingcheng and Wang, Yuzheng and Liu, Yang and Yang, Kun and Chen, Zhaoyu and Wang, Yan and Liu, Jing and Zhang, Peixuan and Zhai, Peng and Zhang, Lihua}, title = {AIDE: A Vision-Driven Multi-View, Multi-Modal, Multi-Tasking Dataset for Assistive Driving Perception}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20459-20470} }
Feature Proliferation -- the "Cancer" in StyleGAN and its Treatments: Shuang Song,

Yuanbang Liang,

Jing Wu,

Yu-Kun Lai,

Yipeng Qin; [pdf] [supp]
[bibtex]
@InProceedings{Song_2023_ICCV, author = {Song, Shuang and Liang, Yuanbang and Wu, Jing and Lai, Yu-Kun and Qin, Yipeng}, title = {Feature Proliferation -- the ''Cancer'' in StyleGAN and its Treatments}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2360-2370} }
Self-Supervised Character-to-Character Distillation for Text Recognition: Tongkun Guan,

Wei Shen,

Xue Yang,

Qi Feng,

Zekun Jiang,

Xiaokang Yang; [pdf] [arXiv]
[bibtex]
@InProceedings{Guan_2023_ICCV, author = {Guan, Tongkun and Shen, Wei and Yang, Xue and Feng, Qi and Jiang, Zekun and Yang, Xiaokang}, title = {Self-Supervised Character-to-Character Distillation for Text Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19473-19484} }
MixCycle: Mixup Assisted Semi-Supervised 3D Single Object Tracking with Cycle Consistency: Qiao Wu,

Jiaqi Yang,

Kun Sun,

Chu'ai Zhang,

Yanning Zhang,

Mathieu Salzmann; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Qiao and Yang, Jiaqi and Sun, Kun and Zhang, Chu'ai and Zhang, Yanning and Salzmann, Mathieu}, title = {MixCycle: Mixup Assisted Semi-Supervised 3D Single Object Tracking with Cycle Consistency}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13956-13966} }
Multi-Label Self-Supervised Learning with Scene Images: Ke Zhu,

Minghao Fu,

Jianxin Wu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Ke and Fu, Minghao and Wu, Jianxin}, title = {Multi-Label Self-Supervised Learning with Scene Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6694-6703} }
Domain Adaptive Few-Shot Open-Set Learning: Debabrata Pal,

Deeptej More,

Sai Bhargav,

Dipesh Tamboli,

Vaneet Aggarwal,

Biplab Banerjee; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Pal_2023_ICCV, author = {Pal, Debabrata and More, Deeptej and Bhargav, Sai and Tamboli, Dipesh and Aggarwal, Vaneet and Banerjee, Biplab}, title = {Domain Adaptive Few-Shot Open-Set Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18831-18840} }
DiffFacto: Controllable Part-Based 3D Point Cloud Generation with Cross Diffusion: George Kiyohiro Nakayama,

Mikaela Angelina Uy,

Jiahui Huang,

Shi-Min Hu,

Ke Li,

Leonidas Guibas; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Nakayama_2023_ICCV, author = {Nakayama, George Kiyohiro and Uy, Mikaela Angelina and Huang, Jiahui and Hu, Shi-Min and Li, Ke and Guibas, Leonidas}, title = {DiffFacto: Controllable Part-Based 3D Point Cloud Generation with Cross Diffusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14257-14267} }
Interactive Class-Agnostic Object Counting: Yifeng Huang,

Viresh Ranjan,

Minh Hoai; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Yifeng and Ranjan, Viresh and Hoai, Minh}, title = {Interactive Class-Agnostic Object Counting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22312-22322} }
Spatio-temporal Prompting Network for Robust Video Feature Extraction: Guanxiong Sun,

Chi Wang,

Zhaoyu Zhang,

Jiankang Deng,

Stefanos Zafeiriou,

Yang Hua; [pdf] [supp]
[bibtex]
@InProceedings{Sun_2023_ICCV, author = {Sun, Guanxiong and Wang, Chi and Zhang, Zhaoyu and Deng, Jiankang and Zafeiriou, Stefanos and Hua, Yang}, title = {Spatio-temporal Prompting Network for Robust Video Feature Extraction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13587-13597} }
Enhancing Fine-Tuning Based Backdoor Defense with Sharpness-Aware Minimization: Mingli Zhu,

Shaokui Wei,

Li Shen,

Yanbo Fan,

Baoyuan Wu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Mingli and Wei, Shaokui and Shen, Li and Fan, Yanbo and Wu, Baoyuan}, title = {Enhancing Fine-Tuning Based Backdoor Defense with Sharpness-Aware Minimization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4466-4477} }
Deep Geometry-Aware Camera Self-Calibration from Video: Annika Hagemann,

Moritz Knorr,

Christoph Stiller; [pdf] [supp]
[bibtex]
@InProceedings{Hagemann_2023_ICCV, author = {Hagemann, Annika and Knorr, Moritz and Stiller, Christoph}, title = {Deep Geometry-Aware Camera Self-Calibration from Video}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3438-3448} }
A Simple Vision Transformer for Weakly Semi-supervised 3D Object Detection: Dingyuan Zhang,

Dingkang Liang,

Zhikang Zou,

Jingyu Li,

Xiaoqing Ye,

Zhe Liu,

Xiao Tan,

Xiang Bai; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Dingyuan and Liang, Dingkang and Zou, Zhikang and Li, Jingyu and Ye, Xiaoqing and Liu, Zhe and Tan, Xiao and Bai, Xiang}, title = {A Simple Vision Transformer for Weakly Semi-supervised 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8373-8383} }
Estimator Meets Equilibrium Perspective: A Rectified Straight Through Estimator for Binary Neural Networks Training: Xiao-Ming Wu,

Dian Zheng,

Zuhao Liu,

Wei-Shi Zheng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Xiao-Ming and Zheng, Dian and Liu, Zuhao and Zheng, Wei-Shi}, title = {Estimator Meets Equilibrium Perspective: A Rectified Straight Through Estimator for Binary Neural Networks Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17055-17064} }
Exploring Object-Centric Temporal Modeling for Efficient Multi-View 3D Object Detection: Shihao Wang,

Yingfei Liu,

Tiancai Wang,

Ying Li,

Xiangyu Zhang; [pdf] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Shihao and Liu, Yingfei and Wang, Tiancai and Li, Ying and Zhang, Xiangyu}, title = {Exploring Object-Centric Temporal Modeling for Efficient Multi-View 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3621-3631} }
Open-domain Visual Entity Recognition: Towards Recognizing Millions of Wikipedia Entities: Hexiang Hu,

Yi Luan,

Yang Chen,

Urvashi Khandelwal,

Mandar Joshi,

Kenton Lee,

Kristina Toutanova,

Ming-Wei Chang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hu_2023_ICCV, author = {Hu, Hexiang and Luan, Yi and Chen, Yang and Khandelwal, Urvashi and Joshi, Mandar and Lee, Kenton and Toutanova, Kristina and Chang, Ming-Wei}, title = {Open-domain Visual Entity Recognition: Towards Recognizing Millions of Wikipedia Entities}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12065-12075} }
MedKLIP: Medical Knowledge Enhanced Language-Image Pre-Training for X-ray Diagnosis: Chaoyi Wu,

Xiaoman Zhang,

Ya Zhang,

Yanfeng Wang,

Weidi Xie; [pdf] [supp]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Chaoyi and Zhang, Xiaoman and Zhang, Ya and Wang, Yanfeng and Xie, Weidi}, title = {MedKLIP: Medical Knowledge Enhanced Language-Image Pre-Training for X-ray Diagnosis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21372-21383} }
Automated Knowledge Distillation via Monte Carlo Tree Search: Lujun Li,

Peijie Dong,

Zimian Wei,

Ya Yang; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Lujun and Dong, Peijie and Wei, Zimian and Yang, Ya}, title = {Automated Knowledge Distillation via Monte Carlo Tree Search}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17413-17424} }
EmoTalk: Speech-Driven Emotional Disentanglement for 3D Face Animation: Ziqiao Peng,

Haoyu Wu,

Zhenbo Song,

Hao Xu,

Xiangyu Zhu,

Jun He,

Hongyan Liu,

Zhaoxin Fan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Peng_2023_ICCV, author = {Peng, Ziqiao and Wu, Haoyu and Song, Zhenbo and Xu, Hao and Zhu, Xiangyu and He, Jun and Liu, Hongyan and Fan, Zhaoxin}, title = {EmoTalk: Speech-Driven Emotional Disentanglement for 3D Face Animation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20687-20697} }
A Soft Nearest-Neighbor Framework for Continual Semi-Supervised Learning: Zhiqi Kang,

Enrico Fini,

Moin Nabi,

Elisa Ricci,

Karteek Alahari; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kang_2023_ICCV, author = {Kang, Zhiqi and Fini, Enrico and Nabi, Moin and Ricci, Elisa and Alahari, Karteek}, title = {A Soft Nearest-Neighbor Framework for Continual Semi-Supervised Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11868-11877} }
Text-Conditioned Sampling Framework for Text-to-Image Generation with Masked Generative Models: Jaewoong Lee,

Sangwon Jang,

Jaehyeong Jo,

Jaehong Yoon,

Yunji Kim,

Jin-Hwa Kim,

Jung-Woo Ha,

Sung Ju Hwang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2023_ICCV, author = {Lee, Jaewoong and Jang, Sangwon and Jo, Jaehyeong and Yoon, Jaehong and Kim, Yunji and Kim, Jin-Hwa and Ha, Jung-Woo and Hwang, Sung Ju}, title = {Text-Conditioned Sampling Framework for Text-to-Image Generation with Masked Generative Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23252-23262} }
ScanNet++: A High-Fidelity Dataset of 3D Indoor Scenes: Chandan Yeshwanth,

Yueh-Cheng Liu,

Matthias Nießner,

Angela Dai; [pdf] [supp]
[bibtex]
@InProceedings{Yeshwanth_2023_ICCV, author = {Yeshwanth, Chandan and Liu, Yueh-Cheng and Nie{\ss}ner, Matthias and Dai, Angela}, title = {ScanNet++: A High-Fidelity Dataset of 3D Indoor Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12-22} }
Minimal Solutions to Uncalibrated Two-view Geometry with Known Epipoles: Gaku Nakano; [pdf]
[bibtex]
@InProceedings{Nakano_2023_ICCV, author = {Nakano, Gaku}, title = {Minimal Solutions to Uncalibrated Two-view Geometry with Known Epipoles}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13361-13370} }
Improving Diversity in Zero-Shot GAN Adaptation with Semantic Variations: Seogkyu Jeon,

Bei Liu,

Pilhyeon Lee,

Kibeom Hong,

Jianlong Fu,

Hyeran Byun; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jeon_2023_ICCV, author = {Jeon, Seogkyu and Liu, Bei and Lee, Pilhyeon and Hong, Kibeom and Fu, Jianlong and Byun, Hyeran}, title = {Improving Diversity in Zero-Shot GAN Adaptation with Semantic Variations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7258-7267} }
Context-Aware Planning and Environment-Aware Memory for Instruction Following Embodied Agents: Byeonghwi Kim,

Jinyeon Kim,

Yuyeong Kim,

Cheolhong Min,

Jonghyun Choi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2023_ICCV, author = {Kim, Byeonghwi and Kim, Jinyeon and Kim, Yuyeong and Min, Cheolhong and Choi, Jonghyun}, title = {Context-Aware Planning and Environment-Aware Memory for Instruction Following Embodied Agents}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10936-10946} }
Vox-E: Text-Guided Voxel Editing of 3D Objects: Etai Sella,

Gal Fiebelman,

Peter Hedman,

Hadar Averbuch-Elor; [pdf] [supp]
[bibtex]
@InProceedings{Sella_2023_ICCV, author = {Sella, Etai and Fiebelman, Gal and Hedman, Peter and Averbuch-Elor, Hadar}, title = {Vox-E: Text-Guided Voxel Editing of 3D Objects}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {430-440} }
Inverse Problem Regularization with Hierarchical Variational Autoencoders: Jean Prost,

Antoine Houdard,

Andrés Almansa,

Nicolas Papadakis; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Prost_2023_ICCV, author = {Prost, Jean and Houdard, Antoine and Almansa, Andr\'es and Papadakis, Nicolas}, title = {Inverse Problem Regularization with Hierarchical Variational Autoencoders}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22894-22905} }
Unpaired Multi-domain Attribute Translation of 3D Facial Shapes with a Square and Symmetric Geometric Map: Zhenfeng Fan,

Zhiheng Zhang,

Shuang Yang,

Chongyang Zhong,

Min Cao,

Shihong Xia; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Fan_2023_ICCV, author = {Fan, Zhenfeng and Zhang, Zhiheng and Yang, Shuang and Zhong, Chongyang and Cao, Min and Xia, Shihong}, title = {Unpaired Multi-domain Attribute Translation of 3D Facial Shapes with a Square and Symmetric Geometric Map}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20828-20838} }
Passive Ultra-Wideband Single-Photon Imaging: Mian Wei,

Sotiris Nousias,

Rahul Gulve,

David B. Lindell,

Kiriakos N. Kutulakos; [pdf] [supp]
[bibtex]
@InProceedings{Wei_2023_ICCV, author = {Wei, Mian and Nousias, Sotiris and Gulve, Rahul and Lindell, David B. and Kutulakos, Kiriakos N.}, title = {Passive Ultra-Wideband Single-Photon Imaging}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8135-8146} }
Template Inversion Attack against Face Recognition Systems using 3D Face Reconstruction: Hatef Otroshi Shahreza,

Sébastien Marcel; [pdf] [supp]
[bibtex]
@InProceedings{Shahreza_2023_ICCV, author = {Shahreza, Hatef Otroshi and Marcel, S\'ebastien}, title = {Template Inversion Attack against Face Recognition Systems using 3D Face Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19662-19672} }
ETran: Energy-Based Transferability Estimation: Mohsen Gholami,

Mohammad Akbari,

Xinglu Wang,

Behnam Kamranian,

Yong Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gholami_2023_ICCV, author = {Gholami, Mohsen and Akbari, Mohammad and Wang, Xinglu and Kamranian, Behnam and Zhang, Yong}, title = {ETran: Energy-Based Transferability Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18613-18622} }
Predict to Detect: Prediction-guided 3D Object Detection using Sequential Images: Sanmin Kim,

Youngseok Kim,

In-Jae Lee,

Dongsuk Kum; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2023_ICCV, author = {Kim, Sanmin and Kim, Youngseok and Lee, In-Jae and Kum, Dongsuk}, title = {Predict to Detect: Prediction-guided 3D Object Detection using Sequential Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18057-18066} }
Unilaterally Aggregated Contrastive Learning with Hierarchical Augmentation for Anomaly Detection: Guodong Wang,

Yunhong Wang,

Jie Qin,

Dongming Zhang,

Xiuguo Bao,

Di Huang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Guodong and Wang, Yunhong and Qin, Jie and Zhang, Dongming and Bao, Xiuguo and Huang, Di}, title = {Unilaterally Aggregated Contrastive Learning with Hierarchical Augmentation for Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6888-6897} }
Learning Image-Adaptive Codebooks for Class-Agnostic Image Restoration: Kechun Liu,

Yitong Jiang,

Inchang Choi,

Jinwei Gu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Kechun and Jiang, Yitong and Choi, Inchang and Gu, Jinwei}, title = {Learning Image-Adaptive Codebooks for Class-Agnostic Image Restoration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5373-5383} }
3D Segmentation of Humans in Point Clouds with Synthetic Data: Ayça Takmaz,

Jonas Schult,

Irem Kaftan,

Mertcan Akçay,

Bastian Leibe,

Robert Sumner,

Francis Engelmann,

Siyu Tang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Takmaz_2023_ICCV, author = {Takmaz, Ay\c{c}a and Schult, Jonas and Kaftan, Irem and Ak\c{c}ay, Mertcan and Leibe, Bastian and Sumner, Robert and Engelmann, Francis and Tang, Siyu}, title = {3D Segmentation of Humans in Point Clouds with Synthetic Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1292-1304} }
Mastering Spatial Graph Prediction of Road Networks: Anagnostidis Sotiris,

Aurelien Lucchi,

Thomas Hofmann; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sotiris_2023_ICCV, author = {Sotiris, Anagnostidis and Lucchi, Aurelien and Hofmann, Thomas}, title = {Mastering Spatial Graph Prediction of Road Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5408-5418} }
IDiff-Face: Synthetic-based Face Recognition through Fizzy Identity-Conditioned Diffusion Model: Fadi Boutros,

Jonas Henry Grebe,

Arjan Kuijper,

Naser Damer; [pdf]
[bibtex]
@InProceedings{Boutros_2023_ICCV, author = {Boutros, Fadi and Grebe, Jonas Henry and Kuijper, Arjan and Damer, Naser}, title = {IDiff-Face: Synthetic-based Face Recognition through Fizzy Identity-Conditioned Diffusion Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19650-19661} }
Deep Video Demoireing via Compact Invertible Dyadic Decomposition: Yuhui Quan,

Haoran Huang,

Shengfeng He,

Ruotao Xu; [pdf] [supp]
[bibtex]
@InProceedings{Quan_2023_ICCV, author = {Quan, Yuhui and Huang, Haoran and He, Shengfeng and Xu, Ruotao}, title = {Deep Video Demoireing via Compact Invertible Dyadic Decomposition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12677-12686} }
Rethinking Multi-Contrast MRI Super-Resolution: Rectangle-Window Cross-Attention Transformer and Arbitrary-Scale Upsampling: Guangyuan Li,

Lei Zhao,

Jiakai Sun,

Zehua Lan,

Zhanjie Zhang,

Jiafu Chen,

Zhijie Lin,

Huaizhong Lin,

Wei Xing; [pdf]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Guangyuan and Zhao, Lei and Sun, Jiakai and Lan, Zehua and Zhang, Zhanjie and Chen, Jiafu and Lin, Zhijie and Lin, Huaizhong and Xing, Wei}, title = {Rethinking Multi-Contrast MRI Super-Resolution: Rectangle-Window Cross-Attention Transformer and Arbitrary-Scale Upsampling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21230-21240} }
Domain Generalization via Rationale Invariance: Liang Chen,

Yong Zhang,

Yibing Song,

Anton van den Hengel,

Lingqiao Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Liang and Zhang, Yong and Song, Yibing and van den Hengel, Anton and Liu, Lingqiao}, title = {Domain Generalization via Rationale Invariance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1751-1760} }
ProbVLM: Probabilistic Adapter for Frozen Vison-Language Models: Uddeshya Upadhyay,

Shyamgopal Karthik,

Massimiliano Mancini,

Zeynep Akata; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Upadhyay_2023_ICCV, author = {Upadhyay, Uddeshya and Karthik, Shyamgopal and Mancini, Massimiliano and Akata, Zeynep}, title = {ProbVLM: Probabilistic Adapter for Frozen Vison-Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1899-1910} }
Towards Open-Set Test-Time Adaptation Utilizing the Wisdom of Crowds in Entropy Minimization: Jungsoo Lee,

Debasmit Das,

Jaegul Choo,

Sungha Choi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2023_ICCV, author = {Lee, Jungsoo and Das, Debasmit and Choo, Jaegul and Choi, Sungha}, title = {Towards Open-Set Test-Time Adaptation Utilizing the Wisdom of Crowds in Entropy Minimization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16380-16389} }
Scene Graph Contrastive Learning for Embodied Navigation: Kunal Pratap Singh,

Jordi Salvador,

Luca Weihs,

Aniruddha Kembhavi; [pdf] [supp]
[bibtex]
@InProceedings{Singh_2023_ICCV, author = {Singh, Kunal Pratap and Salvador, Jordi and Weihs, Luca and Kembhavi, Aniruddha}, title = {Scene Graph Contrastive Learning for Embodied Navigation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10884-10894} }
Long-Range Grouping Transformer for Multi-View 3D Reconstruction: Liying Yang,

Zhenwei Zhu,

Xuxin Lin,

Jian Nong,

Yanyan Liang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Liying and Zhu, Zhenwei and Lin, Xuxin and Nong, Jian and Liang, Yanyan}, title = {Long-Range Grouping Transformer for Multi-View 3D Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18257-18267} }
Latent-OFER: Detect, Mask, and Reconstruct with Latent Vectors for Occluded Facial Expression Recognition: Isack Lee,

Eungi Lee,

Seok Bong Yoo; [pdf] [supp]
[bibtex]
@InProceedings{Lee_2023_ICCV, author = {Lee, Isack and Lee, Eungi and Yoo, Seok Bong}, title = {Latent-OFER: Detect, Mask, and Reconstruct with Latent Vectors for Occluded Facial Expression Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1536-1546} }
DenseShift: Towards Accurate and Efficient Low-Bit Power-of-Two Quantization: Xinlin Li,

Bang Liu,

Rui Heng Yang,

Vanessa Courville,

Chao Xing,

Vahid Partovi Nia; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Xinlin and Liu, Bang and Yang, Rui Heng and Courville, Vanessa and Xing, Chao and Nia, Vahid Partovi}, title = {DenseShift: Towards Accurate and Efficient Low-Bit Power-of-Two Quantization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17010-17020} }
Preparing the Future for Continual Semantic Segmentation: Zihan Lin,

Zilei Wang,

Yixin Zhang; [pdf]
[bibtex]
@InProceedings{Lin_2023_ICCV, author = {Lin, Zihan and Wang, Zilei and Zhang, Yixin}, title = {Preparing the Future for Continual Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11910-11920} }
Efficient Computation Sharing for Multi-Task Visual Scene Understanding: Sara Shoouri,

Mingyu Yang,

Zichen Fan,

Hun-Seok Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shoouri_2023_ICCV, author = {Shoouri, Sara and Yang, Mingyu and Fan, Zichen and Kim, Hun-Seok}, title = {Efficient Computation Sharing for Multi-Task Visual Scene Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17130-17141} }
Self-supervised Cross-view Representation Reconstruction for Change Captioning: Yunbin Tu,

Liang Li,

Li Su,

Zheng-Jun Zha,

Chenggang Yan,

Qingming Huang; [pdf] [supp]
[bibtex]
@InProceedings{Tu_2023_ICCV, author = {Tu, Yunbin and Li, Liang and Su, Li and Zha, Zheng-Jun and Yan, Chenggang and Huang, Qingming}, title = {Self-supervised Cross-view Representation Reconstruction for Change Captioning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2805-2815} }
Unify, Align and Refine: Multi-Level Semantic Alignment for Radiology Report Generation: Yaowei Li,

Bang Yang,

Xuxin Cheng,

Zhihong Zhu,

Hongxiang Li,

Yuexian Zou; [pdf] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Yaowei and Yang, Bang and Cheng, Xuxin and Zhu, Zhihong and Li, Hongxiang and Zou, Yuexian}, title = {Unify, Align and Refine: Multi-Level Semantic Alignment for Radiology Report Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2863-2874} }
Synthesizing Diverse Human Motions in 3D Indoor Scenes: Kaifeng Zhao,

Yan Zhang,

Shaofei Wang,

Thabo Beeler,

Siyu Tang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Kaifeng and Zhang, Yan and Wang, Shaofei and Beeler, Thabo and Tang, Siyu}, title = {Synthesizing Diverse Human Motions in 3D Indoor Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14738-14749} }
Deep Optics for Video Snapshot Compressive Imaging: Ping Wang,

Lishun Wang,

Xin Yuan; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Ping and Wang, Lishun and Yuan, Xin}, title = {Deep Optics for Video Snapshot Compressive Imaging}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10646-10656} }
DDIT: Semantic Scene Completion via Deformable Deep Implicit Templates: Haoang Li,

Jinhu Dong,

Binghui Wen,

Ming Gao,

Tianyu Huang,

Yun-Hui Liu,

Daniel Cremers; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Haoang and Dong, Jinhu and Wen, Binghui and Gao, Ming and Huang, Tianyu and Liu, Yun-Hui and Cremers, Daniel}, title = {DDIT: Semantic Scene Completion via Deformable Deep Implicit Templates}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21894-21904} }
Joint Demosaicing and Deghosting of Time-Varying Exposures for Single-Shot HDR Imaging: Jungwoo Kim,

Min H. Kim; [pdf] [supp]
[bibtex]
@InProceedings{Kim_2023_ICCV, author = {Kim, Jungwoo and Kim, Min H.}, title = {Joint Demosaicing and Deghosting of Time-Varying Exposures for Single-Shot HDR Imaging}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12292-12301} }
Scene-Aware Feature Matching: Xiaoyong Lu,

Yaping Yan,

Tong Wei,

Songlin Du; [pdf] [arXiv]
[bibtex]
@InProceedings{Lu_2023_ICCV, author = {Lu, Xiaoyong and Yan, Yaping and Wei, Tong and Du, Songlin}, title = {Scene-Aware Feature Matching}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3704-3713} }
FDViT: Improve the Hierarchical Architecture of Vision Transformer: Yixing Xu,

Chao Li,

Dong Li,

Xiao Sheng,

Fan Jiang,

Lu Tian,

Ashish Sirasao; [pdf]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Yixing and Li, Chao and Li, Dong and Sheng, Xiao and Jiang, Fan and Tian, Lu and Sirasao, Ashish}, title = {FDViT: Improve the Hierarchical Architecture of Vision Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5950-5960} }
Tuning Pre-trained Model via Moment Probing: Mingze Gao,

Qilong Wang,

Zhenyi Lin,

Pengfei Zhu,

Qinghua Hu,

Jingbo Zhou; [pdf] [supp] [arXiv ]
[bibtex]
@InProceedings{Gao_2023_ICCV, author = {Gao, Mingze and Wang, Qilong and Lin, Zhenyi and Zhu, Pengfei and Hu, Qinghua and Zhou, Jingbo}, title = {Tuning Pre-trained Model via Moment Probing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11803-11813} }
Attention Where It Matters: Rethinking Visual Document Understanding with Selective Region Concentration: Haoyu Cao,

Changcun Bao,

Chaohu Liu,

Huang Chen,

Kun Yin,

Hao Liu,

Yinsong Liu,

Deqiang Jiang,

Xing Sun; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cao_2023_ICCV, author = {Cao, Haoyu and Bao, Changcun and Liu, Chaohu and Chen, Huang and Yin, Kun and Liu, Hao and Liu, Yinsong and Jiang, Deqiang and Sun, Xing}, title = {Attention Where It Matters: Rethinking Visual Document Understanding with Selective Region Concentration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19517-19527} }
Task Agnostic Restoration of Natural Video Dynamics: Muhammad Kashif Ali,

Dongjin Kim,

Tae Hyun Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ali_2023_ICCV, author = {Ali, Muhammad Kashif and Kim, Dongjin and Kim, Tae Hyun}, title = {Task Agnostic Restoration of Natural Video Dynamics}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13534-13544} }
TMR: Text-to-Motion Retrieval Using Contrastive 3D Human Motion Synthesis: Mathis Petrovich,

Michael J. Black,

Gül Varol; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Petrovich_2023_ICCV, author = {Petrovich, Mathis and Black, Michael J. and Varol, G\"ul}, title = {TMR: Text-to-Motion Retrieval Using Contrastive 3D Human Motion Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9488-9497} }
3D Neural Embedding Likelihood: Probabilistic Inverse Graphics for Robust 6D Pose Estimation: Guangyao Zhou,

Nishad Gothoskar,

Lirui Wang,

Joshua B. Tenenbaum,

Dan Gutfreund,

Miguel Lázaro-Gredilla,

Dileep George,

Vikash K. Mansinghka; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Guangyao and Gothoskar, Nishad and Wang, Lirui and Tenenbaum, Joshua B. and Gutfreund, Dan and L\'azaro-Gredilla, Miguel and George, Dileep and Mansinghka, Vikash K.}, title = {3D Neural Embedding Likelihood: Probabilistic Inverse Graphics for Robust 6D Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21625-21636} }
Towards Robust Model Watermark via Reducing Parametric Vulnerability: Guanhao Gan,

Yiming Li,

Dongxian Wu,

Shu-Tao Xia; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gan_2023_ICCV, author = {Gan, Guanhao and Li, Yiming and Wu, Dongxian and Xia, Shu-Tao}, title = {Towards Robust Model Watermark via Reducing Parametric Vulnerability}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4751-4761} }
SupFusion: Supervised LiDAR-Camera Fusion for 3D Object Detection: Yiran Qin,

Chaoqun Wang,

Zijian Kang,

Ningning Ma,

Zhen Li,

Ruimao Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Qin_2023_ICCV, author = {Qin, Yiran and Wang, Chaoqun and Kang, Zijian and Ma, Ningning and Li, Zhen and Zhang, Ruimao}, title = {SupFusion: Supervised LiDAR-Camera Fusion for 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22014-22024} }
EMMN: Emotional Motion Memory Network for Audio-driven Emotional Talking Face Generation: Shuai Tan,

Bin Ji,

Ye Pan; [pdf] [supp]
[bibtex]
@InProceedings{Tan_2023_ICCV, author = {Tan, Shuai and Ji, Bin and Pan, Ye}, title = {EMMN: Emotional Motion Memory Network for Audio-driven Emotional Talking Face Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22146-22156} }
Rethinking Vision Transformers for MobileNet Size and Speed: Yanyu Li,

Ju Hu,

Yang Wen,

Georgios Evangelidis,

Kamyar Salahi,

Yanzhi Wang,

Sergey Tulyakov,

Jian Ren; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Yanyu and Hu, Ju and Wen, Yang and Evangelidis, Georgios and Salahi, Kamyar and Wang, Yanzhi and Tulyakov, Sergey and Ren, Jian}, title = {Rethinking Vision Transformers for MobileNet Size and Speed}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16889-16900} }
Implicit Identity Representation Conditioned Memory Compensation Network for Talking Head video Generation: Fa-Ting Hong,

Dan Xu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hong_2023_ICCV, author = {Hong, Fa-Ting and Xu, Dan}, title = {Implicit Identity Representation Conditioned Memory Compensation Network for Talking Head video Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23062-23072} }
SINC: Self-Supervised In-Context Learning for Vision-Language Tasks: Yi-Syuan Chen,

Yun-Zhu Song,

Cheng Yu Yeo,

Bei Liu,

Jianlong Fu,

Hong-Han Shuai; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Yi-Syuan and Song, Yun-Zhu and Yeo, Cheng Yu and Liu, Bei and Fu, Jianlong and Shuai, Hong-Han}, title = {SINC: Self-Supervised In-Context Learning for Vision-Language Tasks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15430-15442} }
LEA2: A Lightweight Ensemble Adversarial Attack via Non-overlapping Vulnerable Frequency Regions: Yaguan Qian,

Shuke He,

Chenyu Zhao,

Jiaqiang Sha,

Wei Wang,

Bin Wang; [pdf] [supp]
[bibtex]
@InProceedings{Qian_2023_ICCV, author = {Qian, Yaguan and He, Shuke and Zhao, Chenyu and Sha, Jiaqiang and Wang, Wei and Wang, Bin}, title = {LEA2: A Lightweight Ensemble Adversarial Attack via Non-overlapping Vulnerable Frequency Regions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4510-4521} }
Chupa: Carving 3D Clothed Humans from Skinned Shape Priors using 2D Diffusion Probabilistic Models: Byungjun Kim,

Patrick Kwon,

Kwangho Lee,

Myunggi Lee,

Sookwan Han,

Daesik Kim,

Hanbyul Joo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2023_ICCV, author = {Kim, Byungjun and Kwon, Patrick and Lee, Kwangho and Lee, Myunggi and Han, Sookwan and Kim, Daesik and Joo, Hanbyul}, title = {Chupa: Carving 3D Clothed Humans from Skinned Shape Priors using 2D Diffusion Probabilistic Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15965-15976} }
Unsupervised Domain Adaptive Detection with Network Stability Analysis: Wenzhang Zhou,

Heng Fan,

Tiejian Luo,

Libo Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Wenzhang and Fan, Heng and Luo, Tiejian and Zhang, Libo}, title = {Unsupervised Domain Adaptive Detection with Network Stability Analysis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6986-6995} }
Learning a Room with the Occ-SDF Hybrid: Signed Distance Function Mingled with Occupancy Aids Scene Representation: Xiaoyang Lyu,

Peng Dai,

Zizhang Li,

Dongyu Yan,

Yi Lin,

Yifan Peng,

Xiaojuan Qi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lyu_2023_ICCV, author = {Lyu, Xiaoyang and Dai, Peng and Li, Zizhang and Yan, Dongyu and Lin, Yi and Peng, Yifan and Qi, Xiaojuan}, title = {Learning a Room with the Occ-SDF Hybrid: Signed Distance Function Mingled with Occupancy Aids Scene Representation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8940-8950} }
Cloth2Body: Generating 3D Human Body Mesh from 2D Clothing: Lu Dai,

Liqian Ma,

Shenhan Qian,

Hao Liu,

Ziwei Liu,

Hui Xiong; [pdf]
[bibtex]
@InProceedings{Dai_2023_ICCV, author = {Dai, Lu and Ma, Liqian and Qian, Shenhan and Liu, Hao and Liu, Ziwei and Xiong, Hui}, title = {Cloth2Body: Generating 3D Human Body Mesh from 2D Clothing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15007-15017} }
Spatially and Spectrally Consistent Deep Functional Maps: Mingze Sun,

Shiwei Mao,

Puhua Jiang,

Maks Ovsjanikov,

Ruqi Huang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sun_2023_ICCV, author = {Sun, Mingze and Mao, Shiwei and Jiang, Puhua and Ovsjanikov, Maks and Huang, Ruqi}, title = {Spatially and Spectrally Consistent Deep Functional Maps}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14497-14507} }
Sparse Point Guided 3D Lane Detection: Chengtang Yao,

Lidong Yu,

Yuwei Wu,

Yunde Jia; [pdf] [supp]
[bibtex]
@InProceedings{Yao_2023_ICCV, author = {Yao, Chengtang and Yu, Lidong and Wu, Yuwei and Jia, Yunde}, title = {Sparse Point Guided 3D Lane Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8363-8372} }
Event-based Temporally Dense Optical Flow Estimation with Sequential Learning: Wachirawit Ponghiran,

Chamika Mihiranga Liyanagedera,

Kaushik Roy; [pdf] [supp]
[bibtex]
@InProceedings{Ponghiran_2023_ICCV, author = {Ponghiran, Wachirawit and Liyanagedera, Chamika Mihiranga and Roy, Kaushik}, title = {Event-based Temporally Dense Optical Flow Estimation with Sequential Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9827-9836} }
Going Beyond Nouns With Vision & Language Models Using Synthetic Data: Paola Cascante-Bonilla,

Khaled Shehada,

James Seale Smith,

Sivan Doveh,

Donghyun Kim,

Rameswar Panda,

Gul Varol,

Aude Oliva,

Vicente Ordonez,

Rogerio Feris,

Leonid Karlinsky; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cascante-Bonilla_2023_ICCV, author = {Cascante-Bonilla, Paola and Shehada, Khaled and Smith, James Seale and Doveh, Sivan and Kim, Donghyun and Panda, Rameswar and Varol, Gul and Oliva, Aude and Ordonez, Vicente and Feris, Rogerio and Karlinsky, Leonid}, title = {Going Beyond Nouns With Vision \& Language Models Using Synthetic Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20155-20165} }
Continual Zero-Shot Learning through Semantically Guided Generative Random Walks: Wenxuan Zhang,

Paul Janson,

Kai Yi,

Ivan Skorokhodov,

Mohamed Elhoseiny; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Wenxuan and Janson, Paul and Yi, Kai and Skorokhodov, Ivan and Elhoseiny, Mohamed}, title = {Continual Zero-Shot Learning through Semantically Guided Generative Random Walks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11574-11585} }
Foreground-Background Distribution Modeling Transformer for Visual Object Tracking: Dawei Yang,

Jianfeng He,

Yinchao Ma,

Qianjin Yu,

Tianzhu Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Dawei and He, Jianfeng and Ma, Yinchao and Yu, Qianjin and Zhang, Tianzhu}, title = {Foreground-Background Distribution Modeling Transformer for Visual Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10117-10127} }
MeViS: A Large-scale Benchmark for Video Segmentation with Motion Expressions: Henghui Ding,

Chang Liu,

Shuting He,

Xudong Jiang,

Chen Change Loy; [pdf] [arXiv]
[bibtex]
@InProceedings{Ding_2023_ICCV, author = {Ding, Henghui and Liu, Chang and He, Shuting and Jiang, Xudong and Loy, Chen Change}, title = {MeViS: A Large-scale Benchmark for Video Segmentation with Motion Expressions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2694-2703} }
OPERA: Omni-Supervised Representation Learning with Hierarchical Supervisions: Chengkun Wang,

Wenzhao Zheng,

Zheng Zhu,

Jie Zhou,

Jiwen Lu; [pdf] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Chengkun and Zheng, Wenzhao and Zhu, Zheng and Zhou, Jie and Lu, Jiwen}, title = {OPERA: Omni-Supervised Representation Learning with Hierarchical Supervisions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5559-5570} }
GPFL: Simultaneously Learning Global and Personalized Feature Information for Personalized Federated Learning: Jianqing Zhang,

Yang Hua,

Hao Wang,

Tao Song,

Zhengui Xue,

Ruhui Ma,

Jian Cao,

Haibing Guan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Jianqing and Hua, Yang and Wang, Hao and Song, Tao and Xue, Zhengui and Ma, Ruhui and Cao, Jian and Guan, Haibing}, title = {GPFL: Simultaneously Learning Global and Personalized Feature Information for Personalized Federated Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5041-5051} }
Zero-Shot Contrastive Loss for Text-Guided Diffusion Image Style Transfer: Serin Yang,

Hyunmin Hwang,

Jong Chul Ye; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Serin and Hwang, Hyunmin and Ye, Jong Chul}, title = {Zero-Shot Contrastive Loss for Text-Guided Diffusion Image Style Transfer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22873-22882} }
Efficient Region-Aware Neural Radiance Fields for High-Fidelity Talking Portrait Synthesis: Jiahe Li,

Jiawei Zhang,

Xiao Bai,

Jun Zhou,

Lin Gu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Jiahe and Zhang, Jiawei and Bai, Xiao and Zhou, Jun and Gu, Lin}, title = {Efficient Region-Aware Neural Radiance Fields for High-Fidelity Talking Portrait Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7568-7578} }
End2End Multi-View Feature Matching with Differentiable Pose Optimization: Barbara Roessle,

Matthias Nießner; [pdf] [supp]
[bibtex]
@InProceedings{Roessle_2023_ICCV, author = {Roessle, Barbara and Nie{\ss}ner, Matthias}, title = {End2End Multi-View Feature Matching with Differentiable Pose Optimization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {477-487} }
Low-Light Image Enhancement with Illumination-Aware Gamma Correction and Complete Image Modelling Network: Yinglong Wang,

Zhen Liu,

Jianzhuang Liu,

Songcen Xu,

Shuaicheng Liu; [pdf] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Yinglong and Liu, Zhen and Liu, Jianzhuang and Xu, Songcen and Liu, Shuaicheng}, title = {Low-Light Image Enhancement with Illumination-Aware Gamma Correction and Complete Image Modelling Network}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13128-13137} }
Both Diverse and Realism Matter: Physical Attribute and Style Alignment for Rainy Image Generation: Changfeng Yu,

Shiming Chen,

Yi Chang,

Yibing Song,

Luxin Yan; [pdf] [supp]
[bibtex]
@InProceedings{Yu_2023_ICCV, author = {Yu, Changfeng and Chen, Shiming and Chang, Yi and Song, Yibing and Yan, Luxin}, title = {Both Diverse and Realism Matter: Physical Attribute and Style Alignment for Rainy Image Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12387-12397} }
Exploring the Benefits of Visual Prompting in Differential Privacy: Yizhe Li,

Yu-Lin Tsai,

Chia-Mu Yu,

Pin-Yu Chen,

Xuebin Ren; [pdf] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Yizhe and Tsai, Yu-Lin and Yu, Chia-Mu and Chen, Pin-Yu and Ren, Xuebin}, title = {Exploring the Benefits of Visual Prompting in Differential Privacy}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5158-5167} }
Single Image Reflection Separation via Component Synergy: Qiming Hu,

Xiaojie Guo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hu_2023_ICCV, author = {Hu, Qiming and Guo, Xiaojie}, title = {Single Image Reflection Separation via Component Synergy}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13138-13147} }
Mining bias-target Alignment from Voronoi Cells: Rémi Nahon,

Van-Tam Nguyen,

Enzo Tartaglione; [pdf] [arXiv]
[bibtex]
@InProceedings{Nahon_2023_ICCV, author = {Nahon, R\'emi and Nguyen, Van-Tam and Tartaglione, Enzo}, title = {Mining bias-target Alignment from Voronoi Cells}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4946-4955} }
The Victim and The Beneficiary: Exploiting a Poisoned Model to Train a Clean Model on Poisoned Data: Zixuan Zhu,

Rui Wang,

Cong Zou,

Lihua Jing; [pdf] [supp]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Zixuan and Wang, Rui and Zou, Cong and Jing, Lihua}, title = {The Victim and The Beneficiary: Exploiting a Poisoned Model to Train a Clean Model on Poisoned Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {155-164} }
DIFFGUARD: Semantic Mismatch-Guided Out-of-Distribution Detection Using Pre-Trained Diffusion Models: Ruiyuan Gao,

Chenchen Zhao,

Lanqing Hong,

Qiang Xu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gao_2023_ICCV, author = {Gao, Ruiyuan and Zhao, Chenchen and Hong, Lanqing and Xu, Qiang}, title = {DIFFGUARD: Semantic Mismatch-Guided Out-of-Distribution Detection Using Pre-Trained Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1579-1589} }
Identity-Seeking Self-Supervised Representation Learning for Generalizable Person Re-Identification: Zhaopeng Dou,

Zhongdao Wang,

Yali Li,

Shengjin Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dou_2023_ICCV, author = {Dou, Zhaopeng and Wang, Zhongdao and Li, Yali and Wang, Shengjin}, title = {Identity-Seeking Self-Supervised Representation Learning for Generalizable Person Re-Identification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15847-15858} }
3D-Aware Generative Model for Improved Side-View Image Synthesis: Kyungmin Jo,

Wonjoon Jin,

Jaegul Choo,

Hyunjoon Lee,

Sunghyun Cho; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jo_2023_ICCV, author = {Jo, Kyungmin and Jin, Wonjoon and Choo, Jaegul and Lee, Hyunjoon and Cho, Sunghyun}, title = {3D-Aware Generative Model for Improved Side-View Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22862-22872} }
Tracking Anything with Decoupled Video Segmentation: Ho Kei Cheng,

Seoung Wug Oh,

Brian Price,

Alexander Schwing,

Joon-Young Lee; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cheng_2023_ICCV, author = {Cheng, Ho Kei and Oh, Seoung Wug and Price, Brian and Schwing, Alexander and Lee, Joon-Young}, title = {Tracking Anything with Decoupled Video Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1316-1326} }
Generative Gradient Inversion via Over-Parameterized Networks in Federated Learning: Chi Zhang,

Zhang Xiaoman,

Ekanut Sotthiwat,

Yanyu Xu,

Ping Liu,

Liangli Zhen,

Yong Liu; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Chi and Xiaoman, Zhang and Sotthiwat, Ekanut and Xu, Yanyu and Liu, Ping and Zhen, Liangli and Liu, Yong}, title = {Generative Gradient Inversion via Over-Parameterized Networks in Federated Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5126-5135} }
EQ-Net: Elastic Quantization Neural Networks: Ke Xu,

Lei Han,

Ye Tian,

Shangshang Yang,

Xingyi Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Ke and Han, Lei and Tian, Ye and Yang, Shangshang and Zhang, Xingyi}, title = {EQ-Net: Elastic Quantization Neural Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1505-1514} }
OxfordTVG-HIC: Can Machine Make Humorous Captions from Images?: Runjia Li,

Shuyang Sun,

Mohamed Elhoseiny,

Philip Torr; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Runjia and Sun, Shuyang and Elhoseiny, Mohamed and Torr, Philip}, title = {OxfordTVG-HIC: Can Machine Make Humorous Captions from Images?}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20293-20303} }
Exploring Open-Vocabulary Semantic Segmentation from CLIP Vision Encoder Distillation Only: Jun Chen,

Deyao Zhu,

Guocheng Qian,

Bernard Ghanem,

Zhicheng Yan,

Chenchen Zhu,

Fanyi Xiao,

Sean Chang Culatana,

Mohamed Elhoseiny; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Jun and Zhu, Deyao and Qian, Guocheng and Ghanem, Bernard and Yan, Zhicheng and Zhu, Chenchen and Xiao, Fanyi and Culatana, Sean Chang and Elhoseiny, Mohamed}, title = {Exploring Open-Vocabulary Semantic Segmentation from CLIP Vision Encoder Distillation Only}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {699-710} }
EDAPS: Enhanced Domain-Adaptive Panoptic Segmentation: Suman Saha,

Lukas Hoyer,

Anton Obukhov,

Dengxin Dai,

Luc Van Gool; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Saha_2023_ICCV, author = {Saha, Suman and Hoyer, Lukas and Obukhov, Anton and Dai, Dengxin and Van Gool, Luc}, title = {EDAPS: Enhanced Domain-Adaptive Panoptic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19234-19245} }
Parallax-Tolerant Unsupervised Deep Image Stitching: Lang Nie,

Chunyu Lin,

Kang Liao,

Shuaicheng Liu,

Yao Zhao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Nie_2023_ICCV, author = {Nie, Lang and Lin, Chunyu and Liao, Kang and Liu, Shuaicheng and Zhao, Yao}, title = {Parallax-Tolerant Unsupervised Deep Image Stitching}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7399-7408} }
Scratch Each Other's Back: Incomplete Multi-Modal Brain Tumor Segmentation via Category Aware Group Self-Support Learning: Yansheng Qiu,

Delin Chen,

Hongdou Yao,

Yongchao Xu,

Zheng Wang; [pdf]
[bibtex]
@InProceedings{Qiu_2023_ICCV, author = {Qiu, Yansheng and Chen, Delin and Yao, Hongdou and Xu, Yongchao and Wang, Zheng}, title = {Scratch Each Other's Back: Incomplete Multi-Modal Brain Tumor Segmentation via Category Aware Group Self-Support Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21317-21326} }
SFHarmony: Source Free Domain Adaptation for Distributed Neuroimaging Analysis: Nicola K Dinsdale,

Mark Jenkinson,

Ana IL Namburete; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dinsdale_2023_ICCV, author = {Dinsdale, Nicola K and Jenkinson, Mark and Namburete, Ana IL}, title = {SFHarmony: Source Free Domain Adaptation for Distributed Neuroimaging Analysis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11494-11505} }
M2T: Masking Transformers Twice for Faster Decoding: Fabian Mentzer,

Eirikur Agustson,

Michael Tschannen; [pdf] [supp]
[bibtex]
@InProceedings{Mentzer_2023_ICCV, author = {Mentzer, Fabian and Agustson, Eirikur and Tschannen, Michael}, title = {M2T: Masking Transformers Twice for Faster Decoding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5340-5349} }
CoIn: Contrastive Instance Feature Mining for Outdoor 3D Object Detection with Very Limited Annotations: Qiming Xia,

Jinhao Deng,

Chenglu Wen,

Hai Wu,

Shaoshuai Shi,

Xin Li,

Cheng Wang; [pdf] [supp]
[bibtex]
@InProceedings{Xia_2023_ICCV, author = {Xia, Qiming and Deng, Jinhao and Wen, Chenglu and Wu, Hai and Shi, Shaoshuai and Li, Xin and Wang, Cheng}, title = {CoIn: Contrastive Instance Feature Mining for Outdoor 3D Object Detection with Very Limited Annotations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6254-6263} }
3D Human Mesh Recovery with Sequentially Global Rotation Estimation: Dongkai Wang,

Shiliang Zhang; [pdf]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Dongkai and Zhang, Shiliang}, title = {3D Human Mesh Recovery with Sequentially Global Rotation Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14953-14962} }
DREAMWALKER: Mental Planning for Continuous Vision-Language Navigation: Hanqing Wang,

Wei Liang,

Luc Van Gool,

Wenguan Wang; [pdf] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Hanqing and Liang, Wei and Van Gool, Luc and Wang, Wenguan}, title = {DREAMWALKER: Mental Planning for Continuous Vision-Language Navigation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10873-10883} }
Computation and Data Efficient Backdoor Attacks: Yutong Wu,

Xingshuo Han,

Han Qiu,

Tianwei Zhang; [pdf]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Yutong and Han, Xingshuo and Qiu, Han and Zhang, Tianwei}, title = {Computation and Data Efficient Backdoor Attacks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4805-4814} }
Agglomerative Transformer for Human-Object Interaction Detection: Danyang Tu,

Wei Sun,

Guangtao Zhai,

Wei Shen; [pdf] [arXiv]
[bibtex]
@InProceedings{Tu_2023_ICCV, author = {Tu, Danyang and Sun, Wei and Zhai, Guangtao and Shen, Wei}, title = {Agglomerative Transformer for Human-Object Interaction Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21614-21624} }
Decouple Before Interact: Multi-Modal Prompt Learning for Continual Visual Question Answering: Zi Qian,

Xin Wang,

Xuguang Duan,

Pengda Qin,

Yuhong Li,

Wenwu Zhu; [pdf] [supp]
[bibtex]
@InProceedings{Qian_2023_ICCV, author = {Qian, Zi and Wang, Xin and Duan, Xuguang and Qin, Pengda and Li, Yuhong and Zhu, Wenwu}, title = {Decouple Before Interact: Multi-Modal Prompt Learning for Continual Visual Question Answering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2953-2962} }
Rethinking Fast Fourier Convolution in Image Inpainting: Tianyi Chu,

Jiafu Chen,

Jiakai Sun,

Shuobin Lian,

Zhizhong Wang,

Zhiwen Zuo,

Lei Zhao,

Wei Xing,

Dongming Lu; [pdf] [supp]
[bibtex]
@InProceedings{Chu_2023_ICCV, author = {Chu, Tianyi and Chen, Jiafu and Sun, Jiakai and Lian, Shuobin and Wang, Zhizhong and Zuo, Zhiwen and Zhao, Lei and Xing, Wei and Lu, Dongming}, title = {Rethinking Fast Fourier Convolution in Image Inpainting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23195-23205} }
Learning Robust Representations with Information Bottleneck and Memory Network for RGB-D-based Gesture Recognition: Yunan Li,

Huizhou Chen,

Guanwen Feng,

Qiguang Miao; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Yunan and Chen, Huizhou and Feng, Guanwen and Miao, Qiguang}, title = {Learning Robust Representations with Information Bottleneck and Memory Network for RGB-D-based Gesture Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20968-20978} }
P1AC: Revisiting Absolute Pose From a Single Affine Correspondence: Jonathan Ventura,

Zuzana Kukelova,

Torsten Sattler,

Dániel Baráth; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ventura_2023_ICCV, author = {Ventura, Jonathan and Kukelova, Zuzana and Sattler, Torsten and Bar\'ath, D\'aniel}, title = {P1AC: Revisiting Absolute Pose From a Single Affine Correspondence}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19751-19761} }
LAN-HDR: Luminance-based Alignment Network for High Dynamic Range Video Reconstruction: Haesoo Chung,

Nam Ik Cho; [pdf]
[bibtex]
@InProceedings{Chung_2023_ICCV, author = {Chung, Haesoo and Cho, Nam Ik}, title = {LAN-HDR: Luminance-based Alignment Network for High Dynamic Range Video Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12760-12769} }
Dancing in the Dark: A Benchmark towards General Low-light Video Enhancement: Huiyuan Fu,

Wenkai Zheng,

Xicong Wang,

Jiaxuan Wang,

Heng Zhang,

Huadong Ma; [pdf]
[bibtex]
@InProceedings{Fu_2023_ICCV, author = {Fu, Huiyuan and Zheng, Wenkai and Wang, Xicong and Wang, Jiaxuan and Zhang, Heng and Ma, Huadong}, title = {Dancing in the Dark: A Benchmark towards General Low-light Video Enhancement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12877-12886} }
RED-PSM: Regularization by Denoising of Partially Separable Models for Dynamic Imaging: Berk Iskender,

Marc L. Klasky,

Yoram Bresler; [pdf] [supp]
[bibtex]
@InProceedings{Iskender_2023_ICCV, author = {Iskender, Berk and Klasky, Marc L. and Bresler, Yoram}, title = {RED-PSM: Regularization by Denoising of Partially Separable Models for Dynamic Imaging}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10595-10604} }
Unsupervised Manifold Linearizing and Clustering: Tianjiao Ding,

Shengbang Tong,

Kwan Ho Ryan Chan,

Xili Dai,

Yi Ma,

Benjamin D. Haeffele; [pdf] [arXiv]
[bibtex]
@InProceedings{Ding_2023_ICCV, author = {Ding, Tianjiao and Tong, Shengbang and Chan, Kwan Ho Ryan and Dai, Xili and Ma, Yi and Haeffele, Benjamin D.}, title = {Unsupervised Manifold Linearizing and Clustering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5450-5461} }
Lossy and Lossless (L2) Post-training Model Size Compression: Yumeng Shi,

Shihao Bai,

Xiuying Wei,

Ruihao Gong,

Jianlei Yang; [pdf] [supp]
[bibtex]
@InProceedings{Shi_2023_ICCV, author = {Shi, Yumeng and Bai, Shihao and Wei, Xiuying and Gong, Ruihao and Yang, Jianlei}, title = {Lossy and Lossless (L2) Post-training Model Size Compression}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17546-17556} }
C2ST: Cross-Modal Contextualized Sequence Transduction for Continuous Sign Language Recognition: Huaiwen Zhang,

Zihang Guo,

Yang Yang,

Xin Liu,

De Hu; [pdf]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Huaiwen and Guo, Zihang and Yang, Yang and Liu, Xin and Hu, De}, title = {C2ST: Cross-Modal Contextualized Sequence Transduction for Continuous Sign Language Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21053-21062} }
ObjectFusion: Multi-modal 3D Object Detection with Object-Centric Fusion: Qi Cai,

Yingwei Pan,

Ting Yao,

Chong-Wah Ngo,

Tao Mei; [pdf] [supp]
[bibtex]
@InProceedings{Cai_2023_ICCV, author = {Cai, Qi and Pan, Yingwei and Yao, Ting and Ngo, Chong-Wah and Mei, Tao}, title = {ObjectFusion: Multi-modal 3D Object Detection with Object-Centric Fusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18067-18076} }
D-IF: Uncertainty-aware Human Digitization via Implicit Distribution Field: Xueting Yang,

Yihao Luo,

Yuliang Xiu,

Wei Wang,

Hao Xu,

Zhaoxin Fan; [pdf]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Xueting and Luo, Yihao and Xiu, Yuliang and Wang, Wei and Xu, Hao and Fan, Zhaoxin}, title = {D-IF: Uncertainty-aware Human Digitization via Implicit Distribution Field}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9122-9132} }
MMVP: Motion-Matrix-Based Video Prediction: Yiqi Zhong,

Luming Liang,

Ilya Zharkov,

Ulrich Neumann; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhong_2023_ICCV, author = {Zhong, Yiqi and Liang, Luming and Zharkov, Ilya and Neumann, Ulrich}, title = {MMVP: Motion-Matrix-Based Video Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4273-4283} }
Human Preference Score: Better Aligning Text-to-Image Models with Human Preference: Xiaoshi Wu,

Keqiang Sun,

Feng Zhu,

Rui Zhao,

Hongsheng Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Xiaoshi and Sun, Keqiang and Zhu, Feng and Zhao, Rui and Li, Hongsheng}, title = {Human Preference Score: Better Aligning Text-to-Image Models with Human Preference}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2096-2105} }
Guided Motion Diffusion for Controllable Human Motion Synthesis: Korrawe Karunratanakul,

Konpat Preechakul,

Supasorn Suwajanakorn,

Siyu Tang; [pdf] [supp]
[bibtex]
@InProceedings{Karunratanakul_2023_ICCV, author = {Karunratanakul, Korrawe and Preechakul, Konpat and Suwajanakorn, Supasorn and Tang, Siyu}, title = {Guided Motion Diffusion for Controllable Human Motion Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2151-2162} }
AffordPose: A Large-Scale Dataset of Hand-Object Interactions with Affordance-Driven Hand Pose: Juntao Jian,

Xiuping Liu,

Manyi Li,

Ruizhen Hu,

Jian Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jian_2023_ICCV, author = {Jian, Juntao and Liu, Xiuping and Li, Manyi and Hu, Ruizhen and Liu, Jian}, title = {AffordPose: A Large-Scale Dataset of Hand-Object Interactions with Affordance-Driven Hand Pose}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14713-14724} }
Locomotion-Action-Manipulation: Synthesizing Human-Scene Interactions in Complex 3D Environments: Jiye Lee,

Hanbyul Joo; [pdf] [supp]
[bibtex]
@InProceedings{Lee_2023_ICCV, author = {Lee, Jiye and Joo, Hanbyul}, title = {Locomotion-Action-Manipulation: Synthesizing Human-Scene Interactions in Complex 3D Environments}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9663-9674} }
NDDepth: Normal-Distance Assisted Monocular Depth Estimation: Shuwei Shao,

Zhongcai Pei,

Weihai Chen,

Xingming Wu,

Zhengguo Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shao_2023_ICCV, author = {Shao, Shuwei and Pei, Zhongcai and Chen, Weihai and Wu, Xingming and Li, Zhengguo}, title = {NDDepth: Normal-Distance Assisted Monocular Depth Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7931-7940} }
Sequential Texts Driven Cohesive Motions Synthesis with Natural Transitions: Shuai Li,

Sisi Zhuang,

Wenfeng Song,

Xinyu Zhang,

Hejia Chen,

Aimin Hao; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Shuai and Zhuang, Sisi and Song, Wenfeng and Zhang, Xinyu and Chen, Hejia and Hao, Aimin}, title = {Sequential Texts Driven Cohesive Motions Synthesis with Natural Transitions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9498-9508} }
Efficient Converted Spiking Neural Network for 3D and 2D Classification: Yuxiang Lan,

Yachao Zhang,

Xu Ma,

Yanyun Qu,

Yun Fu; [pdf]
[bibtex]
@InProceedings{Lan_2023_ICCV, author = {Lan, Yuxiang and Zhang, Yachao and Ma, Xu and Qu, Yanyun and Fu, Yun}, title = {Efficient Converted Spiking Neural Network for 3D and 2D Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9211-9220} }
Eulerian Single-Photon Vision: Shantanu Gupta,

Mohit Gupta; [pdf] [supp]
[bibtex]
@InProceedings{Gupta_2023_ICCV, author = {Gupta, Shantanu and Gupta, Mohit}, title = {Eulerian Single-Photon Vision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10465-10476} }
Adaptive Calibrator Ensemble: Navigating Test Set Difficulty in Out-of-Distribution Scenarios: Yuli Zou,

Weijian Deng,

Liang Zheng; [pdf] [supp]
[bibtex]
@InProceedings{Zou_2023_ICCV, author = {Zou, Yuli and Deng, Weijian and Zheng, Liang}, title = {Adaptive Calibrator Ensemble: Navigating Test Set Difficulty in Out-of-Distribution Scenarios}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19333-19342} }
Contrastive Learning Relies More on Spatial Inductive Bias Than Supervised Learning: An Empirical Study: Yuanyi Zhong,

Haoran Tang,

Jun-Kun Chen,

Yu-Xiong Wang; [pdf] [supp]
[bibtex]
@InProceedings{Zhong_2023_ICCV, author = {Zhong, Yuanyi and Tang, Haoran and Chen, Jun-Kun and Wang, Yu-Xiong}, title = {Contrastive Learning Relies More on Spatial Inductive Bias Than Supervised Learning: An Empirical Study}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16327-16336} }
DiffuMask: Synthesizing Images with Pixel-level Annotations for Semantic Segmentation Using Diffusion Models: Weijia Wu,

Yuzhong Zhao,

Mike Zheng Shou,

Hong Zhou,

Chunhua Shen; [pdf] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Weijia and Zhao, Yuzhong and Shou, Mike Zheng and Zhou, Hong and Shen, Chunhua}, title = {DiffuMask: Synthesizing Images with Pixel-level Annotations for Semantic Segmentation Using Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1206-1217} }
NSF: Neural Surface Fields for Human Modeling from Monocular Depth: Yuxuan Xue,

Bharat Lal Bhatnagar,

Riccardo Marin,

Nikolaos Sarafianos,

Yuanlu Xu,

Gerard Pons-Moll,

Tony Tung; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xue_2023_ICCV, author = {Xue, Yuxuan and Bhatnagar, Bharat Lal and Marin, Riccardo and Sarafianos, Nikolaos and Xu, Yuanlu and Pons-Moll, Gerard and Tung, Tony}, title = {NSF: Neural Surface Fields for Human Modeling from Monocular Depth}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15049-15060} }
Unaligned 2D to 3D Translation with Conditional Vector-Quantized Code Diffusion using Transformers: Abril Corona-Figueroa,

Sam Bond-Taylor,

Neelanjan Bhowmik,

Yona Falinie A. Gaus,

Toby P. Breckon,

Hubert P. H. Shum,

Chris G. Willcocks; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Corona-Figueroa_2023_ICCV, author = {Corona-Figueroa, Abril and Bond-Taylor, Sam and Bhowmik, Neelanjan and Gaus, Yona Falinie A. and Breckon, Toby P. and Shum, Hubert P. H. and Willcocks, Chris G.}, title = {Unaligned 2D to 3D Translation with Conditional Vector-Quantized Code Diffusion using Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14585-14594} }
DMNet: Delaunay Meshing Network for 3D Shape Representation: Chen Zhang,

Ganzhangqin Yuan,

Wenbing Tao; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Chen and Yuan, Ganzhangqin and Tao, Wenbing}, title = {DMNet: Delaunay Meshing Network for 3D Shape Representation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14418-14428} }
StyleDomain: Efficient and Lightweight Parameterizations of StyleGAN for One-shot and Few-shot Domain Adaptation: Aibek Alanov,

Vadim Titov,

Maksim Nakhodnov,

Dmitry Vetrov; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Alanov_2023_ICCV, author = {Alanov, Aibek and Titov, Vadim and Nakhodnov, Maksim and Vetrov, Dmitry}, title = {StyleDomain: Efficient and Lightweight Parameterizations of StyleGAN for One-shot and Few-shot Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2184-2194} }
RankMixup: Ranking-Based Mixup Training for Network Calibration: Jongyoun Noh,

Hyekang Park,

Junghyup Lee,

Bumsub Ham; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Noh_2023_ICCV, author = {Noh, Jongyoun and Park, Hyekang and Lee, Junghyup and Ham, Bumsub}, title = {RankMixup: Ranking-Based Mixup Training for Network Calibration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1358-1368} }
Body Knowledge and Uncertainty Modeling for Monocular 3D Human Body Reconstruction: Yufei Zhang,

Hanjing Wang,

Jeffrey O. Kephart,

Qiang Ji; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Yufei and Wang, Hanjing and Kephart, Jeffrey O. and Ji, Qiang}, title = {Body Knowledge and Uncertainty Modeling for Monocular 3D Human Body Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9020-9032} }
Randomized Quantization: A Generic Augmentation for Data Agnostic Self-supervised Learning: Huimin Wu,

Chenyang Lei,

Xiao Sun,

Peng-Shuai Wang,

Qifeng Chen,

Kwang-Ting Cheng,

Stephen Lin,

Zhirong Wu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Huimin and Lei, Chenyang and Sun, Xiao and Wang, Peng-Shuai and Chen, Qifeng and Cheng, Kwang-Ting and Lin, Stephen and Wu, Zhirong}, title = {Randomized Quantization: A Generic Augmentation for Data Agnostic Self-supervised Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16305-16316} }
Learning to Generate Semantic Layouts for Higher Text-Image Correspondence in Text-to-Image Synthesis: Minho Park,

Jooyeol Yun,

Seunghwan Choi,

Jaegul Choo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Park_2023_ICCV, author = {Park, Minho and Yun, Jooyeol and Choi, Seunghwan and Choo, Jaegul}, title = {Learning to Generate Semantic Layouts for Higher Text-Image Correspondence in Text-to-Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7591-7600} }
Neural Radiance Field with LiDAR maps: MingFang Chang,

Akash Sharma,

Michael Kaess,

Simon Lucey; [pdf] [supp]
[bibtex]
@InProceedings{Chang_2023_ICCV, author = {Chang, MingFang and Sharma, Akash and Kaess, Michael and Lucey, Simon}, title = {Neural Radiance Field with LiDAR maps}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17914-17923} }
AREA: Adaptive Reweighting via Effective Area for Long-Tailed Classification: Xiaohua Chen,

Yucan Zhou,

Dayan Wu,

Chule Yang,

Bo Li,

Qinghua Hu,

Weiping Wang; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Xiaohua and Zhou, Yucan and Wu, Dayan and Yang, Chule and Li, Bo and Hu, Qinghua and Wang, Weiping}, title = {AREA: Adaptive Reweighting via Effective Area for Long-Tailed Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19277-19287} }
Erasing Concepts from Diffusion Models: Rohit Gandikota,

Joanna Materzynska,

Jaden Fiotto-Kaufman,

David Bau; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gandikota_2023_ICCV, author = {Gandikota, Rohit and Materzynska, Joanna and Fiotto-Kaufman, Jaden and Bau, David}, title = {Erasing Concepts from Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2426-2436} }
Fully Attentional Networks with Self-emerging Token Labeling: Bingyin Zhao,

Zhiding Yu,

Shiyi Lan,

Yutao Cheng,

Anima Anandkumar,

Yingjie Lao,

Jose M. Alvarez; [pdf]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Bingyin and Yu, Zhiding and Lan, Shiyi and Cheng, Yutao and Anandkumar, Anima and Lao, Yingjie and Alvarez, Jose M.}, title = {Fully Attentional Networks with Self-emerging Token Labeling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5585-5595} }
ACTIVE: Towards Highly Transferable 3D Physical Camouflage for Universal and Robust Vehicle Evasion: Naufal Suryanto,

Yongsu Kim,

Harashta Tatimma Larasati,

Hyoeun Kang,

Thi-Thu-Huong Le,

Yoonyoung Hong,

Hunmin Yang,

Se-Yoon Oh,

Howon Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Suryanto_2023_ICCV, author = {Suryanto, Naufal and Kim, Yongsu and Larasati, Harashta Tatimma and Kang, Hyoeun and Le, Thi-Thu-Huong and Hong, Yoonyoung and Yang, Hunmin and Oh, Se-Yoon and Kim, Howon}, title = {ACTIVE: Towards Highly Transferable 3D Physical Camouflage for Universal and Robust Vehicle Evasion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4305-4314} }
Learning Adaptive Neighborhoods for Graph Neural Networks: Avishkar Saha,

Oscar Mendez,

Chris Russell,

Richard Bowden; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Saha_2023_ICCV, author = {Saha, Avishkar and Mendez, Oscar and Russell, Chris and Bowden, Richard}, title = {Learning Adaptive Neighborhoods for Graph Neural Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22541-22550} }
Equivariant Similarity for Vision-Language Foundation Models: Tan Wang,

Kevin Lin,

Linjie Li,

Chung-Ching Lin,

Zhengyuan Yang,

Hanwang Zhang,

Zicheng Liu,

Lijuan Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Tan and Lin, Kevin and Li, Linjie and Lin, Chung-Ching and Yang, Zhengyuan and Zhang, Hanwang and Liu, Zicheng and Wang, Lijuan}, title = {Equivariant Similarity for Vision-Language Foundation Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11998-12008} }
ReST: A Reconfigurable Spatial-Temporal Graph Model for Multi-Camera Multi-Object Tracking: Cheng-Che Cheng,

Min-Xuan Qiu,

Chen-Kuo Chiang,

Shang-Hong Lai; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cheng_2023_ICCV, author = {Cheng, Cheng-Che and Qiu, Min-Xuan and Chiang, Chen-Kuo and Lai, Shang-Hong}, title = {ReST: A Reconfigurable Spatial-Temporal Graph Model for Multi-Camera Multi-Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10051-10060} }
Too Large; Data Reduction for Vision-Language Pre-Training: Alex Jinpeng Wang,

Kevin Qinghong Lin,

David Junhao Zhang,

Stan Weixian Lei,

Mike Zheng Shou; [pdf] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Alex Jinpeng and Lin, Kevin Qinghong and Zhang, David Junhao and Lei, Stan Weixian and Shou, Mike Zheng}, title = {Too Large; Data Reduction for Vision-Language Pre-Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3147-3157} }
Make-It-3D: High-fidelity 3D Creation from A Single Image with Diffusion Prior: Junshu Tang,

Tengfei Wang,

Bo Zhang,

Ting Zhang,

Ran Yi,

Lizhuang Ma,

Dong Chen; [pdf] [supp]
[bibtex]
@InProceedings{Tang_2023_ICCV, author = {Tang, Junshu and Wang, Tengfei and Zhang, Bo and Zhang, Ting and Yi, Ran and Ma, Lizhuang and Chen, Dong}, title = {Make-It-3D: High-fidelity 3D Creation from A Single Image with Diffusion Prior}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22819-22829} }
Towards Deeply Unified Depth-aware Panoptic Segmentation with Bi-directional Guidance Learning: Junwen He,

Yifan Wang,

Lijun Wang,

Huchuan Lu,

Bin Luo,

Jun-Yan He,

Jin-Peng Lan,

Yifeng Geng,

Xuansong Xie; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{He_2023_ICCV, author = {He, Junwen and Wang, Yifan and Wang, Lijun and Lu, Huchuan and Luo, Bin and He, Jun-Yan and Lan, Jin-Peng and Geng, Yifeng and Xie, Xuansong}, title = {Towards Deeply Unified Depth-aware Panoptic Segmentation with Bi-directional Guidance Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4111-4121} }
Taxonomy Adaptive Cross-Domain Adaptation in Medical Imaging via Optimization Trajectory Distillation: Jianan Fan,

Dongnan Liu,

Hang Chang,

Heng Huang,

Mei Chen,

Weidong Cai; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Fan_2023_ICCV, author = {Fan, Jianan and Liu, Dongnan and Chang, Hang and Huang, Heng and Chen, Mei and Cai, Weidong}, title = {Taxonomy Adaptive Cross-Domain Adaptation in Medical Imaging via Optimization Trajectory Distillation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21174-21184} }
DiffTAD: Temporal Action Detection with Proposal Denoising Diffusion: Sauradip Nag,

Xiatian Zhu,

Jiankang Deng,

Yi-Zhe Song,

Tao Xiang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Nag_2023_ICCV, author = {Nag, Sauradip and Zhu, Xiatian and Deng, Jiankang and Song, Yi-Zhe and Xiang, Tao}, title = {DiffTAD: Temporal Action Detection with Proposal Denoising Diffusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10362-10374} }
Ray Conditioning: Trading Photo-consistency for Photo-realism in Multi-view Image Generation: Eric Ming Chen,

Sidhanth Holalkere,

Ruyu Yan,

Kai Zhang,

Abe Davis; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Eric Ming and Holalkere, Sidhanth and Yan, Ruyu and Zhang, Kai and Davis, Abe}, title = {Ray Conditioning: Trading Photo-consistency for Photo-realism in Multi-view Image Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23242-23251} }
SCOB: Universal Text Understanding via Character-wise Supervised Contrastive Learning with Online Text Rendering for Bridging Domain Gap: Daehee Kim,

Yoonsik Kim,

DongHyun Kim,

Yumin Lim,

Geewook Kim,

Taeho Kil; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2023_ICCV, author = {Kim, Daehee and Kim, Yoonsik and Kim, DongHyun and Lim, Yumin and Kim, Geewook and Kil, Taeho}, title = {SCOB: Universal Text Understanding via Character-wise Supervised Contrastive Learning with Online Text Rendering for Bridging Domain Gap}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19562-19573} }
Point-Query Quadtree for Crowd Counting, Localization, and More: Chengxin Liu,

Hao Lu,

Zhiguo Cao,

Tongliang Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Chengxin and Lu, Hao and Cao, Zhiguo and Liu, Tongliang}, title = {Point-Query Quadtree for Crowd Counting, Localization, and More}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1676-1685} }
Heterogeneous Diversity Driven Active Learning for Multi-Object Tracking: Rui Li,

Baopeng Zhang,

Jun Liu,

Wei Liu,

Jian Zhao,

Zhu Teng; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Rui and Zhang, Baopeng and Liu, Jun and Liu, Wei and Zhao, Jian and Teng, Zhu}, title = {Heterogeneous Diversity Driven Active Learning for Multi-Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9932-9941} }
Domain Generalization of 3D Semantic Segmentation in Autonomous Driving: Jules Sanchez,

Jean-Emmanuel Deschaud,

François Goulette; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sanchez_2023_ICCV, author = {Sanchez, Jules and Deschaud, Jean-Emmanuel and Goulette, Fran\c{c}ois}, title = {Domain Generalization of 3D Semantic Segmentation in Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18077-18087} }
HaMuCo: Hand Pose Estimation via Multiview Collaborative Self-Supervised Learning: Xiaozheng Zheng,

Chao Wen,

Zhou Xue,

Pengfei Ren,

Jingyu Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zheng_2023_ICCV, author = {Zheng, Xiaozheng and Wen, Chao and Xue, Zhou and Ren, Pengfei and Wang, Jingyu}, title = {HaMuCo: Hand Pose Estimation via Multiview Collaborative Self-Supervised Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20763-20773} }
Efficient Model Personalization in Federated Learning via Client-Specific Prompt Generation: Fu-En Yang,

Chien-Yi Wang,

Yu-Chiang Frank Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Fu-En and Wang, Chien-Yi and Wang, Yu-Chiang Frank}, title = {Efficient Model Personalization in Federated Learning via Client-Specific Prompt Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19159-19168} }
Dual Aggregation Transformer for Image Super-Resolution: Zheng Chen,

Yulun Zhang,

Jinjin Gu,

Linghe Kong,

Xiaokang Yang,

Fisher Yu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Zheng and Zhang, Yulun and Gu, Jinjin and Kong, Linghe and Yang, Xiaokang and Yu, Fisher}, title = {Dual Aggregation Transformer for Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12312-12321} }
Zero-Shot Spatial Layout Conditioning for Text-to-Image Diffusion Models: Guillaume Couairon,

Marlène Careil,

Matthieu Cord,

Stéphane Lathuilière,

Jakob Verbeek; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Couairon_2023_ICCV, author = {Couairon, Guillaume and Careil, Marl\`ene and Cord, Matthieu and Lathuili\`ere, St\'ephane and Verbeek, Jakob}, title = {Zero-Shot Spatial Layout Conditioning for Text-to-Image Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2174-2183} }
SegGPT: Towards Segmenting Everything in Context: Xinlong Wang,

Xiaosong Zhang,

Yue Cao,

Wen Wang,

Chunhua Shen,

Tiejun Huang; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Xinlong and Zhang, Xiaosong and Cao, Yue and Wang, Wen and Shen, Chunhua and Huang, Tiejun}, title = {SegGPT: Towards Segmenting Everything in Context}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1130-1140} }
Semantify: Simplifying the Control of 3D Morphable Models Using CLIP: Omer Gralnik,

Guy Gafni,

Ariel Shamir; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gralnik_2023_ICCV, author = {Gralnik, Omer and Gafni, Guy and Shamir, Ariel}, title = {Semantify: Simplifying the Control of 3D Morphable Models Using CLIP}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14554-14564} }
From Sky to the Ground: A Large-scale Benchmark and Simple Baseline Towards Real Rain Removal: Yun Guo,

Xueyao Xiao,

Yi Chang,

Shumin Deng,

Luxin Yan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Guo_2023_ICCV, author = {Guo, Yun and Xiao, Xueyao and Chang, Yi and Deng, Shumin and Yan, Luxin}, title = {From Sky to the Ground: A Large-scale Benchmark and Simple Baseline Towards Real Rain Removal}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12097-12107} }
Knowledge Restore and Transfer for Multi-Label Class-Incremental Learning: Songlin Dong,

Haoyu Luo,

Yuhang He,

Xing Wei,

Jie Cheng,

Yihong Gong; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dong_2023_ICCV, author = {Dong, Songlin and Luo, Haoyu and He, Yuhang and Wei, Xing and Cheng, Jie and Gong, Yihong}, title = {Knowledge Restore and Transfer for Multi-Label Class-Incremental Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18711-18720} }
DDColor: Towards Photo-Realistic Image Colorization via Dual Decoders: Xiaoyang Kang,

Tao Yang,

Wenqi Ouyang,

Peiran Ren,

Lingzhi Li,

Xuansong Xie; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kang_2023_ICCV, author = {Kang, Xiaoyang and Yang, Tao and Ouyang, Wenqi and Ren, Peiran and Li, Lingzhi and Xie, Xuansong}, title = {DDColor: Towards Photo-Realistic Image Colorization via Dual Decoders}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {328-338} }
Visual Explanations via Iterated Integrated Attributions: Oren Barkan,

‪Yehonatan Elisha‬‏,

Yuval Asher,

Amit Eshel,

Noam Koenigstein; [pdf] [supp]
[bibtex]
@InProceedings{Barkan_2023_ICCV, author = {Barkan, Oren and Elisha‬‏, ‪Yehonatan and Asher, Yuval and Eshel, Amit and Koenigstein, Noam}, title = {Visual Explanations via Iterated Integrated Attributions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2073-2084} }
PanFlowNet: A Flow-Based Deep Network for Pan-Sharpening: Gang Yang,

Xiangyong Cao,

Wenzhe Xiao,

Man Zhou,

Aiping Liu,

Xun Chen,

Deyu Meng; [pdf] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Gang and Cao, Xiangyong and Xiao, Wenzhe and Zhou, Man and Liu, Aiping and Chen, Xun and Meng, Deyu}, title = {PanFlowNet: A Flow-Based Deep Network for Pan-Sharpening}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16857-16867} }
Domain Generalization via Balancing Training Difficulty and Model Capability: Xueying Jiang,

Jiaxing Huang,

Sheng Jin,

Shijian Lu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jiang_2023_ICCV, author = {Jiang, Xueying and Huang, Jiaxing and Jin, Sheng and Lu, Shijian}, title = {Domain Generalization via Balancing Training Difficulty and Model Capability}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18993-19003} }
Pairwise Similarity Learning is SimPLE: Yandong Wen,

Weiyang Liu,

Yao Feng,

Bhiksha Raj,

Rita Singh,

Adrian Weller,

Michael J. Black,

Bernhard Schölkopf; [pdf] [supp]
[bibtex]
@InProceedings{Wen_2023_ICCV, author = {Wen, Yandong and Liu, Weiyang and Feng, Yao and Raj, Bhiksha and Singh, Rita and Weller, Adrian and Black, Michael J. and Sch\"olkopf, Bernhard}, title = {Pairwise Similarity Learning is SimPLE}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5308-5318} }
GO-SLAM: Global Optimization for Consistent 3D Instant Reconstruction: Youmin Zhang,

Fabio Tosi,

Stefano Mattoccia,

Matteo Poggi; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Youmin and Tosi, Fabio and Mattoccia, Stefano and Poggi, Matteo}, title = {GO-SLAM: Global Optimization for Consistent 3D Instant Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3727-3737} }
JOTR: 3D Joint Contrastive Learning with Transformers for Occluded Human Mesh Recovery: Jiahao Li,

Zongxin Yang,

Xiaohan Wang,

Jianxin Ma,

Chang Zhou,

Yi Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Jiahao and Yang, Zongxin and Wang, Xiaohan and Ma, Jianxin and Zhou, Chang and Yang, Yi}, title = {JOTR: 3D Joint Contrastive Learning with Transformers for Occluded Human Mesh Recovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9110-9121} }
CLIP-Driven Universal Model for Organ Segmentation and Tumor Detection: Jie Liu,

Yixiao Zhang,

Jie-Neng Chen,

Junfei Xiao,

Yongyi Lu,

Bennett A Landman,

Yixuan Yuan,

Alan Yuille,

Yucheng Tang,

Zongwei Zhou; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Jie and Zhang, Yixiao and Chen, Jie-Neng and Xiao, Junfei and Lu, Yongyi and A Landman, Bennett and Yuan, Yixuan and Yuille, Alan and Tang, Yucheng and Zhou, Zongwei}, title = {CLIP-Driven Universal Model for Organ Segmentation and Tumor Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21152-21164} }
NIR-assisted Video Enhancement via Unpaired 24-hour Data: Muyao Niu,

Zhihang Zhong,

Yinqiang Zheng; [pdf] [supp]
[bibtex]
@InProceedings{Niu_2023_ICCV, author = {Niu, Muyao and Zhong, Zhihang and Zheng, Yinqiang}, title = {NIR-assisted Video Enhancement via Unpaired 24-hour Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10778-10788} }
FACTS: First Amplify Correlations and Then Slice to Discover Bias: Sriram Yenamandra,

Pratik Ramesh,

Viraj Prabhu,

Judy Hoffman; [pdf] [supp]
[bibtex]
@InProceedings{Yenamandra_2023_ICCV, author = {Yenamandra, Sriram and Ramesh, Pratik and Prabhu, Viraj and Hoffman, Judy}, title = {FACTS: First Amplify Correlations and Then Slice to Discover Bias}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4794-4804} }
Anchor Structure Regularization Induced Multi-view Subspace Clustering via Enhanced Tensor Rank Minimization: Jintian Ji,

Songhe Feng; [pdf] [supp]
[bibtex]
@InProceedings{Ji_2023_ICCV, author = {Ji, Jintian and Feng, Songhe}, title = {Anchor Structure Regularization Induced Multi-view Subspace Clustering via Enhanced Tensor Rank Minimization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19343-19352} }
VeRi3D: Generative Vertex-based Radiance Fields for 3D Controllable Human Image Synthesis: Xinya Chen,

Jiaxin Huang,

Yanrui Bin,

Lu Yu,

Yiyi Liao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Xinya and Huang, Jiaxin and Bin, Yanrui and Yu, Lu and Liao, Yiyi}, title = {VeRi3D: Generative Vertex-based Radiance Fields for 3D Controllable Human Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8986-8997} }
MOSE: A New Dataset for Video Object Segmentation in Complex Scenes: Henghui Ding,

Chang Liu,

Shuting He,

Xudong Jiang,

Philip H.S. Torr,

Song Bai; [pdf] [arXiv]
[bibtex]
@InProceedings{Ding_2023_ICCV, author = {Ding, Henghui and Liu, Chang and He, Shuting and Jiang, Xudong and Torr, Philip H.S. and Bai, Song}, title = {MOSE: A New Dataset for Video Object Segmentation in Complex Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20224-20234} }
BoMD: Bag of Multi-label Descriptors for Noisy Chest X-ray Classification: Yuanhong Chen,

Fengbei Liu,

Hu Wang,

Chong Wang,

Yuyuan Liu,

Yu Tian,

Gustavo Carneiro; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Yuanhong and Liu, Fengbei and Wang, Hu and Wang, Chong and Liu, Yuyuan and Tian, Yu and Carneiro, Gustavo}, title = {BoMD: Bag of Multi-label Descriptors for Noisy Chest X-ray Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21284-21295} }
Mask-Attention-Free Transformer for 3D Instance Segmentation: Xin Lai,

Yuhui Yuan,

Ruihang Chu,

Yukang Chen,

Han Hu,

Jiaya Jia; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lai_2023_ICCV, author = {Lai, Xin and Yuan, Yuhui and Chu, Ruihang and Chen, Yukang and Hu, Han and Jia, Jiaya}, title = {Mask-Attention-Free Transformer for 3D Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3693-3703} }
SHIFT3D: Synthesizing Hard Inputs For Tricking 3D Detectors: Hongge Chen,

Zhao Chen,

Gregory P. Meyer,

Dennis Park,

Carl Vondrick,

Ashish Shrivastava,

Yuning Chai; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Hongge and Chen, Zhao and Meyer, Gregory P. and Park, Dennis and Vondrick, Carl and Shrivastava, Ashish and Chai, Yuning}, title = {SHIFT3D: Synthesizing Hard Inputs For Tricking 3D Detectors}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8493-8503} }
EgoLoc: Revisiting 3D Object Localization from Egocentric Videos with Visual Queries: Jinjie Mai,

Abdullah Hamdi,

Silvio Giancola,

Chen Zhao,

Bernard Ghanem; [pdf] [arXiv]
[bibtex]
@InProceedings{Mai_2023_ICCV, author = {Mai, Jinjie and Hamdi, Abdullah and Giancola, Silvio and Zhao, Chen and Ghanem, Bernard}, title = {EgoLoc: Revisiting 3D Object Localization from Egocentric Videos with Visual Queries}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {45-57} }
Coordinate Transformer: Achieving Single-stage Multi-person Mesh Recovery from Videos: Haoyuan Li,

Haoye Dong,

Hanchao Jia,

Dong Huang,

Michael C. Kampffmeyer,

Liang Lin,

Xiaodan Liang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Haoyuan and Dong, Haoye and Jia, Hanchao and Huang, Dong and Kampffmeyer, Michael C. and Lin, Liang and Liang, Xiaodan}, title = {Coordinate Transformer: Achieving Single-stage Multi-person Mesh Recovery from Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8744-8753} }
FLatten Transformer: Vision Transformer using Focused Linear Attention: Dongchen Han,

Xuran Pan,

Yizeng Han,

Shiji Song,

Gao Huang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Han_2023_ICCV, author = {Han, Dongchen and Pan, Xuran and Han, Yizeng and Song, Shiji and Huang, Gao}, title = {FLatten Transformer: Vision Transformer using Focused Linear Attention}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5961-5971} }
Q-Diffusion: Quantizing Diffusion Models: Xiuyu Li,

Yijiang Liu,

Long Lian,

Huanrui Yang,

Zhen Dong,

Daniel Kang,

Shanghang Zhang,

Kurt Keutzer; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Xiuyu and Liu, Yijiang and Lian, Long and Yang, Huanrui and Dong, Zhen and Kang, Daniel and Zhang, Shanghang and Keutzer, Kurt}, title = {Q-Diffusion: Quantizing Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17535-17545} }
Robustifying Token Attention for Vision Transformers: Yong Guo,

David Stutz,

Bernt Schiele; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Guo_2023_ICCV, author = {Guo, Yong and Stutz, David and Schiele, Bernt}, title = {Robustifying Token Attention for Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17557-17568} }
Boosting Positive Segments for Weakly-Supervised Audio-Visual Video Parsing: Kranthi Kumar Rachavarapu,

Rajagopalan A. N.; [pdf] [supp]
[bibtex]
@InProceedings{Rachavarapu_2023_ICCV, author = {Rachavarapu, Kranthi Kumar and N., Rajagopalan A.}, title = {Boosting Positive Segments for Weakly-Supervised Audio-Visual Video Parsing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10192-10202} }
ADNet: Lane Shape Prediction via Anchor Decomposition: Lingyu Xiao,

Xiang Li,

Sen Yang,

Wankou Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xiao_2023_ICCV, author = {Xiao, Lingyu and Li, Xiang and Yang, Sen and Yang, Wankou}, title = {ADNet: Lane Shape Prediction via Anchor Decomposition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6404-6413} }
UniSeg: A Unified Multi-Modal LiDAR Segmentation Network and the OpenPCSeg Codebase: Youquan Liu,

Runnan Chen,

Xin Li,

Lingdong Kong,

Yuchen Yang,

Zhaoyang Xia,

Yeqi Bai,

Xinge Zhu,

Yuexin Ma,

Yikang Li,

Yu Qiao,

Yuenan Hou; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Youquan and Chen, Runnan and Li, Xin and Kong, Lingdong and Yang, Yuchen and Xia, Zhaoyang and Bai, Yeqi and Zhu, Xinge and Ma, Yuexin and Li, Yikang and Qiao, Yu and Hou, Yuenan}, title = {UniSeg: A Unified Multi-Modal LiDAR Segmentation Network and the OpenPCSeg Codebase}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21662-21673} }
Sign Language Translation with Iterative Prototype: Huijie Yao,

Wengang Zhou,

Hao Feng,

Hezhen Hu,

Hao Zhou,

Houqiang Li; [pdf] [arXiv]
[bibtex]
@InProceedings{Yao_2023_ICCV, author = {Yao, Huijie and Zhou, Wengang and Feng, Hao and Hu, Hezhen and Zhou, Hao and Li, Houqiang}, title = {Sign Language Translation with Iterative Prototype}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15592-15601} }
Pixel-Wise Contrastive Distillation: Junqiang Huang,

Zichao Guo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Junqiang and Guo, Zichao}, title = {Pixel-Wise Contrastive Distillation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16359-16369} }
Efficient Deep Space Filling Curve: Wanli Chen,

Xufeng Yao,

Xinyun Zhang,

Bei Yu; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Wanli and Yao, Xufeng and Zhang, Xinyun and Yu, Bei}, title = {Efficient Deep Space Filling Curve}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17525-17534} }
GlueGen: Plug and Play Multi-modal Encoders for X-to-image Generation: Can Qin,

Ning Yu,

Chen Xing,

Shu Zhang,

Zeyuan Chen,

Stefano Ermon,

Yun Fu,

Caiming Xiong,

Ran Xu; [pdf] [supp]
[bibtex]
@InProceedings{Qin_2023_ICCV, author = {Qin, Can and Yu, Ning and Xing, Chen and Zhang, Shu and Chen, Zeyuan and Ermon, Stefano and Fu, Yun and Xiong, Caiming and Xu, Ran}, title = {GlueGen: Plug and Play Multi-modal Encoders for X-to-image Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23085-23096} }
Humans in 4D: Reconstructing and Tracking Humans with Transformers: Shubham Goel,

Georgios Pavlakos,

Jathushan Rajasegaran,

Angjoo Kanazawa,

Jitendra Malik; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Goel_2023_ICCV, author = {Goel, Shubham and Pavlakos, Georgios and Rajasegaran, Jathushan and Kanazawa, Angjoo and Malik, Jitendra}, title = {Humans in 4D: Reconstructing and Tracking Humans with Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14783-14794} }
Ponder: Point Cloud Pre-training via Neural Rendering: Di Huang,

Sida Peng,

Tong He,

Honghui Yang,

Xiaowei Zhou,

Wanli Ouyang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Di and Peng, Sida and He, Tong and Yang, Honghui and Zhou, Xiaowei and Ouyang, Wanli}, title = {Ponder: Point Cloud Pre-training via Neural Rendering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16089-16098} }
Perpetual Humanoid Control for Real-time Simulated Avatars: Zhengyi Luo,

Jinkun Cao,

AlexanderWinkler,

Kris Kitani,

Weipeng Xu; [pdf] [supp]
[bibtex]
@InProceedings{Luo_2023_ICCV, author = {Luo, Zhengyi and Cao, Jinkun and AlexanderWinkler and Kitani, Kris and Xu, Weipeng}, title = {Perpetual Humanoid Control for Real-time Simulated Avatars}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10895-10904} }
HollowNeRF: Pruning Hashgrid-Based NeRFs with Trainable Collision Mitigation: Xiufeng Xie,

Riccardo Gherardi,

Zhihong Pan,

Stephen Huang; [pdf] [arXiv]
[bibtex]
@InProceedings{Xie_2023_ICCV, author = {Xie, Xiufeng and Gherardi, Riccardo and Pan, Zhihong and Huang, Stephen}, title = {HollowNeRF: Pruning Hashgrid-Based NeRFs with Trainable Collision Mitigation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3480-3490} }
A Complete Recipe for Diffusion Generative Models: Kushagra Pandey,

Stephan Mandt; [pdf] [supp]
[bibtex]
@InProceedings{Pandey_2023_ICCV, author = {Pandey, Kushagra and Mandt, Stephan}, title = {A Complete Recipe for Diffusion Generative Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4261-4272} }
The Devil is in the Crack Orientation: A New Perspective for Crack Detection: Zhuangzhuang Chen,

Jin Zhang,

Zhuonan Lai,

Guanming Zhu,

Zun Liu,

Jie Chen,

Jianqiang Li; [pdf]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Zhuangzhuang and Zhang, Jin and Lai, Zhuonan and Zhu, Guanming and Liu, Zun and Chen, Jie and Li, Jianqiang}, title = {The Devil is in the Crack Orientation: A New Perspective for Crack Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6653-6663} }
FedPD: Federated Open Set Recognition with Parameter Disentanglement: Chen Yang,

Meilu Zhu,

Yifan Liu,

Yixuan Yuan; [pdf]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Chen and Zhu, Meilu and Liu, Yifan and Yuan, Yixuan}, title = {FedPD: Federated Open Set Recognition with Parameter Disentanglement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4882-4891} }
WaterMask: Instance Segmentation for Underwater Imagery: Shijie Lian,

Hua Li,

Runmin Cong,

Suqi Li,

Wei Zhang,

Sam Kwong; [pdf]
[bibtex]
@InProceedings{Lian_2023_ICCV, author = {Lian, Shijie and Li, Hua and Cong, Runmin and Li, Suqi and Zhang, Wei and Kwong, Sam}, title = {WaterMask: Instance Segmentation for Underwater Imagery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1305-1315} }
Score Priors Guided Deep Variational Inference for Unsupervised Real-World Single Image Denoising: Jun Cheng,

Tao Liu,

Shan Tan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cheng_2023_ICCV, author = {Cheng, Jun and Liu, Tao and Tan, Shan}, title = {Score Priors Guided Deep Variational Inference for Unsupervised Real-World Single Image Denoising}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12937-12948} }
L-DAWA: Layer-wise Divergence Aware Weight Aggregation in Federated Self-Supervised Visual Representation Learning: Yasar Abbas Ur Rehman,

Yan Gao,

Pedro Porto Buarque de Gusmao,

Mina Alibeigi,

Jiajun Shen,

Nicholas D. Lane; [pdf] [supp]
[bibtex]
@InProceedings{Rehman_2023_ICCV, author = {Rehman, Yasar Abbas Ur and Gao, Yan and de Gusmao, Pedro Porto Buarque and Alibeigi, Mina and Shen, Jiajun and Lane, Nicholas D.}, title = {L-DAWA: Layer-wise Divergence Aware Weight Aggregation in Federated Self-Supervised Visual Representation Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16464-16473} }
Improving Transformer-based Image Matching by Cascaded Capturing Spatially Informative Keypoints: Chenjie Cao,

Yanwei Fu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cao_2023_ICCV, author = {Cao, Chenjie and Fu, Yanwei}, title = {Improving Transformer-based Image Matching by Cascaded Capturing Spatially Informative Keypoints}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12129-12139} }
Controllable Guide-Space for Generalizable Face Forgery Detection: Ying Guo,

Cheng Zhen,

Pengfei Yan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Guo_2023_ICCV, author = {Guo, Ying and Zhen, Cheng and Yan, Pengfei}, title = {Controllable Guide-Space for Generalizable Face Forgery Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20818-20827} }
Calibrating Uncertainty for Semi-Supervised Crowd Counting: Chen LI,

Xiaoling Hu,

Shahira Abousamra,

Chao Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{LI_2023_ICCV, author = {LI, Chen and Hu, Xiaoling and Abousamra, Shahira and Chen, Chao}, title = {Calibrating Uncertainty for Semi-Supervised Crowd Counting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16731-16741} }
MosaiQ: Quantum Generative Adversarial Networks for Image Generation on NISQ Computers: Daniel Silver,

Tirthak Patel,

William Cutler,

Aditya Ranjan,

Harshitta Gandhi,

Devesh Tiwari; [pdf] [arXiv]
[bibtex]
@InProceedings{Silver_2023_ICCV, author = {Silver, Daniel and Patel, Tirthak and Cutler, William and Ranjan, Aditya and Gandhi, Harshitta and Tiwari, Devesh}, title = {MosaiQ: Quantum Generative Adversarial Networks for Image Generation on NISQ Computers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7030-7039} }
DVIS: Decoupled Video Instance Segmentation Framework: Tao Zhang,

Xingye Tian,

Yu Wu,

Shunping Ji,

Xuebo Wang,

Yuan Zhang,

Pengfei Wan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Tao and Tian, Xingye and Wu, Yu and Ji, Shunping and Wang, Xuebo and Zhang, Yuan and Wan, Pengfei}, title = {DVIS: Decoupled Video Instance Segmentation Framework}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1282-1291} }
Segmentation of Tubular Structures Using Iterative Training with Tailored Samples: Wei Liao; [pdf] [arXiv]
[bibtex]
@InProceedings{Liao_2023_ICCV, author = {Liao, Wei}, title = {Segmentation of Tubular Structures Using Iterative Training with Tailored Samples}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23643-23652} }
Boundary-Aware Divide and Conquer: A Diffusion-Based Solution for Unsupervised Shadow Removal: Lanqing Guo,

Chong Wang,

Wenhan Yang,

Yufei Wang,

Bihan Wen; [pdf] [supp]
[bibtex]
@InProceedings{Guo_2023_ICCV, author = {Guo, Lanqing and Wang, Chong and Yang, Wenhan and Wang, Yufei and Wen, Bihan}, title = {Boundary-Aware Divide and Conquer: A Diffusion-Based Solution for Unsupervised Shadow Removal}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13045-13054} }
Towards Nonlinear-Motion-Aware and Occlusion-Robust Rolling Shutter Correction: Delin Qu,

Yizhen Lao,

Zhigang Wang,

Dong Wang,

Bin Zhao,

Xuelong Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Qu_2023_ICCV, author = {Qu, Delin and Lao, Yizhen and Wang, Zhigang and Wang, Dong and Zhao, Bin and Li, Xuelong}, title = {Towards Nonlinear-Motion-Aware and Occlusion-Robust Rolling Shutter Correction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10680-10688} }
Surface Extraction from Neural Unsigned Distance Fields: Congyi Zhang,

Guying Lin,

Lei Yang,

Xin Li,

Taku Komura,

Scott Schaefer,

John Keyser,

Wenping Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Congyi and Lin, Guying and Yang, Lei and Li, Xin and Komura, Taku and Schaefer, Scott and Keyser, John and Wang, Wenping}, title = {Surface Extraction from Neural Unsigned Distance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22531-22540} }
CBA: Improving Online Continual Learning via Continual Bias Adaptor: Quanziang Wang,

Renzhen Wang,

Yichen Wu,

Xixi Jia,

Deyu Meng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Quanziang and Wang, Renzhen and Wu, Yichen and Jia, Xixi and Meng, Deyu}, title = {CBA: Improving Online Continual Learning via Continual Bias Adaptor}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19082-19092} }
GraphEcho: Graph-Driven Unsupervised Domain Adaptation for Echocardiogram Video Segmentation: Jiewen Yang,

Xinpeng Ding,

Ziyang Zheng,

Xiaowei Xu,

Xiaomeng Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Jiewen and Ding, Xinpeng and Zheng, Ziyang and Xu, Xiaowei and Li, Xiaomeng}, title = {GraphEcho: Graph-Driven Unsupervised Domain Adaptation for Echocardiogram Video Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11878-11887} }
Multi-view Spectral Polarization Propagation for Video Glass Segmentation: Yu Qiao,

Bo Dong,

Ao Jin,

Yu Fu,

Seung-Hwan Baek,

Felix Heide,

Pieter Peers,

Xiaopeng Wei,

Xin Yang; [pdf] [supp]
[bibtex]
@InProceedings{Qiao_2023_ICCV, author = {Qiao, Yu and Dong, Bo and Jin, Ao and Fu, Yu and Baek, Seung-Hwan and Heide, Felix and Peers, Pieter and Wei, Xiaopeng and Yang, Xin}, title = {Multi-view Spectral Polarization Propagation for Video Glass Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23218-23228} }
Rethinking Amodal Video Segmentation from Learning Supervised Signals with Object-centric Representation: Ke Fan,

Jingshi Lei,

Xuelin Qian,

Miaopeng Yu,

Tianjun Xiao,

Tong He,

Zheng Zhang,

Yanwei Fu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Fan_2023_ICCV, author = {Fan, Ke and Lei, Jingshi and Qian, Xuelin and Yu, Miaopeng and Xiao, Tianjun and He, Tong and Zhang, Zheng and Fu, Yanwei}, title = {Rethinking Amodal Video Segmentation from Learning Supervised Signals with Object-centric Representation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1272-1281} }
Augmented Box Replay: Overcoming Foreground Shift for Incremental Object Detection: Yuyang Liu,

Yang Cong,

Dipam Goswami,

Xialei Liu,

Joost van de Weijer; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Yuyang and Cong, Yang and Goswami, Dipam and Liu, Xialei and van de Weijer, Joost}, title = {Augmented Box Replay: Overcoming Foreground Shift for Incremental Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11367-11377} }
Distilled Reverse Attention Network for Open-world Compositional Zero-Shot Learning: Yun Li,

Zhe Liu,

Saurav Jha,

Lina Yao; [pdf] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Yun and Liu, Zhe and Jha, Saurav and Yao, Lina}, title = {Distilled Reverse Attention Network for Open-world Compositional Zero-Shot Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1782-1791} }
DandelionNet: Domain Composition with Instance Adaptive Classification for Domain Generalization: Lanqing Hu,

Meina Kan,

Shiguang Shan,

Xilin Chen; [pdf] [supp]
[bibtex]
@InProceedings{Hu_2023_ICCV, author = {Hu, Lanqing and Kan, Meina and Shan, Shiguang and Chen, Xilin}, title = {DandelionNet: Domain Composition with Instance Adaptive Classification for Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19050-19059} }
TexFusion: Synthesizing 3D Textures with Text-Guided Image Diffusion Models: Tianshi Cao,

Karsten Kreis,

Sanja Fidler,

Nicholas Sharp,

Kangxue Yin; [pdf] [supp]
[bibtex]
@InProceedings{Cao_2023_ICCV, author = {Cao, Tianshi and Kreis, Karsten and Fidler, Sanja and Sharp, Nicholas and Yin, Kangxue}, title = {TexFusion: Synthesizing 3D Textures with Text-Guided Image Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4169-4181} }
Shift from Texture-bias to Shape-bias: Edge Deformation-based Augmentation for Robust Object Recognition: Xilin He,

Qinliang Lin,

Cheng Luo,

Weicheng Xie,

Siyang Song,

Feng Liu,

Linlin Shen; [pdf] [supp]
[bibtex]
@InProceedings{He_2023_ICCV, author = {He, Xilin and Lin, Qinliang and Luo, Cheng and Xie, Weicheng and Song, Siyang and Liu, Feng and Shen, Linlin}, title = {Shift from Texture-bias to Shape-bias: Edge Deformation-based Augmentation for Robust Object Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1526-1535} }
Lighting Every Darkness in Two Pairs: A Calibration-Free Pipeline for RAW Denoising: Xin Jin,

Jia-Wen Xiao,

Ling-Hao Han,

Chunle Guo,

Ruixun Zhang,

Xialei Liu,

Chongyi Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jin_2023_ICCV, author = {Jin, Xin and Xiao, Jia-Wen and Han, Ling-Hao and Guo, Chunle and Zhang, Ruixun and Liu, Xialei and Li, Chongyi}, title = {Lighting Every Darkness in Two Pairs: A Calibration-Free Pipeline for RAW Denoising}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13275-13284} }
Data-free Knowledge Distillation for Fine-grained Visual Categorization: Renrong Shao,

Wei Zhang,

Jianhua Yin,

Jun Wang; [pdf] [supp]
[bibtex]
@InProceedings{Shao_2023_ICCV, author = {Shao, Renrong and Zhang, Wei and Yin, Jianhua and Wang, Jun}, title = {Data-free Knowledge Distillation for Fine-grained Visual Categorization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1515-1525} }
MotionBERT: A Unified Perspective on Learning Human Motion Representations: Wentao Zhu,

Xiaoxuan Ma,

Zhaoyang Liu,

Libin Liu,

Wayne Wu,

Yizhou Wang; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Wentao and Ma, Xiaoxuan and Liu, Zhaoyang and Liu, Libin and Wu, Wayne and Wang, Yizhou}, title = {MotionBERT: A Unified Perspective on Learning Human Motion Representations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15085-15099} }
PASTA: Proportional Amplitude Spectrum Training Augmentation for Syn-to-Real Domain Generalization: Prithvijit Chattopadhyay,

Kartik Sarangmath,

Vivek Vijaykumar,

Judy Hoffman; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chattopadhyay_2023_ICCV, author = {Chattopadhyay, Prithvijit and Sarangmath, Kartik and Vijaykumar, Vivek and Hoffman, Judy}, title = {PASTA: Proportional Amplitude Spectrum Training Augmentation for Syn-to-Real Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19288-19300} }
EgoPCA: A New Framework for Egocentric Hand-Object Interaction Understanding: Yue Xu,

Yong-Lu Li,

Zhemin Huang,

Michael Xu Liu,

Cewu Lu,

Yu-Wing Tai,

Chi-Keung Tang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Yue and Li, Yong-Lu and Huang, Zhemin and Liu, Michael Xu and Lu, Cewu and Tai, Yu-Wing and Tang, Chi-Keung}, title = {EgoPCA: A New Framework for Egocentric Hand-Object Interaction Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5273-5284} }
Metric3D: Towards Zero-shot Metric 3D Prediction from A Single Image: Wei Yin,

Chi Zhang,

Hao Chen,

Zhipeng Cai,

Gang Yu,

Kaixuan Wang,

Xiaozhi Chen,

Chunhua Shen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yin_2023_ICCV, author = {Yin, Wei and Zhang, Chi and Chen, Hao and Cai, Zhipeng and Yu, Gang and Wang, Kaixuan and Chen, Xiaozhi and Shen, Chunhua}, title = {Metric3D: Towards Zero-shot Metric 3D Prediction from A Single Image}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9043-9053} }
I Can't Believe There's No Images! Learning Visual Tasks Using only Language Supervision: Sophia Gu,

Christopher Clark,

Aniruddha Kembhavi; [pdf] [supp]
[bibtex]
@InProceedings{Gu_2023_ICCV, author = {Gu, Sophia and Clark, Christopher and Kembhavi, Aniruddha}, title = {I Can't Believe There's No Images! Learning Visual Tasks Using only Language Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2672-2683} }
Lightweight Image Super-Resolution with Superpixel Token Interaction: Aiping Zhang,

Wenqi Ren,

Yi Liu,

Xiaochun Cao; [pdf]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Aiping and Ren, Wenqi and Liu, Yi and Cao, Xiaochun}, title = {Lightweight Image Super-Resolution with Superpixel Token Interaction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12728-12737} }
Feature Prediction Diffusion Model for Video Anomaly Detection: Cheng Yan,

Shiyu Zhang,

Yang Liu,

Guansong Pang,

Wenjun Wang; [pdf]
[bibtex]
@InProceedings{Yan_2023_ICCV, author = {Yan, Cheng and Zhang, Shiyu and Liu, Yang and Pang, Guansong and Wang, Wenjun}, title = {Feature Prediction Diffusion Model for Video Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5527-5537} }
RANA: Relightable Articulated Neural Avatars: Umar Iqbal,

Akin Caliskan,

Koki Nagano,

Sameh Khamis,

Pavlo Molchanov,

Jan Kautz; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Iqbal_2023_ICCV, author = {Iqbal, Umar and Caliskan, Akin and Nagano, Koki and Khamis, Sameh and Molchanov, Pavlo and Kautz, Jan}, title = {RANA: Relightable Articulated Neural Avatars}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23142-23153} }
Iterative Denoiser and Noise Estimator for Self-Supervised Image Denoising: Yunhao Zou,

Chenggang Yan,

Ying Fu; [pdf]
[bibtex]
@InProceedings{Zou_2023_ICCV, author = {Zou, Yunhao and Yan, Chenggang and Fu, Ying}, title = {Iterative Denoiser and Noise Estimator for Self-Supervised Image Denoising}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13265-13274} }
MasQCLIP for Open-Vocabulary Universal Image Segmentation: Xin Xu,

Tianyi Xiong,

Zheng Ding,

Zhuowen Tu; [pdf]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Xin and Xiong, Tianyi and Ding, Zheng and Tu, Zhuowen}, title = {MasQCLIP for Open-Vocabulary Universal Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {887-898} }
Memory-and-Anticipation Transformer for Online Action Understanding: Jiahao Wang,

Guo Chen,

Yifei Huang,

Limin Wang,

Tong Lu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Jiahao and Chen, Guo and Huang, Yifei and Wang, Limin and Lu, Tong}, title = {Memory-and-Anticipation Transformer for Online Action Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13824-13835} }
Self-similarity Driven Scale-invariant Learning for Weakly Supervised Person Search: Benzhi Wang,

Yang Yang,

Jinlin Wu,

Guo-jun Qi,

Zhen Lei; [pdf] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Benzhi and Yang, Yang and Wu, Jinlin and Qi, Guo-jun and Lei, Zhen}, title = {Self-similarity Driven Scale-invariant Learning for Weakly Supervised Person Search}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1813-1822} }
MODA: Mapping-Once Audio-driven Portrait Animation with Dual Attentions: Yunfei Liu,

Lijian Lin,

Fei Yu,

Changyin Zhou,

Yu Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Yunfei and Lin, Lijian and Yu, Fei and Zhou, Changyin and Li, Yu}, title = {MODA: Mapping-Once Audio-driven Portrait Animation with Dual Attentions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23020-23029} }
Realistic Full-Body Tracking from Sparse Observations via Joint-Level Modeling: Xiaozheng Zheng,

Zhuo Su,

Chao Wen,

Zhou Xue,

Xiaojie Jin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zheng_2023_ICCV, author = {Zheng, Xiaozheng and Su, Zhuo and Wen, Chao and Xue, Zhou and Jin, Xiaojie}, title = {Realistic Full-Body Tracking from Sparse Observations via Joint-Level Modeling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14678-14688} }
MetaF2N: Blind Image Super-Resolution by Learning Efficient Model Adaptation from Faces: Zhicun Yin,

Ming Liu,

Xiaoming Li,

Hui Yang,

Longan Xiao,

Wangmeng Zuo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yin_2023_ICCV, author = {Yin, Zhicun and Liu, Ming and Li, Xiaoming and Yang, Hui and Xiao, Longan and Zuo, Wangmeng}, title = {MetaF2N: Blind Image Super-Resolution by Learning Efficient Model Adaptation from Faces}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13033-13044} }
Lighting up NeRF via Unsupervised Decomposition and Enhancement: Haoyuan Wang,

Xiaogang Xu,

Ke Xu,

Rynson W.H. Lau; [pdf] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Haoyuan and Xu, Xiaogang and Xu, Ke and Lau, Rynson W.H.}, title = {Lighting up NeRF via Unsupervised Decomposition and Enhancement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12632-12641} }
ViM: Vision Middleware for Unified Downstream Transferring: Yutong Feng,

Biao Gong,

Jianwen Jiang,

Yiliang Lv,

Yujun Shen,

Deli Zhao,

Jingren Zhou; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Feng_2023_ICCV, author = {Feng, Yutong and Gong, Biao and Jiang, Jianwen and Lv, Yiliang and Shen, Yujun and Zhao, Deli and Zhou, Jingren}, title = {ViM: Vision Middleware for Unified Downstream Transferring}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11696-11707} }
DIRE for Diffusion-Generated Image Detection: Zhendong Wang,

Jianmin Bao,

Wengang Zhou,

Weilun Wang,

Hezhen Hu,

Hong Chen,

Houqiang Li; [pdf] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Zhendong and Bao, Jianmin and Zhou, Wengang and Wang, Weilun and Hu, Hezhen and Chen, Hong and Li, Houqiang}, title = {DIRE for Diffusion-Generated Image Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22445-22455} }
Ord2Seq: Regarding Ordinal Regression as Label Sequence Prediction: Jinhong Wang,

Yi Cheng,

Jintai Chen,

TingTing Chen,

Danny Chen,

Jian Wu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Jinhong and Cheng, Yi and Chen, Jintai and Chen, TingTing and Chen, Danny and Wu, Jian}, title = {Ord2Seq: Regarding Ordinal Regression as Label Sequence Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5865-5875} }
Bring Clipart to Life: Nanxuan Zhao,

Shengqi Dang,

Hexun Lin,

Yang Shi,

Nan Cao; [pdf] [supp]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Nanxuan and Dang, Shengqi and Lin, Hexun and Shi, Yang and Cao, Nan}, title = {Bring Clipart to Life}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23341-23350} }
Co-Evolution of Pose and Mesh for 3D Human Body Estimation from Video: Yingxuan You,

Hong Liu,

Ti Wang,

Wenhao Li,

Runwei Ding,

Xia Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{You_2023_ICCV, author = {You, Yingxuan and Liu, Hong and Wang, Ti and Li, Wenhao and Ding, Runwei and Li, Xia}, title = {Co-Evolution of Pose and Mesh for 3D Human Body Estimation from Video}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14963-14973} }
Noise2Info: Noisy Image to Information of Noise for Self-Supervised Image Denoising: Jiachuan Wang,

Shimin Di,

Lei Chen,

Charles Wang Wai Ng; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Jiachuan and Di, Shimin and Chen, Lei and Ng, Charles Wang Wai}, title = {Noise2Info: Noisy Image to Information of Noise for Self-Supervised Image Denoising}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16034-16043} }
Controllable Visual-Tactile Synthesis: Ruihan Gao,

Wenzhen Yuan,

Jun-Yan Zhu; [pdf] [arXiv]
[bibtex]
@InProceedings{Gao_2023_ICCV, author = {Gao, Ruihan and Yuan, Wenzhen and Zhu, Jun-Yan}, title = {Controllable Visual-Tactile Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7040-7052} }
Keep It SimPool: Who Said Supervised Transformers Suffer from Attention Deficit?: Bill Psomas,

Ioannis Kakogeorgiou,

Konstantinos Karantzalos,

Yannis Avrithis; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Psomas_2023_ICCV, author = {Psomas, Bill and Kakogeorgiou, Ioannis and Karantzalos, Konstantinos and Avrithis, Yannis}, title = {Keep It SimPool: Who Said Supervised Transformers Suffer from Attention Deficit?}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5350-5360} }
SynBody: Synthetic Dataset with Layered Human Models for 3D Human Perception and Modeling: Zhitao Yang,

Zhongang Cai,

Haiyi Mei,

Shuai Liu,

Zhaoxi Chen,

Weiye Xiao,

Yukun Wei,

Zhongfei Qing,

Chen Wei,

Bo Dai,

Wayne Wu,

Chen Qian,

Dahua Lin,

Ziwei Liu,

Lei Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Zhitao and Cai, Zhongang and Mei, Haiyi and Liu, Shuai and Chen, Zhaoxi and Xiao, Weiye and Wei, Yukun and Qing, Zhongfei and Wei, Chen and Dai, Bo and Wu, Wayne and Qian, Chen and Lin, Dahua and Liu, Ziwei and Yang, Lei}, title = {SynBody: Synthetic Dataset with Layered Human Models for 3D Human Perception and Modeling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20282-20292} }
Viewset Diffusion: (0-)Image-Conditioned 3D Generative Models from 2D Data: Stanislaw Szymanowicz,

Christian Rupprecht,

Andrea Vedaldi; [pdf] [supp]
[bibtex]
@InProceedings{Szymanowicz_2023_ICCV, author = {Szymanowicz, Stanislaw and Rupprecht, Christian and Vedaldi, Andrea}, title = {Viewset Diffusion: (0-)Image-Conditioned 3D Generative Models from 2D Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8863-8873} }
LoGoPrompt: Synthetic Text Images Can Be Good Visual Prompts for Vision-Language Models: Cheng Shi,

Sibei Yang; [pdf] [arXiv]
[bibtex]
@InProceedings{Shi_2023_ICCV, author = {Shi, Cheng and Yang, Sibei}, title = {LoGoPrompt: Synthetic Text Images Can Be Good Visual Prompts for Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2932-2941} }
EP2P-Loc: End-to-End 3D Point to 2D Pixel Localization for Large-Scale Visual Localization: Minjung Kim,

Junseo Koo,

Gunhee Kim; [pdf] [supp]
[bibtex]
@InProceedings{Kim_2023_ICCV, author = {Kim, Minjung and Koo, Junseo and Kim, Gunhee}, title = {EP2P-Loc: End-to-End 3D Point to 2D Pixel Localization for Large-Scale Visual Localization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21527-21537} }
SIRA-PCR: Sim-to-Real Adaptation for 3D Point Cloud Registration: Suyi Chen,

Hao Xu,

Ru Li,

Guanghui Liu,

Chi-Wing Fu,

Shuaicheng Liu; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Suyi and Xu, Hao and Li, Ru and Liu, Guanghui and Fu, Chi-Wing and Liu, Shuaicheng}, title = {SIRA-PCR: Sim-to-Real Adaptation for 3D Point Cloud Registration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14394-14405} }
FeatEnHancer: Enhancing Hierarchical Features for Object Detection and Beyond Under Low-Light Vision: Khurram Azeem Hashmi,

Goutham Kallempudi,

Didier Stricker,

Muhammad Zeshan Afzal; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hashmi_2023_ICCV, author = {Hashmi, Khurram Azeem and Kallempudi, Goutham and Stricker, Didier and Afzal, Muhammad Zeshan}, title = {FeatEnHancer: Enhancing Hierarchical Features for Object Detection and Beyond Under Low-Light Vision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6725-6735} }
SOAR: Scene-debiasing Open-set Action Recognition: Yuanhao Zhai,

Ziyi Liu,

Zhenyu Wu,

Yi Wu,

Chunluan Zhou,

David Doermann,

Junsong Yuan,

Gang Hua; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhai_2023_ICCV, author = {Zhai, Yuanhao and Liu, Ziyi and Wu, Zhenyu and Wu, Yi and Zhou, Chunluan and Doermann, David and Yuan, Junsong and Hua, Gang}, title = {SOAR: Scene-debiasing Open-set Action Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10244-10254} }
Physics-Augmented Autoencoder for 3D Skeleton-Based Gait Recognition: Hongji Guo,

Qiang Ji; [pdf] [supp]
[bibtex]
@InProceedings{Guo_2023_ICCV, author = {Guo, Hongji and Ji, Qiang}, title = {Physics-Augmented Autoencoder for 3D Skeleton-Based Gait Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19627-19638} }
Regularized Primitive Graph Learning for Unified Vector Mapping: Lei Wang,

Min Dai,

Jianan He,

Jingwei Huang; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Lei and Dai, Min and He, Jianan and Huang, Jingwei}, title = {Regularized Primitive Graph Learning for Unified Vector Mapping}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16817-16826} }
Saliency Regularization for Self-Training with Partial Annotations: Shouwen Wang,

Qian Wan,

Xiang Xiang,

Zhigang Zeng; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Shouwen and Wan, Qian and Xiang, Xiang and Zeng, Zhigang}, title = {Saliency Regularization for Self-Training with Partial Annotations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1611-1620} }
Stabilizing Visual Reinforcement Learning via Asymmetric Interactive Cooperation: Yunpeng Zhai,

Peixi Peng,

Yifan Zhao,

Yangru Huang,

Yonghong Tian; [pdf]
[bibtex]
@InProceedings{Zhai_2023_ICCV, author = {Zhai, Yunpeng and Peng, Peixi and Zhao, Yifan and Huang, Yangru and Tian, Yonghong}, title = {Stabilizing Visual Reinforcement Learning via Asymmetric Interactive Cooperation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {207-216} }
FlipNeRF: Flipped Reflection Rays for Few-shot Novel View Synthesis: Seunghyeon Seo,

Yeonjin Chang,

Nojun Kwak; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Seo_2023_ICCV, author = {Seo, Seunghyeon and Chang, Yeonjin and Kwak, Nojun}, title = {FlipNeRF: Flipped Reflection Rays for Few-shot Novel View Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22883-22893} }
Discovering Spatio-Temporal Rationales for Video Question Answering: Yicong Li,

Junbin Xiao,

Chun Feng,

Xiang Wang,

Tat-Seng Chua; [pdf] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Yicong and Xiao, Junbin and Feng, Chun and Wang, Xiang and Chua, Tat-Seng}, title = {Discovering Spatio-Temporal Rationales for Video Question Answering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13869-13878} }
Iterative Soft Shrinkage Learning for Efficient Image Super-Resolution: Jiamian Wang,

Huan Wang,

Yulun Zhang,

Yun Fu,

Zhiqiang Tao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Jiamian and Wang, Huan and Zhang, Yulun and Fu, Yun and Tao, Zhiqiang}, title = {Iterative Soft Shrinkage Learning for Efficient Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12590-12599} }
Learning Hierarchical Features with Joint Latent Space Energy-Based Prior: Jiali Cui,

Ying Nian Wu,

Tian Han; [pdf] [supp]
[bibtex]
@InProceedings{Cui_2023_ICCV, author = {Cui, Jiali and Wu, Ying Nian and Han, Tian}, title = {Learning Hierarchical Features with Joint Latent Space Energy-Based Prior}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2218-2227} }
UniFormerV2: Unlocking the Potential of Image ViTs for Video Understanding: Kunchang Li,

Yali Wang,

Yinan He,

Yizhuo Li,

Yi Wang,

Limin Wang,

Yu Qiao; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Kunchang and Wang, Yali and He, Yinan and Li, Yizhuo and Wang, Yi and Wang, Limin and Qiao, Yu}, title = {UniFormerV2: Unlocking the Potential of Image ViTs for Video Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1632-1643} }
G2L: Semantically Aligned and Uniform Video Grounding via Geodesic and Game Theory: Hongxiang Li,

Meng Cao,

Xuxin Cheng,

Yaowei Li,

Zhihong Zhu,

Yuexian Zou; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Hongxiang and Cao, Meng and Cheng, Xuxin and Li, Yaowei and Zhu, Zhihong and Zou, Yuexian}, title = {G2L: Semantically Aligned and Uniform Video Grounding via Geodesic and Game Theory}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12032-12042} }
TARGET: Federated Class-Continual Learning via Exemplar-Free Distillation: Jie Zhang,

Chen Chen,

Weiming Zhuang,

Lingjuan Lyu; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Jie and Chen, Chen and Zhuang, Weiming and Lyu, Lingjuan}, title = {TARGET: Federated Class-Continual Learning via Exemplar-Free Distillation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4782-4793} }
FashionNTM: Multi-turn Fashion Image Retrieval via Cascaded Memory: Anwesan Pal,

Sahil Wadhwa,

Ayush Jaiswal,

Xu Zhang,

Yue Wu,

Rakesh Chada,

Pradeep Natarajan,

Henrik I. Christensen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Pal_2023_ICCV, author = {Pal, Anwesan and Wadhwa, Sahil and Jaiswal, Ayush and Zhang, Xu and Wu, Yue and Chada, Rakesh and Natarajan, Pradeep and Christensen, Henrik I.}, title = {FashionNTM: Multi-turn Fashion Image Retrieval via Cascaded Memory}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11323-11334} }
MolGrapher: Graph-based Visual Recognition of Chemical Structures: Lucas Morin,

Martin Danelljan,

Maria Isabel Agea,

Ahmed Nassar,

Valery Weber,

Ingmar Meijer,

Peter Staar,

Fisher Yu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Morin_2023_ICCV, author = {Morin, Lucas and Danelljan, Martin and Agea, Maria Isabel and Nassar, Ahmed and Weber, Valery and Meijer, Ingmar and Staar, Peter and Yu, Fisher}, title = {MolGrapher: Graph-based Visual Recognition of Chemical Structures}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19552-19561} }
SAMPLING: Scene-adaptive Hierarchical Multiplane Images Representation for Novel View Synthesis from a Single Image: Xiaoyu Zhou,

Zhiwei Lin,

Xiaojun Shan,

Yongtao Wang,

Deqing Sun,

Ming-Hsuan Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Xiaoyu and Lin, Zhiwei and Shan, Xiaojun and Wang, Yongtao and Sun, Deqing and Yang, Ming-Hsuan}, title = {SAMPLING: Scene-adaptive Hierarchical Multiplane Images Representation for Novel View Synthesis from a Single Image}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22830-22840} }
DiffV2S: Diffusion-Based Video-to-Speech Synthesis with Vision-Guided Speaker Embedding: Jeongsoo Choi,

Joanna Hong,

Yong Man Ro; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Choi_2023_ICCV, author = {Choi, Jeongsoo and Hong, Joanna and Ro, Yong Man}, title = {DiffV2S: Diffusion-Based Video-to-Speech Synthesis with Vision-Guided Speaker Embedding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7812-7821} }
PointOdyssey: A Large-Scale Synthetic Dataset for Long-Term Point Tracking: Yang Zheng,

Adam W. Harley,

Bokui Shen,

Gordon Wetzstein,

Leonidas J. Guibas; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zheng_2023_ICCV, author = {Zheng, Yang and Harley, Adam W. and Shen, Bokui and Wetzstein, Gordon and Guibas, Leonidas J.}, title = {PointOdyssey: A Large-Scale Synthetic Dataset for Long-Term Point Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19855-19865} }
The Effectiveness of MAE Pre-Pretraining for Billion-Scale Pretraining: Mannat Singh,

Quentin Duval,

Kalyan Vasudev Alwala,

Haoqi Fan,

Vaibhav Aggarwal,

Aaron Adcock,

Armand Joulin,

Piotr Dollar,

Christoph Feichtenhofer,

Ross Girshick,

Rohit Girdhar,

Ishan Misra; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Singh_2023_ICCV, author = {Singh, Mannat and Duval, Quentin and Alwala, Kalyan Vasudev and Fan, Haoqi and Aggarwal, Vaibhav and Adcock, Aaron and Joulin, Armand and Dollar, Piotr and Feichtenhofer, Christoph and Girshick, Ross and Girdhar, Rohit and Misra, Ishan}, title = {The Effectiveness of MAE Pre-Pretraining for Billion-Scale Pretraining}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5484-5494} }
Towards Zero Domain Gap: A Comprehensive Study of Realistic LiDAR Simulation for Autonomy Testing: Sivabalan Manivasagam,

Ioan Andrei Bârsan,

Jingkang Wang,

Ze Yang,

Raquel Urtasun; [pdf] [supp]
[bibtex]
@InProceedings{Manivasagam_2023_ICCV, author = {Manivasagam, Sivabalan and B\^arsan, Ioan Andrei and Wang, Jingkang and Yang, Ze and Urtasun, Raquel}, title = {Towards Zero Domain Gap: A Comprehensive Study of Realistic LiDAR Simulation for Autonomy Testing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8272-8282} }
GPA-3D: Geometry-aware Prototype Alignment for Unsupervised Domain Adaptive 3D Object Detection from Point Clouds: Ziyu Li,

Jingming Guo,

Tongtong Cao,

Liu Bingbing,

Wankou Yang; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Ziyu and Guo, Jingming and Cao, Tongtong and Bingbing, Liu and Yang, Wankou}, title = {GPA-3D: Geometry-aware Prototype Alignment for Unsupervised Domain Adaptive 3D Object Detection from Point Clouds}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6394-6403} }
TransHuman: A Transformer-based Human Representation for Generalizable Neural Human Rendering: Xiao Pan,

Zongxin Yang,

Jianxin Ma,

Chang Zhou,

Yi Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Pan_2023_ICCV, author = {Pan, Xiao and Yang, Zongxin and Ma, Jianxin and Zhou, Chang and Yang, Yi}, title = {TransHuman: A Transformer-based Human Representation for Generalizable Neural Human Rendering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3544-3555} }
LNPL-MIL: Learning from Noisy Pseudo Labels for Promoting Multiple Instance Learning in Whole Slide Image: Zhuchen Shao,

Yifeng Wang,

Yang Chen,

Hao Bian,

Shaohui Liu,

Haoqian Wang,

Yongbing Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Shao_2023_ICCV, author = {Shao, Zhuchen and Wang, Yifeng and Chen, Yang and Bian, Hao and Liu, Shaohui and Wang, Haoqian and Zhang, Yongbing}, title = {LNPL-MIL: Learning from Noisy Pseudo Labels for Promoting Multiple Instance Learning in Whole Slide Image}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21495-21505} }
Few-Shot Dataset Distillation via Translative Pre-Training: Songhua Liu,

Xinchao Wang; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Songhua and Wang, Xinchao}, title = {Few-Shot Dataset Distillation via Translative Pre-Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18654-18664} }
Random Sub-Samples Generation for Self-Supervised Real Image Denoising: Yizhong Pan,

Xiao Liu,

Xiangyu Liao,

Yuanzhouhan Cao,

Chao Ren; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Pan_2023_ICCV, author = {Pan, Yizhong and Liu, Xiao and Liao, Xiangyu and Cao, Yuanzhouhan and Ren, Chao}, title = {Random Sub-Samples Generation for Self-Supervised Real Image Denoising}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12150-12159} }
Waffling Around for Performance: Visual Classification with Random Words and Broad Concepts: Karsten Roth,

Jae Myung Kim,

A. Sophia Koepke,

Oriol Vinyals,

Cordelia Schmid,

Zeynep Akata; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Roth_2023_ICCV, author = {Roth, Karsten and Kim, Jae Myung and Koepke, A. Sophia and Vinyals, Oriol and Schmid, Cordelia and Akata, Zeynep}, title = {Waffling Around for Performance: Visual Classification with Random Words and Broad Concepts}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15746-15757} }
Unsupervised Surface Anomaly Detection with Diffusion Probabilistic Model: Xinyi Zhang,

Naiqi Li,

Jiawei Li,

Tao Dai,

Yong Jiang,

Shu-Tao Xia; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Xinyi and Li, Naiqi and Li, Jiawei and Dai, Tao and Jiang, Yong and Xia, Shu-Tao}, title = {Unsupervised Surface Anomaly Detection with Diffusion Probabilistic Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6782-6791} }
AutoAD II: The Sequel - Who, When, and What in Movie Audio Description: Tengda Han,

Max Bain,

Arsha Nagrani,

Gul Varol,

Weidi Xie,

Andrew Zisserman; [pdf] [supp]
[bibtex]
@InProceedings{Han_2023_ICCV, author = {Han, Tengda and Bain, Max and Nagrani, Arsha and Varol, Gul and Xie, Weidi and Zisserman, Andrew}, title = {AutoAD II: The Sequel - Who, When, and What in Movie Audio Description}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13645-13655} }
TinyCLIP: CLIP Distillation via Affinity Mimicking and Weight Inheritance: Kan Wu,

Houwen Peng,

Zhenghong Zhou,

Bin Xiao,

Mengchen Liu,

Lu Yuan,

Hong Xuan,

Michael Valenzuela,

Xi (Stephen) Chen,

Xinggang Wang,

Hongyang Chao,

Han Hu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Kan and Peng, Houwen and Zhou, Zhenghong and Xiao, Bin and Liu, Mengchen and Yuan, Lu and Xuan, Hong and Valenzuela, Michael and Chen, Xi (Stephen) and Wang, Xinggang and Chao, Hongyang and Hu, Han}, title = {TinyCLIP: CLIP Distillation via Affinity Mimicking and Weight Inheritance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21970-21980} }
Hyperbolic Chamfer Distance for Point Cloud Completion: Fangzhou Lin,

Yun Yue,

Songlin Hou,

Xuechu Yu,

Yajun Xu,

Kazunori D Yamada,

Ziming Zhang; [pdf]
[bibtex]
@InProceedings{Lin_2023_ICCV, author = {Lin, Fangzhou and Yue, Yun and Hou, Songlin and Yu, Xuechu and Xu, Yajun and Yamada, Kazunori D and Zhang, Ziming}, title = {Hyperbolic Chamfer Distance for Point Cloud Completion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14595-14606} }
Democratising 2D Sketch to 3D Shape Retrieval Through Pivoting: Pinaki Nath Chowdhury,

Ayan Kumar Bhunia,

Aneeshan Sain,

Subhadeep Koley,

Tao Xiang,

Yi-Zhe Song; [pdf] [supp]
[bibtex]
@InProceedings{Chowdhury_2023_ICCV, author = {Chowdhury, Pinaki Nath and Bhunia, Ayan Kumar and Sain, Aneeshan and Koley, Subhadeep and Xiang, Tao and Song, Yi-Zhe}, title = {Democratising 2D Sketch to 3D Shape Retrieval Through Pivoting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23275-23286} }
Simoun: Synergizing Interactive Motion-appearance Understanding for Vision-based Reinforcement Learning: Yangru Huang,

Peixi Peng,

Yifan Zhao,

Yunpeng Zhai,

Haoran Xu,

Yonghong Tian; [pdf] [supp]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Yangru and Peng, Peixi and Zhao, Yifan and Zhai, Yunpeng and Xu, Haoran and Tian, Yonghong}, title = {Simoun: Synergizing Interactive Motion-appearance Understanding for Vision-based Reinforcement Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {176-185} }
AG3D: Learning to Generate 3D Avatars from 2D Image Collections: Zijian Dong,

Xu Chen,

Jinlong Yang,

Michael J. Black,

Otmar Hilliges,

Andreas Geiger; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dong_2023_ICCV, author = {Dong, Zijian and Chen, Xu and Yang, Jinlong and Black, Michael J. and Hilliges, Otmar and Geiger, Andreas}, title = {AG3D: Learning to Generate 3D Avatars from 2D Image Collections}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14916-14927} }
KECOR: Kernel Coding Rate Maximization for Active 3D Object Detection: Yadan Luo,

Zhuoxiao Chen,

Zhen Fang,

Zheng Zhang,

Mahsa Baktashmotlagh,

Zi Huang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Luo_2023_ICCV, author = {Luo, Yadan and Chen, Zhuoxiao and Fang, Zhen and Zhang, Zheng and Baktashmotlagh, Mahsa and Huang, Zi}, title = {KECOR: Kernel Coding Rate Maximization for Active 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18279-18290} }
Learned Image Reasoning Prior Penetrates Deep Unfolding Network for Panchromatic and Multi-spectral Image Fusion: Man Zhou,

Jie Huang,

Naishan Zheng,

Chongyi Li; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Man and Huang, Jie and Zheng, Naishan and Li, Chongyi}, title = {Learned Image Reasoning Prior Penetrates Deep Unfolding Network for Panchromatic and Multi-spectral Image Fusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12398-12407} }
Representation Disparity-aware Distillation for 3D Object Detection: Yanjing Li,

Sheng Xu,

Mingbao Lin,

Jihao Yin,

Baochang Zhang,

Xianbin Cao; [pdf] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Yanjing and Xu, Sheng and Lin, Mingbao and Yin, Jihao and Zhang, Baochang and Cao, Xianbin}, title = {Representation Disparity-aware Distillation for 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6715-6724} }
NCHO: Unsupervised Learning for Neural 3D Composition of Humans and Objects: Taeksoo Kim,

Shunsuke Saito,

Hanbyul Joo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2023_ICCV, author = {Kim, Taeksoo and Saito, Shunsuke and Joo, Hanbyul}, title = {NCHO: Unsupervised Learning for Neural 3D Composition of Humans and Objects}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14817-14828} }
Breaking The Limits of Text-conditioned 3D Motion Synthesis with Elaborative Descriptions: Yijun Qian,

Jack Urbanek,

Alexander G. Hauptmann,

Jungdam Won; [pdf]
[bibtex]
@InProceedings{Qian_2023_ICCV, author = {Qian, Yijun and Urbanek, Jack and Hauptmann, Alexander G. and Won, Jungdam}, title = {Breaking The Limits of Text-conditioned 3D Motion Synthesis with Elaborative Descriptions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2306-2316} }
VL-PET: Vision-and-Language Parameter-Efficient Tuning via Granularity Control: Zi-Yuan Hu,

Yanyang Li,

Michael R. Lyu,

Liwei Wang; [pdf] [supp]
[bibtex]
@InProceedings{Hu_2023_ICCV, author = {Hu, Zi-Yuan and Li, Yanyang and Lyu, Michael R. and Wang, Liwei}, title = {VL-PET: Vision-and-Language Parameter-Efficient Tuning via Granularity Control}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3010-3020} }
ROME: Robustifying Memory-Efficient NAS via Topology Disentanglement and Gradient Accumulation: Xiaoxing Wang,

Xiangxiang Chu,

Yuda Fan,

Zhexi Zhang,

Bo Zhang,

Xiaokang Yang,

Junchi Yan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Xiaoxing and Chu, Xiangxiang and Fan, Yuda and Zhang, Zhexi and Zhang, Bo and Yang, Xiaokang and Yan, Junchi}, title = {ROME: Robustifying Memory-Efficient NAS via Topology Disentanglement and Gradient Accumulation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5939-5949} }
Toward Multi-Granularity Decision-Making: Explicit Visual Reasoning with Hierarchical Knowledge: Yifeng Zhang,

Shi Chen,

Qi Zhao; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Yifeng and Chen, Shi and Zhao, Qi}, title = {Toward Multi-Granularity Decision-Making: Explicit Visual Reasoning with Hierarchical Knowledge}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2573-2583} }
3D-aware Image Generation using 2D Diffusion Models: Jianfeng Xiang,

Jiaolong Yang,

Binbin Huang,

Xin Tong; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xiang_2023_ICCV, author = {Xiang, Jianfeng and Yang, Jiaolong and Huang, Binbin and Tong, Xin}, title = {3D-aware Image Generation using 2D Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2383-2393} }
Locating Noise is Halfway Denoising for Semi-Supervised Segmentation: Yan Fang,

Feng Zhu,

Bowen Cheng,

Luoqi Liu,

Yao Zhao,

Yunchao Wei; [pdf] [supp]
[bibtex]
@InProceedings{Fang_2023_ICCV, author = {Fang, Yan and Zhu, Feng and Cheng, Bowen and Liu, Luoqi and Zhao, Yao and Wei, Yunchao}, title = {Locating Noise is Halfway Denoising for Semi-Supervised Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16612-16622} }
Learning Non-Local Spatial-Angular Correlation for Light Field Image Super-Resolution: Zhengyu Liang,

Yingqian Wang,

Longguang Wang,

Jungang Yang,

Shilin Zhou,

Yulan Guo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liang_2023_ICCV, author = {Liang, Zhengyu and Wang, Yingqian and Wang, Longguang and Yang, Jungang and Zhou, Shilin and Guo, Yulan}, title = {Learning Non-Local Spatial-Angular Correlation for Light Field Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12376-12386} }
ICE-NeRF: Interactive Color Editing of NeRFs via Decomposition-Aware Weight Optimization: Jae-Hyeok Lee,

Dae-Shik Kim; [pdf]
[bibtex]
@InProceedings{Lee_2023_ICCV, author = {Lee, Jae-Hyeok and Kim, Dae-Shik}, title = {ICE-NeRF: Interactive Color Editing of NeRFs via Decomposition-Aware Weight Optimization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3491-3501} }
SPANet: Frequency-balancing Token Mixer using Spectral Pooling Aggregation Modulation: Guhnoo Yun,

Juhan Yoo,

Kijung Kim,

Jeongho Lee,

Dong Hwan Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yun_2023_ICCV, author = {Yun, Guhnoo and Yoo, Juhan and Kim, Kijung and Lee, Jeongho and Kim, Dong Hwan}, title = {SPANet: Frequency-balancing Token Mixer using Spectral Pooling Aggregation Modulation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6113-6124} }
ASAG: Building Strong One-Decoder-Layer Sparse Detectors via Adaptive Sparse Anchor Generation: Shenghao Fu,

Junkai Yan,

Yipeng Gao,

Xiaohua Xie,

Wei-Shi Zheng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Fu_2023_ICCV, author = {Fu, Shenghao and Yan, Junkai and Gao, Yipeng and Xie, Xiaohua and Zheng, Wei-Shi}, title = {ASAG: Building Strong One-Decoder-Layer Sparse Detectors via Adaptive Sparse Anchor Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6328-6338} }
MGMAE: Motion Guided Masking for Video Masked Autoencoding: Bingkun Huang,

Zhiyu Zhao,

Guozhen Zhang,

Yu Qiao,

Limin Wang; [pdf] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Bingkun and Zhao, Zhiyu and Zhang, Guozhen and Qiao, Yu and Wang, Limin}, title = {MGMAE: Motion Guided Masking for Video Masked Autoencoding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13493-13504} }
The Perils of Learning From Unlabeled Data: Backdoor Attacks on Semi-supervised Learning: Virat Shejwalkar,

Lingjuan Lyu,

Amir Houmansadr; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shejwalkar_2023_ICCV, author = {Shejwalkar, Virat and Lyu, Lingjuan and Houmansadr, Amir}, title = {The Perils of Learning From Unlabeled Data: Backdoor Attacks on Semi-supervised Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4730-4740} }
SSB: Simple but Strong Baseline for Boosting Performance of Open-Set Semi-Supervised Learning: Yue Fan,

Anna Kukleva,

Dengxin Dai,

Bernt Schiele; [pdf] [supp]
[bibtex]
@InProceedings{Fan_2023_ICCV, author = {Fan, Yue and Kukleva, Anna and Dai, Dengxin and Schiele, Bernt}, title = {SSB: Simple but Strong Baseline for Boosting Performance of Open-Set Semi-Supervised Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16068-16078} }
StyleDiffusion: Controllable Disentangled Style Transfer via Diffusion Models: Zhizhong Wang,

Lei Zhao,

Wei Xing; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Zhizhong and Zhao, Lei and Xing, Wei}, title = {StyleDiffusion: Controllable Disentangled Style Transfer via Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7677-7689} }
AdvDiffuser: Natural Adversarial Example Synthesis with Diffusion Models: Xinquan Chen,

Xitong Gao,

Juanjuan Zhao,

Kejiang Ye,

Cheng-Zhong Xu; [pdf]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Xinquan and Gao, Xitong and Zhao, Juanjuan and Ye, Kejiang and Xu, Cheng-Zhong}, title = {AdvDiffuser: Natural Adversarial Example Synthesis with Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4562-4572} }
ViewRefer: Grasp the Multi-view Knowledge for 3D Visual Grounding: Zoey Guo,

Yiwen Tang,

Ray Zhang,

Dong Wang,

Zhigang Wang,

Bin Zhao,

Xuelong Li; [pdf] [arXiv]
[bibtex]
@InProceedings{Guo_2023_ICCV, author = {Guo, Zoey and Tang, Yiwen and Zhang, Ray and Wang, Dong and Wang, Zhigang and Zhao, Bin and Li, Xuelong}, title = {ViewRefer: Grasp the Multi-view Knowledge for 3D Visual Grounding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15372-15383} }
CaPhy: Capturing Physical Properties for Animatable Human Avatars: Zhaoqi Su,

Liangxiao Hu,

Siyou Lin,

Hongwen Zhang,

Shengping Zhang,

Justus Thies,

Yebin Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Su_2023_ICCV, author = {Su, Zhaoqi and Hu, Liangxiao and Lin, Siyou and Zhang, Hongwen and Zhang, Shengping and Thies, Justus and Liu, Yebin}, title = {CaPhy: Capturing Physical Properties for Animatable Human Avatars}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14150-14160} }
DarSwin: Distortion Aware Radial Swin Transformer: Akshaya Athwale,

Arman Afrasiyabi,

Justin Lagüe,

Ichrak Shili,

Ola Ahmad,

Jean-François Lalonde; [pdf]
[bibtex]
@InProceedings{Athwale_2023_ICCV, author = {Athwale, Akshaya and Afrasiyabi, Arman and Lag\"ue, Justin and Shili, Ichrak and Ahmad, Ola and Lalonde, Jean-Fran\c{c}ois}, title = {DarSwin: Distortion Aware Radial Swin Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5929-5938} }
Fine-grained Unsupervised Domain Adaptation for Gait Recognition: Kang Ma,

Ying Fu,

Dezhi Zheng,

Yunjie Peng,

Chunshui Cao,

Yongzhen Huang; [pdf]
[bibtex]
@InProceedings{Ma_2023_ICCV, author = {Ma, Kang and Fu, Ying and Zheng, Dezhi and Peng, Yunjie and Cao, Chunshui and Huang, Yongzhen}, title = {Fine-grained Unsupervised Domain Adaptation for Gait Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11313-11322} }
Cross-Modal Orthogonal High-Rank Augmentation for RGB-Event Transformer-Trackers: Zhiyu Zhu,

Junhui Hou,

Dapeng Oliver Wu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Zhiyu and Hou, Junhui and Wu, Dapeng Oliver}, title = {Cross-Modal Orthogonal High-Rank Augmentation for RGB-Event Transformer-Trackers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22045-22055} }
Take-A-Photo: 3D-to-2D Generative Pre-training of Point Cloud Models: Ziyi Wang,

Xumin Yu,

Yongming Rao,

Jie Zhou,

Jiwen Lu; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Ziyi and Yu, Xumin and Rao, Yongming and Zhou, Jie and Lu, Jiwen}, title = {Take-A-Photo: 3D-to-2D Generative Pre-training of Point Cloud Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5640-5650} }
Open-vocabulary Panoptic Segmentation with Embedding Modulation: Xi Chen,

Shuang Li,

Ser-Nam Lim,

Antonio Torralba,

Hengshuang Zhao; [pdf] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Xi and Li, Shuang and Lim, Ser-Nam and Torralba, Antonio and Zhao, Hengshuang}, title = {Open-vocabulary Panoptic Segmentation with Embedding Modulation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1141-1150} }
Beyond Single Path Integrated Gradients for Reliable Input Attribution via Randomized Path Sampling: Giyoung Jeon,

Haedong Jeong,

Jaesik Choi; [pdf] [supp]
[bibtex]
@InProceedings{Jeon_2023_ICCV, author = {Jeon, Giyoung and Jeong, Haedong and Choi, Jaesik}, title = {Beyond Single Path Integrated Gradients for Reliable Input Attribution via Randomized Path Sampling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2052-2061} }
Instance-aware Dynamic Prompt Tuning for Pre-trained Point Cloud Models: Yaohua Zha,

Jinpeng Wang,

Tao Dai,

Bin Chen,

Zhi Wang,

Shu-Tao Xia; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zha_2023_ICCV, author = {Zha, Yaohua and Wang, Jinpeng and Dai, Tao and Chen, Bin and Wang, Zhi and Xia, Shu-Tao}, title = {Instance-aware Dynamic Prompt Tuning for Pre-trained Point Cloud Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14161-14170} }
How to Boost Face Recognition with StyleGAN?: Artem Sevastopolskiy,

Yury Malkov,

Nikita Durasov,

Luisa Verdoliva,

Matthias Nießner; [pdf] [supp]
[bibtex]
@InProceedings{Sevastopolskiy_2023_ICCV, author = {Sevastopolskiy, Artem and Malkov, Yury and Durasov, Nikita and Verdoliva, Luisa and Nie{\ss}ner, Matthias}, title = {How to Boost Face Recognition with StyleGAN?}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20924-20934} }
Text2Tex: Text-driven Texture Synthesis via Diffusion Models: Dave Zhenyu Chen,

Yawar Siddiqui,

Hsin-Ying Lee,

Sergey Tulyakov,

Matthias Nießner; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Dave Zhenyu and Siddiqui, Yawar and Lee, Hsin-Ying and Tulyakov, Sergey and Nie{\ss}ner, Matthias}, title = {Text2Tex: Text-driven Texture Synthesis via Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18558-18568} }
MUVA: A New Large-Scale Benchmark for Multi-View Amodal Instance Segmentation in the Shopping Scenario: Zhixuan Li,

Weining Ye,

Juan Terven,

Zachary Bennett,

Ying Zheng,

Tingting Jiang,

Tiejun Huang; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Zhixuan and Ye, Weining and Terven, Juan and Bennett, Zachary and Zheng, Ying and Jiang, Tingting and Huang, Tiejun}, title = {MUVA: A New Large-Scale Benchmark for Multi-View Amodal Instance Segmentation in the Shopping Scenario}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23504-23513} }
Foreground-Background Separation through Concept Distillation from Generative Image Foundation Models: Mischa Dombrowski,

Hadrien Reynaud,

Matthew Baugh,

Bernhard Kainz; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dombrowski_2023_ICCV, author = {Dombrowski, Mischa and Reynaud, Hadrien and Baugh, Matthew and Kainz, Bernhard}, title = {Foreground-Background Separation through Concept Distillation from Generative Image Foundation Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {988-998} }
ENVIDR: Implicit Differentiable Renderer with Neural Environment Lighting: Ruofan Liang,

Huiting Chen,

Chunlin Li,

Fan Chen,

Selvakumar Panneer,

Nandita Vijaykumar; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liang_2023_ICCV, author = {Liang, Ruofan and Chen, Huiting and Li, Chunlin and Chen, Fan and Panneer, Selvakumar and Vijaykumar, Nandita}, title = {ENVIDR: Implicit Differentiable Renderer with Neural Environment Lighting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {79-89} }
Not All Steps are Created Equal: Selective Diffusion Distillation for Image Manipulation: Luozhou Wang,

Shuai Yang,

Shu Liu,

Ying-cong Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Luozhou and Yang, Shuai and Liu, Shu and Chen, Ying-cong}, title = {Not All Steps are Created Equal: Selective Diffusion Distillation for Image Manipulation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7472-7481} }
SeiT: Storage-Efficient Vision Training with Tokens Using 1% of Pixel Storage: Song Park,

Sanghyuk Chun,

Byeongho Heo,

Wonjae Kim,

Sangdoo Yun; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Park_2023_ICCV, author = {Park, Song and Chun, Sanghyuk and Heo, Byeongho and Kim, Wonjae and Yun, Sangdoo}, title = {SeiT: Storage-Efficient Vision Training with Tokens Using 1\% of Pixel Storage}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17248-17259} }
ALIP: Adaptive Language-Image Pre-Training with Synthetic Caption: Kaicheng Yang,

Jiankang Deng,

Xiang An,

Jiawei Li,

Ziyong Feng,

Jia Guo,

Jing Yang,

Tongliang Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Kaicheng and Deng, Jiankang and An, Xiang and Li, Jiawei and Feng, Ziyong and Guo, Jia and Yang, Jing and Liu, Tongliang}, title = {ALIP: Adaptive Language-Image Pre-Training with Synthetic Caption}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2922-2931} }
GeoUDF: Surface Reconstruction from 3D Point Clouds via Geometry-guided Distance Representation: Siyu Ren,

Junhui Hou,

Xiaodong Chen,

Ying He,

Wenping Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ren_2023_ICCV, author = {Ren, Siyu and Hou, Junhui and Chen, Xiaodong and He, Ying and Wang, Wenping}, title = {GeoUDF: Surface Reconstruction from 3D Point Clouds via Geometry-guided Distance Representation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14214-14224} }
LaPE: Layer-adaptive Position Embedding for Vision Transformers with Independent Layer Normalization: Runyi Yu,

Zhennan Wang,

Yinhuai Wang,

Kehan Li,

Chang Liu,

Haoyi Duan,

Xiangyang Ji,

Jie Chen; [pdf] [supp]
[bibtex]
@InProceedings{Yu_2023_ICCV, author = {Yu, Runyi and Wang, Zhennan and Wang, Yinhuai and Li, Kehan and Liu, Chang and Duan, Haoyi and Ji, Xiangyang and Chen, Jie}, title = {LaPE: Layer-adaptive Position Embedding for Vision Transformers with Independent Layer Normalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5886-5896} }
CLIP2Point: Transfer CLIP to Point Cloud Classification with Image-Depth Pre-Training: Tianyu Huang,

Bowen Dong,

Yunhan Yang,

Xiaoshui Huang,

Rynson W.H. Lau,

Wanli Ouyang,

Wangmeng Zuo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Tianyu and Dong, Bowen and Yang, Yunhan and Huang, Xiaoshui and Lau, Rynson W.H. and Ouyang, Wanli and Zuo, Wangmeng}, title = {CLIP2Point: Transfer CLIP to Point Cloud Classification with Image-Depth Pre-Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22157-22167} }
Parametric Classification for Generalized Category Discovery: A Baseline Study: Xin Wen,

Bingchen Zhao,

Xiaojuan Qi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wen_2023_ICCV, author = {Wen, Xin and Zhao, Bingchen and Qi, Xiaojuan}, title = {Parametric Classification for Generalized Category Discovery: A Baseline Study}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16590-16600} }
MeMOTR: Long-Term Memory-Augmented Transformer for Multi-Object Tracking: Ruopeng Gao,

Limin Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gao_2023_ICCV, author = {Gao, Ruopeng and Wang, Limin}, title = {MeMOTR: Long-Term Memory-Augmented Transformer for Multi-Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9901-9910} }
RawHDR: High Dynamic Range Image Reconstruction from a Single Raw Image: Yunhao Zou,

Chenggang Yan,

Ying Fu; [pdf] [arXiv]
[bibtex]
@InProceedings{Zou_2023_ICCV, author = {Zou, Yunhao and Yan, Chenggang and Fu, Ying}, title = {RawHDR: High Dynamic Range Image Reconstruction from a Single Raw Image}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12334-12344} }
Denoising Diffusion Autoencoders are Unified Self-supervised Learners: Weilai Xiang,

Hongyu Yang,

Di Huang,

Yunhong Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xiang_2023_ICCV, author = {Xiang, Weilai and Yang, Hongyu and Huang, Di and Wang, Yunhong}, title = {Denoising Diffusion Autoencoders are Unified Self-supervised Learners}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15802-15812} }
Robust Object Modeling for Visual Tracking: Yidong Cai,

Jie Liu,

Jie Tang,

Gangshan Wu; [pdf] [arXiv]
[bibtex]
@InProceedings{Cai_2023_ICCV, author = {Cai, Yidong and Liu, Jie and Tang, Jie and Wu, Gangshan}, title = {Robust Object Modeling for Visual Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9589-9600} }
FSI: Frequency and Spatial Interactive Learning for Image Restoration in Under-Display Cameras: Chengxu Liu,

Xuan Wang,

Shuai Li,

Yuzhi Wang,

Xueming Qian; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Chengxu and Wang, Xuan and Li, Shuai and Wang, Yuzhi and Qian, Xueming}, title = {FSI: Frequency and Spatial Interactive Learning for Image Restoration in Under-Display Cameras}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12537-12546} }
Cross-view Topology Based Consistent and Complementary Information for Deep Multi-view Clustering: Zhibin Dong,

Siwei Wang,

Jiaqi Jin,

Xinwang Liu,

En Zhu; [pdf]
[bibtex]
@InProceedings{Dong_2023_ICCV, author = {Dong, Zhibin and Wang, Siwei and Jin, Jiaqi and Liu, Xinwang and Zhu, En}, title = {Cross-view Topology Based Consistent and Complementary Information for Deep Multi-view Clustering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19440-19451} }
Distribution-Consistent Modal Recovering for Incomplete Multimodal Learning: Yuanzhi Wang,

Zhen Cui,

Yong Li; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Yuanzhi and Cui, Zhen and Li, Yong}, title = {Distribution-Consistent Modal Recovering for Incomplete Multimodal Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22025-22034} }
ContactGen: Generative Contact Modeling for Grasp Generation: Shaowei Liu,

Yang Zhou,

Jimei Yang,

Saurabh Gupta,

Shenlong Wang; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Shaowei and Zhou, Yang and Yang, Jimei and Gupta, Saurabh and Wang, Shenlong}, title = {ContactGen: Generative Contact Modeling for Grasp Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20609-20620} }
Temporal Collection and Distribution for Referring Video Object Segmentation: Jiajin Tang,

Ge Zheng,

Sibei Yang; [pdf] [arXiv]
[bibtex]
@InProceedings{Tang_2023_ICCV, author = {Tang, Jiajin and Zheng, Ge and Yang, Sibei}, title = {Temporal Collection and Distribution for Referring Video Object Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15466-15476} }
SA-BEV: Generating Semantic-Aware Bird's-Eye-View Feature for Multi-view 3D Object Detection: Jinqing Zhang,

Yanan Zhang,

Qingjie Liu,

Yunhong Wang; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Jinqing and Zhang, Yanan and Liu, Qingjie and Wang, Yunhong}, title = {SA-BEV: Generating Semantic-Aware Bird's-Eye-View Feature for Multi-view 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3348-3357} }
Variational Degeneration to Structural Refinement: A Unified Framework for Superimposed Image Decomposition: Wenyu Li,

Yan Xu,

Yang Yang,

Haoran Ji,

Yue Lang; [pdf]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Wenyu and Xu, Yan and Yang, Yang and Ji, Haoran and Lang, Yue}, title = {Variational Degeneration to Structural Refinement: A Unified Framework for Superimposed Image Decomposition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12206-12216} }
Global Knowledge Calibration for Fast Open-Vocabulary Segmentation: Kunyang Han,

Yong Liu,

Jun Hao Liew,

Henghui Ding,

Jiajun Liu,

Yitong Wang,

Yansong Tang,

Yujiu Yang,

Jiashi Feng,

Yao Zhao,

Yunchao Wei; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Han_2023_ICCV, author = {Han, Kunyang and Liu, Yong and Liew, Jun Hao and Ding, Henghui and Liu, Jiajun and Wang, Yitong and Tang, Yansong and Yang, Yujiu and Feng, Jiashi and Zhao, Yao and Wei, Yunchao}, title = {Global Knowledge Calibration for Fast Open-Vocabulary Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {797-807} }
Ego-Humans: An Ego-Centric 3D Multi-Human Benchmark: Rawal Khirodkar,

Aayush Bansal,

Lingni Ma,

Richard Newcombe,

Minh Vo,

Kris Kitani; [pdf] [supp]
[bibtex]
@InProceedings{Khirodkar_2023_ICCV, author = {Khirodkar, Rawal and Bansal, Aayush and Ma, Lingni and Newcombe, Richard and Vo, Minh and Kitani, Kris}, title = {Ego-Humans: An Ego-Centric 3D Multi-Human Benchmark}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19807-19819} }
Focal Network for Image Restoration: Yuning Cui,

Wenqi Ren,

Xiaochun Cao,

Alois Knoll; [pdf] [supp]
[bibtex]
@InProceedings{Cui_2023_ICCV, author = {Cui, Yuning and Ren, Wenqi and Cao, Xiaochun and Knoll, Alois}, title = {Focal Network for Image Restoration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13001-13011} }
Indoor Depth Recovery Based on Deep Unfolding with Non-Local Prior: Yuhui Dai,

Junkang Zhang,

Faming Fang,

Guixu Zhang; [pdf]
[bibtex]
@InProceedings{Dai_2023_ICCV, author = {Dai, Yuhui and Zhang, Junkang and Fang, Faming and Zhang, Guixu}, title = {Indoor Depth Recovery Based on Deep Unfolding with Non-Local Prior}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12355-12364} }
Compatibility of Fundamental Matrices for Complete Viewing Graphs: Martin Bråtelund,

Felix Rydell; [pdf] [supp]
[bibtex]
@InProceedings{Bratelund_2023_ICCV, author = {Br\r{a}telund, Martin and Rydell, Felix}, title = {Compatibility of Fundamental Matrices for Complete Viewing Graphs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3328-3336} }
GAFlow: Incorporating Gaussian Attention into Optical Flow: Ao Luo,

Fan Yang,

Xin Li,

Lang Nie,

Chunyu Lin,

Haoqiang Fan,

Shuaicheng Liu; [pdf]
[bibtex]
@InProceedings{Luo_2023_ICCV, author = {Luo, Ao and Yang, Fan and Li, Xin and Nie, Lang and Lin, Chunyu and Fan, Haoqiang and Liu, Shuaicheng}, title = {GAFlow: Incorporating Gaussian Attention into Optical Flow}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9642-9651} }
MAtch, eXpand and Improve: Unsupervised Finetuning for Zero-Shot Action Recognition with Language Knowledge: Wei Lin,

Leonid Karlinsky,

Nina Shvetsova,

Horst Possegger,

Mateusz Kozinski,

Rameswar Panda,

Rogerio Feris,

Hilde Kuehne,

Horst Bischof; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lin_2023_ICCV, author = {Lin, Wei and Karlinsky, Leonid and Shvetsova, Nina and Possegger, Horst and Kozinski, Mateusz and Panda, Rameswar and Feris, Rogerio and Kuehne, Hilde and Bischof, Horst}, title = {MAtch, eXpand and Improve: Unsupervised Finetuning for Zero-Shot Action Recognition with Language Knowledge}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2851-2862} }
Space Engage: Collaborative Space Supervision for Contrastive-Based Semi-Supervised Semantic Segmentation: Changqi Wang,

Haoyu Xie,

Yuhui Yuan,

Chong Fu,

Xiangyu Yue; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Changqi and Xie, Haoyu and Yuan, Yuhui and Fu, Chong and Yue, Xiangyu}, title = {Space Engage: Collaborative Space Supervision for Contrastive-Based Semi-Supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {931-942} }
Delving into Motion-Aware Matching for Monocular 3D Object Tracking: Kuan-Chih Huang,

Ming-Hsuan Yang,

Yi-Hsuan Tsai; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Kuan-Chih and Yang, Ming-Hsuan and Tsai, Yi-Hsuan}, title = {Delving into Motion-Aware Matching for Monocular 3D Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6909-6918} }
SoDaCam: Software-defined Cameras via Single-Photon Imaging: Varun Sundar,

Andrei Ardelean,

Tristan Swedish,

Claudio Bruschini,

Edoardo Charbon,

Mohit Gupta; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sundar_2023_ICCV, author = {Sundar, Varun and Ardelean, Andrei and Swedish, Tristan and Bruschini, Claudio and Charbon, Edoardo and Gupta, Mohit}, title = {SoDaCam: Software-defined Cameras via Single-Photon Imaging}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8165-8176} }
Reference-guided Controllable Inpainting of Neural Radiance Fields: Ashkan Mirzaei,

Tristan Aumentado-Armstrong,

Marcus A. Brubaker,

Jonathan Kelly,

Alex Levinshtein,

Konstantinos G. Derpanis,

Igor Gilitschenski; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mirzaei_2023_ICCV, author = {Mirzaei, Ashkan and Aumentado-Armstrong, Tristan and Brubaker, Marcus A. and Kelly, Jonathan and Levinshtein, Alex and Derpanis, Konstantinos G. and Gilitschenski, Igor}, title = {Reference-guided Controllable Inpainting of Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17815-17825} }
Diffusion-Guided Reconstruction of Everyday Hand-Object Interaction Clips: Yufei Ye,

Poorvi Hebbar,

Abhinav Gupta,

Shubham Tulsiani; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ye_2023_ICCV, author = {Ye, Yufei and Hebbar, Poorvi and Gupta, Abhinav and Tulsiani, Shubham}, title = {Diffusion-Guided Reconstruction of Everyday Hand-Object Interaction Clips}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19717-19728} }
Decoupled Iterative Refinement Framework for Interacting Hands Reconstruction from a Single RGB Image: Pengfei Ren,

Chao Wen,

Xiaozheng Zheng,

Zhou Xue,

Haifeng Sun,

Qi Qi,

Jingyu Wang,

Jianxin Liao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ren_2023_ICCV, author = {Ren, Pengfei and Wen, Chao and Zheng, Xiaozheng and Xue, Zhou and Sun, Haifeng and Qi, Qi and Wang, Jingyu and Liao, Jianxin}, title = {Decoupled Iterative Refinement Framework for Interacting Hands Reconstruction from a Single RGB Image}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8014-8025} }
Fast Adversarial Training with Smooth Convergence: Mengnan Zhao,

Lihe Zhang,

Yuqiu Kong,

Baocai Yin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Mengnan and Zhang, Lihe and Kong, Yuqiu and Yin, Baocai}, title = {Fast Adversarial Training with Smooth Convergence}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4720-4729} }
Who Are You Referring To? Coreference Resolution In Image Narrations: Arushi Goel,

Basura Fernando,

Frank Keller,

Hakan Bilen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Goel_2023_ICCV, author = {Goel, Arushi and Fernando, Basura and Keller, Frank and Bilen, Hakan}, title = {Who Are You Referring To? Coreference Resolution In Image Narrations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15247-15258} }
DVGaze: Dual-View Gaze Estimation: Yihua Cheng,

Feng Lu; [pdf] [arXiv]
[bibtex]
@InProceedings{Cheng_2023_ICCV, author = {Cheng, Yihua and Lu, Feng}, title = {DVGaze: Dual-View Gaze Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20632-20641} }
Dynamic Hyperbolic Attention Network for Fine Hand-object Reconstruction: Zhiying Leng,

Shun-Cheng Wu,

Mahdi Saleh,

Antonio Montanaro,

Hao Yu,

Yin Wang,

Nassir Navab,

Xiaohui Liang,

Federico Tombari; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Leng_2023_ICCV, author = {Leng, Zhiying and Wu, Shun-Cheng and Saleh, Mahdi and Montanaro, Antonio and Yu, Hao and Wang, Yin and Navab, Nassir and Liang, Xiaohui and Tombari, Federico}, title = {Dynamic Hyperbolic Attention Network for Fine Hand-object Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14894-14904} }
A-STAR: Test-time Attention Segregation and Retention for Text-to-image Synthesis: Aishwarya Agarwal,

Srikrishna Karanam,

K J Joseph,

Apoorv Saxena,

Koustava Goswami,

Balaji Vasan Srinivasan; [pdf] [supp]
[bibtex]
@InProceedings{Agarwal_2023_ICCV, author = {Agarwal, Aishwarya and Karanam, Srikrishna and Joseph, K J and Saxena, Apoorv and Goswami, Koustava and Srinivasan, Balaji Vasan}, title = {A-STAR: Test-time Attention Segregation and Retention for Text-to-image Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2283-2293} }
LivePose: Online 3D Reconstruction from Monocular Video with Dynamic Camera Poses: Noah Stier,

Baptiste Angles,

Liang Yang,

Yajie Yan,

Alex Colburn,

Ming Chuang; [pdf] [arXiv]
[bibtex]
@InProceedings{Stier_2023_ICCV, author = {Stier, Noah and Angles, Baptiste and Yang, Liang and Yan, Yajie and Colburn, Alex and Chuang, Ming}, title = {LivePose: Online 3D Reconstruction from Monocular Video with Dynamic Camera Poses}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7921-7930} }
Efficient Joint Optimization of Layer-Adaptive Weight Pruning in Deep Neural Networks: Kaixin Xu,

Zhe Wang,

Xue Geng,

Min Wu,

Xiaoli Li,

Weisi Lin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Kaixin and Wang, Zhe and Geng, Xue and Wu, Min and Li, Xiaoli and Lin, Weisi}, title = {Efficient Joint Optimization of Layer-Adaptive Weight Pruning in Deep Neural Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17447-17457} }
Feature Modulation Transformer: Cross-Refinement of Global Representation via High-Frequency Prior for Image Super-Resolution: Ao Li,

Le Zhang,

Yun Liu,

Ce Zhu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Ao and Zhang, Le and Liu, Yun and Zhu, Ce}, title = {Feature Modulation Transformer: Cross-Refinement of Global Representation via High-Frequency Prior for Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12514-12524} }
Exploring the Sim2Real Gap Using Digital Twins: Sruthi Sudhakar,

Jon Hanzelka,

Josh Bobillot,

Tanmay Randhavane,

Neel Joshi,

Vibhav Vineet; [pdf] [supp]
[bibtex]
@InProceedings{Sudhakar_2023_ICCV, author = {Sudhakar, Sruthi and Hanzelka, Jon and Bobillot, Josh and Randhavane, Tanmay and Joshi, Neel and Vineet, Vibhav}, title = {Exploring the Sim2Real Gap Using Digital Twins}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20418-20427} }
MPI-Flow: Learning Realistic Optical Flow with Multiplane Images: Yingping Liang,

Jiaming Liu,

Debing Zhang,

Ying Fu; [pdf]
[bibtex]
@InProceedings{Liang_2023_ICCV, author = {Liang, Yingping and Liu, Jiaming and Zhang, Debing and Fu, Ying}, title = {MPI-Flow: Learning Realistic Optical Flow with Multiplane Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13857-13868} }
Re:PolyWorld - A Graph Neural Network for Polygonal Scene Parsing: Stefano Zorzi,

Friedrich Fraundorfer; [pdf] [supp]
[bibtex]
@InProceedings{Zorzi_2023_ICCV, author = {Zorzi, Stefano and Fraundorfer, Friedrich}, title = {Re:PolyWorld - A Graph Neural Network for Polygonal Scene Parsing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16762-16771} }
FaceCLIPNeRF: Text-driven 3D Face Manipulation using Deformable Neural Radiance Fields: Sungwon Hwang,

Junha Hyung,

Daejin Kim,

Min-Jung Kim,

Jaegul Choo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hwang_2023_ICCV, author = {Hwang, Sungwon and Hyung, Junha and Kim, Daejin and Kim, Min-Jung and Choo, Jaegul}, title = {FaceCLIPNeRF: Text-driven 3D Face Manipulation using Deformable Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3469-3479} }
Video State-Changing Object Segmentation: Jiangwei Yu,

Xiang Li,

Xinran Zhao,

Hongming Zhang,

Yu-Xiong Wang; [pdf] [supp]
[bibtex]
@InProceedings{Yu_2023_ICCV, author = {Yu, Jiangwei and Li, Xiang and Zhao, Xinran and Zhang, Hongming and Wang, Yu-Xiong}, title = {Video State-Changing Object Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20439-20448} }
Learning Shape Primitives via Implicit Convexity Regularization: Xiaoyang Huang,

Yi Zhang,

Kai Chen,

Teng Li,

Wenjun Zhang,

Bingbing Ni; [pdf] [supp]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Xiaoyang and Zhang, Yi and Chen, Kai and Li, Teng and Zhang, Wenjun and Ni, Bingbing}, title = {Learning Shape Primitives via Implicit Convexity Regularization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3642-3651} }
MonoNeRF: Learning a Generalizable Dynamic Radiance Field from Monocular Videos: Fengrui Tian,

Shaoyi Du,

Yueqi Duan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tian_2023_ICCV, author = {Tian, Fengrui and Du, Shaoyi and Duan, Yueqi}, title = {MonoNeRF: Learning a Generalizable Dynamic Radiance Field from Monocular Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17903-17913} }
PG-RCNN: Semantic Surface Point Generation for 3D Object Detection: Inyong Koo,

Inyoung Lee,

Se-Ho Kim,

Hee-Seon Kim,

Woo-jin Jeon,

Changick Kim; [pdf] [supp]
[bibtex]
@InProceedings{Koo_2023_ICCV, author = {Koo, Inyong and Lee, Inyoung and Kim, Se-Ho and Kim, Hee-Seon and Jeon, Woo-jin and Kim, Changick}, title = {PG-RCNN: Semantic Surface Point Generation for 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18142-18151} }
ITI-GEN: Inclusive Text-to-Image Generation: Cheng Zhang,

Xuanbai Chen,

Siqi Chai,

Chen Henry Wu,

Dmitry Lagun,

Thabo Beeler,

Fernando De la Torre; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Cheng and Chen, Xuanbai and Chai, Siqi and Wu, Chen Henry and Lagun, Dmitry and Beeler, Thabo and De la Torre, Fernando}, title = {ITI-GEN: Inclusive Text-to-Image Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3969-3980} }
Learning Depth Estimation for Transparent and Mirror Surfaces: Alex Costanzino,

Pierluigi Zama Ramirez,

Matteo Poggi,

Fabio Tosi,

Stefano Mattoccia,

Luigi Di Stefano; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Costanzino_2023_ICCV, author = {Costanzino, Alex and Ramirez, Pierluigi Zama and Poggi, Matteo and Tosi, Fabio and Mattoccia, Stefano and Di Stefano, Luigi}, title = {Learning Depth Estimation for Transparent and Mirror Surfaces}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9244-9255} }
Learning Neural Eigenfunctions for Unsupervised Semantic Segmentation: Zhijie Deng,

Yucen Luo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Deng_2023_ICCV, author = {Deng, Zhijie and Luo, Yucen}, title = {Learning Neural Eigenfunctions for Unsupervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {551-561} }
Shape Analysis of Euclidean Curves under Frenet-Serret Framework: Perrine Chassat,

Juhyun Park,

Nicolas Brunel; [pdf] [supp]
[bibtex]
@InProceedings{Chassat_2023_ICCV, author = {Chassat, Perrine and Park, Juhyun and Brunel, Nicolas}, title = {Shape Analysis of Euclidean Curves under Frenet-Serret Framework}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4027-4036} }
Representation Uncertainty in Self-Supervised Learning as Variational Inference: Hiroki Nakamura,

Masashi Okada,

Tadahiro Taniguchi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Nakamura_2023_ICCV, author = {Nakamura, Hiroki and Okada, Masashi and Taniguchi, Tadahiro}, title = {Representation Uncertainty in Self-Supervised Learning as Variational Inference}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16484-16493} }
Efficient Diffusion Training via Min-SNR Weighting Strategy: Tiankai Hang,

Shuyang Gu,

Chen Li,

Jianmin Bao,

Dong Chen,

Han Hu,

Xin Geng,

Baining Guo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hang_2023_ICCV, author = {Hang, Tiankai and Gu, Shuyang and Li, Chen and Bao, Jianmin and Chen, Dong and Hu, Han and Geng, Xin and Guo, Baining}, title = {Efficient Diffusion Training via Min-SNR Weighting Strategy}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7441-7451} }
Bridging Vision and Language Encoders: Parameter-Efficient Tuning for Referring Image Segmentation: Zunnan Xu,

Zhihong Chen,

Yong Zhang,

Yibing Song,

Xiang Wan,

Guanbin Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Zunnan and Chen, Zhihong and Zhang, Yong and Song, Yibing and Wan, Xiang and Li, Guanbin}, title = {Bridging Vision and Language Encoders: Parameter-Efficient Tuning for Referring Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17503-17512} }
Towards Zero-Shot Scale-Aware Monocular Depth Estimation: Vitor Guizilini,

Igor Vasiljevic,

Dian Chen,

Rareș Ambruș,

Adrien Gaidon; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Guizilini_2023_ICCV, author = {Guizilini, Vitor and Vasiljevic, Igor and Chen, Dian and Ambruș, Rareș and Gaidon, Adrien}, title = {Towards Zero-Shot Scale-Aware Monocular Depth Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9233-9243} }
ATT3D: Amortized Text-to-3D Object Synthesis: Jonathan Lorraine,

Kevin Xie,

Xiaohui Zeng,

Chen-Hsuan Lin,

Towaki Takikawa,

Nicholas Sharp,

Tsung-Yi Lin,

Ming-Yu Liu,

Sanja Fidler,

James Lucas; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lorraine_2023_ICCV, author = {Lorraine, Jonathan and Xie, Kevin and Zeng, Xiaohui and Lin, Chen-Hsuan and Takikawa, Towaki and Sharp, Nicholas and Lin, Tsung-Yi and Liu, Ming-Yu and Fidler, Sanja and Lucas, James}, title = {ATT3D: Amortized Text-to-3D Object Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17946-17956} }
Virtual Try-On with Pose-Garment Keypoints Guided Inpainting: Zhi Li,

Pengfei Wei,

Xiang Yin,

Zejun Ma,

Alex C. Kot; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Zhi and Wei, Pengfei and Yin, Xiang and Ma, Zejun and Kot, Alex C.}, title = {Virtual Try-On with Pose-Garment Keypoints Guided Inpainting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22788-22797} }
Learning by Sorting: Self-supervised Learning with Group Ordering Constraints: Nina Shvetsova,

Felix Petersen,

Anna Kukleva,

Bernt Schiele,

Hilde Kuehne; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shvetsova_2023_ICCV, author = {Shvetsova, Nina and Petersen, Felix and Kukleva, Anna and Schiele, Bernt and Kuehne, Hilde}, title = {Learning by Sorting: Self-supervised Learning with Group Ordering Constraints}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16453-16463} }
Cross Modal Transformer: Towards Fast and Robust 3D Object Detection: Junjie Yan,

Yingfei Liu,

Jianjian Sun,

Fan Jia,

Shuailin Li,

Tiancai Wang,

Xiangyu Zhang; [pdf] [arXiv]
[bibtex]
@InProceedings{Yan_2023_ICCV, author = {Yan, Junjie and Liu, Yingfei and Sun, Jianjian and Jia, Fan and Li, Shuailin and Wang, Tiancai and Zhang, Xiangyu}, title = {Cross Modal Transformer: Towards Fast and Robust 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18268-18278} }
Perceptual Grouping in Contrastive Vision-Language Models: Kanchana Ranasinghe,

Brandon McKinzie,

Sachin Ravi,

Yinfei Yang,

Alexander Toshev,

Jonathon Shlens; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ranasinghe_2023_ICCV, author = {Ranasinghe, Kanchana and McKinzie, Brandon and Ravi, Sachin and Yang, Yinfei and Toshev, Alexander and Shlens, Jonathon}, title = {Perceptual Grouping in Contrastive Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5571-5584} }
Dynamic Perceiver for Efficient Visual Recognition: Yizeng Han,

Dongchen Han,

Zeyu Liu,

Yulin Wang,

Xuran Pan,

Yifan Pu,

Chao Deng,

Junlan Feng,

Shiji Song,

Gao Huang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Han_2023_ICCV, author = {Han, Yizeng and Han, Dongchen and Liu, Zeyu and Wang, Yulin and Pan, Xuran and Pu, Yifan and Deng, Chao and Feng, Junlan and Song, Shiji and Huang, Gao}, title = {Dynamic Perceiver for Efficient Visual Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5992-6002} }
MoTIF: Learning Motion Trajectories with Local Implicit Neural Functions for Continuous Space-Time Video Super-Resolution: Yi-Hsin Chen,

Si-Cun Chen,

Yi-Hsin Chen,

Yen-Yu Lin,

Wen-Hsiao Peng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Yi-Hsin and Chen, Si-Cun and Chen, Yi-Hsin and Lin, Yen-Yu and Peng, Wen-Hsiao}, title = {MoTIF: Learning Motion Trajectories with Local Implicit Neural Functions for Continuous Space-Time Video Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23131-23141} }
CRN: Camera Radar Net for Accurate, Robust, Efficient 3D Perception: Youngseok Kim,

Juyeb Shin,

Sanmin Kim,

In-Jae Lee,

Jun Won Choi,

Dongsuk Kum; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2023_ICCV, author = {Kim, Youngseok and Shin, Juyeb and Kim, Sanmin and Lee, In-Jae and Choi, Jun Won and Kum, Dongsuk}, title = {CRN: Camera Radar Net for Accurate, Robust, Efficient 3D Perception}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17615-17626} }
PromptStyler: Prompt-driven Style Generation for Source-free Domain Generalization: Junhyeong Cho,

Gilhyun Nam,

Sungyeon Kim,

Hunmin Yang,

Suha Kwak; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cho_2023_ICCV, author = {Cho, Junhyeong and Nam, Gilhyun and Kim, Sungyeon and Yang, Hunmin and Kwak, Suha}, title = {PromptStyler: Prompt-driven Style Generation for Source-free Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15702-15712} }
Phasic Content Fusing Diffusion Model with Directional Distribution Consistency for Few-Shot Model Adaption: Teng Hu,

Jiangning Zhang,

Liang Liu,

Ran Yi,

Siqi Kou,

Haokun Zhu,

Xu Chen,

Yabiao Wang,

Chengjie Wang,

Lizhuang Ma; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hu_2023_ICCV, author = {Hu, Teng and Zhang, Jiangning and Liu, Liang and Yi, Ran and Kou, Siqi and Zhu, Haokun and Chen, Xu and Wang, Yabiao and Wang, Chengjie and Ma, Lizhuang}, title = {Phasic Content Fusing Diffusion Model with Directional Distribution Consistency for Few-Shot Model Adaption}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2406-2415} }
SVQNet: Sparse Voxel-Adjacent Query Network for 4D Spatio-Temporal LiDAR Semantic Segmentation: Xuechao Chen,

Shuangjie Xu,

Xiaoyi Zou,

Tongyi Cao,

Dit-Yan Yeung,

Lu Fang; [pdf] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Xuechao and Xu, Shuangjie and Zou, Xiaoyi and Cao, Tongyi and Yeung, Dit-Yan and Fang, Lu}, title = {SVQNet: Sparse Voxel-Adjacent Query Network for 4D Spatio-Temporal LiDAR Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8569-8578} }
HAL3D: Hierarchical Active Learning for Fine-Grained 3D Part Labeling: Fenggen Yu,

Yiming Qian,

Francisca Gil-Ureta,

Brian Jackson,

Eric Bennett,

Hao Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yu_2023_ICCV, author = {Yu, Fenggen and Qian, Yiming and Gil-Ureta, Francisca and Jackson, Brian and Bennett, Eric and Zhang, Hao}, title = {HAL3D: Hierarchical Active Learning for Fine-Grained 3D Part Labeling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {865-875} }
MEFLUT: Unsupervised 1D Lookup Tables for Multi-exposure Image Fusion: Ting Jiang,

Chuan Wang,

Xinpeng Li,

Ru Li,

Haoqiang Fan,

Shuaicheng Liu; [pdf] [arXiv]
[bibtex]
@InProceedings{Jiang_2023_ICCV, author = {Jiang, Ting and Wang, Chuan and Li, Xinpeng and Li, Ru and Fan, Haoqiang and Liu, Shuaicheng}, title = {MEFLUT: Unsupervised 1D Lookup Tables for Multi-exposure Image Fusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10542-10551} }
FedPerfix: Towards Partial Model Personalization of Vision Transformers in Federated Learning: Guangyu Sun,

Matias Mendieta,

Jun Luo,

Shandong Wu,

Chen Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sun_2023_ICCV, author = {Sun, Guangyu and Mendieta, Matias and Luo, Jun and Wu, Shandong and Chen, Chen}, title = {FedPerfix: Towards Partial Model Personalization of Vision Transformers in Federated Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4988-4998} }
Conditional 360-degree Image Synthesis for Immersive Indoor Scene Decoration: Ka Chun Shum,

Hong-Wing Pang,

Binh-Son Hua,

Duc Thanh Nguyen,

Sai-Kit Yeung; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shum_2023_ICCV, author = {Shum, Ka Chun and Pang, Hong-Wing and Hua, Binh-Son and Nguyen, Duc Thanh and Yeung, Sai-Kit}, title = {Conditional 360-degree Image Synthesis for Immersive Indoor Scene Decoration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4478-4488} }
The Unreasonable Effectiveness of Large Language-Vision Models for Source-Free Video Domain Adaptation: Giacomo Zara,

Alessandro Conti,

Subhankar Roy,

Stéphane Lathuilière,

Paolo Rota,

Elisa Ricci; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zara_2023_ICCV, author = {Zara, Giacomo and Conti, Alessandro and Roy, Subhankar and Lathuili\`ere, St\'ephane and Rota, Paolo and Ricci, Elisa}, title = {The Unreasonable Effectiveness of Large Language-Vision Models for Source-Free Video Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10307-10317} }
SIDGAN: High-Resolution Dubbed Video Generation via Shift-Invariant Learning: Urwa Muaz,

Wondong Jang,

Rohun Tripathi,

Santhosh Mani,

Wenbin Ouyang,

Ravi Teja Gadde,

Baris Gecer,

Sergio Elizondo,

Reza Madad,

Naveen Nair; [pdf] [supp]
[bibtex]
@InProceedings{Muaz_2023_ICCV, author = {Muaz, Urwa and Jang, Wondong and Tripathi, Rohun and Mani, Santhosh and Ouyang, Wenbin and Gadde, Ravi Teja and Gecer, Baris and Elizondo, Sergio and Madad, Reza and Nair, Naveen}, title = {SIDGAN: High-Resolution Dubbed Video Generation via Shift-Invariant Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7833-7842} }
Meta-ZSDETR: Zero-shot DETR with Meta-learning: Lu Zhang,

Chenbo Zhang,

Jiajia Zhao,

Jihong Guan,

Shuigeng Zhou; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Lu and Zhang, Chenbo and Zhao, Jiajia and Guan, Jihong and Zhou, Shuigeng}, title = {Meta-ZSDETR: Zero-shot DETR with Meta-learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6845-6854} }
GaPro: Box-Supervised 3D Point Cloud Instance Segmentation Using Gaussian Processes as Pseudo Labelers: Tuan Duc Ngo,

Binh-Son Hua,

Khoi Nguyen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ngo_2023_ICCV, author = {Ngo, Tuan Duc and Hua, Binh-Son and Nguyen, Khoi}, title = {GaPro: Box-Supervised 3D Point Cloud Instance Segmentation Using Gaussian Processes as Pseudo Labelers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17794-17803} }
STPrivacy: Spatio-Temporal Privacy-Preserving Action Recognition: Ming Li,

Xiangyu Xu,

Hehe Fan,

Pan Zhou,

Jun Liu,

Jia-Wei Liu,

Jiahe Li,

Jussi Keppo,

Mike Zheng Shou,

Shuicheng Yan; [pdf] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Ming and Xu, Xiangyu and Fan, Hehe and Zhou, Pan and Liu, Jun and Liu, Jia-Wei and Li, Jiahe and Keppo, Jussi and Shou, Mike Zheng and Yan, Shuicheng}, title = {STPrivacy: Spatio-Temporal Privacy-Preserving Action Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5106-5115} }
Get the Best of Both Worlds: Improving Accuracy and Transferability by Grassmann Class Representation: Haoqi Wang,

Zhizhong Li,

Wayne Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Haoqi and Li, Zhizhong and Zhang, Wayne}, title = {Get the Best of Both Worlds: Improving Accuracy and Transferability by Grassmann Class Representation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22478-22487} }
Computationally-Efficient Neural Image Compression with Shallow Decoders: Yibo Yang,

Stephan Mandt; [pdf] [supp]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Yibo and Mandt, Stephan}, title = {Computationally-Efficient Neural Image Compression with Shallow Decoders}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {530-540} }
ObjectSDF++: Improved Object-Compositional Neural Implicit Surfaces: Qianyi Wu,

Kaisiyuan Wang,

Kejie Li,

Jianmin Zheng,

Jianfei Cai; [pdf] [supp]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Qianyi and Wang, Kaisiyuan and Li, Kejie and Zheng, Jianmin and Cai, Jianfei}, title = {ObjectSDF++: Improved Object-Compositional Neural Implicit Surfaces}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21764-21774} }
Tracing the Origin of Adversarial Attack for Forensic Investigation and Deterrence: Han Fang,

Jiyi Zhang,

Yupeng Qiu,

Jiayang Liu,

Ke Xu,

Chengfang Fang,

Ee-Chien Chang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Fang_2023_ICCV, author = {Fang, Han and Zhang, Jiyi and Qiu, Yupeng and Liu, Jiayang and Xu, Ke and Fang, Chengfang and Chang, Ee-Chien}, title = {Tracing the Origin of Adversarial Attack for Forensic Investigation and Deterrence}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4335-4344} }
Sketch and Text Guided Diffusion Model for Colored Point Cloud Generation: Zijie Wu,

Yaonan Wang,

Mingtao Feng,

He Xie,

Ajmal Mian; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Zijie and Wang, Yaonan and Feng, Mingtao and Xie, He and Mian, Ajmal}, title = {Sketch and Text Guided Diffusion Model for Colored Point Cloud Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8929-8939} }
Scenimefy: Learning to Craft Anime Scene via Semi-Supervised Image-to-Image Translation: Yuxin Jiang,

Liming Jiang,

Shuai Yang,

Chen Change Loy; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jiang_2023_ICCV, author = {Jiang, Yuxin and Jiang, Liming and Yang, Shuai and Loy, Chen Change}, title = {Scenimefy: Learning to Craft Anime Scene via Semi-Supervised Image-to-Image Translation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7357-7367} }
Towards Unsupervised Domain Generalization for Face Anti-Spoofing: Yuchen Liu,

Yabo Chen,

Mengran Gou,

Chun-Ting Huang,

Yaoming Wang,

Wenrui Dai,

Hongkai Xiong; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Yuchen and Chen, Yabo and Gou, Mengran and Huang, Chun-Ting and Wang, Yaoming and Dai, Wenrui and Xiong, Hongkai}, title = {Towards Unsupervised Domain Generalization for Face Anti-Spoofing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20654-20664} }
DR-Tune: Improving Fine-tuning of Pretrained Visual Models by Distribution Regularization with Semantic Calibration: Nan Zhou,

Jiaxin Chen,

Di Huang; [pdf] [supp]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Nan and Chen, Jiaxin and Huang, Di}, title = {DR-Tune: Improving Fine-tuning of Pretrained Visual Models by Distribution Regularization with Semantic Calibration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1547-1556} }
MotionDeltaCNN: Sparse CNN Inference of Frame Differences in Moving Camera Videos with Spherical Buffers and Padded Convolutions: Mathias Parger,

Chengcheng Tang,

Thomas Neff,

Christopher D. Twigg,

Cem Keskin,

Robert Wang,

Markus Steinberger; [pdf] [supp]
[bibtex]
@InProceedings{Parger_2023_ICCV, author = {Parger, Mathias and Tang, Chengcheng and Neff, Thomas and Twigg, Christopher D. and Keskin, Cem and Wang, Robert and Steinberger, Markus}, title = {MotionDeltaCNN: Sparse CNN Inference of Frame Differences in Moving Camera Videos with Spherical Buffers and Padded Convolutions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17292-17301} }
General Image-to-Image Translation with One-Shot Image Guidance: Bin Cheng,

Zuhao Liu,

Yunbo Peng,

Yue Lin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cheng_2023_ICCV, author = {Cheng, Bin and Liu, Zuhao and Peng, Yunbo and Lin, Yue}, title = {General Image-to-Image Translation with One-Shot Image Guidance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22736-22746} }
Dense 2D-3D Indoor Prediction with Sound via Aligned Cross-Modal Distillation: Heeseung Yun,

Joonil Na,

Gunhee Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yun_2023_ICCV, author = {Yun, Heeseung and Na, Joonil and Kim, Gunhee}, title = {Dense 2D-3D Indoor Prediction with Sound via Aligned Cross-Modal Distillation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7863-7872} }
Leveraging SE(3) Equivariance for Learning 3D Geometric Shape Assembly: Ruihai Wu,

Chenrui Tie,

Yushi Du,

Yan Zhao,

Hao Dong; [pdf] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Ruihai and Tie, Chenrui and Du, Yushi and Zhao, Yan and Dong, Hao}, title = {Leveraging SE(3) Equivariance for Learning 3D Geometric Shape Assembly}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14311-14320} }
Adversarial Bayesian Augmentation for Single-Source Domain Generalization: Sheng Cheng,

Tejas Gokhale,

Yezhou Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cheng_2023_ICCV, author = {Cheng, Sheng and Gokhale, Tejas and Yang, Yezhou}, title = {Adversarial Bayesian Augmentation for Single-Source Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11400-11410} }
Robust Geometry-Preserving Depth Estimation Using Differentiable Rendering: Chi Zhang,

Wei Yin,

Gang Yu,

Zhibin Wang,

Tao Chen,

Bin Fu,

Joey Tianyi Zhou,

Chunhua Shen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Chi and Yin, Wei and Yu, Gang and Wang, Zhibin and Chen, Tao and Fu, Bin and Zhou, Joey Tianyi and Shen, Chunhua}, title = {Robust Geometry-Preserving Depth Estimation Using Differentiable Rendering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8951-8961} }
Self-regulating Prompts: Foundational Model Adaptation without Forgetting: Muhammad Uzair Khattak,

Syed Talal Wasim,

Muzammal Naseer,

Salman Khan,

Ming-Hsuan Yang,

Fahad Shahbaz Khan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Khattak_2023_ICCV, author = {Khattak, Muhammad Uzair and Wasim, Syed Talal and Naseer, Muzammal and Khan, Salman and Yang, Ming-Hsuan and Khan, Fahad Shahbaz}, title = {Self-regulating Prompts: Foundational Model Adaptation without Forgetting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15190-15200} }
ASM: Adaptive Skinning Model for High-Quality 3D Face Modeling: Kai Yang,

Hong Shang,

Tianyang Shi,

Xinghan Chen,

Jingkai Zhou,

Zhongqian Sun,

Wei Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Kai and Shang, Hong and Shi, Tianyang and Chen, Xinghan and Zhou, Jingkai and Sun, Zhongqian and Yang, Wei}, title = {ASM: Adaptive Skinning Model for High-Quality 3D Face Modeling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20708-20717} }
EverLight: Indoor-Outdoor Editable HDR Lighting Estimation: Mohammad Reza Karimi Dastjerdi,

Jonathan Eisenmann,

Yannick Hold-Geoffroy,

Jean-François Lalonde; [pdf] [arXiv]
[bibtex]
@InProceedings{Dastjerdi_2023_ICCV, author = {Dastjerdi, Mohammad Reza Karimi and Eisenmann, Jonathan and Hold-Geoffroy, Yannick and Lalonde, Jean-Fran\c{c}ois}, title = {EverLight: Indoor-Outdoor Editable HDR Lighting Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7420-7429} }
MARS: Model-agnostic Biased Object Removal without Additional Supervision for Weakly-Supervised Semantic Segmentation: Sanghyun Jo,

In-Jae Yu,

Kyungsu Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jo_2023_ICCV, author = {Jo, Sanghyun and Yu, In-Jae and Kim, Kyungsu}, title = {MARS: Model-agnostic Biased Object Removal without Additional Supervision for Weakly-Supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {614-623} }
CAFA: Class-Aware Feature Alignment for Test-Time Adaptation: Sanghun Jung,

Jungsoo Lee,

Nanhee Kim,

Amirreza Shaban,

Byron Boots,

Jaegul Choo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jung_2023_ICCV, author = {Jung, Sanghun and Lee, Jungsoo and Kim, Nanhee and Shaban, Amirreza and Boots, Byron and Choo, Jaegul}, title = {CAFA: Class-Aware Feature Alignment for Test-Time Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19060-19071} }
Learning Clothing and Pose Invariant 3D Shape Representation for Long-Term Person Re-Identification: Feng Liu,

Minchul Kim,

ZiAng Gu,

Anil Jain,

Xiaoming Liu; [pdf] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Feng and Kim, Minchul and Gu, ZiAng and Jain, Anil and Liu, Xiaoming}, title = {Learning Clothing and Pose Invariant 3D Shape Representation for Long-Term Person Re-Identification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19617-19626} }
Agile Modeling: From Concept to Classifier in Minutes: Otilia Stretcu,

Edward Vendrow,

Kenji Hata,

Krishnamurthy Viswanathan,

Vittorio Ferrari,

Sasan Tavakkol,

Wenlei Zhou,

Aditya Avinash,

Emming Luo,

Neil Gordon Alldrin,

MohammadHossein Bateni,

Gabriel Berger,

Andrew Bunner,

Chun-Ta Lu,

Javier Rey,

Giulia DeSalvo,

Ranjay Krishna,

Ariel Fuxman‎; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Stretcu_2023_ICCV, author = {Stretcu, Otilia and Vendrow, Edward and Hata, Kenji and Viswanathan, Krishnamurthy and Ferrari, Vittorio and Tavakkol, Sasan and Zhou, Wenlei and Avinash, Aditya and Luo, Emming and Alldrin, Neil Gordon and Bateni, MohammadHossein and Berger, Gabriel and Bunner, Andrew and Lu, Chun-Ta and Rey, Javier and DeSalvo, Giulia and Krishna, Ranjay and Fuxman‎, Ariel}, title = {Agile Modeling: From Concept to Classifier in Minutes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22323-22334} }
Improving Lens Flare Removal with General-Purpose Pipeline and Multiple Light Sources Recovery: Yuyan Zhou,

Dong Liang,

Songcan Chen,

Sheng-Jun Huang,

Shuo Yang,

Chongyi Li; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Yuyan and Liang, Dong and Chen, Songcan and Huang, Sheng-Jun and Yang, Shuo and Li, Chongyi}, title = {Improving Lens Flare Removal with General-Purpose Pipeline and Multiple Light Sources Recovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12969-12979} }
FACET: Fairness in Computer Vision Evaluation Benchmark: Laura Gustafson,

Chloe Rolland,

Nikhila Ravi,

Quentin Duval,

Aaron Adcock,

Cheng-Yang Fu,

Melissa Hall,

Candace Ross; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gustafson_2023_ICCV, author = {Gustafson, Laura and Rolland, Chloe and Ravi, Nikhila and Duval, Quentin and Adcock, Aaron and Fu, Cheng-Yang and Hall, Melissa and Ross, Candace}, title = {FACET: Fairness in Computer Vision Evaluation Benchmark}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20370-20382} }
Few-Shot Physically-Aware Articulated Mesh Generation via Hierarchical Deformation: Xueyi Liu,

Bin Wang,

He Wang,

Li Yi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Xueyi and Wang, Bin and Wang, He and Yi, Li}, title = {Few-Shot Physically-Aware Articulated Mesh Generation via Hierarchical Deformation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {854-864} }
Single-Stage Diffusion NeRF: A Unified Approach to 3D Generation and Reconstruction: Hansheng Chen,

Jiatao Gu,

Anpei Chen,

Wei Tian,

Zhuowen Tu,

Lingjie Liu,

Hao Su; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Hansheng and Gu, Jiatao and Chen, Anpei and Tian, Wei and Tu, Zhuowen and Liu, Lingjie and Su, Hao}, title = {Single-Stage Diffusion NeRF: A Unified Approach to 3D Generation and Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2416-2425} }
DCPB: Deformable Convolution Based on the Poincare Ball for Top-view Fisheye Cameras: Xuan Wei,

Zhidan Ran,

Xiaobo Lu; [pdf]
[bibtex]
@InProceedings{Wei_2023_ICCV, author = {Wei, Xuan and Ran, Zhidan and Lu, Xiaobo}, title = {DCPB: Deformable Convolution Based on the Poincare Ball for Top-view Fisheye Cameras}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13308-13317} }
Integrating Boxes and Masks: A Multi-Object Framework for Unified Visual Tracking and Segmentation: Yuanyou Xu,

Zongxin Yang,

Yi Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Yuanyou and Yang, Zongxin and Yang, Yi}, title = {Integrating Boxes and Masks: A Multi-Object Framework for Unified Visual Tracking and Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9738-9751} }
One-Shot Generative Domain Adaptation: Ceyuan Yang,

Yujun Shen,

Zhiyi Zhang,

Yinghao Xu,

Jiapeng Zhu,

Zhirong Wu,

Bolei Zhou; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Ceyuan and Shen, Yujun and Zhang, Zhiyi and Xu, Yinghao and Zhu, Jiapeng and Wu, Zhirong and Zhou, Bolei}, title = {One-Shot Generative Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7733-7742} }
Prototypes-oriented Transductive Few-shot Learning with Conditional Transport: Long Tian,

Jingyi Feng,

Xiaoqiang Chai,

Wenchao Chen,

Liming Wang,

Xiyang Liu,

Bo Chen; [pdf] [arXiv]
[bibtex]
@InProceedings{Tian_2023_ICCV, author = {Tian, Long and Feng, Jingyi and Chai, Xiaoqiang and Chen, Wenchao and Wang, Liming and Liu, Xiyang and Chen, Bo}, title = {Prototypes-oriented Transductive Few-shot Learning with Conditional Transport}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16317-16326} }
SparseFusion: Fusing Multi-Modal Sparse Representations for Multi-Sensor 3D Object Detection: Yichen Xie,

Chenfeng Xu,

Marie-Julie Rakotosaona,

Patrick Rim,

Federico Tombari,

Kurt Keutzer,

Masayoshi Tomizuka,

Wei Zhan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xie_2023_ICCV, author = {Xie, Yichen and Xu, Chenfeng and Rakotosaona, Marie-Julie and Rim, Patrick and Tombari, Federico and Keutzer, Kurt and Tomizuka, Masayoshi and Zhan, Wei}, title = {SparseFusion: Fusing Multi-Modal Sparse Representations for Multi-Sensor 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17591-17602} }
DetermiNet: A Large-Scale Diagnostic Dataset for Complex Visually-Grounded Referencing using Determiners: Clarence Lee,

M Ganesh Kumar,

Cheston Tan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2023_ICCV, author = {Lee, Clarence and Kumar, M Ganesh and Tan, Cheston}, title = {DetermiNet: A Large-Scale Diagnostic Dataset for Complex Visually-Grounded Referencing using Determiners}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20019-20028} }
3DMOTFormer: Graph Transformer for Online 3D Multi-Object Tracking: Shuxiao Ding,

Eike Rehder,

Lukas Schneider,

Marius Cordts,

Juergen Gall; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ding_2023_ICCV, author = {Ding, Shuxiao and Rehder, Eike and Schneider, Lukas and Cordts, Marius and Gall, Juergen}, title = {3DMOTFormer: Graph Transformer for Online 3D Multi-Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9784-9794} }
ReGen: A good Generative Zero-Shot Video Classifier Should be Rewarded: Adrian Bulat,

Enrique Sanchez,

Brais Martinez,

Georgios Tzimiropoulos; [pdf] [supp]
[bibtex]
@InProceedings{Bulat_2023_ICCV, author = {Bulat, Adrian and Sanchez, Enrique and Martinez, Brais and Tzimiropoulos, Georgios}, title = {ReGen: A good Generative Zero-Shot Video Classifier Should be Rewarded}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13523-13533} }
Complementary Domain Adaptation and Generalization for Unsupervised Continual Domain Shift Learning: Wonguk Cho,

Jinha Park,

Taesup Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cho_2023_ICCV, author = {Cho, Wonguk and Park, Jinha and Kim, Taesup}, title = {Complementary Domain Adaptation and Generalization for Unsupervised Continual Domain Shift Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11442-11452} }
RICO: Regularizing the Unobservable for Indoor Compositional Reconstruction: Zizhang Li,

Xiaoyang Lyu,

Yuanyuan Ding,

Mengmeng Wang,

Yiyi Liao,

Yong Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Zizhang and Lyu, Xiaoyang and Ding, Yuanyuan and Wang, Mengmeng and Liao, Yiyi and Liu, Yong}, title = {RICO: Regularizing the Unobservable for Indoor Compositional Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17761-17771} }
Ordered Atomic Activity for Fine-grained Interactive Traffic Scenario Understanding: Nakul Agarwal,

Yi-Ting Chen; [pdf] [supp]
[bibtex]
@InProceedings{Agarwal_2023_ICCV, author = {Agarwal, Nakul and Chen, Yi-Ting}, title = {Ordered Atomic Activity for Fine-grained Interactive Traffic Scenario Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8624-8636} }
CO-PILOT: Dynamic Top-Down Point Cloud with Conditional Neighborhood Aggregation for Multi-Gigapixel Histopathology Image Representation: Ramin Nakhli,

Allen Zhang,

Ali Mirabadi,

Katherine Rich,

Maryam Asadi,

Blake Gilks,

Hossein Farahani,

Ali Bashashati; [pdf] [supp]
[bibtex]
@InProceedings{Nakhli_2023_ICCV, author = {Nakhli, Ramin and Zhang, Allen and Mirabadi, Ali and Rich, Katherine and Asadi, Maryam and Gilks, Blake and Farahani, Hossein and Bashashati, Ali}, title = {CO-PILOT: Dynamic Top-Down Point Cloud with Conditional Neighborhood Aggregation for Multi-Gigapixel Histopathology Image Representation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21063-21073} }
Troubleshooting Ethnic Quality Bias with Curriculum Domain Adaptation for Face Image Quality Assessment: Fu-Zhao Ou,

Baoliang Chen,

Chongyi Li,

Shiqi Wang,

Sam Kwong; [pdf]
[bibtex]
@InProceedings{Ou_2023_ICCV, author = {Ou, Fu-Zhao and Chen, Baoliang and Li, Chongyi and Wang, Shiqi and Kwong, Sam}, title = {Troubleshooting Ethnic Quality Bias with Curriculum Domain Adaptation for Face Image Quality Assessment}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20718-20729} }
HybridAugment++: Unified Frequency Spectra Perturbations for Model Robustness: Mehmet Kerim Yucel,

Ramazan Gokberk Cinbis,

Pinar Duygulu; [pdf] [supp]
[bibtex]
@InProceedings{Yucel_2023_ICCV, author = {Yucel, Mehmet Kerim and Cinbis, Ramazan Gokberk and Duygulu, Pinar}, title = {HybridAugment++: Unified Frequency Spectra Perturbations for Model Robustness}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5718-5728} }
CLR: Channel-wise Lightweight Reprogramming for Continual Learning: Yunhao Ge,

Yuecheng Li,

Shuo Ni,

Jiaping Zhao,

Ming-Hsuan Yang,

Laurent Itti; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ge_2023_ICCV, author = {Ge, Yunhao and Li, Yuecheng and Ni, Shuo and Zhao, Jiaping and Yang, Ming-Hsuan and Itti, Laurent}, title = {CLR: Channel-wise Lightweight Reprogramming for Continual Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18798-18808} }
IOMatch: Simplifying Open-Set Semi-Supervised Learning with Joint Inliers and Outliers Utilization: Zekun Li,

Lei Qi,

Yinghuan Shi,

Yang Gao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Zekun and Qi, Lei and Shi, Yinghuan and Gao, Yang}, title = {IOMatch: Simplifying Open-Set Semi-Supervised Learning with Joint Inliers and Outliers Utilization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15870-15879} }
Hierarchical Point-based Active Learning for Semi-supervised Point Cloud Semantic Segmentation: Zongyi Xu,

Bo Yuan,

Shanshan Zhao,

Qianni Zhang,

Xinbo Gao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Zongyi and Yuan, Bo and Zhao, Shanshan and Zhang, Qianni and Gao, Xinbo}, title = {Hierarchical Point-based Active Learning for Semi-supervised Point Cloud Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18098-18108} }
Doppelgangers: Learning to Disambiguate Images of Similar Structures: Ruojin Cai,

Joseph Tung,

Qianqian Wang,

Hadar Averbuch-Elor,

Bharath Hariharan,

Noah Snavely; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cai_2023_ICCV, author = {Cai, Ruojin and Tung, Joseph and Wang, Qianqian and Averbuch-Elor, Hadar and Hariharan, Bharath and Snavely, Noah}, title = {Doppelgangers: Learning to Disambiguate Images of Similar Structures}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {34-44} }
BEV-DG: Cross-Modal Learning under Bird's-Eye View for Domain Generalization of 3D Semantic Segmentation: Miaoyu Li,

Yachao Zhang,

Xu Ma,

Yanyun Qu,

Yun Fu; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Miaoyu and Zhang, Yachao and Ma, Xu and Qu, Yanyun and Fu, Yun}, title = {BEV-DG: Cross-Modal Learning under Bird's-Eye View for Domain Generalization of 3D Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11632-11642} }
Grounded Entity-Landmark Adaptive Pre-Training for Vision-and-Language Navigation: Yibo Cui,

Liang Xie,

Yakun Zhang,

Meishan Zhang,

Ye Yan,

Erwei Yin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cui_2023_ICCV, author = {Cui, Yibo and Xie, Liang and Zhang, Yakun and Zhang, Meishan and Yan, Ye and Yin, Erwei}, title = {Grounded Entity-Landmark Adaptive Pre-Training for Vision-and-Language Navigation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12043-12053} }
Lip Reading for Low-resource Languages by Learning and Combining General Speech Knowledge and Language-specific Knowledge: Minsu Kim,

Jeong Hun Yeo,

Jeongsoo Choi,

Yong Man Ro; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2023_ICCV, author = {Kim, Minsu and Yeo, Jeong Hun and Choi, Jeongsoo and Ro, Yong Man}, title = {Lip Reading for Low-resource Languages by Learning and Combining General Speech Knowledge and Language-specific Knowledge}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15359-15371} }
Quality-Agnostic Deepfake Detection with Intra-model Collaborative Learning: Binh M. Le,

Simon S. Woo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Le_2023_ICCV, author = {Le, Binh M. and Woo, Simon S.}, title = {Quality-Agnostic Deepfake Detection with Intra-model Collaborative Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22378-22389} }
Object-Centric Multiple Object Tracking: Zixu Zhao,

Jiaze Wang,

Max Horn,

Yizhuo Ding,

Tong He,

Zechen Bai,

Dominik Zietlow,

Carl-Johann Simon-Gabriel,

Bing Shuai,

Zhuowen Tu,

Thomas Brox,

Bernt Schiele,

Yanwei Fu,

Francesco Locatello,

Zheng Zhang,

Tianjun Xiao; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Zixu and Wang, Jiaze and Horn, Max and Ding, Yizhuo and He, Tong and Bai, Zechen and Zietlow, Dominik and Simon-Gabriel, Carl-Johann and Shuai, Bing and Tu, Zhuowen and Brox, Thomas and Schiele, Bernt and Fu, Yanwei and Locatello, Francesco and Zhang, Zheng and Xiao, Tianjun}, title = {Object-Centric Multiple Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16601-16611} }
Point-TTA: Test-Time Adaptation for Point Cloud Registration Using Multitask Meta-Auxiliary Learning: Ahmed Hatem,

Yiming Qian,

Yang Wang; [pdf] [supp]
[bibtex]
@InProceedings{Hatem_2023_ICCV, author = {Hatem, Ahmed and Qian, Yiming and Wang, Yang}, title = {Point-TTA: Test-Time Adaptation for Point Cloud Registration Using Multitask Meta-Auxiliary Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16494-16504} }
HopFIR: Hop-wise GraphFormer with Intragroup Joint Refinement for 3D Human Pose Estimation: Kai Zhai,

Qiang Nie,

Bo Ouyang,

Xiang Li,

Shanlin Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhai_2023_ICCV, author = {Zhai, Kai and Nie, Qiang and Ouyang, Bo and Li, Xiang and Yang, Shanlin}, title = {HopFIR: Hop-wise GraphFormer with Intragroup Joint Refinement for 3D Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14985-14995} }
Improving Generalization of Adversarial Training via Robust Critical Fine-Tuning: Kaijie Zhu,

Xixu Hu,

Jindong Wang,

Xing Xie,

Ge Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Kaijie and Hu, Xixu and Wang, Jindong and Xie, Xing and Yang, Ge}, title = {Improving Generalization of Adversarial Training via Robust Critical Fine-Tuning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4424-4434} }
Minimal Solutions to Generalized Three-View Relative Pose Problem: Yaqing Ding,

Chiang-Heng Chien,

Viktor Larsson,

Karl Åström,

Benjamin Kimia; [pdf] [supp]
[bibtex]
@InProceedings{Ding_2023_ICCV, author = {Ding, Yaqing and Chien, Chiang-Heng and Larsson, Viktor and \r{A}str\"om, Karl and Kimia, Benjamin}, title = {Minimal Solutions to Generalized Three-View Relative Pose Problem}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8156-8164} }
Trajectory Unified Transformer for Pedestrian Trajectory Prediction: Liushuai Shi,

Le Wang,

Sanping Zhou,

Gang Hua; [pdf] [supp]
[bibtex]
@InProceedings{Shi_2023_ICCV, author = {Shi, Liushuai and Wang, Le and Zhou, Sanping and Hua, Gang}, title = {Trajectory Unified Transformer for Pedestrian Trajectory Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9675-9684} }
Understanding the Feature Norm for Out-of-Distribution Detection: Jaewoo Park,

Jacky Chen Long Chai,

Jaeho Yoon,

Andrew Beng Jin Teoh; [pdf] [supp]
[bibtex]
@InProceedings{Park_2023_ICCV, author = {Park, Jaewoo and Chai, Jacky Chen Long and Yoon, Jaeho and Teoh, Andrew Beng Jin}, title = {Understanding the Feature Norm for Out-of-Distribution Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1557-1567} }
MHEntropy: Entropy Meets Multiple Hypotheses for Pose and Shape Recovery: Rongyu Chen,

Linlin Yang,

Angela Yao; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Rongyu and Yang, Linlin and Yao, Angela}, title = {MHEntropy: Entropy Meets Multiple Hypotheses for Pose and Shape Recovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14840-14849} }
uSplit: Image Decomposition for Fluorescence Microscopy: Ashesh Ashesh,

Alexander Krull,

Moises Di Sante,

Francesco Pasqualini,

Florian Jug; [pdf] [supp]
[bibtex]
@InProceedings{Ashesh_2023_ICCV, author = {Ashesh, Ashesh and Krull, Alexander and Di Sante, Moises and Pasqualini, Francesco and Jug, Florian}, title = {uSplit: Image Decomposition for Fluorescence Microscopy}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21219-21229} }
Modeling the Relative Visual Tempo for Self-supervised Skeleton-based Action Recognition: Yisheng Zhu,

Hu Han,

Zhengtao Yu,

Guangcan Liu; [pdf]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Yisheng and Han, Hu and Yu, Zhengtao and Liu, Guangcan}, title = {Modeling the Relative Visual Tempo for Self-supervised Skeleton-based Action Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13913-13922} }
LightGlue: Local Feature Matching at Light Speed: Philipp Lindenberger,

Paul-Edouard Sarlin,

Marc Pollefeys; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lindenberger_2023_ICCV, author = {Lindenberger, Philipp and Sarlin, Paul-Edouard and Pollefeys, Marc}, title = {LightGlue: Local Feature Matching at Light Speed}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17627-17638} }
Masked Autoencoders are Efficient Class Incremental Learners: Jiang-Tian Zhai,

Xialei Liu,

Andrew D. Bagdanov,

Ke Li,

Ming-Ming Cheng; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhai_2023_ICCV, author = {Zhai, Jiang-Tian and Liu, Xialei and Bagdanov, Andrew D. and Li, Ke and Cheng, Ming-Ming}, title = {Masked Autoencoders are Efficient Class Incremental Learners}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19104-19113} }
Knowledge Proxy Intervention for Deconfounded Video Question Answering: Jiangtong Li,

Li Niu,

Liqing Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Jiangtong and Niu, Li and Zhang, Liqing}, title = {Knowledge Proxy Intervention for Deconfounded Video Question Answering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2782-2793} }
Towards Semi-supervised Learning with Non-random Missing Labels: Yue Duan,

Zhen Zhao,

Lei Qi,

Luping Zhou,

Lei Wang,

Yinghuan Shi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Duan_2023_ICCV, author = {Duan, Yue and Zhao, Zhen and Qi, Lei and Zhou, Luping and Wang, Lei and Shi, Yinghuan}, title = {Towards Semi-supervised Learning with Non-random Missing Labels}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16121-16131} }
DetZero: Rethinking Offboard 3D Object Detection with Long-term Sequential Point Clouds: Tao Ma,

Xuemeng Yang,

Hongbin Zhou,

Xin Li,

Botian Shi,

Junjie Liu,

Yuchen Yang,

Zhizheng Liu,

Liang He,

Yu Qiao,

Yikang Li,

Hongsheng Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ma_2023_ICCV, author = {Ma, Tao and Yang, Xuemeng and Zhou, Hongbin and Li, Xin and Shi, Botian and Liu, Junjie and Yang, Yuchen and Liu, Zhizheng and He, Liang and Qiao, Yu and Li, Yikang and Li, Hongsheng}, title = {DetZero: Rethinking Offboard 3D Object Detection with Long-term Sequential Point Clouds}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6736-6747} }
ImbSAM: A Closer Look at Sharpness-Aware Minimization in Class-Imbalanced Recognition: Yixuan Zhou,

Yi Qu,

Xing Xu,

Hengtao Shen; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Yixuan and Qu, Yi and Xu, Xing and Shen, Hengtao}, title = {ImbSAM: A Closer Look at Sharpness-Aware Minimization in Class-Imbalanced Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11345-11355} }
Learning from Noisy Data for Semi-Supervised 3D Object Detection: Zehui Chen,

Zhenyu Li,

Shuo Wang,

Dengpan Fu,

Feng Zhao; [pdf]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Zehui and Li, Zhenyu and Wang, Shuo and Fu, Dengpan and Zhao, Feng}, title = {Learning from Noisy Data for Semi-Supervised 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6929-6939} }
NeRFrac: Neural Radiance Fields through Refractive Surface: Yifan Zhan,

Shohei Nobuhara,

Ko Nishino,

Yinqiang Zheng; [pdf] [supp]
[bibtex]
@InProceedings{Zhan_2023_ICCV, author = {Zhan, Yifan and Nobuhara, Shohei and Nishino, Ko and Zheng, Yinqiang}, title = {NeRFrac: Neural Radiance Fields through Refractive Surface}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18402-18412} }
MonoDETR: Depth-guided Transformer for Monocular 3D Object Detection: Renrui Zhang,

Han Qiu,

Tai Wang,

Ziyu Guo,

Ziteng Cui,

Yu Qiao,

Hongsheng Li,

Peng Gao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Renrui and Qiu, Han and Wang, Tai and Guo, Ziyu and Cui, Ziteng and Qiao, Yu and Li, Hongsheng and Gao, Peng}, title = {MonoDETR: Depth-guided Transformer for Monocular 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9155-9166} }
Towards Authentic Face Restoration with Iterative Diffusion Models and Beyond: Yang Zhao,

Tingbo Hou,

Yu-Chuan Su,

Xuhui Jia,

Yandong Li,

Matthias Grundmann; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Yang and Hou, Tingbo and Su, Yu-Chuan and Jia, Xuhui and Li, Yandong and Grundmann, Matthias}, title = {Towards Authentic Face Restoration with Iterative Diffusion Models and Beyond}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7312-7322} }
LivelySpeaker: Towards Semantic-Aware Co-Speech Gesture Generation: Yihao Zhi,

Xiaodong Cun,

Xuelin Chen,

Xi Shen,

Wen Guo,

Shaoli Huang,

Shenghua Gao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhi_2023_ICCV, author = {Zhi, Yihao and Cun, Xiaodong and Chen, Xuelin and Shen, Xi and Guo, Wen and Huang, Shaoli and Gao, Shenghua}, title = {LivelySpeaker: Towards Semantic-Aware Co-Speech Gesture Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20807-20817} }
Contrastive Feature Masking Open-Vocabulary Vision Transformer: Dahun Kim,

Anelia Angelova,

Weicheng Kuo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2023_ICCV, author = {Kim, Dahun and Angelova, Anelia and Kuo, Weicheng}, title = {Contrastive Feature Masking Open-Vocabulary Vision Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15602-15612} }
Group DETR: Fast DETR Training with Group-Wise One-to-Many Assignment: Qiang Chen,

Xiaokang Chen,

Jian Wang,

Shan Zhang,

Kun Yao,

Haocheng Feng,

Junyu Han,

Errui Ding,

Gang Zeng,

Jingdong Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Qiang and Chen, Xiaokang and Wang, Jian and Zhang, Shan and Yao, Kun and Feng, Haocheng and Han, Junyu and Ding, Errui and Zeng, Gang and Wang, Jingdong}, title = {Group DETR: Fast DETR Training with Group-Wise One-to-Many Assignment}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6633-6642} }
Preventing Zero-Shot Transfer Degradation in Continual Learning of Vision-Language Models: Zangwei Zheng,

Mingyuan Ma,

Kai Wang,

Ziheng Qin,

Xiangyu Yue,

Yang You; [pdf] [arXiv]
[bibtex]
@InProceedings{Zheng_2023_ICCV, author = {Zheng, Zangwei and Ma, Mingyuan and Wang, Kai and Qin, Ziheng and Yue, Xiangyu and You, Yang}, title = {Preventing Zero-Shot Transfer Degradation in Continual Learning of Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19125-19136} }
Personalized Image Generation for Color Vision Deficiency Population: Shuyi Jiang,

Daochang Liu,

Dingquan Li,

Chang Xu; [pdf] [supp]
[bibtex]
@InProceedings{Jiang_2023_ICCV, author = {Jiang, Shuyi and Liu, Daochang and Li, Dingquan and Xu, Chang}, title = {Personalized Image Generation for Color Vision Deficiency Population}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22571-22580} }
EGC: Image Generation and Classification via a Diffusion Energy-Based Model: Qiushan Guo,

Chuofan Ma,

Yi Jiang,

Zehuan Yuan,

Yizhou Yu,

Ping Luo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Guo_2023_ICCV, author = {Guo, Qiushan and Ma, Chuofan and Jiang, Yi and Yuan, Zehuan and Yu, Yizhou and Luo, Ping}, title = {EGC: Image Generation and Classification via a Diffusion Energy-Based Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22952-22962} }
OccFormer: Dual-path Transformer for Vision-based 3D Semantic Occupancy Prediction: Yunpeng Zhang,

Zheng Zhu,

Dalong Du; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Yunpeng and Zhu, Zheng and Du, Dalong}, title = {OccFormer: Dual-path Transformer for Vision-based 3D Semantic Occupancy Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9433-9443} }
Probabilistic Triangulation for Uncalibrated Multi-View 3D Human Pose Estimation: Boyuan Jiang,

Lei Hu,

Shihong Xia; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jiang_2023_ICCV, author = {Jiang, Boyuan and Hu, Lei and Xia, Shihong}, title = {Probabilistic Triangulation for Uncalibrated Multi-View 3D Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14850-14860} }
Joint Metrics Matter: A Better Standard for Trajectory Forecasting: Erica Weng,

Hana Hoshino,

Deva Ramanan,

Kris Kitani; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Weng_2023_ICCV, author = {Weng, Erica and Hoshino, Hana and Ramanan, Deva and Kitani, Kris}, title = {Joint Metrics Matter: A Better Standard for Trajectory Forecasting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20315-20326} }
TORE: Token Reduction for Efficient Human Mesh Recovery with Transformer: Zhiyang Dou,

Qingxuan Wu,

Cheng Lin,

Zeyu Cao,

Qiangqiang Wu,

Weilin Wan,

Taku Komura,

Wenping Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dou_2023_ICCV, author = {Dou, Zhiyang and Wu, Qingxuan and Lin, Cheng and Cao, Zeyu and Wu, Qiangqiang and Wan, Weilin and Komura, Taku and Wang, Wenping}, title = {TORE: Token Reduction for Efficient Human Mesh Recovery with Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15143-15155} }
Test Time Adaptation for Blind Image Quality Assessment: Subhadeep Roy,

Shankhanil Mitra,

Soma Biswas,

Rajiv Soundararajan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Roy_2023_ICCV, author = {Roy, Subhadeep and Mitra, Shankhanil and Biswas, Soma and Soundararajan, Rajiv}, title = {Test Time Adaptation for Blind Image Quality Assessment}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16742-16751} }
GeT: Generative Target Structure Debiasing for Domain Adaptation: Can Zhang,

Gim Hee Lee; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Can and Lee, Gim Hee}, title = {GeT: Generative Target Structure Debiasing for Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23577-23588} }
D3G: Exploring Gaussian Prior for Temporal Sentence Grounding with Glance Annotation: Hanjun Li,

Xiujun Shu,

Sunan He,

Ruizhi Qiao,

Wei Wen,

Taian Guo,

Bei Gan,

Xing Sun; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Hanjun and Shu, Xiujun and He, Sunan and Qiao, Ruizhi and Wen, Wei and Guo, Taian and Gan, Bei and Sun, Xing}, title = {D3G: Exploring Gaussian Prior for Temporal Sentence Grounding with Glance Annotation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13734-13746} }
GEDepth: Ground Embedding for Monocular Depth Estimation: Xiaodong Yang,

Zhuang Ma,

Zhiyu Ji,

Zhe Ren; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Xiaodong and Ma, Zhuang and Ji, Zhiyu and Ren, Zhe}, title = {GEDepth: Ground Embedding for Monocular Depth Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12719-12727} }
DETRs with Collaborative Hybrid Assignments Training: Zhuofan Zong,

Guanglu Song,

Yu Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zong_2023_ICCV, author = {Zong, Zhuofan and Song, Guanglu and Liu, Yu}, title = {DETRs with Collaborative Hybrid Assignments Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6748-6758} }
Animal3D: A Comprehensive Dataset of 3D Animal Pose and Shape: Jiacong Xu,

Yi Zhang,

Jiawei Peng,

Wufei Ma,

Artur Jesslen,

Pengliang Ji,

Qixin Hu,

Jiehua Zhang,

Qihao Liu,

Jiahao Wang,

Wei Ji,

Chen Wang,

Xiaoding Yuan,

Prakhar Kaushik,

Guofeng Zhang,

Jie Liu,

Yushan Xie,

Yawen Cui,

Alan Yuille,

Adam Kortylewski; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Jiacong and Zhang, Yi and Peng, Jiawei and Ma, Wufei and Jesslen, Artur and Ji, Pengliang and Hu, Qixin and Zhang, Jiehua and Liu, Qihao and Wang, Jiahao and Ji, Wei and Wang, Chen and Yuan, Xiaoding and Kaushik, Prakhar and Zhang, Guofeng and Liu, Jie and Xie, Yushan and Cui, Yawen and Yuille, Alan and Kortylewski, Adam}, title = {Animal3D: A Comprehensive Dataset of 3D Animal Pose and Shape}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9099-9109} }
Rethinking Video Frame Interpolation from Shutter Mode Induced Degradation: Xiang Ji,

Zhixiang Wang,

Zhihang Zhong,

Yinqiang Zheng; [pdf] [supp]
[bibtex]
@InProceedings{Ji_2023_ICCV, author = {Ji, Xiang and Wang, Zhixiang and Zhong, Zhihang and Zheng, Yinqiang}, title = {Rethinking Video Frame Interpolation from Shutter Mode Induced Degradation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12259-12268} }
Multi-Modal Neural Radiance Field for Monocular Dense SLAM with a Light-Weight ToF Sensor: Xinyang Liu,

Yijin Li,

Yanbin Teng,

Hujun Bao,

Guofeng Zhang,

Yinda Zhang,

Zhaopeng Cui; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Xinyang and Li, Yijin and Teng, Yanbin and Bao, Hujun and Zhang, Guofeng and Zhang, Yinda and Cui, Zhaopeng}, title = {Multi-Modal Neural Radiance Field for Monocular Dense SLAM with a Light-Weight ToF Sensor}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1-11} }
MonoNeRD: NeRF-like Representations for Monocular 3D Object Detection: Junkai Xu,

Liang Peng,

Haoran Cheng,

Hao Li,

Wei Qian,

Ke Li,

Wenxiao Wang,

Deng Cai; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Junkai and Peng, Liang and Cheng, Haoran and Li, Hao and Qian, Wei and Li, Ke and Wang, Wenxiao and Cai, Deng}, title = {MonoNeRD: NeRF-like Representations for Monocular 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6814-6824} }
Monocular 3D Object Detection with Bounding Box Denoising in 3D by Perceiver: Xianpeng Liu,

Ce Zheng,

Kelvin B Cheng,

Nan Xue,

Guo-Jun Qi,

Tianfu Wu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Xianpeng and Zheng, Ce and Cheng, Kelvin B and Xue, Nan and Qi, Guo-Jun and Wu, Tianfu}, title = {Monocular 3D Object Detection with Bounding Box Denoising in 3D by Perceiver}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6436-6446} }
Point-SLAM: Dense Neural Point Cloud-based SLAM: Erik Sandström,

Yue Li,

Luc Van Gool,

Martin R. Oswald; [pdf] [supp]
[bibtex]
@InProceedings{Sandstrom_2023_ICCV, author = {Sandstr\"om, Erik and Li, Yue and Van Gool, Luc and Oswald, Martin R.}, title = {Point-SLAM: Dense Neural Point Cloud-based SLAM}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18433-18444} }
TrajectoryFormer: 3D Object Tracking Transformer with Predictive Trajectory Hypotheses: Xuesong Chen,

Shaoshuai Shi,

Chao Zhang,

Benjin Zhu,

Qiang Wang,

Ka Chun Cheung,

Simon See,

Hongsheng Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Xuesong and Shi, Shaoshuai and Zhang, Chao and Zhu, Benjin and Wang, Qiang and Cheung, Ka Chun and See, Simon and Li, Hongsheng}, title = {TrajectoryFormer: 3D Object Tracking Transformer with Predictive Trajectory Hypotheses}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18527-18536} }
Semantic-Aware Dynamic Parameter for Video Inpainting Transformer: Eunhye Lee,

Jinsu Yoo,

Yunjeong Yang,

Sungyong Baik,

Tae Hyun Kim; [pdf] [supp]
[bibtex]
@InProceedings{Lee_2023_ICCV, author = {Lee, Eunhye and Yoo, Jinsu and Yang, Yunjeong and Baik, Sungyong and Kim, Tae Hyun}, title = {Semantic-Aware Dynamic Parameter for Video Inpainting Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12949-12958} }
See More and Know More: Zero-shot Point Cloud Segmentation via Multi-modal Visual Data: Yuhang Lu,

Qi Jiang,

Runnan Chen,

Yuenan Hou,

Xinge Zhu,

Yuexin Ma; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lu_2023_ICCV, author = {Lu, Yuhang and Jiang, Qi and Chen, Runnan and Hou, Yuenan and Zhu, Xinge and Ma, Yuexin}, title = {See More and Know More: Zero-shot Point Cloud Segmentation via Multi-modal Visual Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21674-21684} }
SKED: Sketch-guided Text-based 3D Editing: Aryan Mikaeili,

Or Perel,

Mehdi Safaee,

Daniel Cohen-Or,

Ali Mahdavi-Amiri; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mikaeili_2023_ICCV, author = {Mikaeili, Aryan and Perel, Or and Safaee, Mehdi and Cohen-Or, Daniel and Mahdavi-Amiri, Ali}, title = {SKED: Sketch-guided Text-based 3D Editing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14607-14619} }
WaveIPT: Joint Attention and Flow Alignment in the Wavelet domain for Pose Transfer: Liyuan Ma,

Tingwei Gao,

Haitian Jiang,

Haibin Shen,

Kejie Huang; [pdf] [supp]
[bibtex]
@InProceedings{Ma_2023_ICCV, author = {Ma, Liyuan and Gao, Tingwei and Jiang, Haitian and Shen, Haibin and Huang, Kejie}, title = {WaveIPT: Joint Attention and Flow Alignment in the Wavelet domain for Pose Transfer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7215-7225} }
Editable Image Geometric Abstraction via Neural Primitive Assembly: Ye Chen,

Bingbing Ni,

Xuanhong Chen,

Zhangli Hu; [pdf]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Ye and Ni, Bingbing and Chen, Xuanhong and Hu, Zhangli}, title = {Editable Image Geometric Abstraction via Neural Primitive Assembly}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23514-23523} }
Homeomorphism Alignment for Unsupervised Domain Adaptation: Lihua Zhou,

Mao Ye,

Xiatian Zhu,

Siying Xiao,

Xu-Qian Fan,

Ferrante Neri; [pdf] [supp]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Lihua and Ye, Mao and Zhu, Xiatian and Xiao, Siying and Fan, Xu-Qian and Neri, Ferrante}, title = {Homeomorphism Alignment for Unsupervised Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18699-18710} }
MBPTrack: Improving 3D Point Cloud Tracking with Memory Networks and Box Priors: Tian-Xing Xu,

Yuan-Chen Guo,

Yu-Kun Lai,

Song-Hai Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Tian-Xing and Guo, Yuan-Chen and Lai, Yu-Kun and Zhang, Song-Hai}, title = {MBPTrack: Improving 3D Point Cloud Tracking with Memory Networks and Box Priors}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9911-9920} }
Novel-View Synthesis and Pose Estimation for Hand-Object Interaction from Sparse Views: Wentian Qu,

Zhaopeng Cui,

Yinda Zhang,

Chenyu Meng,

Cuixia Ma,

Xiaoming Deng,

Hongan Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Qu_2023_ICCV, author = {Qu, Wentian and Cui, Zhaopeng and Zhang, Yinda and Meng, Chenyu and Ma, Cuixia and Deng, Xiaoming and Wang, Hongan}, title = {Novel-View Synthesis and Pose Estimation for Hand-Object Interaction from Sparse Views}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15100-15111} }
EmoSet: A Large-scale Visual Emotion Dataset with Rich Attributes: Jingyuan Yang,

Qirui Huang,

Tingting Ding,

Dani Lischinski,

Danny Cohen-Or,

Hui Huang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Jingyuan and Huang, Qirui and Ding, Tingting and Lischinski, Dani and Cohen-Or, Danny and Huang, Hui}, title = {EmoSet: A Large-scale Visual Emotion Dataset with Rich Attributes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20383-20394} }
Distilling from Similar Tasks for Transfer Learning on a Budget: Kenneth Borup,

Cheng Perng Phoo,

Bharath Hariharan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Borup_2023_ICCV, author = {Borup, Kenneth and Phoo, Cheng Perng and Hariharan, Bharath}, title = {Distilling from Similar Tasks for Transfer Learning on a Budget}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11431-11441} }
Self-Supervised Burst Super-Resolution: Goutam Bhat,

Michaël Gharbi,

Jiawen Chen,

Luc Van Gool,

Zhihao Xia; [pdf] [supp]
[bibtex]
@InProceedings{Bhat_2023_ICCV, author = {Bhat, Goutam and Gharbi, Micha\"el and Chen, Jiawen and Van Gool, Luc and Xia, Zhihao}, title = {Self-Supervised Burst Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10605-10614} }
Class-relation Knowledge Distillation for Novel Class Discovery: Peiyan Gu,

Chuyu Zhang,

Ruijie Xu,

Xuming He; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gu_2023_ICCV, author = {Gu, Peiyan and Zhang, Chuyu and Xu, Ruijie and He, Xuming}, title = {Class-relation Knowledge Distillation for Novel Class Discovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16474-16483} }
PARTNER: Level up the Polar Representation for LiDAR 3D Object Detection: Ming Nie,

Yujing Xue,

Chunwei Wang,

Chaoqiang Ye,

Hang Xu,

Xinge Zhu,

Qingqiu Huang,

Michael Bi Mi,

Xinchao Wang,

Li Zhang; [pdf] [arXiv]
[bibtex]
@InProceedings{Nie_2023_ICCV, author = {Nie, Ming and Xue, Yujing and Wang, Chunwei and Ye, Chaoqiang and Xu, Hang and Zhu, Xinge and Huang, Qingqiu and Mi, Michael Bi and Wang, Xinchao and Zhang, Li}, title = {PARTNER: Level up the Polar Representation for LiDAR 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3801-3813} }
Data-Free Class-Incremental Hand Gesture Recognition: Shubhra Aich,

Jesus Ruiz-Santaquiteria,

Zhenyu Lu,

Prachi Garg,

K J Joseph,

Alvaro Fernandez Garcia,

Vineeth N Balasubramanian,

Kenrick Kin,

Chengde Wan,

Necati Cihan Camgoz,

Shugao Ma,

Fernando De la Torre; [pdf] [supp]
[bibtex]
@InProceedings{Aich_2023_ICCV, author = {Aich, Shubhra and Ruiz-Santaquiteria, Jesus and Lu, Zhenyu and Garg, Prachi and Joseph, K J and Garcia, Alvaro Fernandez and Balasubramanian, Vineeth N and Kin, Kenrick and Wan, Chengde and Camgoz, Necati Cihan and Ma, Shugao and De la Torre, Fernando}, title = {Data-Free Class-Incremental Hand Gesture Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20958-20967} }
Corrupting Neuron Explanations of Deep Visual Features: Divyansh Srivastava,

Tuomas Oikarinen,

Tsui-Wei Weng; [pdf] [supp]
[bibtex]
@InProceedings{Srivastava_2023_ICCV, author = {Srivastava, Divyansh and Oikarinen, Tuomas and Weng, Tsui-Wei}, title = {Corrupting Neuron Explanations of Deep Visual Features}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1877-1886} }
PNI : Industrial Anomaly Detection using Position and Neighborhood Information: Jaehyeok Bae,

Jae-Han Lee,

Seyun Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bae_2023_ICCV, author = {Bae, Jaehyeok and Lee, Jae-Han and Kim, Seyun}, title = {PNI : Industrial Anomaly Detection using Position and Neighborhood Information}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6373-6383} }
PC-Adapter: Topology-Aware Adapter for Efficient Domain Adaption on Point Clouds with Rectified Pseudo-label: Joonhyung Park,

Hyunjin Seo,

Eunho Yang; [pdf] [supp]
[bibtex]
@InProceedings{Park_2023_ICCV, author = {Park, Joonhyung and Seo, Hyunjin and Yang, Eunho}, title = {PC-Adapter: Topology-Aware Adapter for Efficient Domain Adaption on Point Clouds with Rectified Pseudo-label}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11530-11540} }
Cyclic Test-Time Adaptation on Monocular Video for 3D Human Mesh Reconstruction: Hyeongjin Nam,

Daniel Sungho Jung,

Yeonguk Oh,

Kyoung Mu Lee; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Nam_2023_ICCV, author = {Nam, Hyeongjin and Jung, Daniel Sungho and Oh, Yeonguk and Lee, Kyoung Mu}, title = {Cyclic Test-Time Adaptation on Monocular Video for 3D Human Mesh Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14829-14839} }
2D3D-MATR: 2D-3D Matching Transformer for Detection-Free Registration Between Images and Point Clouds: Minhao Li,

Zheng Qin,

Zhirui Gao,

Renjiao Yi,

Chenyang Zhu,

Yulan Guo,

Kai Xu; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Minhao and Qin, Zheng and Gao, Zhirui and Yi, Renjiao and Zhu, Chenyang and Guo, Yulan and Xu, Kai}, title = {2D3D-MATR: 2D-3D Matching Transformer for Detection-Free Registration Between Images and Point Clouds}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14128-14138} }
Mixed Neural Voxels for Fast Multi-view Video Synthesis: Feng Wang,

Sinan Tan,

Xinghang Li,

Zeyue Tian,

Yafei Song,

Huaping Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Feng and Tan, Sinan and Li, Xinghang and Tian, Zeyue and Song, Yafei and Liu, Huaping}, title = {Mixed Neural Voxels for Fast Multi-view Video Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19706-19716} }
Bidirectionally Deformable Motion Modulation For Video-based Human Pose Transfer: Wing-Yin Yu,

Lai-Man Po,

Ray C.C. Cheung,

Yuzhi Zhao,

Yu Xue,

Kun Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yu_2023_ICCV, author = {Yu, Wing-Yin and Po, Lai-Man and Cheung, Ray C.C. and Zhao, Yuzhi and Xue, Yu and Li, Kun}, title = {Bidirectionally Deformable Motion Modulation For Video-based Human Pose Transfer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7502-7512} }
Harvard Glaucoma Detection and Progression: A Multimodal Multitask Dataset and Generalization-Reinforced Semi-Supervised Learning: Yan Luo,

Min Shi,

Yu Tian,

Tobias Elze,

Mengyu Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Luo_2023_ICCV, author = {Luo, Yan and Shi, Min and Tian, Yu and Elze, Tobias and Wang, Mengyu}, title = {Harvard Glaucoma Detection and Progression: A Multimodal Multitask Dataset and Generalization-Reinforced Semi-Supervised Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20471-20482} }
Tracking Everything Everywhere All at Once: Qianqian Wang,

Yen-Yu Chang,

Ruojin Cai,

Zhengqi Li,

Bharath Hariharan,

Aleksander Holynski,

Noah Snavely; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Qianqian and Chang, Yen-Yu and Cai, Ruojin and Li, Zhengqi and Hariharan, Bharath and Holynski, Aleksander and Snavely, Noah}, title = {Tracking Everything Everywhere All at Once}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19795-19806} }
Group Pose: A Simple Baseline for End-to-End Multi-Person Pose Estimation: Huan Liu,

Qiang Chen,

Zichang Tan,

Jiang-Jiang Liu,

Jian Wang,

Xiangbo Su,

Xiaolong Li,

Kun Yao,

Junyu Han,

Errui Ding,

Yao Zhao,

Jingdong Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Huan and Chen, Qiang and Tan, Zichang and Liu, Jiang-Jiang and Wang, Jian and Su, Xiangbo and Li, Xiaolong and Yao, Kun and Han, Junyu and Ding, Errui and Zhao, Yao and Wang, Jingdong}, title = {Group Pose: A Simple Baseline for End-to-End Multi-Person Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15029-15038} }
Objects Do Not Disappear: Video Object Detection by Single-Frame Object Location Anticipation: Xin Liu,

Fatemeh Karimi Nejadasl,

Jan C. van Gemert,

Olaf Booij,

Silvia L. Pintea; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Xin and Nejadasl, Fatemeh Karimi and van Gemert, Jan C. and Booij, Olaf and Pintea, Silvia L.}, title = {Objects Do Not Disappear: Video Object Detection by Single-Frame Object Location Anticipation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6950-6961} }
CauSSL: Causality-inspired Semi-supervised Learning for Medical Image Segmentation: Juzheng Miao,

Cheng Chen,

Furui Liu,

Hao Wei,

Pheng-Ann Heng; [pdf] [supp]
[bibtex]
@InProceedings{Miao_2023_ICCV, author = {Miao, Juzheng and Chen, Cheng and Liu, Furui and Wei, Hao and Heng, Pheng-Ann}, title = {CauSSL: Causality-inspired Semi-supervised Learning for Medical Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21426-21437} }
ChartReader: A Unified Framework for Chart Derendering and Comprehension without Heuristic Rules: Zhi-Qi Cheng,

Qi Dai,

Alexander G. Hauptmann; [pdf] [arXiv]
[bibtex]
@InProceedings{Cheng_2023_ICCV, author = {Cheng, Zhi-Qi and Dai, Qi and Hauptmann, Alexander G.}, title = {ChartReader: A Unified Framework for Chart Derendering and Comprehension without Heuristic Rules}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22202-22213} }
Learning from Semantic Alignment between Unpaired Multiviews for Egocentric Video Recognition: Qitong Wang,

Long Zhao,

Liangzhe Yuan,

Ting Liu,

Xi Peng; [pdf] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Qitong and Zhao, Long and Yuan, Liangzhe and Liu, Ting and Peng, Xi}, title = {Learning from Semantic Alignment between Unpaired Multiviews for Egocentric Video Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3307-3317} }
Neural LiDAR Fields for Novel View Synthesis: Shengyu Huang,

Zan Gojcic,

Zian Wang,

Francis Williams,

Yoni Kasten,

Sanja Fidler,

Konrad Schindler,

Or Litany; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Shengyu and Gojcic, Zan and Wang, Zian and Williams, Francis and Kasten, Yoni and Fidler, Sanja and Schindler, Konrad and Litany, Or}, title = {Neural LiDAR Fields for Novel View Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18236-18246} }
Source-free Depth for Object Pop-out: Zongwei WU,

Danda Pani Paudel,

Deng-Ping Fan,

Jingjing Wang,

Shuo Wang,

Cédric Demonceaux,

Radu Timofte,

Luc Van Gool; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{WU_2023_ICCV, author = {WU, Zongwei and Paudel, Danda Pani and Fan, Deng-Ping and Wang, Jingjing and Wang, Shuo and Demonceaux, C\'edric and Timofte, Radu and Van Gool, Luc}, title = {Source-free Depth for Object Pop-out}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1032-1042} }
Token-Label Alignment for Vision Transformers: Han Xiao,

Wenzhao Zheng,

Zheng Zhu,

Jie Zhou,

Jiwen Lu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xiao_2023_ICCV, author = {Xiao, Han and Zheng, Wenzhao and Zhu, Zheng and Zhou, Jie and Lu, Jiwen}, title = {Token-Label Alignment for Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5495-5504} }
Understanding 3D Object Interaction from a Single Image: Shengyi Qian,

David F. Fouhey; [pdf] [arXiv]
[bibtex]
@InProceedings{Qian_2023_ICCV, author = {Qian, Shengyi and Fouhey, David F.}, title = {Understanding 3D Object Interaction from a Single Image}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21753-21763} }
SkeleTR: Towards Skeleton-based Action Recognition in the Wild: Haodong Duan,

Mingze Xu,

Bing Shuai,

Davide Modolo,

Zhuowen Tu,

Joseph Tighe,

Alessandro Bergamo; [pdf]
[bibtex]
@InProceedings{Duan_2023_ICCV, author = {Duan, Haodong and Xu, Mingze and Shuai, Bing and Modolo, Davide and Tu, Zhuowen and Tighe, Joseph and Bergamo, Alessandro}, title = {SkeleTR: Towards Skeleton-based Action Recognition in the Wild}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13634-13644} }
Learning Gabor Texture Features for Fine-Grained Recognition: Lanyun Zhu,

Tianrun Chen,

Jianxiong Yin,

Simon See,

Jun Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Lanyun and Chen, Tianrun and Yin, Jianxiong and See, Simon and Liu, Jun}, title = {Learning Gabor Texture Features for Fine-Grained Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1621-1631} }
Weakly-Supervised Action Localization by Hierarchically-Structured Latent Attention Modeling: Guiqin Wang,

Peng Zhao,

Cong Zhao,

Shusen Yang,

Jie Cheng,

Luziwei Leng,

Jianxing Liao,

Qinghai Guo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Guiqin and Zhao, Peng and Zhao, Cong and Yang, Shusen and Cheng, Jie and Leng, Luziwei and Liao, Jianxing and Guo, Qinghai}, title = {Weakly-Supervised Action Localization by Hierarchically-Structured Latent Attention Modeling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10203-10213} }
Get3DHuman: Lifting StyleGAN-Human into a 3D Generative Model Using Pixel-Aligned Reconstruction Priors: Zhangyang Xiong,

Di Kang,

Derong Jin,

Weikai Chen,

Linchao Bao,

Shuguang Cui,

Xiaoguang Han; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xiong_2023_ICCV, author = {Xiong, Zhangyang and Kang, Di and Jin, Derong and Chen, Weikai and Bao, Linchao and Cui, Shuguang and Han, Xiaoguang}, title = {Get3DHuman: Lifting StyleGAN-Human into a 3D Generative Model Using Pixel-Aligned Reconstruction Priors}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9287-9297} }
Query6DoF: Learning Sparse Queries as Implicit Shape Prior for Category-Level 6DoF Pose Estimation: Ruiqi Wang,

Xinggang Wang,

Te Li,

Rong Yang,

Minhong Wan,

Wenyu Liu; [pdf]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Ruiqi and Wang, Xinggang and Li, Te and Yang, Rong and Wan, Minhong and Liu, Wenyu}, title = {Query6DoF: Learning Sparse Queries as Implicit Shape Prior for Category-Level 6DoF Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14055-14064} }
Towards High-Quality Specular Highlight Removal by Leveraging Large-Scale Synthetic Data: Gang Fu,

Qing Zhang,

Lei Zhu,

Chunxia Xiao,

Ping Li; [pdf] [arXiv]
[bibtex]
@InProceedings{Fu_2023_ICCV, author = {Fu, Gang and Zhang, Qing and Zhu, Lei and Xiao, Chunxia and Li, Ping}, title = {Towards High-Quality Specular Highlight Removal by Leveraging Large-Scale Synthetic Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12857-12865} }
An Embarrassingly Simple Backdoor Attack on Self-supervised Learning: Changjiang Li,

Ren Pang,

Zhaohan Xi,

Tianyu Du,

Shouling Ji,

Yuan Yao,

Ting Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Changjiang and Pang, Ren and Xi, Zhaohan and Du, Tianyu and Ji, Shouling and Yao, Yuan and Wang, Ting}, title = {An Embarrassingly Simple Backdoor Attack on Self-supervised Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4367-4378} }
Cross-Modal Translation and Alignment for Survival Analysis: Fengtao Zhou,

Hao Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Fengtao and Chen, Hao}, title = {Cross-Modal Translation and Alignment for Survival Analysis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21485-21494} }
Chaotic World: A Large and Challenging Benchmark for Human Behavior Understanding in Chaotic Events: Kian Eng Ong,

Xun Long Ng,

Yanchao Li,

Wenjie Ai,

Kuangyi Zhao,

Si Yong Yeo,

Jun Liu; [pdf] [supp]
[bibtex]
@InProceedings{Ong_2023_ICCV, author = {Ong, Kian Eng and Ng, Xun Long and Li, Yanchao and Ai, Wenjie and Zhao, Kuangyi and Yeo, Si Yong and Liu, Jun}, title = {Chaotic World: A Large and Challenging Benchmark for Human Behavior Understanding in Chaotic Events}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20213-20223} }
Unsupervised 3D Perception with 2D Vision-Language Distillation for Autonomous Driving: Mahyar Najibi,

Jingwei Ji,

Yin Zhou,

Charles R. Qi,

Xinchen Yan,

Scott Ettinger,

Dragomir Anguelov; [pdf] [supp]
[bibtex]
@InProceedings{Najibi_2023_ICCV, author = {Najibi, Mahyar and Ji, Jingwei and Zhou, Yin and Qi, Charles R. and Yan, Xinchen and Ettinger, Scott and Anguelov, Dragomir}, title = {Unsupervised 3D Perception with 2D Vision-Language Distillation for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8602-8612} }
Towards Grand Unified Representation Learning for Unsupervised Visible-Infrared Person Re-Identification: Bin Yang,

Jun Chen,

Mang Ye; [pdf] [supp]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Bin and Chen, Jun and Ye, Mang}, title = {Towards Grand Unified Representation Learning for Unsupervised Visible-Infrared Person Re-Identification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11069-11079} }
Active Stereo Without Pattern Projector: Luca Bartolomei,

Matteo Poggi,

Fabio Tosi,

Andrea Conti,

Stefano Mattoccia; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bartolomei_2023_ICCV, author = {Bartolomei, Luca and Poggi, Matteo and Tosi, Fabio and Conti, Andrea and Mattoccia, Stefano}, title = {Active Stereo Without Pattern Projector}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18470-18482} }
Partition Speeds Up Learning Implicit Neural Representations Based on Exponential-Increase Hypothesis: Ke Liu,

Feng Liu,

Haishuai Wang,

Ning Ma,

Jiajun Bu,

Bo Han; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Ke and Liu, Feng and Wang, Haishuai and Ma, Ning and Bu, Jiajun and Han, Bo}, title = {Partition Speeds Up Learning Implicit Neural Representations Based on Exponential-Increase Hypothesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5474-5483} }
Uncertainty Guided Adaptive Warping for Robust and Efficient Stereo Matching: Junpeng Jing,

Jiankun Li,

Pengfei Xiong,

Jiangyu Liu,

Shuaicheng Liu,

Yichen Guo,

Xin Deng,

Mai Xu,

Lai Jiang,

Leonid Sigal; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jing_2023_ICCV, author = {Jing, Junpeng and Li, Jiankun and Xiong, Pengfei and Liu, Jiangyu and Liu, Shuaicheng and Guo, Yichen and Deng, Xin and Xu, Mai and Jiang, Lai and Sigal, Leonid}, title = {Uncertainty Guided Adaptive Warping for Robust and Efficient Stereo Matching}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3318-3327} }
ReFit: Recurrent Fitting Network for 3D Human Recovery: Yufu Wang,

Kostas Daniilidis; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Yufu and Daniilidis, Kostas}, title = {ReFit: Recurrent Fitting Network for 3D Human Recovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14644-14654} }
Towards Instance-adaptive Inference for Federated Learning: Chun-Mei Feng,

Kai Yu,

Nian Liu,

Xinxing Xu,

Salman Khan,

Wangmeng Zuo; [pdf] [arXiv]
[bibtex]
@InProceedings{Feng_2023_ICCV, author = {Feng, Chun-Mei and Yu, Kai and Liu, Nian and Xu, Xinxing and Khan, Salman and Zuo, Wangmeng}, title = {Towards Instance-adaptive Inference for Federated Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23287-23296} }
CGBA: Curvature-aware Geometric Black-box Attack: Md Farhamdur Reza,

Ali Rahmati,

Tianfu Wu,

Huaiyu Dai; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Reza_2023_ICCV, author = {Reza, Md Farhamdur and Rahmati, Ali and Wu, Tianfu and Dai, Huaiyu}, title = {CGBA: Curvature-aware Geometric Black-box Attack}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {124-133} }
Unsupervised Facial Performance Editing via Vector-Quantized StyleGAN Representations: Berkay Kicanaoglu,

Pablo Garrido,

Gaurav Bharaj; [pdf] [supp]
[bibtex]
@InProceedings{Kicanaoglu_2023_ICCV, author = {Kicanaoglu, Berkay and Garrido, Pablo and Bharaj, Gaurav}, title = {Unsupervised Facial Performance Editing via Vector-Quantized StyleGAN Representations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2371-2382} }
Online Clustered Codebook: Chuanxia Zheng,

Andrea Vedaldi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zheng_2023_ICCV, author = {Zheng, Chuanxia and Vedaldi, Andrea}, title = {Online Clustered Codebook}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22798-22807} }
A Multidimensional Analysis of Social Biases in Vision Transformers: Jannik Brinkmann,

Paul Swoboda,

Christian Bartelt; [pdf] [arXiv]
[bibtex]
@InProceedings{Brinkmann_2023_ICCV, author = {Brinkmann, Jannik and Swoboda, Paul and Bartelt, Christian}, title = {A Multidimensional Analysis of Social Biases in Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4914-4923} }
PGFed: Personalize Each Client's Global Objective for Federated Learning: Jun Luo,

Matias Mendieta,

Chen Chen,

Shandong Wu; [pdf] [supp]
[bibtex]
@InProceedings{Luo_2023_ICCV, author = {Luo, Jun and Mendieta, Matias and Chen, Chen and Wu, Shandong}, title = {PGFed: Personalize Each Client's Global Objective for Federated Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3946-3956} }
Verbs in Action: Improving Verb Understanding in Video-Language Models: Liliane Momeni,

Mathilde Caron,

Arsha Nagrani,

Andrew Zisserman,

Cordelia Schmid; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Momeni_2023_ICCV, author = {Momeni, Liliane and Caron, Mathilde and Nagrani, Arsha and Zisserman, Andrew and Schmid, Cordelia}, title = {Verbs in Action: Improving Verb Understanding in Video-Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15579-15591} }
Zero-Shot Point Cloud Segmentation by Semantic-Visual Aware Synthesis: Yuwei Yang,

Munawar Hayat,

Zhao Jin,

Hongyuan Zhu,

Yinjie Lei; [pdf] [supp]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Yuwei and Hayat, Munawar and Jin, Zhao and Zhu, Hongyuan and Lei, Yinjie}, title = {Zero-Shot Point Cloud Segmentation by Semantic-Visual Aware Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11586-11596} }
Exploring Predicate Visual Context in Detecting of Human-Object Interactions: Frederic Z Zhang,

Yuhui Yuan,

Dylan Campbell,

Zhuoyao Zhong,

Stephen Gould; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Frederic Z and Yuan, Yuhui and Campbell, Dylan and Zhong, Zhuoyao and Gould, Stephen}, title = {Exploring Predicate Visual Context in Detecting of Human-Object Interactions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10411-10421} }
Robo3D: Towards Robust and Reliable 3D Perception against Corruptions: Lingdong Kong,

Youquan Liu,

Xin Li,

Runnan Chen,

Wenwei Zhang,

Jiawei Ren,

Liang Pan,

Kai Chen,

Ziwei Liu; [pdf] [arXiv]
[bibtex]
@InProceedings{Kong_2023_ICCV, author = {Kong, Lingdong and Liu, Youquan and Li, Xin and Chen, Runnan and Zhang, Wenwei and Ren, Jiawei and Pan, Liang and Chen, Kai and Liu, Ziwei}, title = {Robo3D: Towards Robust and Reliable 3D Perception against Corruptions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19994-20006} }
Towards Saner Deep Image Registration: Bin Duan,

Ming Zhong,

Yan Yan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Duan_2023_ICCV, author = {Duan, Bin and Zhong, Ming and Yan, Yan}, title = {Towards Saner Deep Image Registration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12459-12468} }
Instance and Category Supervision are Alternate Learners for Continual Learning: Xudong Tian,

Zhizhong Zhang,

Xin Tan,

Jun Liu,

Chengjie Wang,

Yanyun Qu,

Guannan Jiang,

Yuan Xie; [pdf] [supp]
[bibtex]
@InProceedings{Tian_2023_ICCV, author = {Tian, Xudong and Zhang, Zhizhong and Tan, Xin and Liu, Jun and Wang, Chengjie and Qu, Yanyun and Jiang, Guannan and Xie, Yuan}, title = {Instance and Category Supervision are Alternate Learners for Continual Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5596-5605} }
Diverse Data Augmentation with Diffusions for Effective Test-time Prompt Tuning: Chun-Mei Feng,

Kai Yu,

Yong Liu,

Salman Khan,

Wangmeng Zuo; [pdf] [arXiv]
[bibtex]
@InProceedings{Feng_2023_ICCV, author = {Feng, Chun-Mei and Yu, Kai and Liu, Yong and Khan, Salman and Zuo, Wangmeng}, title = {Diverse Data Augmentation with Diffusions for Effective Test-time Prompt Tuning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2704-2714} }
Interaction-aware Joint Attention Estimation Using People Attributes: Chihiro Nakatani,

Hiroaki Kawashima,

Norimichi Ukita; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Nakatani_2023_ICCV, author = {Nakatani, Chihiro and Kawashima, Hiroaki and Ukita, Norimichi}, title = {Interaction-aware Joint Attention Estimation Using People Attributes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10224-10233} }
GePSAn: Generative Procedure Step Anticipation in Cooking Videos: Mohamed A. Abdelsalam,

Samrudhdhi B. Rangrej,

Isma Hadji,

Nikita Dvornik,

Konstantinos G. Derpanis,

Afsaneh Fazly; [pdf] [supp]
[bibtex]
@InProceedings{Abdelsalam_2023_ICCV, author = {Abdelsalam, Mohamed A. and Rangrej, Samrudhdhi B. and Hadji, Isma and Dvornik, Nikita and Derpanis, Konstantinos G. and Fazly, Afsaneh}, title = {GePSAn: Generative Procedure Step Anticipation in Cooking Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2988-2997} }
Gradient-based Sampling for Class Imbalanced Semi-supervised Object Detection: Jiaming Li,

Xiangru Lin,

Wei Zhang,

Xiao Tan,

Yingying Li,

Junyu Han,

Errui Ding,

Jingdong Wang,

Guanbin Li; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Jiaming and Lin, Xiangru and Zhang, Wei and Tan, Xiao and Li, Yingying and Han, Junyu and Ding, Errui and Wang, Jingdong and Li, Guanbin}, title = {Gradient-based Sampling for Class Imbalanced Semi-supervised Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16390-16400} }
SLCA: Slow Learner with Classifier Alignment for Continual Learning on a Pre-trained Model: Gengwei Zhang,

Liyuan Wang,

Guoliang Kang,

Ling Chen,

Yunchao Wei; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Gengwei and Wang, Liyuan and Kang, Guoliang and Chen, Ling and Wei, Yunchao}, title = {SLCA: Slow Learner with Classifier Alignment for Continual Learning on a Pre-trained Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19148-19158} }
Implicit Temporal Modeling with Learnable Alignment for Video Recognition: Shuyuan Tu,

Qi Dai,

Zuxuan Wu,

Zhi-Qi Cheng,

Han Hu,

Yu-Gang Jiang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tu_2023_ICCV, author = {Tu, Shuyuan and Dai, Qi and Wu, Zuxuan and Cheng, Zhi-Qi and Hu, Han and Jiang, Yu-Gang}, title = {Implicit Temporal Modeling with Learnable Alignment for Video Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19936-19947} }
Non-Coaxial Event-Guided Motion Deblurring with Spatial Alignment: Hoonhee Cho,

Yuhwan Jeong,

Taewoo Kim,

Kuk-Jin Yoon; [pdf] [supp]
[bibtex]
@InProceedings{Cho_2023_ICCV, author = {Cho, Hoonhee and Jeong, Yuhwan and Kim, Taewoo and Yoon, Kuk-Jin}, title = {Non-Coaxial Event-Guided Motion Deblurring with Spatial Alignment}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12492-12503} }
Fingerprinting Deep Image Restoration Models: Yuhui Quan,

Huan Teng,

Ruotao Xu,

Jun Huang,

Hui Ji; [pdf] [supp]
[bibtex]
@InProceedings{Quan_2023_ICCV, author = {Quan, Yuhui and Teng, Huan and Xu, Ruotao and Huang, Jun and Ji, Hui}, title = {Fingerprinting Deep Image Restoration Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13285-13295} }
AutoDiffusion: Training-Free Optimization of Time Steps and Architectures for Automated Diffusion Model Acceleration: Lijiang Li,

Huixia Li,

Xiawu Zheng,

Jie Wu,

Xuefeng Xiao,

Rui Wang,

Min Zheng,

Xin Pan,

Fei Chao,

Rongrong Ji; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Lijiang and Li, Huixia and Zheng, Xiawu and Wu, Jie and Xiao, Xuefeng and Wang, Rui and Zheng, Min and Pan, Xin and Chao, Fei and Ji, Rongrong}, title = {AutoDiffusion: Training-Free Optimization of Time Steps and Architectures for Automated Diffusion Model Acceleration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7105-7114} }
SportsMOT: A Large Multi-Object Tracking Dataset in Multiple Sports Scenes: Yutao Cui,

Chenkai Zeng,

Xiaoyu Zhao,

Yichun Yang,

Gangshan Wu,

Limin Wang; [pdf] [arXiv]
[bibtex]
@InProceedings{Cui_2023_ICCV, author = {Cui, Yutao and Zeng, Chenkai and Zhao, Xiaoyu and Yang, Yichun and Wu, Gangshan and Wang, Limin}, title = {SportsMOT: A Large Multi-Object Tracking Dataset in Multiple Sports Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9921-9931} }
Localizing Moments in Long Video Via Multimodal Guidance: Wayner Barrios,

Mattia Soldan,

Alberto Mario Ceballos-Arroyo,

Fabian Caba Heilbron,

Bernard Ghanem; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Barrios_2023_ICCV, author = {Barrios, Wayner and Soldan, Mattia and Ceballos-Arroyo, Alberto Mario and Heilbron, Fabian Caba and Ghanem, Bernard}, title = {Localizing Moments in Long Video Via Multimodal Guidance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13667-13678} }
Pixel-Aligned Recurrent Queries for Multi-View 3D Object Detection: Yiming Xie,

Huaizu Jiang,

Georgia Gkioxari,

Julian Straub; [pdf] [supp]
[bibtex]
@InProceedings{Xie_2023_ICCV, author = {Xie, Yiming and Jiang, Huaizu and Gkioxari, Georgia and Straub, Julian}, title = {Pixel-Aligned Recurrent Queries for Multi-View 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18370-18380} }
Towards Universal Image Embeddings: A Large-Scale Dataset and Challenge for Generic Image Representations: Nikolaos-Antonios Ypsilantis,

Kaifeng Chen,

Bingyi Cao,

Mário Lipovský,

Pelin Dogan-Schönberger,

Grzegorz Makosa,

Boris Bluntschli,

Mojtaba Seyedhosseini,

Ondřej Chum,

André Araujo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ypsilantis_2023_ICCV, author = {Ypsilantis, Nikolaos-Antonios and Chen, Kaifeng and Cao, Bingyi and Lipovsk\'y, M\'ario and Dogan-Sch\"onberger, Pelin and Makosa, Grzegorz and Bluntschli, Boris and Seyedhosseini, Mojtaba and Chum, Ond\v{r}ej and Araujo, Andr\'e}, title = {Towards Universal Image Embeddings: A Large-Scale Dataset and Challenge for Generic Image Representations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11290-11301} }
SemARFlow: Injecting Semantics into Unsupervised Optical Flow Estimation for Autonomous Driving: Shuai Yuan,

Shuzhi Yu,

Hannah Kim,

Carlo Tomasi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yuan_2023_ICCV, author = {Yuan, Shuai and Yu, Shuzhi and Kim, Hannah and Tomasi, Carlo}, title = {SemARFlow: Injecting Semantics into Unsupervised Optical Flow Estimation for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9566-9577} }
TiDAL: Learning Training Dynamics for Active Learning: Seong Min Kye,

Kwanghee Choi,

Hyeongmin Byun,

Buru Chang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kye_2023_ICCV, author = {Kye, Seong Min and Choi, Kwanghee and Byun, Hyeongmin and Chang, Buru}, title = {TiDAL: Learning Training Dynamics for Active Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22335-22345} }
Uncertainty-aware Unsupervised Multi-Object Tracking: Kai Liu,

Sheng Jin,

Zhihang Fu,

Ze Chen,

Rongxin Jiang,

Jieping Ye; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Kai and Jin, Sheng and Fu, Zhihang and Chen, Ze and Jiang, Rongxin and Ye, Jieping}, title = {Uncertainty-aware Unsupervised Multi-Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9996-10005} }
DPS-Net: Deep Polarimetric Stereo Depth Estimation: Chaoran Tian,

Weihong Pan,

Zimo Wang,

Mao Mao,

Guofeng Zhang,

Hujun Bao,

Ping Tan,

Zhaopeng Cui; [pdf] [supp]
[bibtex]
@InProceedings{Tian_2023_ICCV, author = {Tian, Chaoran and Pan, Weihong and Wang, Zimo and Mao, Mao and Zhang, Guofeng and Bao, Hujun and Tan, Ping and Cui, Zhaopeng}, title = {DPS-Net: Deep Polarimetric Stereo Depth Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3569-3579} }
Designing Phase Masks for Under-Display Cameras: Anqi Yang,

Eunhee Kang,

Hyong-Euk Lee,

Aswin C. Sankaranarayanan; [pdf] [supp]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Anqi and Kang, Eunhee and Lee, Hyong-Euk and Sankaranarayanan, Aswin C.}, title = {Designing Phase Masks for Under-Display Cameras}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10637-10645} }
Can Language Models Learn to Listen?: Evonne Ng,

Sanjay Subramanian,

Dan Klein,

Angjoo Kanazawa,

Trevor Darrell,

Shiry Ginosar; [pdf] [arXiv]
[bibtex]
@InProceedings{Ng_2023_ICCV, author = {Ng, Evonne and Subramanian, Sanjay and Klein, Dan and Kanazawa, Angjoo and Darrell, Trevor and Ginosar, Shiry}, title = {Can Language Models Learn to Listen?}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10083-10093} }
SpaceEvo: Hardware-Friendly Search Space Design for Efficient INT8 Inference: Xudong Wang,

Li Lyna Zhang,

Jiahang Xu,

Quanlu Zhang,

Yujing Wang,

Yuqing Yang,

Ningxin Zheng,

Ting Cao,

Mao Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Xudong and Zhang, Li Lyna and Xu, Jiahang and Zhang, Quanlu and Wang, Yujing and Yang, Yuqing and Zheng, Ningxin and Cao, Ting and Yang, Mao}, title = {SpaceEvo: Hardware-Friendly Search Space Design for Efficient INT8 Inference}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5819-5828} }
How Far Pre-trained Models Are from Neural Collapse on the Target Dataset Informs their Transferability: Zijian Wang,

Yadan Luo,

Liang Zheng,

Zi Huang,

Mahsa Baktashmotlagh; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Zijian and Luo, Yadan and Zheng, Liang and Huang, Zi and Baktashmotlagh, Mahsa}, title = {How Far Pre-trained Models Are from Neural Collapse on the Target Dataset Informs their Transferability}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5549-5558} }
SurfsUP: Learning Fluid Simulation for Novel Surfaces: Arjun Mani,

Ishaan Preetam Chandratreya,

Elliot Creager,

Carl Vondrick,

Richard Zemel; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mani_2023_ICCV, author = {Mani, Arjun and Chandratreya, Ishaan Preetam and Creager, Elliot and Vondrick, Carl and Zemel, Richard}, title = {SurfsUP: Learning Fluid Simulation for Novel Surfaces}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14225-14235} }
Convolutional Networks with Oriented 1D Kernels: Alexandre Kirchmeyer,

Jia Deng; [pdf] [supp]
[bibtex]
@InProceedings{Kirchmeyer_2023_ICCV, author = {Kirchmeyer, Alexandre and Deng, Jia}, title = {Convolutional Networks with Oriented 1D Kernels}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6222-6232} }
Regularized Mask Tuning: Uncovering Hidden Knowledge in Pre-Trained Vision-Language Models: Kecheng Zheng,

Wei Wu,

Ruili Feng,

Kai Zhu,

Jiawei Liu,

Deli Zhao,

Zheng-Jun Zha,

Wei Chen,

Yujun Shen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zheng_2023_ICCV, author = {Zheng, Kecheng and Wu, Wei and Feng, Ruili and Zhu, Kai and Liu, Jiawei and Zhao, Deli and Zha, Zheng-Jun and Chen, Wei and Shen, Yujun}, title = {Regularized Mask Tuning: Uncovering Hidden Knowledge in Pre-Trained Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11663-11673} }
Skill Transformer: A Monolithic Policy for Mobile Manipulation: Xiaoyu Huang,

Dhruv Batra,

Akshara Rai,

Andrew Szot; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Xiaoyu and Batra, Dhruv and Rai, Akshara and Szot, Andrew}, title = {Skill Transformer: A Monolithic Policy for Mobile Manipulation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10852-10862} }
Adaptive and Background-Aware Vision Transformer for Real-Time UAV Tracking: Shuiwang Li,

Yangxiang Yang,

Dan Zeng,

Xucheng Wang; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Shuiwang and Yang, Yangxiang and Zeng, Dan and Wang, Xucheng}, title = {Adaptive and Background-Aware Vision Transformer for Real-Time UAV Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13989-14000} }
Improving Pixel-based MIM by Reducing Wasted Modeling Capability: Yuan Liu,

Songyang Zhang,

Jiacheng Chen,

Zhaohui Yu,

Kai Chen,

Dahua Lin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Yuan and Zhang, Songyang and Chen, Jiacheng and Yu, Zhaohui and Chen, Kai and Lin, Dahua}, title = {Improving Pixel-based MIM by Reducing Wasted Modeling Capability}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5361-5372} }
Towards Memory- and Time-Efficient Backpropagation for Training Spiking Neural Networks: Qingyan Meng,

Mingqing Xiao,

Shen Yan,

Yisen Wang,

Zhouchen Lin,

Zhi-Quan Luo; [pdf] [supp]
[bibtex]
@InProceedings{Meng_2023_ICCV, author = {Meng, Qingyan and Xiao, Mingqing and Yan, Shen and Wang, Yisen and Lin, Zhouchen and Luo, Zhi-Quan}, title = {Towards Memory- and Time-Efficient Backpropagation for Training Spiking Neural Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6166-6176} }
Persistent-Transient Duality: A Multi-Mechanism Approach for Modeling Human-Object Interaction: Hung Tran,

Vuong Le,

Svetha Venkatesh,

Truyen Tran; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tran_2023_ICCV, author = {Tran, Hung and Le, Vuong and Venkatesh, Svetha and Tran, Truyen}, title = {Persistent-Transient Duality: A Multi-Mechanism Approach for Modeling Human-Object Interaction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9858-9867} }
When to Learn What: Model-Adaptive Data Augmentation Curriculum: Chengkai Hou,

Jieyu Zhang,

Tianyi Zhou; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hou_2023_ICCV, author = {Hou, Chengkai and Zhang, Jieyu and Zhou, Tianyi}, title = {When to Learn What: Model-Adaptive Data Augmentation Curriculum}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1717-1728} }
DiffPose: Multi-hypothesis Human Pose Estimation using Diffusion Models: Karl Holmquist,

Bastian Wandt; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Holmquist_2023_ICCV, author = {Holmquist, Karl and Wandt, Bastian}, title = {DiffPose: Multi-hypothesis Human Pose Estimation using Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15977-15987} }
AesPA-Net: Aesthetic Pattern-Aware Style Transfer Networks: Kibeom Hong,

Seogkyu Jeon,

Junsoo Lee,

Namhyuk Ahn,

Kunhee Kim,

Pilhyeon Lee,

Daesik Kim,

Youngjung Uh,

Hyeran Byun; [pdf] [supp]
[bibtex]
@InProceedings{Hong_2023_ICCV, author = {Hong, Kibeom and Jeon, Seogkyu and Lee, Junsoo and Ahn, Namhyuk and Kim, Kunhee and Lee, Pilhyeon and Kim, Daesik and Uh, Youngjung and Byun, Hyeran}, title = {AesPA-Net: Aesthetic Pattern-Aware Style Transfer Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22758-22767} }
COPILOT: Human-Environment Collision Prediction and Localization from Egocentric Videos: Boxiao Pan,

Bokui Shen,

Davis Rempe,

Despoina Paschalidou,

Kaichun Mo,

Yanchao Yang,

Leonidas J. Guibas; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Pan_2023_ICCV, author = {Pan, Boxiao and Shen, Bokui and Rempe, Davis and Paschalidou, Despoina and Mo, Kaichun and Yang, Yanchao and Guibas, Leonidas J.}, title = {COPILOT: Human-Environment Collision Prediction and Localization from Egocentric Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5262-5272} }
EGformer: Equirectangular Geometry-biased Transformer for 360 Depth Estimation: Ilwi Yun,

Chanyong Shin,

Hyunku Lee,

Hyuk-Jae Lee,

Chae Eun Rhee; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yun_2023_ICCV, author = {Yun, Ilwi and Shin, Chanyong and Lee, Hyunku and Lee, Hyuk-Jae and Rhee, Chae Eun}, title = {EGformer: Equirectangular Geometry-biased Transformer for 360 Depth Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6101-6112} }
Size Does Matter: Size-aware Virtual Try-on via Clothing-oriented Transformation Try-on Network: Chieh-Yun Chen,

Yi-Chung Chen,

Hong-Han Shuai,

Wen-Huang Cheng; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Chieh-Yun and Chen, Yi-Chung and Shuai, Hong-Han and Cheng, Wen-Huang}, title = {Size Does Matter: Size-aware Virtual Try-on via Clothing-oriented Transformation Try-on Network}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7513-7522} }
Generating Realistic Images from In-the-wild Sounds: Taegyeong Lee,

Jeonghun Kang,

Hyeonyu Kim,

Taehwan Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2023_ICCV, author = {Lee, Taegyeong and Kang, Jeonghun and Kim, Hyeonyu and Kim, Taehwan}, title = {Generating Realistic Images from In-the-wild Sounds}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7160-7170} }
DDS2M: Self-Supervised Denoising Diffusion Spatio-Spectral Model for Hyperspectral Image Restoration: Yuchun Miao,

Lefei Zhang,

Liangpei Zhang,

Dacheng Tao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Miao_2023_ICCV, author = {Miao, Yuchun and Zhang, Lefei and Zhang, Liangpei and Tao, Dacheng}, title = {DDS2M: Self-Supervised Denoising Diffusion Spatio-Spectral Model for Hyperspectral Image Restoration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12086-12096} }
Candidate-aware Selective Disambiguation Based On Normalized Entropy for Instance-dependent Partial-label Learning: Shuo He,

Guowu Yang,

Lei Feng; [pdf]
[bibtex]
@InProceedings{He_2023_ICCV, author = {He, Shuo and Yang, Guowu and Feng, Lei}, title = {Candidate-aware Selective Disambiguation Based On Normalized Entropy for Instance-dependent Partial-label Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1792-1801} }
Open-vocabulary Video Question Answering: A New Benchmark for Evaluating the Generalizability of Video Question Answering Models: Dohwan Ko,

Ji Soo Lee,

Miso Choi,

Jaewon Chu,

Jihwan Park,

Hyunwoo J. Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ko_2023_ICCV, author = {Ko, Dohwan and Lee, Ji Soo and Choi, Miso and Chu, Jaewon and Park, Jihwan and Kim, Hyunwoo J.}, title = {Open-vocabulary Video Question Answering: A New Benchmark for Evaluating the Generalizability of Video Question Answering Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3101-3112} }
Using a Waffle Iron for Automotive Point Cloud Semantic Segmentation: Gilles Puy,

Alexandre Boulch,

Renaud Marlet; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Puy_2023_ICCV, author = {Puy, Gilles and Boulch, Alexandre and Marlet, Renaud}, title = {Using a Waffle Iron for Automotive Point Cloud Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3379-3389} }
AutoReP: Automatic ReLU Replacement for Fast Private Network Inference: Hongwu Peng,

Shaoyi Huang,

Tong Zhou,

Yukui Luo,

Chenghong Wang,

Zigeng Wang,

Jiahui Zhao,

Xi Xie,

Ang Li,

Tony Geng,

Kaleel Mahmood,

Wujie Wen,

Xiaolin Xu,

Caiwen Ding; [pdf] [arXiv]
[bibtex]
@InProceedings{Peng_2023_ICCV, author = {Peng, Hongwu and Huang, Shaoyi and Zhou, Tong and Luo, Yukui and Wang, Chenghong and Wang, Zigeng and Zhao, Jiahui and Xie, Xi and Li, Ang and Geng, Tony and Mahmood, Kaleel and Wen, Wujie and Xu, Xiaolin and Ding, Caiwen}, title = {AutoReP: Automatic ReLU Replacement for Fast Private Network Inference}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5178-5188} }
MotionLM: Multi-Agent Motion Forecasting as Language Modeling: Ari Seff,

Brian Cera,

Dian Chen,

Mason Ng,

Aurick Zhou,

Nigamaa Nayakanti,

Khaled S. Refaat,

Rami Al-Rfou,

Benjamin Sapp; [pdf] [supp]
[bibtex]
@InProceedings{Seff_2023_ICCV, author = {Seff, Ari and Cera, Brian and Chen, Dian and Ng, Mason and Zhou, Aurick and Nayakanti, Nigamaa and Refaat, Khaled S. and Al-Rfou, Rami and Sapp, Benjamin}, title = {MotionLM: Multi-Agent Motion Forecasting as Language Modeling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8579-8590} }
Black Box Few-Shot Adaptation for Vision-Language Models: Yassine Ouali,

Adrian Bulat,

Brais Matinez,

Georgios Tzimiropoulos; [pdf] [supp]
[bibtex]
@InProceedings{Ouali_2023_ICCV, author = {Ouali, Yassine and Bulat, Adrian and Matinez, Brais and Tzimiropoulos, Georgios}, title = {Black Box Few-Shot Adaptation for Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15534-15546} }
Center-Based Decoupled Point-cloud Registration for 6D Object Pose Estimation: Haobo Jiang,

Zheng Dang,

Shuo Gu,

Jin Xie,

Mathieu Salzmann,

Jian Yang; [pdf]
[bibtex]
@InProceedings{Jiang_2023_ICCV, author = {Jiang, Haobo and Dang, Zheng and Gu, Shuo and Xie, Jin and Salzmann, Mathieu and Yang, Jian}, title = {Center-Based Decoupled Point-cloud Registration for 6D Object Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3427-3437} }
Self-Ordering Point Clouds: Pengwan Yang,

Cees G. M. Snoek,

Yuki M. Asano; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Pengwan and Snoek, Cees G. M. and Asano, Yuki M.}, title = {Self-Ordering Point Clouds}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15813-15822} }
Continual Segment: Towards a Single, Unified and Non-forgetting Continual Segmentation Model of 143 Whole-body Organs in CT Scans: Zhanghexuan Ji,

Dazhou Guo,

Puyang Wang,

Ke Yan,

Le Lu,

Minfeng Xu,

Qifeng Wang,

Jia Ge,

Mingchen Gao,

Xianghua Ye,

Dakai Jin; [pdf] [supp]
[bibtex]
@InProceedings{Ji_2023_ICCV, author = {Ji, Zhanghexuan and Guo, Dazhou and Wang, Puyang and Yan, Ke and Lu, Le and Xu, Minfeng and Wang, Qifeng and Ge, Jia and Gao, Mingchen and Ye, Xianghua and Jin, Dakai}, title = {Continual Segment: Towards a Single, Unified and Non-forgetting Continual Segmentation Model of 143 Whole-body Organs in CT Scans}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21140-21151} }
Enhancing Modality-Agnostic Representations via Meta-Learning for Brain Tumor Segmentation: Aishik Konwer,

Xiaoling Hu,

Joseph Bae,

Xuan Xu,

Chao Chen,

Prateek Prasanna; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Konwer_2023_ICCV, author = {Konwer, Aishik and Hu, Xiaoling and Bae, Joseph and Xu, Xuan and Chen, Chao and Prasanna, Prateek}, title = {Enhancing Modality-Agnostic Representations via Meta-Learning for Brain Tumor Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21415-21425} }
Zero-1-to-3: Zero-shot One Image to 3D Object: Ruoshi Liu,

Rundi Wu,

Basile Van Hoorick,

Pavel Tokmakov,

Sergey Zakharov,

Carl Vondrick; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Ruoshi and Wu, Rundi and Van Hoorick, Basile and Tokmakov, Pavel and Zakharov, Sergey and Vondrick, Carl}, title = {Zero-1-to-3: Zero-shot One Image to 3D Object}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9298-9309} }
3D Distillation: Improving Self-Supervised Monocular Depth Estimation on Reflective Surfaces: Xuepeng Shi,

Georgi Dikov,

Gerhard Reitmayr,

Tae-Kyun Kim,

Mohsen Ghafoorian; [pdf] [supp]
[bibtex]
@InProceedings{Shi_2023_ICCV, author = {Shi, Xuepeng and Dikov, Georgi and Reitmayr, Gerhard and Kim, Tae-Kyun and Ghafoorian, Mohsen}, title = {3D Distillation: Improving Self-Supervised Monocular Depth Estimation on Reflective Surfaces}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9133-9143} }
GAIT: Generating Aesthetic Indoor Tours with Deep Reinforcement Learning: Desai Xie,

Ping Hu,

Xin Sun,

Soren Pirk,

Jianming Zhang,

Radomir Mech,

Arie E. Kaufman; [pdf] [supp]
[bibtex]
@InProceedings{Xie_2023_ICCV, author = {Xie, Desai and Hu, Ping and Sun, Xin and Pirk, Soren and Zhang, Jianming and Mech, Radomir and Kaufman, Arie E.}, title = {GAIT: Generating Aesthetic Indoor Tours with Deep Reinforcement Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7409-7419} }
Low-Light Image Enhancement with Multi-Stage Residue Quantization and Brightness-Aware Attention: Yunlong Liu,

Tao Huang,

Weisheng Dong,

Fangfang Wu,

Xin Li,

Guangming Shi; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Yunlong and Huang, Tao and Dong, Weisheng and Wu, Fangfang and Li, Xin and Shi, Guangming}, title = {Low-Light Image Enhancement with Multi-Stage Residue Quantization and Brightness-Aware Attention}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12140-12149} }
Hierarchically Decomposed Graph Convolutional Networks for Skeleton-Based Action Recognition: Jungho Lee,

Minhyeok Lee,

Dogyoon Lee,

Sangyoun Lee; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2023_ICCV, author = {Lee, Jungho and Lee, Minhyeok and Lee, Dogyoon and Lee, Sangyoun}, title = {Hierarchically Decomposed Graph Convolutional Networks for Skeleton-Based Action Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10444-10453} }
LIST: Learning Implicitly from Spatial Transformers for Single-View 3D Reconstruction: Mohammad Samiul Arshad,

William J. Beksi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Arshad_2023_ICCV, author = {Arshad, Mohammad Samiul and Beksi, William J.}, title = {LIST: Learning Implicitly from Spatial Transformers for Single-View 3D Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9321-9330} }
Rethinking Mobile Block for Efficient Attention-based Models: Jiangning Zhang,

Xiangtai Li,

Jian Li,

Liang Liu,

Zhucun Xue,

Boshen Zhang,

Zhengkai Jiang,

Tianxin Huang,

Yabiao Wang,

Chengjie Wang; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Jiangning and Li, Xiangtai and Li, Jian and Liu, Liang and Xue, Zhucun and Zhang, Boshen and Jiang, Zhengkai and Huang, Tianxin and Wang, Yabiao and Wang, Chengjie}, title = {Rethinking Mobile Block for Efficient Attention-based Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1389-1400} }
REAP: A Large-Scale Realistic Adversarial Patch Benchmark: Nabeel Hingun,

Chawin Sitawarin,

Jerry Li,

David Wagner; [pdf] [arXiv]
[bibtex]
@InProceedings{Hingun_2023_ICCV, author = {Hingun, Nabeel and Sitawarin, Chawin and Li, Jerry and Wagner, David}, title = {REAP: A Large-Scale Realistic Adversarial Patch Benchmark}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4640-4651} }
LRRU: Long-short Range Recurrent Updating Networks for Depth Completion: Yufei Wang,

Bo Li,

Ge Zhang,

Qi Liu,

Tao Gao,

Yuchao Dai; [pdf]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Yufei and Li, Bo and Zhang, Ge and Liu, Qi and Gao, Tao and Dai, Yuchao}, title = {LRRU: Long-short Range Recurrent Updating Networks for Depth Completion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9422-9432} }
MetaBEV: Solving Sensor Failures for 3D Detection and Map Segmentation: Chongjian Ge,

Junsong Chen,

Enze Xie,

Zhongdao Wang,

Lanqing Hong,

Huchuan Lu,

Zhenguo Li,

Ping Luo; [pdf] [supp]
[bibtex]
@InProceedings{Ge_2023_ICCV, author = {Ge, Chongjian and Chen, Junsong and Xie, Enze and Wang, Zhongdao and Hong, Lanqing and Lu, Huchuan and Li, Zhenguo and Luo, Ping}, title = {MetaBEV: Solving Sensor Failures for 3D Detection and Map Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8721-8731} }
DNA-Rendering: A Diverse Neural Actor Repository for High-Fidelity Human-Centric Rendering: Wei Cheng,

Ruixiang Chen,

Siming Fan,

Wanqi Yin,

Keyu Chen,

Zhongang Cai,

Jingbo Wang,

Yang Gao,

Zhengming Yu,

Zhengyu Lin,

Daxuan Ren,

Lei Yang,

Ziwei Liu,

Chen Change Loy,

Chen Qian,

Wayne Wu,

Dahua Lin,

Bo Dai,

Kwan-Yee Lin; [pdf] [supp]
[bibtex]
@InProceedings{Cheng_2023_ICCV, author = {Cheng, Wei and Chen, Ruixiang and Fan, Siming and Yin, Wanqi and Chen, Keyu and Cai, Zhongang and Wang, Jingbo and Gao, Yang and Yu, Zhengming and Lin, Zhengyu and Ren, Daxuan and Yang, Lei and Liu, Ziwei and Loy, Chen Change and Qian, Chen and Wu, Wayne and Lin, Dahua and Dai, Bo and Lin, Kwan-Yee}, title = {DNA-Rendering: A Diverse Neural Actor Repository for High-Fidelity Human-Centric Rendering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19982-19993} }
Exploring Temporal Concurrency for Video-Language Representation Learning: Heng Zhang,

Daqing Liu,

Zezhong Lv,

Bing Su,

Dacheng Tao; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Heng and Liu, Daqing and Lv, Zezhong and Su, Bing and Tao, Dacheng}, title = {Exploring Temporal Concurrency for Video-Language Representation Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15568-15578} }
StegaNeRF: Embedding Invisible Information within Neural Radiance Fields: Chenxin Li,

Brandon Y. Feng,

Zhiwen Fan,

Panwang Pan,

Zhangyang Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Chenxin and Feng, Brandon Y. and Fan, Zhiwen and Pan, Panwang and Wang, Zhangyang}, title = {StegaNeRF: Embedding Invisible Information within Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {441-453} }
DynamicISP: Dynamically Controlled Image Signal Processor for Image Recognition: Masakazu Yoshimura,

Junji Otsuka,

Atsushi Irie,

Takeshi Ohashi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yoshimura_2023_ICCV, author = {Yoshimura, Masakazu and Otsuka, Junji and Irie, Atsushi and Ohashi, Takeshi}, title = {DynamicISP: Dynamically Controlled Image Signal Processor for Image Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12866-12876} }
R-Pred: Two-Stage Motion Prediction Via Tube-Query Attention-Based Trajectory Refinement: Sehwan Choi,

Jungho Kim,

Junyong Yun,

Jun Won Choi; [pdf] [supp]
[bibtex]
@InProceedings{Choi_2023_ICCV, author = {Choi, Sehwan and Kim, Jungho and Yun, Junyong and Choi, Jun Won}, title = {R-Pred: Two-Stage Motion Prediction Via Tube-Query Attention-Based Trajectory Refinement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8525-8535} }
A step towards understanding why classification helps regression: Silvia L. Pintea,

Yancong Lin,

Jouke Dijkstra,

Jan C. van Gemert; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Pintea_2023_ICCV, author = {Pintea, Silvia L. and Lin, Yancong and Dijkstra, Jouke and van Gemert, Jan C.}, title = {A step towards understanding why classification helps regression}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19972-19981} }
Robust Evaluation of Diffusion-Based Adversarial Purification: Minjong Lee,

Dongwoo Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2023_ICCV, author = {Lee, Minjong and Kim, Dongwoo}, title = {Robust Evaluation of Diffusion-Based Adversarial Purification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {134-144} }
Hyperbolic Audio-visual Zero-shot Learning: Jie Hong,

Zeeshan Hayder,

Junlin Han,

Pengfei Fang,

Mehrtash Harandi,

Lars Petersson; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hong_2023_ICCV, author = {Hong, Jie and Hayder, Zeeshan and Han, Junlin and Fang, Pengfei and Harandi, Mehrtash and Petersson, Lars}, title = {Hyperbolic Audio-visual Zero-shot Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7873-7883} }
CTP:Towards Vision-Language Continual Pretraining via Compatible Momentum Contrast and Topology Preservation: Hongguang Zhu,

Yunchao Wei,

Xiaodan Liang,

Chunjie Zhang,

Yao Zhao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Hongguang and Wei, Yunchao and Liang, Xiaodan and Zhang, Chunjie and Zhao, Yao}, title = {CTP:Towards Vision-Language Continual Pretraining via Compatible Momentum Contrast and Topology Preservation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22257-22267} }
Aggregating Feature Point Cloud for Depth Completion: Zhu Yu,

Zehua Sheng,

Zili Zhou,

Lun Luo,

Si-Yuan Cao,

Hong Gu,

Huaqi Zhang,

Hui-Liang Shen; [pdf] [supp]
[bibtex]
@InProceedings{Yu_2023_ICCV, author = {Yu, Zhu and Sheng, Zehua and Zhou, Zili and Luo, Lun and Cao, Si-Yuan and Gu, Hong and Zhang, Huaqi and Shen, Hui-Liang}, title = {Aggregating Feature Point Cloud for Depth Completion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8732-8743} }
FLIP: Cross-domain Face Anti-spoofing with Language Guidance: Koushik Srivatsan,

Muzammal Naseer,

Karthik Nandakumar; [pdf] [supp]
[bibtex]
@InProceedings{Srivatsan_2023_ICCV, author = {Srivatsan, Koushik and Naseer, Muzammal and Nandakumar, Karthik}, title = {FLIP: Cross-domain Face Anti-spoofing with Language Guidance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19685-19696} }
Distribution Shift Matters for Knowledge Distillation with Webly Collected Images: Jialiang Tang,

Shuo Chen,

Gang Niu,

Masashi Sugiyama,

Chen Gong; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tang_2023_ICCV, author = {Tang, Jialiang and Chen, Shuo and Niu, Gang and Sugiyama, Masashi and Gong, Chen}, title = {Distribution Shift Matters for Knowledge Distillation with Webly Collected Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17470-17480} }
Reconstructed Convolution Module Based Look-Up Tables for Efficient Image Super-Resolution: Guandu Liu,

Yukang Ding,

Mading Li,

Ming Sun,

Xing Wen,

Bin Wang; [pdf] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Guandu and Ding, Yukang and Li, Mading and Sun, Ming and Wen, Xing and Wang, Bin}, title = {Reconstructed Convolution Module Based Look-Up Tables for Efficient Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12217-12226} }
Action Sensitivity Learning for Temporal Action Localization: Jiayi Shao,

Xiaohan Wang,

Ruijie Quan,

Junjun Zheng,

Jiang Yang,

Yi Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shao_2023_ICCV, author = {Shao, Jiayi and Wang, Xiaohan and Quan, Ruijie and Zheng, Junjun and Yang, Jiang and Yang, Yi}, title = {Action Sensitivity Learning for Temporal Action Localization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13457-13469} }
Gram-based Attentive Neural Ordinary Differential Equations Network for Video Nystagmography Classification: Xihe Qiu,

Shaojie Shi,

Xiaoyu Tan,

Chao Qu,

Zhijun Fang,

Hailing Wang,

Yongbin Gao,

Peixia Wu,

Huawei Li; [pdf]
[bibtex]
@InProceedings{Qiu_2023_ICCV, author = {Qiu, Xihe and Shi, Shaojie and Tan, Xiaoyu and Qu, Chao and Fang, Zhijun and Wang, Hailing and Gao, Yongbin and Wu, Peixia and Li, Huawei}, title = {Gram-based Attentive Neural Ordinary Differential Equations Network for Video Nystagmography Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21339-21348} }
PEANUT: Predicting and Navigating to Unseen Targets: Albert J. Zhai,

Shenlong Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhai_2023_ICCV, author = {Zhai, Albert J. and Wang, Shenlong}, title = {PEANUT: Predicting and Navigating to Unseen Targets}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10926-10935} }
Pluralistic Aging Diffusion Autoencoder: Peipei Li,

Rui Wang,

Huaibo Huang,

Ran He,

Zhaofeng He; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Peipei and Wang, Rui and Huang, Huaibo and He, Ran and He, Zhaofeng}, title = {Pluralistic Aging Diffusion Autoencoder}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22613-22623} }
ModelGiF: Gradient Fields for Model Functional Distance: Jie Song,

Zhengqi Xu,

Sai Wu,

Gang Chen,

Mingli Song; [pdf] [arXiv]
[bibtex]
@InProceedings{Song_2023_ICCV, author = {Song, Jie and Xu, Zhengqi and Wu, Sai and Chen, Gang and Song, Mingli}, title = {ModelGiF: Gradient Fields for Model Functional Distance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6125-6135} }
PoseDiffusion: Solving Pose Estimation via Diffusion-aided Bundle Adjustment: Jianyuan Wang,

Christian Rupprecht,

David Novotny; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Jianyuan and Rupprecht, Christian and Novotny, David}, title = {PoseDiffusion: Solving Pose Estimation via Diffusion-aided Bundle Adjustment}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9773-9783} }
TIFA: Accurate and Interpretable Text-to-Image Faithfulness Evaluation with Question Answering: Yushi Hu,

Benlin Liu,

Jungo Kasai,

Yizhong Wang,

Mari Ostendorf,

Ranjay Krishna,

Noah A. Smith; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hu_2023_ICCV, author = {Hu, Yushi and Liu, Benlin and Kasai, Jungo and Wang, Yizhong and Ostendorf, Mari and Krishna, Ranjay and Smith, Noah A.}, title = {TIFA: Accurate and Interpretable Text-to-Image Faithfulness Evaluation with Question Answering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20406-20417} }
SIGMA: Scale-Invariant Global Sparse Shape Matching: Maolin Gao,

Paul Roetzer,

Marvin Eisenberger,

Zorah Lähner,

Michael Moeller,

Daniel Cremers,

Florian Bernard; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gao_2023_ICCV, author = {Gao, Maolin and Roetzer, Paul and Eisenberger, Marvin and L\"ahner, Zorah and Moeller, Michael and Cremers, Daniel and Bernard, Florian}, title = {SIGMA: Scale-Invariant Global Sparse Shape Matching}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {645-654} }
CORE: Cooperative Reconstruction for Multi-Agent Perception: Binglu Wang,

Lei Zhang,

Zhaozhong Wang,

Yongqiang Zhao,

Tianfei Zhou; [pdf] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Binglu and Zhang, Lei and Wang, Zhaozhong and Zhao, Yongqiang and Zhou, Tianfei}, title = {CORE: Cooperative Reconstruction for Multi-Agent Perception}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8710-8720} }
VidStyleODE: Disentangled Video Editing via StyleGAN and NeuralODEs: Moayed Haji Ali,

Andrew Bond,

Tolga Birdal,

Duygu Ceylan,

Levent Karacan,

Erkut Erdem,

Aykut Erdem; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ali_2023_ICCV, author = {Ali, Moayed Haji and Bond, Andrew and Birdal, Tolga and Ceylan, Duygu and Karacan, Levent and Erdem, Erkut and Erdem, Aykut}, title = {VidStyleODE: Disentangled Video Editing via StyleGAN and NeuralODEs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7523-7534} }
SEFD: Learning to Distill Complex Pose and Occlusion: ChangHee Yang,

Kyeongbo Kong,

SungJun Min,

Dongyoon Wee,

Ho-Deok Jang,

Geonho Cha,

SukJu Kang; [pdf] [supp]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, ChangHee and Kong, Kyeongbo and Min, SungJun and Wee, Dongyoon and Jang, Ho-Deok and Cha, Geonho and Kang, SukJu}, title = {SEFD: Learning to Distill Complex Pose and Occlusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14941-14952} }
CiT: Curation in Training for Effective Vision-Language Data: Hu Xu,

Saining Xie,

Po-Yao Huang,

Licheng Yu,

Russell Howes,

Gargi Ghosh,

Luke Zettlemoyer,

Christoph Feichtenhofer; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Hu and Xie, Saining and Huang, Po-Yao and Yu, Licheng and Howes, Russell and Ghosh, Gargi and Zettlemoyer, Luke and Feichtenhofer, Christoph}, title = {CiT: Curation in Training for Effective Vision-Language Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15180-15189} }
SparseNeRF: Distilling Depth Ranking for Few-shot Novel View Synthesis: Guangcong Wang,

Zhaoxi Chen,

Chen Change Loy,

Ziwei Liu; [pdf] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Guangcong and Chen, Zhaoxi and Loy, Chen Change and Liu, Ziwei}, title = {SparseNeRF: Distilling Depth Ranking for Few-shot Novel View Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9065-9076} }
Towards Models that Can See and Read: Roy Ganz,

Oren Nuriel,

Aviad Aberdam,

Yair Kittenplon,

Shai Mazor,

Ron Litman; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ganz_2023_ICCV, author = {Ganz, Roy and Nuriel, Oren and Aberdam, Aviad and Kittenplon, Yair and Mazor, Shai and Litman, Ron}, title = {Towards Models that Can See and Read}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21718-21728} }
ProPainter: Improving Propagation and Transformer for Video Inpainting: Shangchen Zhou,

Chongyi Li,

Kelvin C.K. Chan,

Chen Change Loy; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Shangchen and Li, Chongyi and Chan, Kelvin C.K. and Loy, Chen Change}, title = {ProPainter: Improving Propagation and Transformer for Video Inpainting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10477-10486} }
Query Refinement Transformer for 3D Instance Segmentation: Jiahao Lu,

Jiacheng Deng,

Chuxin Wang,

Jianfeng He,

Tianzhu Zhang; [pdf]
[bibtex]
@InProceedings{Lu_2023_ICCV, author = {Lu, Jiahao and Deng, Jiacheng and Wang, Chuxin and He, Jianfeng and Zhang, Tianzhu}, title = {Query Refinement Transformer for 3D Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18516-18526} }
Root Pose Decomposition Towards Generic Non-rigid 3D Reconstruction with Monocular Videos: Yikai Wang,

Yinpeng Dong,

Fuchun Sun,

Xiao Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Yikai and Dong, Yinpeng and Sun, Fuchun and Yang, Xiao}, title = {Root Pose Decomposition Towards Generic Non-rigid 3D Reconstruction with Monocular Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13890-13900} }
3DHumanGAN: 3D-Aware Human Image Generation with 3D Pose Mapping: Zhuoqian Yang,

Shikai Li,

Wayne Wu,

Bo Dai; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Zhuoqian and Li, Shikai and Wu, Wayne and Dai, Bo}, title = {3DHumanGAN: 3D-Aware Human Image Generation with 3D Pose Mapping}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23008-23019} }
LeaF: Learning Frames for 4D Point Cloud Sequence Understanding: Yunze Liu,

Junyu Chen,

Zekai Zhang,

Jingwei Huang,

Li Yi; [pdf]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Yunze and Chen, Junyu and Zhang, Zekai and Huang, Jingwei and Yi, Li}, title = {LeaF: Learning Frames for 4D Point Cloud Sequence Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {604-613} }
GLA-GCN: Global-local Adaptive Graph Convolutional Network for 3D Human Pose Estimation from Monocular Video: Bruce X.B. Yu,

Zhi Zhang,

Yongxu Liu,

Sheng-hua Zhong,

Yan Liu,

Chang Wen Chen; [pdf]
[bibtex]
@InProceedings{Yu_2023_ICCV, author = {Yu, Bruce X.B. and Zhang, Zhi and Liu, Yongxu and Zhong, Sheng-hua and Liu, Yan and Chen, Chang Wen}, title = {GLA-GCN: Global-local Adaptive Graph Convolutional Network for 3D Human Pose Estimation from Monocular Video}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8818-8829} }
Snow Removal in Video: A New Dataset and A Novel Method: Haoyu Chen,

Jingjing Ren,

Jinjin Gu,

Hongtao Wu,

Xuequan Lu,

Haoming Cai,

Lei Zhu; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Haoyu and Ren, Jingjing and Gu, Jinjin and Wu, Hongtao and Lu, Xuequan and Cai, Haoming and Zhu, Lei}, title = {Snow Removal in Video: A New Dataset and A Novel Method}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13211-13222} }
Degradation-Resistant Unfolding Network for Heterogeneous Image Fusion: Chunming He,

Kai Li,

Guoxia Xu,

Yulun Zhang,

Runze Hu,

Zhenhua Guo,

Xiu Li; [pdf] [supp]
[bibtex]
@InProceedings{He_2023_ICCV, author = {He, Chunming and Li, Kai and Xu, Guoxia and Zhang, Yulun and Hu, Runze and Guo, Zhenhua and Li, Xiu}, title = {Degradation-Resistant Unfolding Network for Heterogeneous Image Fusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12611-12621} }
Priority-Centric Human Motion Generation in Discrete Latent Space: Hanyang Kong,

Kehong Gong,

Dongze Lian,

Michael Bi Mi,

Xinchao Wang; [pdf] [arXiv]
[bibtex]
@InProceedings{Kong_2023_ICCV, author = {Kong, Hanyang and Gong, Kehong and Lian, Dongze and Mi, Michael Bi and Wang, Xinchao}, title = {Priority-Centric Human Motion Generation in Discrete Latent Space}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14806-14816} }
Domain-Specificity Inducing Transformers for Source-Free Domain Adaptation: Sunandini Sanyal,

Ashish Ramayee Asokan,

Suvaansh Bhambri,

Akshay Kulkarni,

Jogendra Nath Kundu,

R Venkatesh Babu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sanyal_2023_ICCV, author = {Sanyal, Sunandini and Asokan, Ashish Ramayee and Bhambri, Suvaansh and Kulkarni, Akshay and Kundu, Jogendra Nath and Babu, R Venkatesh}, title = {Domain-Specificity Inducing Transformers for Source-Free Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18928-18937} }
Towards Improved Input Masking for Convolutional Neural Networks: Sriram Balasubramanian,

Soheil Feizi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Balasubramanian_2023_ICCV, author = {Balasubramanian, Sriram and Feizi, Soheil}, title = {Towards Improved Input Masking for Convolutional Neural Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1855-1865} }
3DHacker: Spectrum-based Decision Boundary Generation for Hard-label 3D Point Cloud Attack: Yunbo Tao,

Daizong Liu,

Pan Zhou,

Yulai Xie,

Wei Du,

Wei Hu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tao_2023_ICCV, author = {Tao, Yunbo and Liu, Daizong and Zhou, Pan and Xie, Yulai and Du, Wei and Hu, Wei}, title = {3DHacker: Spectrum-based Decision Boundary Generation for Hard-label 3D Point Cloud Attack}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14340-14350} }
Exploring Lightweight Hierarchical Vision Transformers for Efficient Visual Tracking: Ben Kang,

Xin Chen,

Dong Wang,

Houwen Peng,

Huchuan Lu; [pdf] [arXiv]
[bibtex]
@InProceedings{Kang_2023_ICCV, author = {Kang, Ben and Chen, Xin and Wang, Dong and Peng, Houwen and Lu, Huchuan}, title = {Exploring Lightweight Hierarchical Vision Transformers for Efficient Visual Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9612-9621} }
MiniROAD: Minimal RNN Framework for Online Action Detection: Joungbin An,

Hyolim Kang,

Su Ho Han,

Ming-Hsuan Yang,

Seon Joo Kim; [pdf] [supp]
[bibtex]
@InProceedings{An_2023_ICCV, author = {An, Joungbin and Kang, Hyolim and Han, Su Ho and Yang, Ming-Hsuan and Kim, Seon Joo}, title = {MiniROAD: Minimal RNN Framework for Online Action Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10341-10350} }
Efficient Emotional Adaptation for Audio-Driven Talking-Head Generation: Yuan Gan,

Zongxin Yang,

Xihang Yue,

Lingyun Sun,

Yi Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gan_2023_ICCV, author = {Gan, Yuan and Yang, Zongxin and Yue, Xihang and Sun, Lingyun and Yang, Yi}, title = {Efficient Emotional Adaptation for Audio-Driven Talking-Head Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22634-22645} }
Object-aware Gaze Target Detection: Francesco Tonini,

Nicola Dall'Asen,

Cigdem Beyan,

Elisa Ricci; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tonini_2023_ICCV, author = {Tonini, Francesco and Dall'Asen, Nicola and Beyan, Cigdem and Ricci, Elisa}, title = {Object-aware Gaze Target Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21860-21869} }
Gramian Attention Heads are Strong yet Efficient Vision Learners: Jongbin Ryu,

Dongyoon Han,

Jongwoo Lim; [pdf] [supp]
[bibtex]
@InProceedings{Ryu_2023_ICCV, author = {Ryu, Jongbin and Han, Dongyoon and Lim, Jongwoo}, title = {Gramian Attention Heads are Strong yet Efficient Vision Learners}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5841-5851} }
VADER: Video Alignment Differencing and Retrieval: Alexander Black,

Simon Jenni,

Tu Bui,

Md. Mehrab Tanjim,

Stefano Petrangeli,

Ritwik Sinha,

Viswanathan Swaminathan,

John Collomosse; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Black_2023_ICCV, author = {Black, Alexander and Jenni, Simon and Bui, Tu and Tanjim, Md. Mehrab and Petrangeli, Stefano and Sinha, Ritwik and Swaminathan, Viswanathan and Collomosse, John}, title = {VADER: Video Alignment Differencing and Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22357-22367} }
MI-GAN: A Simple Baseline for Image Inpainting on Mobile Devices: Andranik Sargsyan,

Shant Navasardyan,

Xingqian Xu,

Humphrey Shi; [pdf] [supp]
[bibtex]
@InProceedings{Sargsyan_2023_ICCV, author = {Sargsyan, Andranik and Navasardyan, Shant and Xu, Xingqian and Shi, Humphrey}, title = {MI-GAN: A Simple Baseline for Image Inpainting on Mobile Devices}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7335-7345} }
HiLo: Exploiting High Low Frequency Relations for Unbiased Panoptic Scene Graph Generation: Zijian Zhou,

Miaojing Shi,

Holger Caesar; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Zijian and Shi, Miaojing and Caesar, Holger}, title = {HiLo: Exploiting High Low Frequency Relations for Unbiased Panoptic Scene Graph Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21637-21648} }
Chop & Learn: Recognizing and Generating Object-State Compositions: Nirat Saini,

Hanyu Wang,

Archana Swaminathan,

Vinoj Jayasundara,

Bo He,

Kamal Gupta,

Abhinav Shrivastava; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Saini_2023_ICCV, author = {Saini, Nirat and Wang, Hanyu and Swaminathan, Archana and Jayasundara, Vinoj and He, Bo and Gupta, Kamal and Shrivastava, Abhinav}, title = {Chop \& Learn: Recognizing and Generating Object-State Compositions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20247-20258} }
Automatic Animation of Hair Blowing in Still Portrait Photos: Wenpeng Xiao,

Wentao Liu,

Yitong Wang,

Bernard Ghanem,

Bing Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xiao_2023_ICCV, author = {Xiao, Wenpeng and Liu, Wentao and Wang, Yitong and Ghanem, Bernard and Li, Bing}, title = {Automatic Animation of Hair Blowing in Still Portrait Photos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22963-22975} }
A Large-Scale Outdoor Multi-Modal Dataset and Benchmark for Novel View Synthesis and Implicit Scene Reconstruction: Chongshan Lu,

Fukun Yin,

Xin Chen,

Wen Liu,

Tao Chen,

Gang Yu,

Jiayuan Fan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lu_2023_ICCV, author = {Lu, Chongshan and Yin, Fukun and Chen, Xin and Liu, Wen and Chen, Tao and Yu, Gang and Fan, Jiayuan}, title = {A Large-Scale Outdoor Multi-Modal Dataset and Benchmark for Novel View Synthesis and Implicit Scene Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7557-7567} }
4D Panoptic Segmentation as Invariant and Equivariant Field Prediction: Minghan Zhu,

Shizhong Han,

Hong Cai,

Shubhankar Borse,

Maani Ghaffari,

Fatih Porikli; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Minghan and Han, Shizhong and Cai, Hong and Borse, Shubhankar and Ghaffari, Maani and Porikli, Fatih}, title = {4D Panoptic Segmentation as Invariant and Equivariant Field Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22488-22498} }
Unleashing Vanilla Vision Transformer with Masked Image Modeling for Object Detection: Yuxin Fang,

Shusheng Yang,

Shijie Wang,

Yixiao Ge,

Ying Shan,

Xinggang Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Fang_2023_ICCV, author = {Fang, Yuxin and Yang, Shusheng and Wang, Shijie and Ge, Yixiao and Shan, Ying and Wang, Xinggang}, title = {Unleashing Vanilla Vision Transformer with Masked Image Modeling for Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6244-6253} }
NDC-Scene: Boost Monocular 3D Semantic Scene Completion in Normalized Device Coordinates Space: Jiawei Yao,

Chuming Li,

Keqiang Sun,

Yingjie Cai,

Hao Li,

Wanli Ouyang,

Hongsheng Li; [pdf] [supp]
[bibtex]
@InProceedings{Yao_2023_ICCV, author = {Yao, Jiawei and Li, Chuming and Sun, Keqiang and Cai, Yingjie and Li, Hao and Ouyang, Wanli and Li, Hongsheng}, title = {NDC-Scene: Boost Monocular 3D Semantic Scene Completion in Normalized Device Coordinates Space}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9455-9465} }
Spatio-Temporal Crop Aggregation for Video Representation Learning: Sepehr Sameni,

Simon Jenni,

Paolo Favaro; [pdf] [arXiv]
[bibtex]
@InProceedings{Sameni_2023_ICCV, author = {Sameni, Sepehr and Jenni, Simon and Favaro, Paolo}, title = {Spatio-Temporal Crop Aggregation for Video Representation Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5664-5674} }
Zip-NeRF: Anti-Aliased Grid-Based Neural Radiance Fields: Jonathan T. Barron,

Ben Mildenhall,

Dor Verbin,

Pratul P. Srinivasan,

Peter Hedman; [pdf] [supp]
[bibtex]
@InProceedings{Barron_2023_ICCV, author = {Barron, Jonathan T. and Mildenhall, Ben and Verbin, Dor and Srinivasan, Pratul P. and Hedman, Peter}, title = {Zip-NeRF: Anti-Aliased Grid-Based Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19697-19705} }
Neural-PBIR Reconstruction of Shape, Material, and Illumination: Cheng Sun,

Guangyan Cai,

Zhengqin Li,

Kai Yan,

Cheng Zhang,

Carl Marshall,

Jia-Bin Huang,

Shuang Zhao,

Zhao Dong; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sun_2023_ICCV, author = {Sun, Cheng and Cai, Guangyan and Li, Zhengqin and Yan, Kai and Zhang, Cheng and Marshall, Carl and Huang, Jia-Bin and Zhao, Shuang and Dong, Zhao}, title = {Neural-PBIR Reconstruction of Shape, Material, and Illumination}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18046-18056} }
Fg-T2M: Fine-Grained Text-Driven Human Motion Generation via Diffusion Model: Yin Wang,

Zhiying Leng,

Frederick W. B. Li,

Shun-Cheng Wu,

Xiaohui Liang; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Yin and Leng, Zhiying and Li, Frederick W. B. and Wu, Shun-Cheng and Liang, Xiaohui}, title = {Fg-T2M: Fine-Grained Text-Driven Human Motion Generation via Diffusion Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22035-22044} }
BlindHarmony: "Blind" Harmonization for MR Images via Flow Model: Hwihun Jeong,

Heejoon Byun,

Dong Un Kang,

Jongho Lee; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jeong_2023_ICCV, author = {Jeong, Hwihun and Byun, Heejoon and Kang, Dong Un and Lee, Jongho}, title = {BlindHarmony: ''Blind'' Harmonization for MR Images via Flow Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21129-21139} }
Zero-guidance Segmentation Using Zero Segment Labels: Pitchaporn Rewatbowornwong,

Nattanat Chatthee,

Ekapol Chuangsuwanich,

Supasorn Suwajanakorn; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Rewatbowornwong_2023_ICCV, author = {Rewatbowornwong, Pitchaporn and Chatthee, Nattanat and Chuangsuwanich, Ekapol and Suwajanakorn, Supasorn}, title = {Zero-guidance Segmentation Using Zero Segment Labels}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1162-1172} }
Efficient LiDAR Point Cloud Oversegmentation Network: Le Hui,

Linghua Tang,

Yuchao Dai,

Jin Xie,

Jian Yang; [pdf] [supp]
[bibtex]
@InProceedings{Hui_2023_ICCV, author = {Hui, Le and Tang, Linghua and Dai, Yuchao and Xie, Jin and Yang, Jian}, title = {Efficient LiDAR Point Cloud Oversegmentation Network}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18003-18012} }
Communication-efficient Federated Learning with Single-Step Synthetic Features Compressor for Faster Convergence: Yuhao Zhou,

Mingjia Shi,

Yuanxi Li,

Yanan Sun,

Qing Ye,

Jiancheng Lv; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Yuhao and Shi, Mingjia and Li, Yuanxi and Sun, Yanan and Ye, Qing and Lv, Jiancheng}, title = {Communication-efficient Federated Learning with Single-Step Synthetic Features Compressor for Faster Convergence}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5031-5040} }
SVDFormer: Complementing Point Cloud via Self-view Augmentation and Self-structure Dual-generator: Zhe Zhu,

Honghua Chen,

Xing He,

Weiming Wang,

Jing Qin,

Mingqiang Wei; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Zhe and Chen, Honghua and He, Xing and Wang, Weiming and Qin, Jing and Wei, Mingqiang}, title = {SVDFormer: Complementing Point Cloud via Self-view Augmentation and Self-structure Dual-generator}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14508-14518} }
Few-Shot Video Classification via Representation Fusion and Promotion Learning: Haifeng Xia,

Kai Li,

Martin Renqiang Min,

Zhengming Ding; [pdf]
[bibtex]
@InProceedings{Xia_2023_ICCV, author = {Xia, Haifeng and Li, Kai and Min, Martin Renqiang and Ding, Zhengming}, title = {Few-Shot Video Classification via Representation Fusion and Promotion Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19311-19320} }
E3Sym: Leveraging E(3) Invariance for Unsupervised 3D Planar Reflective Symmetry Detection: Ren-Wu Li,

Ling-Xiao Zhang,

Chunpeng Li,

Yu-Kun Lai,

Lin Gao; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Ren-Wu and Zhang, Ling-Xiao and Li, Chunpeng and Lai, Yu-Kun and Gao, Lin}, title = {E3Sym: Leveraging E(3) Invariance for Unsupervised 3D Planar Reflective Symmetry Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14543-14553} }
CTVIS: Consistent Training for Online Video Instance Segmentation: Kaining Ying,

Qing Zhong,

Weian Mao,

Zhenhua Wang,

Hao Chen,

Lin Yuanbo Wu,

Yifan Liu,

Chengxiang Fan,

Yunzhi Zhuge,

Chunhua Shen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ying_2023_ICCV, author = {Ying, Kaining and Zhong, Qing and Mao, Weian and Wang, Zhenhua and Chen, Hao and Wu, Lin Yuanbo and Liu, Yifan and Fan, Chengxiang and Zhuge, Yunzhi and Shen, Chunhua}, title = {CTVIS: Consistent Training for Online Video Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {899-908} }
Unsupervised Video Object Segmentation with Online Adversarial Self-Tuning: Tiankang Su,

Huihui Song,

Dong Liu,

Bo Liu,

Qingshan Liu; [pdf]
[bibtex]
@InProceedings{Su_2023_ICCV, author = {Su, Tiankang and Song, Huihui and Liu, Dong and Liu, Bo and Liu, Qingshan}, title = {Unsupervised Video Object Segmentation with Online Adversarial Self-Tuning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {688-698} }
Hallucination Improves the Performance of Unsupervised Visual Representation Learning: Jing Wu,

Jennifer Hobbs,

Naira Hovakimyan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Jing and Hobbs, Jennifer and Hovakimyan, Naira}, title = {Hallucination Improves the Performance of Unsupervised Visual Representation Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16132-16143} }
S3IM: Stochastic Structural SIMilarity and Its Unreasonable Effectiveness for Neural Fields: Zeke Xie,

Xindi Yang,

Yujie Yang,

Qi Sun,

Yixiang Jiang,

Haoran Wang,

Yunfeng Cai,

Mingming Sun; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xie_2023_ICCV, author = {Xie, Zeke and Yang, Xindi and Yang, Yujie and Sun, Qi and Jiang, Yixiang and Wang, Haoran and Cai, Yunfeng and Sun, Mingming}, title = {S3IM: Stochastic Structural SIMilarity and Its Unreasonable Effectiveness for Neural Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18024-18034} }
GlobalMapper: Arbitrary-Shaped Urban Layout Generation: Liu He,

Daniel Aliaga; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{He_2023_ICCV, author = {He, Liu and Aliaga, Daniel}, title = {GlobalMapper: Arbitrary-Shaped Urban Layout Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {454-464} }
Membrane Potential Batch Normalization for Spiking Neural Networks: Yufei Guo,

Yuhan Zhang,

Yuanpei Chen,

Weihang Peng,

Xiaode Liu,

Liwen Zhang,

Xuhui Huang,

Zhe Ma; [pdf] [arXiv]
[bibtex]
@InProceedings{Guo_2023_ICCV, author = {Guo, Yufei and Zhang, Yuhan and Chen, Yuanpei and Peng, Weihang and Liu, Xiaode and Zhang, Liwen and Huang, Xuhui and Ma, Zhe}, title = {Membrane Potential Batch Normalization for Spiking Neural Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19420-19430} }
Enhancing Sample Utilization through Sample Adaptive Augmentation in Semi-Supervised Learning: Guan Gui,

Zhen Zhao,

Lei Qi,

Luping Zhou,

Lei Wang,

Yinghuan Shi; [pdf] [arXiv]
[bibtex]
@InProceedings{Gui_2023_ICCV, author = {Gui, Guan and Zhao, Zhen and Qi, Lei and Zhou, Luping and Wang, Lei and Shi, Yinghuan}, title = {Enhancing Sample Utilization through Sample Adaptive Augmentation in Semi-Supervised Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15880-15889} }
Imitator: Personalized Speech-driven 3D Facial Animation: Balamurugan Thambiraja,

Ikhsanul Habibie,

Sadegh Aliakbarian,

Darren Cosker,

Christian Theobalt,

Justus Thies; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Thambiraja_2023_ICCV, author = {Thambiraja, Balamurugan and Habibie, Ikhsanul and Aliakbarian, Sadegh and Cosker, Darren and Theobalt, Christian and Thies, Justus}, title = {Imitator: Personalized Speech-driven 3D Facial Animation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20621-20631} }
Unified Coarse-to-Fine Alignment for Video-Text Retrieval: Ziyang Wang,

Yi-Lin Sung,

Feng Cheng,

Gedas Bertasius,

Mohit Bansal; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Ziyang and Sung, Yi-Lin and Cheng, Feng and Bertasius, Gedas and Bansal, Mohit}, title = {Unified Coarse-to-Fine Alignment for Video-Text Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2816-2827} }
Seeing Beyond the Patch: Scale-Adaptive Semantic Segmentation of High-resolution Remote Sensing Imagery based on Reinforcement Learning: Yinhe Liu,

Sunan Shi,

Junjue Wang,

Yanfei Zhong; [pdf]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Yinhe and Shi, Sunan and Wang, Junjue and Zhong, Yanfei}, title = {Seeing Beyond the Patch: Scale-Adaptive Semantic Segmentation of High-resolution Remote Sensing Imagery based on Reinforcement Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16868-16878} }
Gradient-Regulated Meta-Prompt Learning for Generalizable Vision-Language Models: Juncheng Li,

Minghe Gao,

Longhui Wei,

Siliang Tang,

Wenqiao Zhang,

Mengze Li,

Wei Ji,

Qi Tian,

Tat-Seng Chua,

Yueting Zhuang; [pdf] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Juncheng and Gao, Minghe and Wei, Longhui and Tang, Siliang and Zhang, Wenqiao and Li, Mengze and Ji, Wei and Tian, Qi and Chua, Tat-Seng and Zhuang, Yueting}, title = {Gradient-Regulated Meta-Prompt Learning for Generalizable Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2551-2562} }
Zero-Shot Composed Image Retrieval with Textual Inversion: Alberto Baldrati,

Lorenzo Agnolucci,

Marco Bertini,

Alberto Del Bimbo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Baldrati_2023_ICCV, author = {Baldrati, Alberto and Agnolucci, Lorenzo and Bertini, Marco and Del Bimbo, Alberto}, title = {Zero-Shot Composed Image Retrieval with Textual Inversion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15338-15347} }
MUter: Machine Unlearning on Adversarially Trained Models: Junxu Liu,

Mingsheng Xue,

Jian Lou,

Xiaoyu Zhang,

Li Xiong,

Zhan Qin; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Junxu and Xue, Mingsheng and Lou, Jian and Zhang, Xiaoyu and Xiong, Li and Qin, Zhan}, title = {MUter: Machine Unlearning on Adversarially Trained Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4892-4902} }
WALDO: Future Video Synthesis Using Object Layer Decomposition and Parametric Flow Prediction: Guillaume Le Moing,

Jean Ponce,

Cordelia Schmid; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Le_Moing_2023_ICCV, author = {Le Moing, Guillaume and Ponce, Jean and Schmid, Cordelia}, title = {WALDO: Future Video Synthesis Using Object Layer Decomposition and Parametric Flow Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23229-23241} }
ParCNetV2: Oversized Kernel with Enhanced Attention: Ruihan Xu,

Haokui Zhang,

Wenze Hu,

Shiliang Zhang,

Xiaoyu Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Ruihan and Zhang, Haokui and Hu, Wenze and Zhang, Shiliang and Wang, Xiaoyu}, title = {ParCNetV2: Oversized Kernel with Enhanced Attention}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5752-5762} }
BiFF: Bi-level Future Fusion with Polyline-based Coordinate for Interactive Trajectory Prediction: Yiyao Zhu,

Di Luan,

Shaojie Shen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Yiyao and Luan, Di and Shen, Shaojie}, title = {BiFF: Bi-level Future Fusion with Polyline-based Coordinate for Interactive Trajectory Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8260-8271} }
RealGraph: A Multiview Dataset for 4D Real-world Context Graph Generation: Haozhe Lin,

Zequn Chen,

Jinzhi Zhang,

Bing Bai,

Yu Wang,

Ruqi Huang,

Lu Fang; [pdf] [supp]
[bibtex]
@InProceedings{Lin_2023_ICCV, author = {Lin, Haozhe and Chen, Zequn and Zhang, Jinzhi and Bai, Bing and Wang, Yu and Huang, Ruqi and Fang, Lu}, title = {RealGraph: A Multiview Dataset for 4D Real-world Context Graph Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3758-3768} }
COOL-CHIC: Coordinate-based Low Complexity Hierarchical Image Codec: Théo Ladune,

Pierrick Philippe,

Félix Henry,

Gordon Clare,

Thomas Leguay; [pdf]
[bibtex]
@InProceedings{Ladune_2023_ICCV, author = {Ladune, Th\'eo and Philippe, Pierrick and Henry, F\'elix and Clare, Gordon and Leguay, Thomas}, title = {COOL-CHIC: Coordinate-based Low Complexity Hierarchical Image Codec}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13515-13522} }
Normalizing Flows for Human Pose Anomaly Detection: Or Hirschorn,

Shai Avidan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hirschorn_2023_ICCV, author = {Hirschorn, Or and Avidan, Shai}, title = {Normalizing Flows for Human Pose Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13545-13554} }
Reconstructing Groups of People with Hypergraph Relational Reasoning: Buzhen Huang,

Jingyi Ju,

Zhihao Li,

Yangang Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Buzhen and Ju, Jingyi and Li, Zhihao and Wang, Yangang}, title = {Reconstructing Groups of People with Hypergraph Relational Reasoning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14873-14883} }
PivotNet: Vectorized Pivot Learning for End-to-end HD Map Construction: Wenjie Ding,

Limeng Qiao,

Xi Qiu,

Chi Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ding_2023_ICCV, author = {Ding, Wenjie and Qiao, Limeng and Qiu, Xi and Zhang, Chi}, title = {PivotNet: Vectorized Pivot Learning for End-to-end HD Map Construction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3672-3682} }
Universal Domain Adaptation via Compressive Attention Matching: Didi Zhu,

Yinchuan Li,

Junkun Yuan,

Zexi Li,

Kun Kuang,

Chao Wu; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Didi and Li, Yinchuan and Yuan, Junkun and Li, Zexi and Kuang, Kun and Wu, Chao}, title = {Universal Domain Adaptation via Compressive Attention Matching}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6974-6985} }
Contactless Pulse Estimation Leveraging Pseudo Labels and Self-Supervision: Zhihua Li,

Lijun Yin; [pdf]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Zhihua and Yin, Lijun}, title = {Contactless Pulse Estimation Leveraging Pseudo Labels and Self-Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20588-20597} }
Instruct-NeRF2NeRF: Editing 3D Scenes with Instructions: Ayaan Haque,

Matthew Tancik,

Alexei A. Efros,

Aleksander Holynski,

Angjoo Kanazawa; [pdf] [supp]
[bibtex]
@InProceedings{Haque_2023_ICCV, author = {Haque, Ayaan and Tancik, Matthew and Efros, Alexei A. and Holynski, Aleksander and Kanazawa, Angjoo}, title = {Instruct-NeRF2NeRF: Editing 3D Scenes with Instructions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19740-19750} }
Point2Mask: Point-supervised Panoptic Segmentation via Optimal Transport: Wentong Li,

Yuqian Yuan,

Song Wang,

Jianke Zhu,

Jianshu Li,

Jian Liu,

Lei Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Wentong and Yuan, Yuqian and Wang, Song and Zhu, Jianke and Li, Jianshu and Liu, Jian and Zhang, Lei}, title = {Point2Mask: Point-supervised Panoptic Segmentation via Optimal Transport}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {572-581} }
Multi-Task Learning with Knowledge Distillation for Dense Prediction: Yangyang Xu,

Yibo Yang,

Lefei Zhang; [pdf]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Yangyang and Yang, Yibo and Zhang, Lefei}, title = {Multi-Task Learning with Knowledge Distillation for Dense Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21550-21559} }
What Does a Platypus Look Like? Generating Customized Prompts for Zero-Shot Image Classification: Sarah Pratt,

Ian Covert,

Rosanne Liu,

Ali Farhadi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Pratt_2023_ICCV, author = {Pratt, Sarah and Covert, Ian and Liu, Rosanne and Farhadi, Ali}, title = {What Does a Platypus Look Like? Generating Customized Prompts for Zero-Shot Image Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15691-15701} }
Scene as Occupancy: Wenwen Tong,

Chonghao Sima,

Tai Wang,

Li Chen,

Silei Wu,

Hanming Deng,

Yi Gu,

Lewei Lu,

Ping Luo,

Dahua Lin,

Hongyang Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tong_2023_ICCV, author = {Tong, Wenwen and Sima, Chonghao and Wang, Tai and Chen, Li and Wu, Silei and Deng, Hanming and Gu, Yi and Lu, Lewei and Luo, Ping and Lin, Dahua and Li, Hongyang}, title = {Scene as Occupancy}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8406-8415} }
U-RED: Unsupervised 3D Shape Retrieval and Deformation for Partial Point Clouds: Yan Di,

Chenyangguang Zhang,

Ruida Zhang,

Fabian Manhardt,

Yongzhi Su,

Jason Rambach,

Didier Stricker,

Xiangyang Ji,

Federico Tombari; [pdf] [supp]
[bibtex]
@InProceedings{Di_2023_ICCV, author = {Di, Yan and Zhang, Chenyangguang and Zhang, Ruida and Manhardt, Fabian and Su, Yongzhi and Rambach, Jason and Stricker, Didier and Ji, Xiangyang and Tombari, Federico}, title = {U-RED: Unsupervised 3D Shape Retrieval and Deformation for Partial Point Clouds}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8884-8895} }
RFLA: A Stealthy Reflected Light Adversarial Attack in the Physical World: Donghua Wang,

Wen Yao,

Tingsong Jiang,

Chao Li,

Xiaoqian Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Donghua and Yao, Wen and Jiang, Tingsong and Li, Chao and Chen, Xiaoqian}, title = {RFLA: A Stealthy Reflected Light Adversarial Attack in the Physical World}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4455-4465} }
Nearest Neighbor Guidance for Out-of-Distribution Detection: Jaewoo Park,

Yoon Gyo Jung,

Andrew Beng Jin Teoh; [pdf] [supp]
[bibtex]
@InProceedings{Park_2023_ICCV, author = {Park, Jaewoo and Jung, Yoon Gyo and Teoh, Andrew Beng Jin}, title = {Nearest Neighbor Guidance for Out-of-Distribution Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1686-1695} }
PatchCT: Aligning Patch Set and Label Set with Conditional Transport for Multi-Label Image Classification: Miaoge Li,

Dongsheng Wang,

Xinyang Liu,

Zequn Zeng,

Ruiying Lu,

Bo Chen,

Mingyuan Zhou; [pdf] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Miaoge and Wang, Dongsheng and Liu, Xinyang and Zeng, Zequn and Lu, Ruiying and Chen, Bo and Zhou, Mingyuan}, title = {PatchCT: Aligning Patch Set and Label Set with Conditional Transport for Multi-Label Image Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15348-15358} }
VI-Net: Boosting Category-level 6D Object Pose Estimation via Learning Decoupled Rotations on the Spherical Representations: Jiehong Lin,

Zewei Wei,

Yabin Zhang,

Kui Jia; [pdf] [supp]
[bibtex]
@InProceedings{Lin_2023_ICCV, author = {Lin, Jiehong and Wei, Zewei and Zhang, Yabin and Jia, Kui}, title = {VI-Net: Boosting Category-level 6D Object Pose Estimation via Learning Decoupled Rotations on the Spherical Representations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14001-14011} }
ICD-Face: Intra-class Compactness Distillation for Face Recognition: Zhipeng Yu,

Jiaheng Liu,

Haoyu Qin,

Yichao Wu,

Kun Hu,

Jiayi Tian,

Ding Liang; [pdf]
[bibtex]
@InProceedings{Yu_2023_ICCV, author = {Yu, Zhipeng and Liu, Jiaheng and Qin, Haoyu and Wu, Yichao and Hu, Kun and Tian, Jiayi and Liang, Ding}, title = {ICD-Face: Intra-class Compactness Distillation for Face Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21042-21052} }
Diffusion-SDF: Conditional Generative Modeling of Signed Distance Functions: Gene Chou,

Yuval Bahat,

Felix Heide; [pdf]
[bibtex]
@InProceedings{Chou_2023_ICCV, author = {Chou, Gene and Bahat, Yuval and Heide, Felix}, title = {Diffusion-SDF: Conditional Generative Modeling of Signed Distance Functions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2262-2272} }
Open-Vocabulary Object Detection With an Open Corpus: Jiong Wang,

Huiming Zhang,

Haiwen Hong,

Xuan Jin,

Yuan He,

Hui Xue,

Zhou Zhao; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Jiong and Zhang, Huiming and Hong, Haiwen and Jin, Xuan and He, Yuan and Xue, Hui and Zhao, Zhou}, title = {Open-Vocabulary Object Detection With an Open Corpus}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6759-6769} }
Long-range Multimodal Pretraining for Movie Understanding: Dawit Mureja Argaw,

Joon-Young Lee,

Markus Woodson,

In So Kweon,

Fabian Caba Heilbron; [pdf] [arXiv]
[bibtex]
@InProceedings{Argaw_2023_ICCV, author = {Argaw, Dawit Mureja and Lee, Joon-Young and Woodson, Markus and Kweon, In So and Heilbron, Fabian Caba}, title = {Long-range Multimodal Pretraining for Movie Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13392-13403} }
MRM: Masked Relation Modeling for Medical Image Pre-Training with Genetics: Qiushi Yang,

Wuyang Li,

Baopu Li,

Yixuan Yuan; [pdf] [supp]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Qiushi and Li, Wuyang and Li, Baopu and Yuan, Yixuan}, title = {MRM: Masked Relation Modeling for Medical Image Pre-Training with Genetics}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21452-21462} }
Adverse Weather Removal with Codebook Priors: Tian Ye,

Sixiang Chen,

Jinbin Bai,

Jun Shi,

Chenghao Xue,

Jingxia Jiang,

Junjie Yin,

Erkang Chen,

Yun Liu; [pdf] [supp]
[bibtex]
@InProceedings{Ye_2023_ICCV, author = {Ye, Tian and Chen, Sixiang and Bai, Jinbin and Shi, Jun and Xue, Chenghao and Jiang, Jingxia and Yin, Junjie and Chen, Erkang and Liu, Yun}, title = {Adverse Weather Removal with Codebook Priors}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12653-12664} }
Spectrum-guided Multi-granularity Referring Video Object Segmentation: Bo Miao,

Mohammed Bennamoun,

Yongsheng Gao,

Ajmal Mian; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Miao_2023_ICCV, author = {Miao, Bo and Bennamoun, Mohammed and Gao, Yongsheng and Mian, Ajmal}, title = {Spectrum-guided Multi-granularity Referring Video Object Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {920-930} }
Sound Source Localization is All about Cross-Modal Alignment: Arda Senocak,

Hyeonggon Ryu,

Junsik Kim,

Tae-Hyun Oh,

Hanspeter Pfister,

Joon Son Chung; [pdf] [arXiv]
[bibtex]
@InProceedings{Senocak_2023_ICCV, author = {Senocak, Arda and Ryu, Hyeonggon and Kim, Junsik and Oh, Tae-Hyun and Pfister, Hanspeter and Chung, Joon Son}, title = {Sound Source Localization is All about Cross-Modal Alignment}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7777-7787} }
MAP: Towards Balanced Generalization of IID and OOD through Model-Agnostic Adapters: Min Zhang,

Junkun Yuan,

Yue He,

Wenbin Li,

Zhengyu Chen,

Kun Kuang; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Min and Yuan, Junkun and He, Yue and Li, Wenbin and Chen, Zhengyu and Kuang, Kun}, title = {MAP: Towards Balanced Generalization of IID and OOD through Model-Agnostic Adapters}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11921-11931} }
Exploring Group Video Captioning with Efficient Relational Approximation: Wang Lin,

Tao Jin,

Ye Wang,

Wenwen Pan,

Linjun Li,

Xize Cheng,

Zhou Zhao; [pdf] [supp]
[bibtex]
@InProceedings{Lin_2023_ICCV, author = {Lin, Wang and Jin, Tao and Wang, Ye and Pan, Wenwen and Li, Linjun and Cheng, Xize and Zhao, Zhou}, title = {Exploring Group Video Captioning with Efficient Relational Approximation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15281-15290} }
ADAPT: Efficient Multi-Agent Trajectory Prediction with Adaptation: Görkay Aydemir,

Adil Kaan Akan,

Fatma Güney; [pdf] [supp]
[bibtex]
@InProceedings{Aydemir_2023_ICCV, author = {Aydemir, G\"orkay and Akan, Adil Kaan and G\"uney, Fatma}, title = {ADAPT: Efficient Multi-Agent Trajectory Prediction with Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8295-8305} }
TaskExpert: Dynamically Assembling Multi-Task Representations with Memorial Mixture-of-Experts: Hanrong Ye,

Dan Xu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ye_2023_ICCV, author = {Ye, Hanrong and Xu, Dan}, title = {TaskExpert: Dynamically Assembling Multi-Task Representations with Memorial Mixture-of-Experts}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21828-21837} }
Meta OOD Learning For Continuously Adaptive OOD Detection: Xinheng Wu,

Jie Lu,

Zhen Fang,

Guangquan Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Xinheng and Lu, Jie and Fang, Zhen and Zhang, Guangquan}, title = {Meta OOD Learning For Continuously Adaptive OOD Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19353-19364} }
MAPConNet: Self-supervised 3D Pose Transfer with Mesh and Point Contrastive Learning: Jiaze Sun,

Zhixiang Chen,

Tae-Kyun Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sun_2023_ICCV, author = {Sun, Jiaze and Chen, Zhixiang and Kim, Tae-Kyun}, title = {MAPConNet: Self-supervised 3D Pose Transfer with Mesh and Point Contrastive Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14452-14462} }
BlendFace: Re-designing Identity Encoders for Face-Swapping: Kaede Shiohara,

Xingchao Yang,

Takafumi Taketomi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shiohara_2023_ICCV, author = {Shiohara, Kaede and Yang, Xingchao and Taketomi, Takafumi}, title = {BlendFace: Re-designing Identity Encoders for Face-Swapping}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7634-7644} }
Test-time Personalizable Forecasting of 3D Human Poses: Qiongjie Cui,

Huaijiang Sun,

Jianfeng Lu,

Weiqing Li,

Bin Li,

Hongwei Yi,

Haofan Wang; [pdf] [supp]
[bibtex]
@InProceedings{Cui_2023_ICCV, author = {Cui, Qiongjie and Sun, Huaijiang and Lu, Jianfeng and Li, Weiqing and Li, Bin and Yi, Hongwei and Wang, Haofan}, title = {Test-time Personalizable Forecasting of 3D Human Poses}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {274-283} }
Few-shot Continual Infomax Learning: Ziqi Gu,

Chunyan Xu,

Jian Yang,

Zhen Cui; [pdf] [supp]
[bibtex]
@InProceedings{Gu_2023_ICCV, author = {Gu, Ziqi and Xu, Chunyan and Yang, Jian and Cui, Zhen}, title = {Few-shot Continual Infomax Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19224-19233} }
A Parse-Then-Place Approach for Generating Graphic Layouts from Textual Descriptions: Jiawei Lin,

Jiaqi Guo,

Shizhao Sun,

Weijiang Xu,

Ting Liu,

Jian-Guang Lou,

Dongmei Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lin_2023_ICCV, author = {Lin, Jiawei and Guo, Jiaqi and Sun, Shizhao and Xu, Weijiang and Liu, Ting and Lou, Jian-Guang and Zhang, Dongmei}, title = {A Parse-Then-Place Approach for Generating Graphic Layouts from Textual Descriptions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23622-23631} }
DreamBooth3D: Subject-Driven Text-to-3D Generation: Amit Raj,

Srinivas Kaza,

Ben Poole,

Michael Niemeyer,

Nataniel Ruiz,

Ben Mildenhall,

Shiran Zada,

Kfir Aberman,

Michael Rubinstein,

Jonathan Barron,

Yuanzhen Li,

Varun Jampani; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Raj_2023_ICCV, author = {Raj, Amit and Kaza, Srinivas and Poole, Ben and Niemeyer, Michael and Ruiz, Nataniel and Mildenhall, Ben and Zada, Shiran and Aberman, Kfir and Rubinstein, Michael and Barron, Jonathan and Li, Yuanzhen and Jampani, Varun}, title = {DreamBooth3D: Subject-Driven Text-to-3D Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2349-2359} }
DARTH: Holistic Test-time Adaptation for Multiple Object Tracking: Mattia Segu,

Bernt Schiele,

Fisher Yu; [pdf] [supp]
[bibtex]
@InProceedings{Segu_2023_ICCV, author = {Segu, Mattia and Schiele, Bernt and Yu, Fisher}, title = {DARTH: Holistic Test-time Adaptation for Multiple Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9717-9727} }
Multi-interactive Feature Learning and a Full-time Multi-modality Benchmark for Image Fusion and Segmentation: Jinyuan Liu,

Zhu Liu,

Guanyao Wu,

Long Ma,

Risheng Liu,

Wei Zhong,

Zhongxuan Luo,

Xin Fan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Jinyuan and Liu, Zhu and Wu, Guanyao and Ma, Long and Liu, Risheng and Zhong, Wei and Luo, Zhongxuan and Fan, Xin}, title = {Multi-interactive Feature Learning and a Full-time Multi-modality Benchmark for Image Fusion and Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8115-8124} }
BaRe-ESA: A Riemannian Framework for Unregistered Human Body Shapes: Emmanuel Hartman,

Emery Pierson,

Martin Bauer,

Nicolas Charon,

Mohamed Daoudi; [pdf] [supp]
[bibtex]
@InProceedings{Hartman_2023_ICCV, author = {Hartman, Emmanuel and Pierson, Emery and Bauer, Martin and Charon, Nicolas and Daoudi, Mohamed}, title = {BaRe-ESA: A Riemannian Framework for Unregistered Human Body Shapes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14181-14191} }
Skip-Plan: Procedure Planning in Instructional Videos via Condensed Action Space Learning: Zhiheng Li,

Wenjia Geng,

Muheng Li,

Lei Chen,

Yansong Tang,

Jiwen Lu,

Jie Zhou; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Zhiheng and Geng, Wenjia and Li, Muheng and Chen, Lei and Tang, Yansong and Lu, Jiwen and Zhou, Jie}, title = {Skip-Plan: Procedure Planning in Instructional Videos via Condensed Action Space Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10297-10306} }
A Retrospect to Multi-prompt Learning across Vision and Language: Ziliang Chen,

Xin Huang,

Quanlong Guan,

Liang Lin,

Weiqi Luo; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Ziliang and Huang, Xin and Guan, Quanlong and Lin, Liang and Luo, Weiqi}, title = {A Retrospect to Multi-prompt Learning across Vision and Language}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22190-22201} }
Sparse Instance Conditioned Multimodal Trajectory Prediction: Yonghao Dong,

Le Wang,

Sanping Zhou,

Gang Hua; [pdf]
[bibtex]
@InProceedings{Dong_2023_ICCV, author = {Dong, Yonghao and Wang, Le and Zhou, Sanping and Hua, Gang}, title = {Sparse Instance Conditioned Multimodal Trajectory Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9763-9772} }
Label Shift Adapter for Test-Time Adaptation under Covariate and Label Shifts: Sunghyun Park,

Seunghan Yang,

Jaegul Choo,

Sungrack Yun; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Park_2023_ICCV, author = {Park, Sunghyun and Yang, Seunghan and Choo, Jaegul and Yun, Sungrack}, title = {Label Shift Adapter for Test-Time Adaptation under Covariate and Label Shifts}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16421-16431} }
NAPA-VQ: Neighborhood-Aware Prototype Augmentation with Vector Quantization for Continual Learning: Tamasha Malepathirana,

Damith Senanayake,

Saman Halgamuge; [pdf] [supp]
[bibtex]
@InProceedings{Malepathirana_2023_ICCV, author = {Malepathirana, Tamasha and Senanayake, Damith and Halgamuge, Saman}, title = {NAPA-VQ: Neighborhood-Aware Prototype Augmentation with Vector Quantization for Continual Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11674-11684} }
Dynamic Snake Convolution Based on Topological Geometric Constraints for Tubular Structure Segmentation: Yaolei Qi,

Yuting He,

Xiaoming Qi,

Yuan Zhang,

Guanyu Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Qi_2023_ICCV, author = {Qi, Yaolei and He, Yuting and Qi, Xiaoming and Zhang, Yuan and Yang, Guanyu}, title = {Dynamic Snake Convolution Based on Topological Geometric Constraints for Tubular Structure Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6070-6079} }
Unsupervised Open-Vocabulary Object Localization in Videos: Ke Fan,

Zechen Bai,

Tianjun Xiao,

Dominik Zietlow,

Max Horn,

Zixu Zhao,

Carl-Johann Simon-Gabriel,

Mike Zheng Shou,

Francesco Locatello,

Bernt Schiele,

Thomas Brox,

Zheng Zhang,

Yanwei Fu,

Tong He; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Fan_2023_ICCV, author = {Fan, Ke and Bai, Zechen and Xiao, Tianjun and Zietlow, Dominik and Horn, Max and Zhao, Zixu and Simon-Gabriel, Carl-Johann and Shou, Mike Zheng and Locatello, Francesco and Schiele, Bernt and Brox, Thomas and Zhang, Zheng and Fu, Yanwei and He, Tong}, title = {Unsupervised Open-Vocabulary Object Localization in Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13747-13755} }
Dataset Quantization: Daquan Zhou,

Kai Wang,

Jianyang Gu,

Xiangyu Peng,

Dongze Lian,

Yifan Zhang,

Yang You,

Jiashi Feng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Daquan and Wang, Kai and Gu, Jianyang and Peng, Xiangyu and Lian, Dongze and Zhang, Yifan and You, Yang and Feng, Jiashi}, title = {Dataset Quantization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17205-17216} }
Unsupervised Video Deraining with An Event Camera: Jin Wang,

Wenming Weng,

Yueyi Zhang,

Zhiwei Xiong; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Jin and Weng, Wenming and Zhang, Yueyi and Xiong, Zhiwei}, title = {Unsupervised Video Deraining with An Event Camera}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10831-10840} }
Overcoming Forgetting Catastrophe in Quantization-Aware Training: Ting-An Chen,

De-Nian Yang,

Ming-Syan Chen; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Ting-An and Yang, De-Nian and Chen, Ming-Syan}, title = {Overcoming Forgetting Catastrophe in Quantization-Aware Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17358-17367} }
DIME-FM : DIstilling Multimodal and Efficient Foundation Models: Ximeng Sun,

Pengchuan Zhang,

Peizhao Zhang,

Hardik Shah,

Kate Saenko,

Xide Xia; [pdf] [supp]
[bibtex]
@InProceedings{Sun_2023_ICCV, author = {Sun, Ximeng and Zhang, Pengchuan and Zhang, Peizhao and Shah, Hardik and Saenko, Kate and Xia, Xide}, title = {DIME-FM : DIstilling Multimodal and Efficient Foundation Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15521-15533} }
Boosting Single Image Super-Resolution via Partial Channel Shifting: Xiaoming Zhang,

Tianrui Li,

Xiaole Zhao; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Xiaoming and Li, Tianrui and Zhao, Xiaole}, title = {Boosting Single Image Super-Resolution via Partial Channel Shifting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13223-13232} }
Learning to Upsample by Learning to Sample: Wenze Liu,

Hao Lu,

Hongtao Fu,

Zhiguo Cao; [pdf] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Wenze and Lu, Hao and Fu, Hongtao and Cao, Zhiguo}, title = {Learning to Upsample by Learning to Sample}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6027-6037} }
LayoutDiffusion: Improving Graphic Layout Generation by Discrete Diffusion Probabilistic Models: Junyi Zhang,

Jiaqi Guo,

Shizhao Sun,

Jian-Guang Lou,

Dongmei Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Junyi and Guo, Jiaqi and Sun, Shizhao and Lou, Jian-Guang and Zhang, Dongmei}, title = {LayoutDiffusion: Improving Graphic Layout Generation by Discrete Diffusion Probabilistic Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7226-7236} }
Efficiently Robustify Pre-Trained Models: Nishant Jain,

Harkirat Behl,

Yogesh Singh Rawat,

Vibhav Vineet; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jain_2023_ICCV, author = {Jain, Nishant and Behl, Harkirat and Rawat, Yogesh Singh and Vineet, Vibhav}, title = {Efficiently Robustify Pre-Trained Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5505-5515} }
Efficient Video Prediction via Sparsely Conditioned Flow Matching: Aram Davtyan,

Sepehr Sameni,

Paolo Favaro; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Davtyan_2023_ICCV, author = {Davtyan, Aram and Sameni, Sepehr and Favaro, Paolo}, title = {Efficient Video Prediction via Sparsely Conditioned Flow Matching}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23263-23274} }
Surface Normal Clustering for Implicit Representation of Manhattan Scenes: Nikola Popovic,

Danda Pani Paudel,

Luc Van Gool; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Popovic_2023_ICCV, author = {Popovic, Nikola and Paudel, Danda Pani and Van Gool, Luc}, title = {Surface Normal Clustering for Implicit Representation of Manhattan Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17860-17870} }
Distracting Downpour: Adversarial Weather Attacks for Motion Estimation: Jenny Schmalfuss,

Lukas Mehl,

Andrés Bruhn; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Schmalfuss_2023_ICCV, author = {Schmalfuss, Jenny and Mehl, Lukas and Bruhn, Andr\'es}, title = {Distracting Downpour: Adversarial Weather Attacks for Motion Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10106-10116} }
Adaptive Similarity Bootstrapping for Self-Distillation Based Representation Learning: Tim Lebailly,

Thomas Stegmüller,

Behzad Bozorgtabar,

Jean-Philippe Thiran,

Tinne Tuytelaars; [pdf] [supp]
[bibtex]
@InProceedings{Lebailly_2023_ICCV, author = {Lebailly, Tim and Stegm\"uller, Thomas and Bozorgtabar, Behzad and Thiran, Jean-Philippe and Tuytelaars, Tinne}, title = {Adaptive Similarity Bootstrapping for Self-Distillation Based Representation Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16505-16514} }
Generalized Differentiable RANSAC: Tong Wei,

Yash Patel,

Alexander Shekhovtsov,

Jiri Matas,

Daniel Barath; [pdf] [arXiv]
[bibtex]
@InProceedings{Wei_2023_ICCV, author = {Wei, Tong and Patel, Yash and Shekhovtsov, Alexander and Matas, Jiri and Barath, Daniel}, title = {Generalized Differentiable RANSAC}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17649-17660} }
Unfolding Framework with Prior of Convolution-Transformer Mixture and Uncertainty Estimation for Video Snapshot Compressive Imaging: Siming Zheng,

Xin Yuan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zheng_2023_ICCV, author = {Zheng, Siming and Yuan, Xin}, title = {Unfolding Framework with Prior of Convolution-Transformer Mixture and Uncertainty Estimation for Video Snapshot Compressive Imaging}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12738-12749} }
Non-Semantics Suppressed Mask Learning for Unsupervised Video Semantic Compression: Yuan Tian,

Guo Lu,

Guangtao Zhai,

Zhiyong Gao; [pdf]
[bibtex]
@InProceedings{Tian_2023_ICCV, author = {Tian, Yuan and Lu, Guo and Zhai, Guangtao and Gao, Zhiyong}, title = {Non-Semantics Suppressed Mask Learning for Unsupervised Video Semantic Compression}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13610-13622} }
ResQ: Residual Quantization for Video Perception: Davide Abati,

Haitam Ben Yahia,

Markus Nagel,

Amirhossein Habibian; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Abati_2023_ICCV, author = {Abati, Davide and Ben Yahia, Haitam and Nagel, Markus and Habibian, Amirhossein}, title = {ResQ: Residual Quantization for Video Perception}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17119-17129} }
Inverse Compositional Learning for Weakly-supervised Relation Grounding: Huan Li,

Ping Wei,

Zeyu Ma,

Nanning Zheng; [pdf]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Huan and Wei, Ping and Ma, Zeyu and Zheng, Nanning}, title = {Inverse Compositional Learning for Weakly-supervised Relation Grounding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15477-15487} }
XMem++: Production-level Video Segmentation From Few Annotated Frames: Maksym Bekuzarov,

Ariana Bermudez,

Joon-Young Lee,

Hao Li; [pdf] [supp]
[bibtex]
@InProceedings{Bekuzarov_2023_ICCV, author = {Bekuzarov, Maksym and Bermudez, Ariana and Lee, Joon-Young and Li, Hao}, title = {XMem++: Production-level Video Segmentation From Few Annotated Frames}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {635-644} }
MHCN: A Hyperbolic Neural Network Model for Multi-view Hierarchical Clustering: Fangfei Lin,

Bing Bai,

Yiwen Guo,

Hao Chen,

Yazhou Ren,

Zenglin Xu; [pdf] [supp]
[bibtex]
@InProceedings{Lin_2023_ICCV, author = {Lin, Fangfei and Bai, Bing and Guo, Yiwen and Chen, Hao and Ren, Yazhou and Xu, Zenglin}, title = {MHCN: A Hyperbolic Neural Network Model for Multi-view Hierarchical Clustering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16525-16535} }
End-to-End Diffusion Latent Optimization Improves Classifier Guidance: Bram Wallace,

Akash Gokul,

Stefano Ermon,

Nikhil Naik; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wallace_2023_ICCV, author = {Wallace, Bram and Gokul, Akash and Ermon, Stefano and Naik, Nikhil}, title = {End-to-End Diffusion Latent Optimization Improves Classifier Guidance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7280-7290} }
FineRecon: Depth-aware Feed-forward Network for Detailed 3D Reconstruction: Noah Stier,

Anurag Ranjan,

Alex Colburn,

Yajie Yan,

Liang Yang,

Fangchang Ma,

Baptiste Angles; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Stier_2023_ICCV, author = {Stier, Noah and Ranjan, Anurag and Colburn, Alex and Yan, Yajie and Yang, Liang and Ma, Fangchang and Angles, Baptiste}, title = {FineRecon: Depth-aware Feed-forward Network for Detailed 3D Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18423-18432} }
Navigating to Objects Specified by Images: Jacob Krantz,

Theophile Gervet,

Karmesh Yadav,

Austin Wang,

Chris Paxton,

Roozbeh Mottaghi,

Dhruv Batra,

Jitendra Malik,

Stefan Lee,

Devendra Singh Chaplot; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Krantz_2023_ICCV, author = {Krantz, Jacob and Gervet, Theophile and Yadav, Karmesh and Wang, Austin and Paxton, Chris and Mottaghi, Roozbeh and Batra, Dhruv and Malik, Jitendra and Lee, Stefan and Chaplot, Devendra Singh}, title = {Navigating to Objects Specified by Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10916-10925} }
TRM-UAP: Enhancing the Transferability of Data-Free Universal Adversarial Perturbation via Truncated Ratio Maximization: Yiran Liu,

Xin Feng,

Yunlong Wang,

Wu Yang,

Di Ming; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Yiran and Feng, Xin and Wang, Yunlong and Yang, Wu and Ming, Di}, title = {TRM-UAP: Enhancing the Transferability of Data-Free Universal Adversarial Perturbation via Truncated Ratio Maximization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4762-4771} }
LATR: 3D Lane Detection from Monocular Images with Transformer: Yueru Luo,

Chaoda Zheng,

Xu Yan,

Tang Kun,

Chao Zheng,

Shuguang Cui,

Zhen Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Luo_2023_ICCV, author = {Luo, Yueru and Zheng, Chaoda and Yan, Xu and Kun, Tang and Zheng, Chao and Cui, Shuguang and Li, Zhen}, title = {LATR: 3D Lane Detection from Monocular Images with Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7941-7952} }
Scratching Visual Transformer's Back with Uniform Attention: Nam Hyeon-Woo,

Kim Yu-Ji,

Byeongho Heo,

Dongyoon Han,

Seong Joon Oh,

Tae-Hyun Oh; [pdf] [supp]
[bibtex]
@InProceedings{Hyeon-Woo_2023_ICCV, author = {Hyeon-Woo, Nam and Yu-Ji, Kim and Heo, Byeongho and Han, Dongyoon and Oh, Seong Joon and Oh, Tae-Hyun}, title = {Scratching Visual Transformer's Back with Uniform Attention}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5807-5818} }
Tune-A-Video: One-Shot Tuning of Image Diffusion Models for Text-to-Video Generation: Jay Zhangjie Wu,

Yixiao Ge,

Xintao Wang,

Stan Weixian Lei,

Yuchao Gu,

Yufei Shi,

Wynne Hsu,

Ying Shan,

Xiaohu Qie,

Mike Zheng Shou; [pdf] [supp]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Jay Zhangjie and Ge, Yixiao and Wang, Xintao and Lei, Stan Weixian and Gu, Yuchao and Shi, Yufei and Hsu, Wynne and Shan, Ying and Qie, Xiaohu and Shou, Mike Zheng}, title = {Tune-A-Video: One-Shot Tuning of Image Diffusion Models for Text-to-Video Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7623-7633} }
Anchor-Intermediate Detector: Decoupling and Coupling Bounding Boxes for Accurate Object Detection: Yilong Lv,

Min Li,

Yujie He,

Shaopeng Li,

Zhuzhen He,

Aitao Yang; [pdf]
[bibtex]
@InProceedings{Lv_2023_ICCV, author = {Lv, Yilong and Li, Min and He, Yujie and Li, Shaopeng and He, Zhuzhen and Yang, Aitao}, title = {Anchor-Intermediate Detector: Decoupling and Coupling Bounding Boxes for Accurate Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6275-6284} }
Environment-Invariant Curriculum Relation Learning for Fine-Grained Scene Graph Generation: Yukuan Min,

Aming Wu,

Cheng Deng; [pdf] [arXiv]
[bibtex]
@InProceedings{Min_2023_ICCV, author = {Min, Yukuan and Wu, Aming and Deng, Cheng}, title = {Environment-Invariant Curriculum Relation Learning for Fine-Grained Scene Graph Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13296-13307} }
Extensible and Efficient Proxy for Neural Architecture Search: Yuhong Li,

Jiajie Li,

Cong Hao,

Pan Li,

Jinjun Xiong,

Deming Chen; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Yuhong and Li, Jiajie and Hao, Cong and Li, Pan and Xiong, Jinjun and Chen, Deming}, title = {Extensible and Efficient Proxy for Neural Architecture Search}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6199-6210} }
Zenseact Open Dataset: A Large-Scale and Diverse Multimodal Dataset for Autonomous Driving: Mina Alibeigi,

William Ljungbergh,

Adam Tonderski,

Georg Hess,

Adam Lilja,

Carl Lindström,

Daria Motorniuk,

Junsheng Fu,

Jenny Widahl,

Christoffer Petersson; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Alibeigi_2023_ICCV, author = {Alibeigi, Mina and Ljungbergh, William and Tonderski, Adam and Hess, Georg and Lilja, Adam and Lindstr\"om, Carl and Motorniuk, Daria and Fu, Junsheng and Widahl, Jenny and Petersson, Christoffer}, title = {Zenseact Open Dataset: A Large-Scale and Diverse Multimodal Dataset for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20178-20188} }
MAAL: Multimodality-Aware Autoencoder-Based Affordance Learning for 3D Articulated Objects: Yuanzhi Liang,

Xiaohan Wang,

Linchao Zhu,

Yi Yang; [pdf] [supp]
[bibtex]
@InProceedings{Liang_2023_ICCV, author = {Liang, Yuanzhi and Wang, Xiaohan and Zhu, Linchao and Yang, Yi}, title = {MAAL: Multimodality-Aware Autoencoder-Based Affordance Learning for 3D Articulated Objects}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {217-227} }
Generalizable Decision Boundaries: Dualistic Meta-Learning for Open Set Domain Generalization: Xiran Wang,

Jian Zhang,

Lei Qi,

Yinghuan Shi; [pdf] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Xiran and Zhang, Jian and Qi, Lei and Shi, Yinghuan}, title = {Generalizable Decision Boundaries: Dualistic Meta-Learning for Open Set Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11564-11573} }
Benchmarking and Analyzing Robust Point Cloud Recognition: Bag of Tricks for Defending Adversarial Examples: Qiufan Ji,

Lin Wang,

Cong Shi,

Shengshan Hu,

Yingying Chen,

Lichao Sun; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ji_2023_ICCV, author = {Ji, Qiufan and Wang, Lin and Shi, Cong and Hu, Shengshan and Chen, Yingying and Sun, Lichao}, title = {Benchmarking and Analyzing Robust Point Cloud Recognition: Bag of Tricks for Defending Adversarial Examples}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4295-4304} }
Weakly Supervised Referring Image Segmentation with Intra-Chunk and Inter-Chunk Consistency: Jungbeom Lee,

Sungjin Lee,

Jinseok Nam,

Seunghak Yu,

Jaeyoung Do,

Tara Taghavi; [pdf] [supp]
[bibtex]
@InProceedings{Lee_2023_ICCV, author = {Lee, Jungbeom and Lee, Sungjin and Nam, Jinseok and Yu, Seunghak and Do, Jaeyoung and Taghavi, Tara}, title = {Weakly Supervised Referring Image Segmentation with Intra-Chunk and Inter-Chunk Consistency}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21870-21881} }
Poincare ResNet: Max van Spengler,

Erwin Berkhout,

Pascal Mettes; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{van_Spengler_2023_ICCV, author = {van Spengler, Max and Berkhout, Erwin and Mettes, Pascal}, title = {Poincare ResNet}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5419-5428} }
Parameterized Cost Volume for Stereo Matching: Jiaxi Zeng,

Chengtang Yao,

Lidong Yu,

Yuwei Wu,

Yunde Jia; [pdf] [supp]
[bibtex]
@InProceedings{Zeng_2023_ICCV, author = {Zeng, Jiaxi and Yao, Chengtang and Yu, Lidong and Wu, Yuwei and Jia, Yunde}, title = {Parameterized Cost Volume for Stereo Matching}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18347-18357} }
SAFE: Sensitivity-Aware Features for Out-of-Distribution Object Detection: Samuel Wilson,

Tobias Fischer,

Feras Dayoub,

Dimity Miller,

Niko Sünderhauf; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wilson_2023_ICCV, author = {Wilson, Samuel and Fischer, Tobias and Dayoub, Feras and Miller, Dimity and S\"underhauf, Niko}, title = {SAFE: Sensitivity-Aware Features for Out-of-Distribution Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23565-23576} }
SimFIR: A Simple Framework for Fisheye Image Rectification with Self-supervised Representation Learning: Hao Feng,

Wendi Wang,

Jiajun Deng,

Wengang Zhou,

Li Li,

Houqiang Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Feng_2023_ICCV, author = {Feng, Hao and Wang, Wendi and Deng, Jiajun and Zhou, Wengang and Li, Li and Li, Houqiang}, title = {SimFIR: A Simple Framework for Fisheye Image Rectification with Self-supervised Representation Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12418-12427} }
Subclass-balancing Contrastive Learning for Long-tailed Recognition: Chengkai Hou,

Jieyu Zhang,

Haonan Wang,

Tianyi Zhou; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hou_2023_ICCV, author = {Hou, Chengkai and Zhang, Jieyu and Wang, Haonan and Zhou, Tianyi}, title = {Subclass-balancing Contrastive Learning for Long-tailed Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5395-5407} }
Generalized Lightness Adaptation with Channel Selective Normalization: Mingde Yao,

Jie Huang,

Xin Jin,

Ruikang Xu,

Shenglong Zhou,

Man Zhou,

Zhiwei Xiong; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yao_2023_ICCV, author = {Yao, Mingde and Huang, Jie and Jin, Xin and Xu, Ruikang and Zhou, Shenglong and Zhou, Man and Xiong, Zhiwei}, title = {Generalized Lightness Adaptation with Channel Selective Normalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10668-10679} }
Omnidirectional Information Gathering for Knowledge Transfer-Based Audio-Visual Navigation: Jinyu Chen,

Wenguan Wang,

Si Liu,

Hongsheng Li,

Yi Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Jinyu and Wang, Wenguan and Liu, Si and Li, Hongsheng and Yang, Yi}, title = {Omnidirectional Information Gathering for Knowledge Transfer-Based Audio-Visual Navigation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10993-11003} }
Multi-Scale Bidirectional Recurrent Network with Hybrid Correlation for Point Cloud Based Scene Flow Estimation: Wencan Cheng,

Jong Hwan Ko; [pdf]
[bibtex]
@InProceedings{Cheng_2023_ICCV, author = {Cheng, Wencan and Ko, Jong Hwan}, title = {Multi-Scale Bidirectional Recurrent Network with Hybrid Correlation for Point Cloud Based Scene Flow Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10041-10050} }
Dynamic Mesh-Aware Radiance Fields: Yi-Ling Qiao,

Alexander Gao,

Yiran Xu,

Yue Feng,

Jia-Bin Huang,

Ming C. Lin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Qiao_2023_ICCV, author = {Qiao, Yi-Ling and Gao, Alexander and Xu, Yiran and Feng, Yue and Huang, Jia-Bin and Lin, Ming C.}, title = {Dynamic Mesh-Aware Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {385-396} }
Learning Support and Trivial Prototypes for Interpretable Image Classification: Chong Wang,

Yuyuan Liu,

Yuanhong Chen,

Fengbei Liu,

Yu Tian,

Davis McCarthy,

Helen Frazer,

Gustavo Carneiro; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Chong and Liu, Yuyuan and Chen, Yuanhong and Liu, Fengbei and Tian, Yu and McCarthy, Davis and Frazer, Helen and Carneiro, Gustavo}, title = {Learning Support and Trivial Prototypes for Interpretable Image Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2062-2072} }
Decoupled DETR: Spatially Disentangling Localization and Classification for Improved End-to-End Object Detection: Manyuan Zhang,

Guanglu Song,

Yu Liu,

Hongsheng Li; [pdf]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Manyuan and Song, Guanglu and Liu, Yu and Li, Hongsheng}, title = {Decoupled DETR: Spatially Disentangling Localization and Classification for Improved End-to-End Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6601-6610} }
GIFD: A Generative Gradient Inversion Method with Feature Domain Optimization: Hao Fang,

Bin Chen,

Xuan Wang,

Zhi Wang,

Shu-Tao Xia; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Fang_2023_ICCV, author = {Fang, Hao and Chen, Bin and Wang, Xuan and Wang, Zhi and Xia, Shu-Tao}, title = {GIFD: A Generative Gradient Inversion Method with Feature Domain Optimization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4967-4976} }
VLN-PETL: Parameter-Efficient Transfer Learning for Vision-and-Language Navigation: Yanyuan Qiao,

Zheng Yu,

Qi Wu; [pdf] [supp]
[bibtex]
@InProceedings{Qiao_2023_ICCV, author = {Qiao, Yanyuan and Yu, Zheng and Wu, Qi}, title = {VLN-PETL: Parameter-Efficient Transfer Learning for Vision-and-Language Navigation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15443-15452} }
Generalized Sum Pooling for Metric Learning: Yeti Z. Gürbüz,

Ozan Sener,

A. Aydin Alatan; [pdf] [supp]
[bibtex]
@InProceedings{Gurbuz_2023_ICCV, author = {G\"urb\"uz, Yeti Z. and Sener, Ozan and Alatan, A. Aydin}, title = {Generalized Sum Pooling for Metric Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5462-5473} }
AlignDet: Aligning Pre-training and Fine-tuning in Object Detection: Ming Li,

Jie Wu,

Xionghui Wang,

Chen Chen,

Jie Qin,

Xuefeng Xiao,

Rui Wang,

Min Zheng,

Xin Pan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Ming and Wu, Jie and Wang, Xionghui and Chen, Chen and Qin, Jie and Xiao, Xuefeng and Wang, Rui and Zheng, Min and Pan, Xin}, title = {AlignDet: Aligning Pre-training and Fine-tuning in Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6866-6876} }
Learning Continuous Exposure Value Representations for Single-Image HDR Reconstruction: Su-Kai Chen,

Hung-Lin Yen,

Yu-Lun Liu,

Min-Hung Chen,

Hou-Ning Hu,

Wen-Hsiao Peng,

Yen-Yu Lin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Su-Kai and Yen, Hung-Lin and Liu, Yu-Lun and Chen, Min-Hung and Hu, Hou-Ning and Peng, Wen-Hsiao and Lin, Yen-Yu}, title = {Learning Continuous Exposure Value Representations for Single-Image HDR Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12990-13000} }
DREAM: Efficient Dataset Distillation by Representative Matching: Yanqing Liu,

Jianyang Gu,

Kai Wang,

Zheng Zhu,

Wei Jiang,

Yang You; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Yanqing and Gu, Jianyang and Wang, Kai and Zhu, Zheng and Jiang, Wei and You, Yang}, title = {DREAM: Efficient Dataset Distillation by Representative Matching}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17314-17324} }
MixSynthFormer: A Transformer Encoder-like Structure with Mixed Synthetic Self-attention for Efficient Human Pose Estimation: Yuran Sun,

Alan William Dougherty,

Zhuoying Zhang,

Yi King Choi,

Chuan Wu; [pdf] [supp]
[bibtex]
@InProceedings{Sun_2023_ICCV, author = {Sun, Yuran and Dougherty, Alan William and Zhang, Zhuoying and Choi, Yi King and Wu, Chuan}, title = {MixSynthFormer: A Transformer Encoder-like Structure with Mixed Synthetic Self-attention for Efficient Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14884-14893} }
Focus on Your Target: A Dual Teacher-Student Framework for Domain-Adaptive Semantic Segmentation: Xinyue Huo,

Lingxi Xie,

Wengang Zhou,

Houqiang Li,

Qi Tian; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huo_2023_ICCV, author = {Huo, Xinyue and Xie, Lingxi and Zhou, Wengang and Li, Houqiang and Tian, Qi}, title = {Focus on Your Target: A Dual Teacher-Student Framework for Domain-Adaptive Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19027-19038} }
Enhanced Meta Label Correction for Coping with Label Corruption: Mitchell Keren Taraday,

Chaim Baskin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Taraday_2023_ICCV, author = {Taraday, Mitchell Keren and Baskin, Chaim}, title = {Enhanced Meta Label Correction for Coping with Label Corruption}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16295-16304} }
Dense Text-to-Image Generation with Attention Modulation: Yunji Kim,

Jiyoung Lee,

Jin-Hwa Kim,

Jung-Woo Ha,

Jun-Yan Zhu; [pdf] [arXiv]
[bibtex]
@InProceedings{Kim_2023_ICCV, author = {Kim, Yunji and Lee, Jiyoung and Kim, Jin-Hwa and Ha, Jung-Woo and Zhu, Jun-Yan}, title = {Dense Text-to-Image Generation with Attention Modulation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7701-7711} }
HumanMAC: Masked Motion Completion for Human Motion Prediction: Ling-Hao Chen,

JiaWei Zhang,

Yewen Li,

Yiren Pang,

Xiaobo Xia,

Tongliang Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Ling-Hao and Zhang, JiaWei and Li, Yewen and Pang, Yiren and Xia, Xiaobo and Liu, Tongliang}, title = {HumanMAC: Masked Motion Completion for Human Motion Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9544-9555} }
Will Large-scale Generative Models Corrupt Future Datasets?: Ryuichiro Hataya,

Han Bao,

Hiromi Arai; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hataya_2023_ICCV, author = {Hataya, Ryuichiro and Bao, Han and Arai, Hiromi}, title = {Will Large-scale Generative Models Corrupt Future Datasets?}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20555-20565} }
SHACIRA: Scalable HAsh-grid Compression for Implicit Neural Representations: Sharath Girish,

Abhinav Shrivastava,

Kamal Gupta; [pdf] [supp]
[bibtex]
@InProceedings{Girish_2023_ICCV, author = {Girish, Sharath and Shrivastava, Abhinav and Gupta, Kamal}, title = {SHACIRA: Scalable HAsh-grid Compression for Implicit Neural Representations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17513-17524} }
Prompt Switch: Efficient CLIP Adaptation for Text-Video Retrieval: Chaorui Deng,

Qi Chen,

Pengda Qin,

Da Chen,

Qi Wu; [pdf] [arXiv]
[bibtex]
@InProceedings{Deng_2023_ICCV, author = {Deng, Chaorui and Chen, Qi and Qin, Pengda and Chen, Da and Wu, Qi}, title = {Prompt Switch: Efficient CLIP Adaptation for Text-Video Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15648-15658} }
Video Action Recognition with Attentive Semantic Units: Yifei Chen,

Dapeng Chen,

Ruijin Liu,

Hao Li,

Wei Peng; [pdf] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Yifei and Chen, Dapeng and Liu, Ruijin and Li, Hao and Peng, Wei}, title = {Video Action Recognition with Attentive Semantic Units}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10170-10180} }
Sentence Attention Blocks for Answer Grounding: Seyedalireza Khoshsirat,

Chandra Kambhamettu; [pdf] [arXiv]
[bibtex]
@InProceedings{Khoshsirat_2023_ICCV, author = {Khoshsirat, Seyedalireza and Kambhamettu, Chandra}, title = {Sentence Attention Blocks for Answer Grounding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6080-6090} }
Scanning Only Once: An End-to-end Framework for Fast Temporal Grounding in Long Videos: Yulin Pan,

Xiangteng He,

Biao Gong,

Yiliang Lv,

Yujun Shen,

Yuxin Peng,

Deli Zhao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Pan_2023_ICCV, author = {Pan, Yulin and He, Xiangteng and Gong, Biao and Lv, Yiliang and Shen, Yujun and Peng, Yuxin and Zhao, Deli}, title = {Scanning Only Once: An End-to-end Framework for Fast Temporal Grounding in Long Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13767-13777} }
A Low-Shot Object Counting Network With Iterative Prototype Adaptation: Nikola Đukić,

Alan Lukežič,

Vitjan Zavrtanik,

Matej Kristan; [pdf]
[bibtex]
@InProceedings{Dukic_2023_ICCV, author = {{\DJ}uki\'c, Nikola and Luke\v{z}i\v{c}, Alan and Zavrtanik, Vitjan and Kristan, Matej}, title = {A Low-Shot Object Counting Network With Iterative Prototype Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18872-18881} }
Towards Fairness-aware Adversarial Network Pruning: Lei Zhang,

Zhibo Wang,

Xiaowei Dong,

Yunhe Feng,

Xiaoyi Pang,

Zhifei Zhang,

Kui Ren; [pdf]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Lei and Wang, Zhibo and Dong, Xiaowei and Feng, Yunhe and Pang, Xiaoyi and Zhang, Zhifei and Ren, Kui}, title = {Towards Fairness-aware Adversarial Network Pruning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5168-5177} }
VoroMesh: Learning Watertight Surface Meshes with Voronoi Diagrams: Nissim Maruani,

Roman Klokov,

Maks Ovsjanikov,

Pierre Alliez,

Mathieu Desbrun; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Maruani_2023_ICCV, author = {Maruani, Nissim and Klokov, Roman and Ovsjanikov, Maks and Alliez, Pierre and Desbrun, Mathieu}, title = {VoroMesh: Learning Watertight Surface Meshes with Voronoi Diagrams}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14565-14574} }
Breaking Temporal Consistency: Generating Video Universal Adversarial Perturbations Using Image Models: Hee-Seon Kim,

Minji Son,

Minbeom Kim,

Myung-Joon Kwon,

Changick Kim; [pdf] [supp]
[bibtex]
@InProceedings{Kim_2023_ICCV, author = {Kim, Hee-Seon and Son, Minji and Kim, Minbeom and Kwon, Myung-Joon and Kim, Changick}, title = {Breaking Temporal Consistency: Generating Video Universal Adversarial Perturbations Using Image Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4325-4334} }
Smoothness Similarity Regularization for Few-Shot GAN Adaptation: Vadim Sushko,

Ruyu Wang,

Juergen Gall; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sushko_2023_ICCV, author = {Sushko, Vadim and Wang, Ruyu and Gall, Juergen}, title = {Smoothness Similarity Regularization for Few-Shot GAN Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7073-7082} }
Distilling Coarse-to-Fine Semantic Matching Knowledge for Weakly Supervised 3D Visual Grounding: Zehan Wang,

Haifeng Huang,

Yang Zhao,

Linjun Li,

Xize Cheng,

Yichen Zhu,

Aoxiong Yin,

Zhou Zhao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Zehan and Huang, Haifeng and Zhao, Yang and Li, Linjun and Cheng, Xize and Zhu, Yichen and Yin, Aoxiong and Zhao, Zhou}, title = {Distilling Coarse-to-Fine Semantic Matching Knowledge for Weakly Supervised 3D Visual Grounding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2662-2671} }
What does CLIP know about a red circle? Visual prompt engineering for VLMs: Aleksandar Shtedritski,

Christian Rupprecht,

Andrea Vedaldi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shtedritski_2023_ICCV, author = {Shtedritski, Aleksandar and Rupprecht, Christian and Vedaldi, Andrea}, title = {What does CLIP know about a red circle? Visual prompt engineering for VLMs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11987-11997} }
MEGA: Multimodal Alignment Aggregation and Distillation For Cinematic Video Segmentation: Najmeh Sadoughi,

Xinyu Li,

Avijit Vajpayee,

David Fan,

Bing Shuai,

Hector Santos-Villalobos,

Vimal Bhat,

Rohith MV; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sadoughi_2023_ICCV, author = {Sadoughi, Najmeh and Li, Xinyu and Vajpayee, Avijit and Fan, David and Shuai, Bing and Santos-Villalobos, Hector and Bhat, Vimal and MV, Rohith}, title = {MEGA: Multimodal Alignment Aggregation and Distillation For Cinematic Video Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23331-23340} }
DiffRate : Differentiable Compression Rate for Efficient Vision Transformers: Mengzhao Chen,

Wenqi Shao,

Peng Xu,

Mingbao Lin,

Kaipeng Zhang,

Fei Chao,

Rongrong Ji,

Yu Qiao,

Ping Luo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Mengzhao and Shao, Wenqi and Xu, Peng and Lin, Mingbao and Zhang, Kaipeng and Chao, Fei and Ji, Rongrong and Qiao, Yu and Luo, Ping}, title = {DiffRate : Differentiable Compression Rate for Efficient Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17164-17174} }
zPROBE: Zero Peek Robustness Checks for Federated Learning: Zahra Ghodsi,

Mojan Javaheripi,

Nojan Sheybani,

Xinqiao Zhang,

Ke Huang,

Farinaz Koushanfar; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ghodsi_2023_ICCV, author = {Ghodsi, Zahra and Javaheripi, Mojan and Sheybani, Nojan and Zhang, Xinqiao and Huang, Ke and Koushanfar, Farinaz}, title = {zPROBE: Zero Peek Robustness Checks for Federated Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4860-4870} }
LoLep: Single-View View Synthesis with Locally-Learned Planes and Self-Attention Occlusion Inference: Cong Wang,

Yu-Ping Wang,

Dinesh Manocha; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Cong and Wang, Yu-Ping and Manocha, Dinesh}, title = {LoLep: Single-View View Synthesis with Locally-Learned Planes and Self-Attention Occlusion Inference}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10841-10851} }
Multi-Modal Continual Test-Time Adaptation for 3D Semantic Segmentation: Haozhi Cao,

Yuecong Xu,

Jianfei Yang,

Pengyu Yin,

Shenghai Yuan,

Lihua Xie; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cao_2023_ICCV, author = {Cao, Haozhi and Xu, Yuecong and Yang, Jianfei and Yin, Pengyu and Yuan, Shenghai and Xie, Lihua}, title = {Multi-Modal Continual Test-Time Adaptation for 3D Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18809-18819} }
Exploring Positional Characteristics of Dual-Pixel Data for Camera Autofocus: Myungsub Choi,

Hana Lee,

Hyong-euk Lee; [pdf] [supp]
[bibtex]
@InProceedings{Choi_2023_ICCV, author = {Choi, Myungsub and Lee, Hana and Lee, Hyong-euk}, title = {Exploring Positional Characteristics of Dual-Pixel Data for Camera Autofocus}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13158-13168} }
Heterogeneous Forgetting Compensation for Class-Incremental Learning: Jiahua Dong,

Wenqi Liang,

Yang Cong,

Gan Sun; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dong_2023_ICCV, author = {Dong, Jiahua and Liang, Wenqi and Cong, Yang and Sun, Gan}, title = {Heterogeneous Forgetting Compensation for Class-Incremental Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11742-11751} }
FemtoDet: An Object Detection Baseline for Energy Versus Performance Tradeoffs: Peng Tu,

Xu Xie,

Guo Ai,

Yuexiang Li,

Yawen Huang,

Yefeng Zheng; [pdf] [arXiv]
[bibtex]
@InProceedings{Tu_2023_ICCV, author = {Tu, Peng and Xie, Xu and Ai, Guo and Li, Yuexiang and Huang, Yawen and Zheng, Yefeng}, title = {FemtoDet: An Object Detection Baseline for Energy Versus Performance Tradeoffs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13318-13327} }
Generative Prompt Model for Weakly Supervised Object Localization: Yuzhong Zhao,

Qixiang Ye,

Weijia Wu,

Chunhua Shen,

Fang Wan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Yuzhong and Ye, Qixiang and Wu, Weijia and Shen, Chunhua and Wan, Fang}, title = {Generative Prompt Model for Weakly Supervised Object Localization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6351-6361} }
ActFormer: A GAN-based Transformer towards General Action-Conditioned 3D Human Motion Generation: Liang Xu,

Ziyang Song,

Dongliang Wang,

Jing Su,

Zhicheng Fang,

Chenjing Ding,

Weihao Gan,

Yichao Yan,

Xin Jin,

Xiaokang Yang,

Wenjun Zeng,

Wei Wu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Liang and Song, Ziyang and Wang, Dongliang and Su, Jing and Fang, Zhicheng and Ding, Chenjing and Gan, Weihao and Yan, Yichao and Jin, Xin and Yang, Xiaokang and Zeng, Wenjun and Wu, Wei}, title = {ActFormer: A GAN-based Transformer towards General Action-Conditioned 3D Human Motion Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2228-2238} }
Hiding Visual Information via Obfuscating Adversarial Perturbations: Zhigang Su,

Dawei Zhou,

Nannan Wang,

Decheng Liu,

Zhen Wang,

Xinbo Gao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Su_2023_ICCV, author = {Su, Zhigang and Zhou, Dawei and Wang, Nannan and Liu, Decheng and Wang, Zhen and Gao, Xinbo}, title = {Hiding Visual Information via Obfuscating Adversarial Perturbations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4356-4366} }
Category-aware Allocation Transformer for Weakly Supervised Object Localization: Zhiwei Chen,

Jinren Ding,

Liujuan Cao,

Yunhang Shen,

Shengchuan Zhang,

Guannan Jiang,

Rongrong Ji; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Zhiwei and Ding, Jinren and Cao, Liujuan and Shen, Yunhang and Zhang, Shengchuan and Jiang, Guannan and Ji, Rongrong}, title = {Category-aware Allocation Transformer for Weakly Supervised Object Localization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6643-6652} }
Domain Specified Optimization for Deployment Authorization: Haotian Wang,

Haoang Chi,

Wenjing Yang,

Zhipeng Lin,

Mingyang Geng,

Long Lan,

Jing Zhang,

Dacheng Tao; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Haotian and Chi, Haoang and Yang, Wenjing and Lin, Zhipeng and Geng, Mingyang and Lan, Long and Zhang, Jing and Tao, Dacheng}, title = {Domain Specified Optimization for Deployment Authorization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5095-5105} }
Iterative Prompt Learning for Unsupervised Backlit Image Enhancement: Zhexin Liang,

Chongyi Li,

Shangchen Zhou,

Ruicheng Feng,

Chen Change Loy; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liang_2023_ICCV, author = {Liang, Zhexin and Li, Chongyi and Zhou, Shangchen and Feng, Ruicheng and Loy, Chen Change}, title = {Iterative Prompt Learning for Unsupervised Backlit Image Enhancement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8094-8103} }
UMIFormer: Mining the Correlations between Similar Tokens for Multi-View 3D Reconstruction: Zhenwei Zhu,

Liying Yang,

Ning Li,

Chaohao Jiang,

Yanyan Liang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Zhenwei and Yang, Liying and Li, Ning and Jiang, Chaohao and Liang, Yanyan}, title = {UMIFormer: Mining the Correlations between Similar Tokens for Multi-View 3D Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18226-18235} }
Improved Knowledge Transfer for Semi-Supervised Domain Adaptation via Trico Training Strategy: Ba Hung Ngo,

Yeon Jeong Chae,

Jung Eun Kwon,

Jae Hyeon Park,

Sung In Cho; [pdf] [supp]
[bibtex]
@InProceedings{Ngo_2023_ICCV, author = {Ngo, Ba Hung and Chae, Yeon Jeong and Kwon, Jung Eun and Park, Jae Hyeon and Cho, Sung In}, title = {Improved Knowledge Transfer for Semi-Supervised Domain Adaptation via Trico Training Strategy}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19214-19223} }
Locally Stylized Neural Radiance Fields: Hong-Wing Pang,

Binh-Son Hua,

Sai-Kit Yeung; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Pang_2023_ICCV, author = {Pang, Hong-Wing and Hua, Binh-Son and Yeung, Sai-Kit}, title = {Locally Stylized Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {307-316} }
InterFormer: Real-time Interactive Image Segmentation: You Huang,

Hao Yang,

Ke Sun,

Shengchuan Zhang,

Liujuan Cao,

Guannan Jiang,

Rongrong Ji; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, You and Yang, Hao and Sun, Ke and Zhang, Shengchuan and Cao, Liujuan and Jiang, Guannan and Ji, Rongrong}, title = {InterFormer: Real-time Interactive Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22301-22311} }
Confidence-aware Pseudo-label Learning for Weakly Supervised Visual Grounding: Yang Liu,

Jiahua Zhang,

Qingchao Chen,

Yuxin Peng; [pdf]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Yang and Zhang, Jiahua and Chen, Qingchao and Peng, Yuxin}, title = {Confidence-aware Pseudo-label Learning for Weakly Supervised Visual Grounding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2828-2838} }
Luminance-aware Color Transform for Multiple Exposure Correction: Jong-Hyeon Baek,

DaeHyun Kim,

Su-Min Choi,

Hyo-jun Lee,

Hanul Kim,

Yeong Jun Koh; [pdf] [supp]
[bibtex]
@InProceedings{Baek_2023_ICCV, author = {Baek, Jong-Hyeon and Kim, DaeHyun and Choi, Su-Min and Lee, Hyo-jun and Kim, Hanul and Koh, Yeong Jun}, title = {Luminance-aware Color Transform for Multiple Exposure Correction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6156-6165} }
A Simple Framework for Open-Vocabulary Segmentation and Detection: Hao Zhang,

Feng Li,

Xueyan Zou,

Shilong Liu,

Chunyuan Li,

Jianwei Yang,

Lei Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Hao and Li, Feng and Zou, Xueyan and Liu, Shilong and Li, Chunyuan and Yang, Jianwei and Zhang, Lei}, title = {A Simple Framework for Open-Vocabulary Segmentation and Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1020-1031} }
Alignment Before Aggregation: Trajectory Memory Retrieval Network for Video Object Segmentation: Rui Sun,

Yuan Wang,

Huayu Mai,

Tianzhu Zhang,

Feng Wu; [pdf] [supp]
[bibtex]
@InProceedings{Sun_2023_ICCV, author = {Sun, Rui and Wang, Yuan and Mai, Huayu and Zhang, Tianzhu and Wu, Feng}, title = {Alignment Before Aggregation: Trajectory Memory Retrieval Network for Video Object Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1218-1228} }
UATVR: Uncertainty-Adaptive Text-Video Retrieval: Bo Fang,

Wenhao Wu,

Chang Liu,

Yu Zhou,

Yuxin Song,

Weiping Wang,

Xiangbo Shu,

Xiangyang Ji,

Jingdong Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Fang_2023_ICCV, author = {Fang, Bo and Wu, Wenhao and Liu, Chang and Zhou, Yu and Song, Yuxin and Wang, Weiping and Shu, Xiangbo and Ji, Xiangyang and Wang, Jingdong}, title = {UATVR: Uncertainty-Adaptive Text-Video Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13723-13733} }
Deep Directly-Trained Spiking Neural Networks for Object Detection: Qiaoyi Su,

Yuhong Chou,

Yifan Hu,

Jianing Li,

Shijie Mei,

Ziyang Zhang,

Guoqi Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Su_2023_ICCV, author = {Su, Qiaoyi and Chou, Yuhong and Hu, Yifan and Li, Jianing and Mei, Shijie and Zhang, Ziyang and Li, Guoqi}, title = {Deep Directly-Trained Spiking Neural Networks for Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6555-6565} }
Online Prototype Learning for Online Continual Learning: Yujie Wei,

Jiaxin Ye,

Zhizhong Huang,

Junping Zhang,

Hongming Shan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wei_2023_ICCV, author = {Wei, Yujie and Ye, Jiaxin and Huang, Zhizhong and Zhang, Junping and Shan, Hongming}, title = {Online Prototype Learning for Online Continual Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18764-18774} }
Robust e-NeRF: NeRF from Sparse & Noisy Events under Non-Uniform Motion: Weng Fei Low,

Gim Hee Lee; [pdf] [supp]
[bibtex]
@InProceedings{Low_2023_ICCV, author = {Low, Weng Fei and Lee, Gim Hee}, title = {Robust e-NeRF: NeRF from Sparse \& Noisy Events under Non-Uniform Motion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18335-18346} }
ActorsNeRF: Animatable Few-shot Human Rendering with Generalizable NeRFs: Jiteng Mu,

Shen Sang,

Nuno Vasconcelos,

Xiaolong Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mu_2023_ICCV, author = {Mu, Jiteng and Sang, Shen and Vasconcelos, Nuno and Wang, Xiaolong}, title = {ActorsNeRF: Animatable Few-shot Human Rendering with Generalizable NeRFs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18391-18401} }
SALAD: Part-Level Latent Diffusion for 3D Shape Generation and Manipulation: Juil Koo,

Seungwoo Yoo,

Minh Hieu Nguyen,

Minhyuk Sung; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Koo_2023_ICCV, author = {Koo, Juil and Yoo, Seungwoo and Nguyen, Minh Hieu and Sung, Minhyuk}, title = {SALAD: Part-Level Latent Diffusion for 3D Shape Generation and Manipulation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14441-14451} }
COMPASS: High-Efficiency Deep Image Compression with Arbitrary-scale Spatial Scalability: Jongmin Park,

Jooyoung Lee,

Munchurl Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Park_2023_ICCV, author = {Park, Jongmin and Lee, Jooyoung and Kim, Munchurl}, title = {COMPASS: High-Efficiency Deep Image Compression with Arbitrary-scale Spatial Scalability}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12826-12835} }
Masked Autoencoders Are Stronger Knowledge Distillers: Shanshan Lao,

Guanglu Song,

Boxiao Liu,

Yu Liu,

Yujiu Yang; [pdf] [supp]
[bibtex]
@InProceedings{Lao_2023_ICCV, author = {Lao, Shanshan and Song, Guanglu and Liu, Boxiao and Liu, Yu and Yang, Yujiu}, title = {Masked Autoencoders Are Stronger Knowledge Distillers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6384-6393} }
Score-Based Diffusion Models as Principled Priors for Inverse Imaging: Berthy T. Feng,

Jamie Smith,

Michael Rubinstein,

Huiwen Chang,

Katherine L. Bouman,

William T. Freeman; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Feng_2023_ICCV, author = {Feng, Berthy T. and Smith, Jamie and Rubinstein, Michael and Chang, Huiwen and Bouman, Katherine L. and Freeman, William T.}, title = {Score-Based Diffusion Models as Principled Priors for Inverse Imaging}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10520-10531} }
Multiscale Structure Guided Diffusion for Image Deblurring: Mengwei Ren,

Mauricio Delbracio,

Hossein Talebi,

Guido Gerig,

Peyman Milanfar; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ren_2023_ICCV, author = {Ren, Mengwei and Delbracio, Mauricio and Talebi, Hossein and Gerig, Guido and Milanfar, Peyman}, title = {Multiscale Structure Guided Diffusion for Image Deblurring}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10721-10733} }
Multiple Planar Object Tracking: Zhicheng Zhang,

Shengzhe Liu,

Jufeng Yang; [pdf]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Zhicheng and Liu, Shengzhe and Yang, Jufeng}, title = {Multiple Planar Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23460-23470} }
CheckerPose: Progressive Dense Keypoint Localization for Object Pose Estimation with Graph Neural Network: Ruyi Lian,

Haibin Ling; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lian_2023_ICCV, author = {Lian, Ruyi and Ling, Haibin}, title = {CheckerPose: Progressive Dense Keypoint Localization for Object Pose Estimation with Graph Neural Network}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14022-14033} }
ASIC: Aligning Sparse in-the-wild Image Collections: Kamal Gupta,

Varun Jampani,

Carlos Esteves,

Abhinav Shrivastava,

Ameesh Makadia,

Noah Snavely,

Abhishek Kar; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gupta_2023_ICCV, author = {Gupta, Kamal and Jampani, Varun and Esteves, Carlos and Shrivastava, Abhinav and Makadia, Ameesh and Snavely, Noah and Kar, Abhishek}, title = {ASIC: Aligning Sparse in-the-wild Image Collections}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4134-4145} }
Residual Pattern Learning for Pixel-Wise Out-of-Distribution Detection in Semantic Segmentation: Yuyuan Liu,

Choubo Ding,

Yu Tian,

Guansong Pang,

Vasileios Belagiannis,

Ian Reid,

Gustavo Carneiro; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Yuyuan and Ding, Choubo and Tian, Yu and Pang, Guansong and Belagiannis, Vasileios and Reid, Ian and Carneiro, Gustavo}, title = {Residual Pattern Learning for Pixel-Wise Out-of-Distribution Detection in Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1151-1161} }
Hierarchical Visual Primitive Experts for Compositional Zero-Shot Learning: Hanjae Kim,

Jiyoung Lee,

Seongheon Park,

Kwanghoon Sohn; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2023_ICCV, author = {Kim, Hanjae and Lee, Jiyoung and Park, Seongheon and Sohn, Kwanghoon}, title = {Hierarchical Visual Primitive Experts for Compositional Zero-Shot Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5675-5685} }
Event Camera Data Pre-training: Yan Yang,

Liyuan Pan,

Liu Liu; [pdf] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Yan and Pan, Liyuan and Liu, Liu}, title = {Event Camera Data Pre-training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10699-10709} }
Segment Every Reference Object in Spatial and Temporal Spaces: Jiannan Wu,

Yi Jiang,

Bin Yan,

Huchuan Lu,

Zehuan Yuan,

Ping Luo; [pdf] [supp]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Jiannan and Jiang, Yi and Yan, Bin and Lu, Huchuan and Yuan, Zehuan and Luo, Ping}, title = {Segment Every Reference Object in Spatial and Temporal Spaces}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2538-2550} }
Unified Out-Of-Distribution Detection: A Model-Specific Perspective: Reza Averly,

Wei-Lun Chao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Averly_2023_ICCV, author = {Averly, Reza and Chao, Wei-Lun}, title = {Unified Out-Of-Distribution Detection: A Model-Specific Perspective}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1453-1463} }
One-shot Implicit Animatable Avatars with Model-based Priors: Yangyi Huang,

Hongwei Yi,

Weiyang Liu,

Haofan Wang,

Boxi Wu,

Wenxiao Wang,

Binbin Lin,

Debing Zhang,

Deng Cai; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Yangyi and Yi, Hongwei and Liu, Weiyang and Wang, Haofan and Wu, Boxi and Wang, Wenxiao and Lin, Binbin and Zhang, Debing and Cai, Deng}, title = {One-shot Implicit Animatable Avatars with Model-based Priors}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8974-8985} }
Unsupervised Feature Representation Learning for Domain-generalized Cross-domain Image Retrieval: Conghui Hu,

Can Zhang,

Gim Hee Lee; [pdf] [supp]
[bibtex]
@InProceedings{Hu_2023_ICCV, author = {Hu, Conghui and Zhang, Can and Lee, Gim Hee}, title = {Unsupervised Feature Representation Learning for Domain-generalized Cross-domain Image Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11016-11025} }
RankMatch: Fostering Confidence and Consistency in Learning with Noisy Labels: Ziyi Zhang,

Weikai Chen,

Chaowei Fang,

Zhen Li,

Lechao Chen,

Liang Lin,

Guanbin Li; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Ziyi and Chen, Weikai and Fang, Chaowei and Li, Zhen and Chen, Lechao and Lin, Liang and Li, Guanbin}, title = {RankMatch: Fostering Confidence and Consistency in Learning with Noisy Labels}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1644-1654} }
Dec-Adapter: Exploring Efficient Decoder-Side Adapter for Bridging Screen Content and Natural Image Compression: Sheng Shen,

Huanjing Yue,

Jingyu Yang; [pdf] [supp]
[bibtex]
@InProceedings{Shen_2023_ICCV, author = {Shen, Sheng and Yue, Huanjing and Yang, Jingyu}, title = {Dec-Adapter: Exploring Efficient Decoder-Side Adapter for Bridging Screen Content and Natural Image Compression}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12887-12896} }
MixReorg: Cross-Modal Mixed Patch Reorganization is a Good Mask Learner for Open-World Semantic Segmentation: Kaixin Cai,

Pengzhen Ren,

Yi Zhu,

Hang Xu,

Jianzhuang Liu,

Changlin Li,

Guangrun Wang,

Xiaodan Liang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cai_2023_ICCV, author = {Cai, Kaixin and Ren, Pengzhen and Zhu, Yi and Xu, Hang and Liu, Jianzhuang and Li, Changlin and Wang, Guangrun and Liang, Xiaodan}, title = {MixReorg: Cross-Modal Mixed Patch Reorganization is a Good Mask Learner for Open-World Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1196-1205} }
Preface: A Data-driven Volumetric Prior for Few-shot Ultra High-resolution Face Synthesis: Marcel C. Bühler,

Kripasindhu Sarkar,

Tanmay Shah,

Gengyan Li,

Daoye Wang,

Leonhard Helminger,

Sergio Orts-Escolano,

Dmitry Lagun,

Otmar Hilliges,

Thabo Beeler,

Abhimitra Meka; [pdf] [supp]
[bibtex]
@InProceedings{Buhler_2023_ICCV, author = {B\"uhler, Marcel C. and Sarkar, Kripasindhu and Shah, Tanmay and Li, Gengyan and Wang, Daoye and Helminger, Leonhard and Orts-Escolano, Sergio and Lagun, Dmitry and Hilliges, Otmar and Beeler, Thabo and Meka, Abhimitra}, title = {Preface: A Data-driven Volumetric Prior for Few-shot Ultra High-resolution Face Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3402-3413} }
Label-Guided Knowledge Distillation for Continual Semantic Segmentation on 2D Images and 3D Point Clouds: Ze Yang,

Ruibo Li,

Evan Ling,

Chi Zhang,

Yiming Wang,

Dezhao Huang,

Keng Teck Ma,

Minhoe Hur,

Guosheng Lin; [pdf] [supp]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Ze and Li, Ruibo and Ling, Evan and Zhang, Chi and Wang, Yiming and Huang, Dezhao and Ma, Keng Teck and Hur, Minhoe and Lin, Guosheng}, title = {Label-Guided Knowledge Distillation for Continual Semantic Segmentation on 2D Images and 3D Point Clouds}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18601-18612} }
Under-Display Camera Image Restoration with Scattering Effect: Binbin Song,

Xiangyu Chen,

Shuning Xu,

Jiantao Zhou; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Song_2023_ICCV, author = {Song, Binbin and Chen, Xiangyu and Xu, Shuning and Zhou, Jiantao}, title = {Under-Display Camera Image Restoration with Scattering Effect}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12580-12589} }
PRANC: Pseudo RAndom Networks for Compacting Deep Models: Parsa Nooralinejad,

Ali Abbasi,

Soroush Abbasi Koohpayegani,

Kossar Pourahmadi Meibodi,

Rana Muhammad Shahroz Khan,

Soheil Kolouri,

Hamed Pirsiavash; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Nooralinejad_2023_ICCV, author = {Nooralinejad, Parsa and Abbasi, Ali and Koohpayegani, Soroush Abbasi and Meibodi, Kossar Pourahmadi and Khan, Rana Muhammad Shahroz and Kolouri, Soheil and Pirsiavash, Hamed}, title = {PRANC: Pseudo RAndom Networks for Compacting Deep Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17021-17031} }
ICICLE: Interpretable Class Incremental Continual Learning: Dawid Rymarczyk,

Joost van de Weijer,

Bartosz Zieliński,

Bartlomiej Twardowski; [pdf] [supp]
[bibtex]
@InProceedings{Rymarczyk_2023_ICCV, author = {Rymarczyk, Dawid and van de Weijer, Joost and Zieli\'nski, Bartosz and Twardowski, Bartlomiej}, title = {ICICLE: Interpretable Class Incremental Continual Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1887-1898} }
Clutter Detection and Removal in 3D Scenes with View-Consistent Inpainting: Fangyin Wei,

Thomas Funkhouser,

Szymon Rusinkiewicz; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wei_2023_ICCV, author = {Wei, Fangyin and Funkhouser, Thomas and Rusinkiewicz, Szymon}, title = {Clutter Detection and Removal in 3D Scenes with View-Consistent Inpainting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18131-18141} }
PointCLIP V2: Prompting CLIP and GPT for Powerful 3D Open-world Learning: Xiangyang Zhu,

Renrui Zhang,

Bowei He,

Ziyu Guo,

Ziyao Zeng,

Zipeng Qin,

Shanghang Zhang,

Peng Gao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Xiangyang and Zhang, Renrui and He, Bowei and Guo, Ziyu and Zeng, Ziyao and Qin, Zipeng and Zhang, Shanghang and Gao, Peng}, title = {PointCLIP V2: Prompting CLIP and GPT for Powerful 3D Open-world Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2639-2650} }
VideoFlow: Exploiting Temporal Cues for Multi-frame Optical Flow Estimation: Xiaoyu Shi,

Zhaoyang Huang,

Weikang Bian,

Dasong Li,

Manyuan Zhang,

Ka Chun Cheung,

Simon See,

Hongwei Qin,

Jifeng Dai,

Hongsheng Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shi_2023_ICCV, author = {Shi, Xiaoyu and Huang, Zhaoyang and Bian, Weikang and Li, Dasong and Zhang, Manyuan and Cheung, Ka Chun and See, Simon and Qin, Hongwei and Dai, Jifeng and Li, Hongsheng}, title = {VideoFlow: Exploiting Temporal Cues for Multi-frame Optical Flow Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12469-12480} }
3DMiner: Discovering Shapes from Large-Scale Unannotated Image Datasets: Ta-Ying Cheng,

Matheus Gadelha,

Sören Pirk,

Thibault Groueix,

Radomír Měch,

Andrew Markham,

Niki Trigoni; [pdf]
[bibtex]
@InProceedings{Cheng_2023_ICCV, author = {Cheng, Ta-Ying and Gadelha, Matheus and Pirk, S\"oren and Groueix, Thibault and M\v{e}ch, Radom{\'\i}r and Markham, Andrew and Trigoni, Niki}, title = {3DMiner: Discovering Shapes from Large-Scale Unannotated Image Datasets}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9331-9341} }
Identification of Systematic Errors of Image Classifiers on Rare Subgroups: Jan Hendrik Metzen,

Robin Hutmacher,

N. Grace Hua,

Valentyn Boreiko,

Dan Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Metzen_2023_ICCV, author = {Metzen, Jan Hendrik and Hutmacher, Robin and Hua, N. Grace and Boreiko, Valentyn and Zhang, Dan}, title = {Identification of Systematic Errors of Image Classifiers on Rare Subgroups}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5064-5073} }
Hierarchical Spatio-Temporal Representation Learning for Gait Recognition: Lei Wang,

Bo Liu,

Fangfang Liang,

Bincheng Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Lei and Liu, Bo and Liang, Fangfang and Wang, Bincheng}, title = {Hierarchical Spatio-Temporal Representation Learning for Gait Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19639-19649} }
Order-Prompted Tag Sequence Generation for Video Tagging: Zongyang Ma,

Ziqi Zhang,

Yuxin Chen,

Zhongang Qi,

Yingmin Luo,

Zekun Li,

Chunfeng Yuan,

Bing Li,

Xiaohu Qie,

Ying Shan,

Weiming Hu; [pdf] [supp]
[bibtex]
@InProceedings{Ma_2023_ICCV, author = {Ma, Zongyang and Zhang, Ziqi and Chen, Yuxin and Qi, Zhongang and Luo, Yingmin and Li, Zekun and Yuan, Chunfeng and Li, Bing and Qie, Xiaohu and Shan, Ying and Hu, Weiming}, title = {Order-Prompted Tag Sequence Generation for Video Tagging}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15681-15690} }
XVO: Generalized Visual Odometry via Cross-Modal Self-Training: Lei Lai,

Zhongkai Shangguan,

Jimuyang Zhang,

Eshed Ohn-Bar; [pdf]
[bibtex]
@InProceedings{Lai_2023_ICCV, author = {Lai, Lei and Shangguan, Zhongkai and Zhang, Jimuyang and Ohn-Bar, Eshed}, title = {XVO: Generalized Visual Odometry via Cross-Modal Self-Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10094-10105} }
Weakly Supervised Learning of Semantic Correspondence through Cascaded Online Correspondence Refinement: Yiwen Huang,

Yixuan Sun,

Chenghang Lai,

Qing Xu,

Xiaomei Wang,

Xuli Shen,

Weifeng Ge; [pdf] [supp]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Yiwen and Sun, Yixuan and Lai, Chenghang and Xu, Qing and Wang, Xiaomei and Shen, Xuli and Ge, Weifeng}, title = {Weakly Supervised Learning of Semantic Correspondence through Cascaded Online Correspondence Refinement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16254-16263} }
Clusterformer: Cluster-based Transformer for 3D Object Detection in Point Clouds: Yu Pei,

Xian Zhao,

Hao Li,

Jingyuan Ma,

Jingwei Zhang,

Shiliang Pu; [pdf]
[bibtex]
@InProceedings{Pei_2023_ICCV, author = {Pei, Yu and Zhao, Xian and Li, Hao and Ma, Jingyuan and Zhang, Jingwei and Pu, Shiliang}, title = {Clusterformer: Cluster-based Transformer for 3D Object Detection in Point Clouds}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6664-6673} }
HMD-NeMo: Online 3D Avatar Motion Generation From Sparse Observations: Sadegh Aliakbarian,

Fatemeh Saleh,

David Collier,

Pashmina Cameron,

Darren Cosker; [pdf] [supp]
[bibtex]
@InProceedings{Aliakbarian_2023_ICCV, author = {Aliakbarian, Sadegh and Saleh, Fatemeh and Collier, David and Cameron, Pashmina and Cosker, Darren}, title = {HMD-NeMo: Online 3D Avatar Motion Generation From Sparse Observations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9622-9631} }
NaviNeRF: NeRF-based 3D Representation Disentanglement by Latent Semantic Navigation: Baao Xie,

Bohan Li,

Zequn Zhang,

Junting Dong,

Xin Jin,

Jingyu Yang,

Wenjun Zeng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xie_2023_ICCV, author = {Xie, Baao and Li, Bohan and Zhang, Zequn and Dong, Junting and Jin, Xin and Yang, Jingyu and Zeng, Wenjun}, title = {NaviNeRF: NeRF-based 3D Representation Disentanglement by Latent Semantic Navigation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17992-18002} }
Adaptive Illumination Mapping for Shadow Detection in Raw Images: Jiayu Sun,

Ke Xu,

Youwei Pang,

Lihe Zhang,

Huchuan Lu,

Gerhard Hancke,

Rynson Lau; [pdf]
[bibtex]
@InProceedings{Sun_2023_ICCV, author = {Sun, Jiayu and Xu, Ke and Pang, Youwei and Zhang, Lihe and Lu, Huchuan and Hancke, Gerhard and Lau, Rynson}, title = {Adaptive Illumination Mapping for Shadow Detection in Raw Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12709-12718} }
CDUL: CLIP-Driven Unsupervised Learning for Multi-Label Image Classification: Rabab Abdelfattah,

Qing Guo,

Xiaoguang Li,

Xiaofeng Wang,

Song Wang; [pdf] [arXiv]
[bibtex]
@InProceedings{Abdelfattah_2023_ICCV, author = {Abdelfattah, Rabab and Guo, Qing and Li, Xiaoguang and Wang, Xiaofeng and Wang, Song}, title = {CDUL: CLIP-Driven Unsupervised Learning for Multi-Label Image Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1348-1357} }
Your Diffusion Model is Secretly a Zero-Shot Classifier: Alexander C. Li,

Mihir Prabhudesai,

Shivam Duggal,

Ellis Brown,

Deepak Pathak; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Alexander C. and Prabhudesai, Mihir and Duggal, Shivam and Brown, Ellis and Pathak, Deepak}, title = {Your Diffusion Model is Secretly a Zero-Shot Classifier}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2206-2217} }
Backpropagation Path Search On Adversarial Transferability: Zhuoer Xu,

Zhangxuan Gu,

Jianping Zhang,

Shiwen Cui,

Changhua Meng,

Weiqiang Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Zhuoer and Gu, Zhangxuan and Zhang, Jianping and Cui, Shiwen and Meng, Changhua and Wang, Weiqiang}, title = {Backpropagation Path Search On Adversarial Transferability}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4663-4673} }
Boosting Adversarial Transferability via Gradient Relevance Attack: Hegui Zhu,

Yuchen Ren,

Xiaoyan Sui,

Lianping Yang,

Wuming Jiang; [pdf]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Hegui and Ren, Yuchen and Sui, Xiaoyan and Yang, Lianping and Jiang, Wuming}, title = {Boosting Adversarial Transferability via Gradient Relevance Attack}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4741-4750} }
Image-Free Classifier Injection for Zero-Shot Classification: Anders Christensen,

Massimiliano Mancini,

A. Sophia Koepke,

Ole Winther,

Zeynep Akata; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Christensen_2023_ICCV, author = {Christensen, Anders and Mancini, Massimiliano and Koepke, A. Sophia and Winther, Ole and Akata, Zeynep}, title = {Image-Free Classifier Injection for Zero-Shot Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19072-19081} }
CLIPN for Zero-Shot OOD Detection: Teaching CLIP to Say No: Hualiang Wang,

Yi Li,

Huifeng Yao,

Xiaomeng Li; [pdf] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Hualiang and Li, Yi and Yao, Huifeng and Li, Xiaomeng}, title = {CLIPN for Zero-Shot OOD Detection: Teaching CLIP to Say No}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1802-1812} }
CO-Net: Learning Multiple Point Cloud Tasks at Once with A Cohesive Network: Tao Xie,

Ke Wang,

Siyi Lu,

Yukun Zhang,

Kun Dai,

Xiaoyu Li,

Jie Xu,

Li Wang,

Lijun Zhao,

Xinyu Zhang,

Ruifeng Li; [pdf] [supp]
[bibtex]
@InProceedings{Xie_2023_ICCV, author = {Xie, Tao and Wang, Ke and Lu, Siyi and Zhang, Yukun and Dai, Kun and Li, Xiaoyu and Xu, Jie and Wang, Li and Zhao, Lijun and Zhang, Xinyu and Li, Ruifeng}, title = {CO-Net: Learning Multiple Point Cloud Tasks at Once with A Cohesive Network}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3523-3533} }
Quality Diversity for Visual Pre-Training: Ruchika Chavhan,

Henry Gouk,

Da Li,

Timothy Hospedales; [pdf] [supp]
[bibtex]
@InProceedings{Chavhan_2023_ICCV, author = {Chavhan, Ruchika and Gouk, Henry and Li, Da and Hospedales, Timothy}, title = {Quality Diversity for Visual Pre-Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5384-5394} }
UniDexGrasp++: Improving Dexterous Grasping Policy Learning via Geometry-Aware Curriculum and Iterative Generalist-Specialist Learning: Weikang Wan,

Haoran Geng,

Yun Liu,

Zikang Shan,

Yaodong Yang,

Li Yi,

He Wang; [pdf] [supp]
[bibtex]
@InProceedings{Wan_2023_ICCV, author = {Wan, Weikang and Geng, Haoran and Liu, Yun and Shan, Zikang and Yang, Yaodong and Yi, Li and Wang, He}, title = {UniDexGrasp++: Improving Dexterous Grasping Policy Learning via Geometry-Aware Curriculum and Iterative Generalist-Specialist Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3891-3902} }
Multi-Scale Residual Low-Pass Filter Network for Image Deblurring: Jiangxin Dong,

Jinshan Pan,

Zhongbao Yang,

Jinhui Tang; [pdf] [supp]
[bibtex]
@InProceedings{Dong_2023_ICCV, author = {Dong, Jiangxin and Pan, Jinshan and Yang, Zhongbao and Tang, Jinhui}, title = {Multi-Scale Residual Low-Pass Filter Network for Image Deblurring}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12345-12354} }
FerKD: Surgical Label Adaptation for Efficient Distillation: Zhiqiang Shen; [pdf] [supp]
[bibtex]
@InProceedings{Shen_2023_ICCV, author = {Shen, Zhiqiang}, title = {FerKD: Surgical Label Adaptation for Efficient Distillation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1666-1675} }
Neural Fields for Structured Lighting: Aarrushi Shandilya,

Benjamin Attal,

Christian Richardt,

James Tompkin,

Matthew O'toole; [pdf] [supp]
[bibtex]
@InProceedings{Shandilya_2023_ICCV, author = {Shandilya, Aarrushi and Attal, Benjamin and Richardt, Christian and Tompkin, James and O'toole, Matthew}, title = {Neural Fields for Structured Lighting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3512-3522} }
ClothPose: A Real-world Benchmark for Visual Analysis of Garment Pose via An Indirect Recording Solution: Wenqiang Xu,

Wenxin Du,

Han Xue,

Yutong Li,

Ruolin Ye,

Yan-Feng Wang,

Cewu Lu; [pdf]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Wenqiang and Du, Wenxin and Xue, Han and Li, Yutong and Ye, Ruolin and Wang, Yan-Feng and Lu, Cewu}, title = {ClothPose: A Real-world Benchmark for Visual Analysis of Garment Pose via An Indirect Recording Solution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {58-68} }
Semantically Structured Image Compression via Irregular Group-Based Decoupling: Ruoyu Feng,

Yixin Gao,

Xin Jin,

Runsen Feng,

Zhibo Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Feng_2023_ICCV, author = {Feng, Ruoyu and Gao, Yixin and Jin, Xin and Feng, Runsen and Chen, Zhibo}, title = {Semantically Structured Image Compression via Irregular Group-Based Decoupling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17237-17247} }
PhaseMP: Robust 3D Pose Estimation via Phase-conditioned Human Motion Prior: Mingyi Shi,

Sebastian Starke,

Yuting Ye,

Taku Komura,

Jungdam Won; [pdf] [supp]
[bibtex]
@InProceedings{Shi_2023_ICCV, author = {Shi, Mingyi and Starke, Sebastian and Ye, Yuting and Komura, Taku and Won, Jungdam}, title = {PhaseMP: Robust 3D Pose Estimation via Phase-conditioned Human Motion Prior}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14725-14737} }
NLOS-NeuS: Non-line-of-sight Neural Implicit Surface: Yuki Fujimura,

Takahiro Kushida,

Takuya Funatomi,

Yasuhiro Mukaigawa; [pdf] [supp]
[bibtex]
@InProceedings{Fujimura_2023_ICCV, author = {Fujimura, Yuki and Kushida, Takahiro and Funatomi, Takuya and Mukaigawa, Yasuhiro}, title = {NLOS-NeuS: Non-line-of-sight Neural Implicit Surface}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10532-10541} }
Unsupervised Object Localization with Representer Point Selection: Yeonghwan Song,

Seokwoo Jang,

Dina Katabi,

Jeany Son; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Song_2023_ICCV, author = {Song, Yeonghwan and Jang, Seokwoo and Katabi, Dina and Son, Jeany}, title = {Unsupervised Object Localization with Representer Point Selection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6534-6544} }
SEMPART: Self-supervised Multi-resolution Partitioning of Image Semantics: Sriram Ravindran,

Debraj Basu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ravindran_2023_ICCV, author = {Ravindran, Sriram and Basu, Debraj}, title = {SEMPART: Self-supervised Multi-resolution Partitioning of Image Semantics}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {723-733} }
Flatness-Aware Minimization for Domain Generalization: Xingxuan Zhang,

Renzhe Xu,

Han Yu,

Yancheng Dong,

Pengfei Tian,

Peng Cui; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Xingxuan and Xu, Renzhe and Yu, Han and Dong, Yancheng and Tian, Pengfei and Cui, Peng}, title = {Flatness-Aware Minimization for Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5189-5202} }
ProtoFL: Unsupervised Federated Learning via Prototypical Distillation: Hansol Kim,

Youngjun Kwak,

Minyoung Jung,

Jinho Shin,

Youngsung Kim,

Changick Kim; [pdf] [arXiv]
[bibtex]
@InProceedings{Kim_2023_ICCV, author = {Kim, Hansol and Kwak, Youngjun and Jung, Minyoung and Shin, Jinho and Kim, Youngsung and Kim, Changick}, title = {ProtoFL: Unsupervised Federated Learning via Prototypical Distillation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6470-6479} }
Augmenting and Aligning Snippets for Few-Shot Video Domain Adaptation: Yuecong Xu,

Jianfei Yang,

Yunjiao Zhou,

Zhenghua Chen,

Min Wu,

Xiaoli Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Yuecong and Yang, Jianfei and Zhou, Yunjiao and Chen, Zhenghua and Wu, Min and Li, Xiaoli}, title = {Augmenting and Aligning Snippets for Few-Shot Video Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13445-13456} }
Self-Organizing Pathway Expansion for Non-Exemplar Class-Incremental Learning: Kai Zhu,

Kecheng Zheng,

Ruili Feng,

Deli Zhao,

Yang Cao,

Zheng-Jun Zha; [pdf]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Kai and Zheng, Kecheng and Feng, Ruili and Zhao, Deli and Cao, Yang and Zha, Zheng-Jun}, title = {Self-Organizing Pathway Expansion for Non-Exemplar Class-Incremental Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19204-19213} }
Preserving Tumor Volumes for Unsupervised Medical Image Registration: Qihua Dong,

Hao Du,

Ying Song,

Yan Xu,

Jing Liao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dong_2023_ICCV, author = {Dong, Qihua and Du, Hao and Song, Ying and Xu, Yan and Liao, Jing}, title = {Preserving Tumor Volumes for Unsupervised Medical Image Registration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21208-21218} }
Multi-label Affordance Mapping from Egocentric Vision: Lorenzo Mur-Labadia,

Jose J. Guerrero,

Ruben Martinez-Cantin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mur-Labadia_2023_ICCV, author = {Mur-Labadia, Lorenzo and Guerrero, Jose J. and Martinez-Cantin, Ruben}, title = {Multi-label Affordance Mapping from Egocentric Vision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5238-5249} }
Towards Real-World Burst Image Super-Resolution: Benchmark and Method: Pengxu Wei,

Yujing Sun,

Xingbei Guo,

Chang Liu,

Guanbin Li,

Jie Chen,

Xiangyang Ji,

Liang Lin; [pdf] [supp]
[bibtex]
@InProceedings{Wei_2023_ICCV, author = {Wei, Pengxu and Sun, Yujing and Guo, Xingbei and Liu, Chang and Li, Guanbin and Chen, Jie and Ji, Xiangyang and Lin, Liang}, title = {Towards Real-World Burst Image Super-Resolution: Benchmark and Method}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13233-13242} }
Unified Adversarial Patch for Cross-Modal Attacks in the Physical World: Xingxing Wei,

Yao Huang,

Yitong Sun,

Jie Yu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wei_2023_ICCV, author = {Wei, Xingxing and Huang, Yao and Sun, Yitong and Yu, Jie}, title = {Unified Adversarial Patch for Cross-Modal Attacks in the Physical World}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4445-4454} }
Unsupervised Accuracy Estimation of Deep Visual Models using Domain-Adaptive Adversarial Perturbation without Source Samples: JoonHo Lee,

Jae Oh Woo,

Hankyu Moon,

Kwonho Lee; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2023_ICCV, author = {Lee, JoonHo and Woo, Jae Oh and Moon, Hankyu and Lee, Kwonho}, title = {Unsupervised Accuracy Estimation of Deep Visual Models using Domain-Adaptive Adversarial Perturbation without Source Samples}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16443-16452} }
Misalign, Contrast then Distill: Rethinking Misalignments in Language-Image Pre-training: Bumsoo Kim,

Yeonsik Jo,

Jinhyung Kim,

Seunghwan Kim; [pdf]
[bibtex]
@InProceedings{Kim_2023_ICCV, author = {Kim, Bumsoo and Jo, Yeonsik and Kim, Jinhyung and Kim, Seunghwan}, title = {Misalign, Contrast then Distill: Rethinking Misalignments in Language-Image Pre-training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2563-2572} }
SYENet: A Simple Yet Effective Network for Multiple Low-Level Vision Tasks with Real-Time Performance on Mobile Device: Weiran Gou,

Ziyao Yi,

Yan Xiang,

Shaoqing Li,

Zibin Liu,

Dehui Kong,

Ke Xu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gou_2023_ICCV, author = {Gou, Weiran and Yi, Ziyao and Xiang, Yan and Li, Shaoqing and Liu, Zibin and Kong, Dehui and Xu, Ke}, title = {SYENet: A Simple Yet Effective Network for Multiple Low-Level Vision Tasks with Real-Time Performance on Mobile Device}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12182-12195} }
MATE: Masked Autoencoders are Online 3D Test-Time Learners: M. Jehanzeb Mirza,

Inkyu Shin,

Wei Lin,

Andreas Schriebl,

Kunyang Sun,

Jaesung Choe,

Mateusz Kozinski,

Horst Possegger,

In So Kweon,

Kuk-Jin Yoon,

Horst Bischof; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mirza_2023_ICCV, author = {Mirza, M. Jehanzeb and Shin, Inkyu and Lin, Wei and Schriebl, Andreas and Sun, Kunyang and Choe, Jaesung and Kozinski, Mateusz and Possegger, Horst and Kweon, In So and Yoon, Kuk-Jin and Bischof, Horst}, title = {MATE: Masked Autoencoders are Online 3D Test-Time Learners}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16709-16718} }
EdaDet: Open-Vocabulary Object Detection Using Early Dense Alignment: Cheng Shi,

Sibei Yang; [pdf] [arXiv]
[bibtex]
@InProceedings{Shi_2023_ICCV, author = {Shi, Cheng and Yang, Sibei}, title = {EdaDet: Open-Vocabulary Object Detection Using Early Dense Alignment}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15724-15734} }
MixPath: A Unified Approach for One-shot Neural Architecture Search: Xiangxiang Chu,

Shun Lu,

Xudong Li,

Bo Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chu_2023_ICCV, author = {Chu, Xiangxiang and Lu, Shun and Li, Xudong and Zhang, Bo}, title = {MixPath: A Unified Approach for One-shot Neural Architecture Search}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5972-5981} }
Enhancing NeRF akin to Enhancing LLMs: Generalizable NeRF Transformer with Mixture-of-View-Experts: Wenyan Cong,

Hanxue Liang,

Peihao Wang,

Zhiwen Fan,

Tianlong Chen,

Mukund Varma,

Yi Wang,

Zhangyang Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cong_2023_ICCV, author = {Cong, Wenyan and Liang, Hanxue and Wang, Peihao and Fan, Zhiwen and Chen, Tianlong and Varma, Mukund and Wang, Yi and Wang, Zhangyang}, title = {Enhancing NeRF akin to Enhancing LLMs: Generalizable NeRF Transformer with Mixture-of-View-Experts}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3193-3204} }
Task-aware Adaptive Learning for Cross-domain Few-shot Learning: Yurong Guo,

Ruoyi Du,

Yuan Dong,

Timothy Hospedales,

Yi-Zhe Song,

Zhanyu Ma; [pdf]
[bibtex]
@InProceedings{Guo_2023_ICCV, author = {Guo, Yurong and Du, Ruoyi and Dong, Yuan and Hospedales, Timothy and Song, Yi-Zhe and Ma, Zhanyu}, title = {Task-aware Adaptive Learning for Cross-domain Few-shot Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1590-1599} }
Two Birds, One Stone: A Unified Framework for Joint Learning of Image and Video Style Transfers: Bohai Gu,

Heng Fan,

Libo Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gu_2023_ICCV, author = {Gu, Bohai and Fan, Heng and Zhang, Libo}, title = {Two Birds, One Stone: A Unified Framework for Joint Learning of Image and Video Style Transfers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23545-23554} }
Revisiting Domain-Adaptive 3D Object Detection by Reliable, Diverse and Class-balanced Pseudo-Labeling: Zhuoxiao Chen,

Yadan Luo,

Zheng Wang,

Mahsa Baktashmotlagh,

Zi Huang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Zhuoxiao and Luo, Yadan and Wang, Zheng and Baktashmotlagh, Mahsa and Huang, Zi}, title = {Revisiting Domain-Adaptive 3D Object Detection by Reliable, Diverse and Class-balanced Pseudo-Labeling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3714-3726} }
Task-Oriented Multi-Modal Mutual Leaning for Vision-Language Models: Sifan Long,

Zhen Zhao,

Junkun Yuan,

Zichang Tan,

Jiangjiang Liu,

Luping Zhou,

Shengsheng Wang,

Jingdong Wang; [pdf] [arXiv]
[bibtex]
@InProceedings{Long_2023_ICCV, author = {Long, Sifan and Zhao, Zhen and Yuan, Junkun and Tan, Zichang and Liu, Jiangjiang and Zhou, Luping and Wang, Shengsheng and Wang, Jingdong}, title = {Task-Oriented Multi-Modal Mutual Leaning for Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21959-21969} }
Efficient Adaptive Human-Object Interaction Detection with Concept-guided Memory: Ting Lei,

Fabian Caba,

Qingchao Chen,

Hailin Jin,

Yuxin Peng,

Yang Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lei_2023_ICCV, author = {Lei, Ting and Caba, Fabian and Chen, Qingchao and Jin, Hailin and Peng, Yuxin and Liu, Yang}, title = {Efficient Adaptive Human-Object Interaction Detection with Concept-guided Memory}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6480-6490} }
NeMF: Inverse Volume Rendering with Neural Microflake Field: Youjia Zhang,

Teng Xu,

Junqing Yu,

Yuteng Ye,

Yanqing Jing,

Junle Wang,

Jingyi Yu,

Wei Yang; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Youjia and Xu, Teng and Yu, Junqing and Ye, Yuteng and Jing, Yanqing and Wang, Junle and Yu, Jingyi and Yang, Wei}, title = {NeMF: Inverse Volume Rendering with Neural Microflake Field}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22919-22929} }
Attentive Mask CLIP: Yifan Yang,

Weiquan Huang,

Yixuan Wei,

Houwen Peng,

Xinyang Jiang,

Huiqiang Jiang,

Fangyun Wei,

Yin Wang,

Han Hu,

Lili Qiu,

Yuqing Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Yifan and Huang, Weiquan and Wei, Yixuan and Peng, Houwen and Jiang, Xinyang and Jiang, Huiqiang and Wei, Fangyun and Wang, Yin and Hu, Han and Qiu, Lili and Yang, Yuqing}, title = {Attentive Mask CLIP}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2771-2781} }
DOLCE: A Model-Based Probabilistic Diffusion Framework for Limited-Angle CT Reconstruction: Jiaming Liu,

Rushil Anirudh,

Jayaraman J. Thiagarajan,

Stewart He,

K Aditya Mohan,

Ulugbek S. Kamilov,

Hyojin Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Jiaming and Anirudh, Rushil and Thiagarajan, Jayaraman J. and He, Stewart and Mohan, K Aditya and Kamilov, Ulugbek S. and Kim, Hyojin}, title = {DOLCE: A Model-Based Probabilistic Diffusion Framework for Limited-Angle CT Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10498-10508} }
Beyond Image Borders: Learning Feature Extrapolation for Unbounded Image Composition: Xiaoyu Liu,

Ming Liu,

Junyi Li,

Shuai Liu,

Xiaotao Wang,

Lei Lei,

Wangmeng Zuo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Xiaoyu and Liu, Ming and Li, Junyi and Liu, Shuai and Wang, Xiaotao and Lei, Lei and Zuo, Wangmeng}, title = {Beyond Image Borders: Learning Feature Extrapolation for Unbounded Image Composition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13023-13032} }
MasaCtrl: Tuning-Free Mutual Self-Attention Control for Consistent Image Synthesis and Editing: Mingdeng Cao,

Xintao Wang,

Zhongang Qi,

Ying Shan,

Xiaohu Qie,

Yinqiang Zheng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cao_2023_ICCV, author = {Cao, Mingdeng and Wang, Xintao and Qi, Zhongang and Shan, Ying and Qie, Xiaohu and Zheng, Yinqiang}, title = {MasaCtrl: Tuning-Free Mutual Self-Attention Control for Consistent Image Synthesis and Editing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22560-22570} }
Understanding Hessian Alignment for Domain Generalization: Sobhan Hemati,

Guojun Zhang,

Amir Estiri,

Xi Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hemati_2023_ICCV, author = {Hemati, Sobhan and Zhang, Guojun and Estiri, Amir and Chen, Xi}, title = {Understanding Hessian Alignment for Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19004-19014} }
DeepChange: A Long-Term Person Re-Identification Benchmark with Clothes Change: Peng Xu,

Xiatian Zhu; [pdf] [supp]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Peng and Zhu, Xiatian}, title = {DeepChange: A Long-Term Person Re-Identification Benchmark with Clothes Change}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11196-11205} }
Preserve Your Own Correlation: A Noise Prior for Video Diffusion Models: Songwei Ge,

Seungjun Nah,

Guilin Liu,

Tyler Poon,

Andrew Tao,

Bryan Catanzaro,

David Jacobs,

Jia-Bin Huang,

Ming-Yu Liu,

Yogesh Balaji; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ge_2023_ICCV, author = {Ge, Songwei and Nah, Seungjun and Liu, Guilin and Poon, Tyler and Tao, Andrew and Catanzaro, Bryan and Jacobs, David and Huang, Jia-Bin and Liu, Ming-Yu and Balaji, Yogesh}, title = {Preserve Your Own Correlation: A Noise Prior for Video Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22930-22941} }
Discrepant and Multi-Instance Proxies for Unsupervised Person Re-Identification: Chang Zou,

Zeqi Chen,

Zhichao Cui,

Yuehu Liu,

Chi Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Zou_2023_ICCV, author = {Zou, Chang and Chen, Zeqi and Cui, Zhichao and Liu, Yuehu and Zhang, Chi}, title = {Discrepant and Multi-Instance Proxies for Unsupervised Person Re-Identification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11058-11068} }
Joint-Relation Transformer for Multi-Person Motion Prediction: Qingyao Xu,

Weibo Mao,

Jingze Gong,

Chenxin Xu,

Siheng Chen,

Weidi Xie,

Ya Zhang,

Yanfeng Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Qingyao and Mao, Weibo and Gong, Jingze and Xu, Chenxin and Chen, Siheng and Xie, Weidi and Zhang, Ya and Wang, Yanfeng}, title = {Joint-Relation Transformer for Multi-Person Motion Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9816-9826} }
Revisiting Vision Transformer from the View of Path Ensemble: Shuning Chang,

Pichao Wang,

Hao Luo,

Fan Wang,

Mike Zheng Shou; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chang_2023_ICCV, author = {Chang, Shuning and Wang, Pichao and Luo, Hao and Wang, Fan and Shou, Mike Zheng}, title = {Revisiting Vision Transformer from the View of Path Ensemble}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19889-19899} }
Tetra-NeRF: Representing Neural Radiance Fields Using Tetrahedra: Jonas Kulhanek,

Torsten Sattler; [pdf] [supp]
[bibtex]
@InProceedings{Kulhanek_2023_ICCV, author = {Kulhanek, Jonas and Sattler, Torsten}, title = {Tetra-NeRF: Representing Neural Radiance Fields Using Tetrahedra}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18458-18469} }
TMA: Temporal Motion Aggregation for Event-based Optical Flow: Haotian Liu,

Guang Chen,

Sanqing Qu,

Yanping Zhang,

Zhijun Li,

Alois Knoll,

Changjun Jiang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Haotian and Chen, Guang and Qu, Sanqing and Zhang, Yanping and Li, Zhijun and Knoll, Alois and Jiang, Changjun}, title = {TMA: Temporal Motion Aggregation for Event-based Optical Flow}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9685-9694} }
Ablating Concepts in Text-to-Image Diffusion Models: Nupur Kumari,

Bingliang Zhang,

Sheng-Yu Wang,

Eli Shechtman,

Richard Zhang,

Jun-Yan Zhu; [pdf] [arXiv]
[bibtex]
@InProceedings{Kumari_2023_ICCV, author = {Kumari, Nupur and Zhang, Bingliang and Wang, Sheng-Yu and Shechtman, Eli and Zhang, Richard and Zhu, Jun-Yan}, title = {Ablating Concepts in Text-to-Image Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22691-22702} }
Motion-Guided Masking for Spatiotemporal Representation Learning: David Fan,

Jue Wang,

Shuai Liao,

Yi Zhu,

Vimal Bhat,

Hector Santos-Villalobos,

Rohith MV,

Xinyu Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Fan_2023_ICCV, author = {Fan, David and Wang, Jue and Liao, Shuai and Zhu, Yi and Bhat, Vimal and Santos-Villalobos, Hector and MV, Rohith and Li, Xinyu}, title = {Motion-Guided Masking for Spatiotemporal Representation Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5619-5629} }
MapFormer: Boosting Change Detection by Using Pre-change Information: Maximilian Bernhard,

Niklas Strauß,

Matthias Schubert; [pdf] [supp]
[bibtex]
@InProceedings{Bernhard_2023_ICCV, author = {Bernhard, Maximilian and Strau{\ss}, Niklas and Schubert, Matthias}, title = {MapFormer: Boosting Change Detection by Using Pre-change Information}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16837-16846} }
Masked Diffusion Transformer is a Strong Image Synthesizer: Shanghua Gao,

Pan Zhou,

Ming-Ming Cheng,

Shuicheng Yan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gao_2023_ICCV, author = {Gao, Shanghua and Zhou, Pan and Cheng, Ming-Ming and Yan, Shuicheng}, title = {Masked Diffusion Transformer is a Strong Image Synthesizer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23164-23173} }
LightDepth: Single-View Depth Self-Supervision from Illumination Decline: Javier Rodríguez-Puigvert,

Víctor M. Batlle,

J.M.M. Montiel,

Ruben Martinez-Cantin,

Pascal Fua,

Juan D. Tardós,

Javier Civera; [pdf] [supp]
[bibtex]
@InProceedings{Rodriguez-Puigvert_2023_ICCV, author = {Rodr{\'\i}guez-Puigvert, Javier and Batlle, V{\'\i}ctor M. and Montiel, J.M.M. and Martinez-Cantin, Ruben and Fua, Pascal and Tard\'os, Juan D. and Civera, Javier}, title = {LightDepth: Single-View Depth Self-Supervision from Illumination Decline}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21273-21283} }
Urban Radiance Field Representation with Deformable Neural Mesh Primitives: Fan Lu,

Yan Xu,

Guang Chen,

Hongsheng Li,

Kwan-Yee Lin,

Changjun Jiang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lu_2023_ICCV, author = {Lu, Fan and Xu, Yan and Chen, Guang and Li, Hongsheng and Lin, Kwan-Yee and Jiang, Changjun}, title = {Urban Radiance Field Representation with Deformable Neural Mesh Primitives}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {465-476} }
Adaptive Frequency Filters As Efficient Global Token Mixers: Zhipeng Huang,

Zhizheng Zhang,

Cuiling Lan,

Zheng-Jun Zha,

Yan Lu,

Baining Guo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Zhipeng and Zhang, Zhizheng and Lan, Cuiling and Zha, Zheng-Jun and Lu, Yan and Guo, Baining}, title = {Adaptive Frequency Filters As Efficient Global Token Mixers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6049-6059} }
Referring Image Segmentation Using Text Supervision: Fang Liu,

Yuhao Liu,

Yuqiu Kong,

Ke Xu,

Lihe Zhang,

Baocai Yin,

Gerhard Hancke,

Rynson Lau; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Fang and Liu, Yuhao and Kong, Yuqiu and Xu, Ke and Zhang, Lihe and Yin, Baocai and Hancke, Gerhard and Lau, Rynson}, title = {Referring Image Segmentation Using Text Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22124-22134} }
Zolly: Zoom Focal Length Correctly for Perspective-Distorted Human Mesh Reconstruction: Wenjia Wang,

Yongtao Ge,

Haiyi Mei,

Zhongang Cai,

Qingping Sun,

Yanjun Wang,

Chunhua Shen,

Lei Yang,

Taku Komura; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Wenjia and Ge, Yongtao and Mei, Haiyi and Cai, Zhongang and Sun, Qingping and Wang, Yanjun and Shen, Chunhua and Yang, Lei and Komura, Taku}, title = {Zolly: Zoom Focal Length Correctly for Perspective-Distorted Human Mesh Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3925-3935} }
Once Detected, Never Lost: Surpassing Human Performance in Offline LiDAR based 3D Object Detection: Lue Fan,

Yuxue Yang,

Yiming Mao,

Feng Wang,

Yuntao Chen,

Naiyan Wang,

Zhaoxiang Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Fan_2023_ICCV, author = {Fan, Lue and Yang, Yuxue and Mao, Yiming and Wang, Feng and Chen, Yuntao and Wang, Naiyan and Zhang, Zhaoxiang}, title = {Once Detected, Never Lost: Surpassing Human Performance in Offline LiDAR based 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19820-19829} }
Building a Winning Team: Selecting Source Model Ensembles using a Submodular Transferability Estimation Approach: Vimal K B,

Saketh Bachu,

Tanmay Garg,

Niveditha Lakshmi Narasimhan,

Raghavan Konuru,

Vineeth N Balasubramanian; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{B_2023_ICCV, author = {B, Vimal K and Bachu, Saketh and Garg, Tanmay and Narasimhan, Niveditha Lakshmi and Konuru, Raghavan and Balasubramanian, Vineeth N}, title = {Building a Winning Team: Selecting Source Model Ensembles using a Submodular Transferability Estimation Approach}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11609-11620} }
Eventful Transformers: Leveraging Temporal Redundancy in Vision Transformers: Matthew Dutson,

Yin Li,

Mohit Gupta; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dutson_2023_ICCV, author = {Dutson, Matthew and Li, Yin and Gupta, Mohit}, title = {Eventful Transformers: Leveraging Temporal Redundancy in Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16911-16923} }
Plausible Uncertainties for Human Pose Regression: Lennart Bramlage,

Michelle Karg,

Cristóbal Curio; [pdf] [supp]
[bibtex]
@InProceedings{Bramlage_2023_ICCV, author = {Bramlage, Lennart and Karg, Michelle and Curio, Crist\'obal}, title = {Plausible Uncertainties for Human Pose Regression}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15133-15142} }
Beyond One-to-One: Rethinking the Referring Image Segmentation: Yutao Hu,

Qixiong Wang,

Wenqi Shao,

Enze Xie,

Zhenguo Li,

Jungong Han,

Ping Luo; [pdf] [supp]
[bibtex]
@InProceedings{Hu_2023_ICCV, author = {Hu, Yutao and Wang, Qixiong and Shao, Wenqi and Xie, Enze and Li, Zhenguo and Han, Jungong and Luo, Ping}, title = {Beyond One-to-One: Rethinking the Referring Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4067-4077} }
Robust Referring Video Object Segmentation with Cyclic Structural Consensus: Xiang Li,

Jinglu Wang,

Xiaohao Xu,

Xiao Li,

Bhiksha Raj,

Yan Lu; [pdf]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Xiang and Wang, Jinglu and Xu, Xiaohao and Li, Xiao and Raj, Bhiksha and Lu, Yan}, title = {Robust Referring Video Object Segmentation with Cyclic Structural Consensus}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22236-22245} }
DiffIR: Efficient Diffusion Model for Image Restoration: Bin Xia,

Yulun Zhang,

Shiyin Wang,

Yitong Wang,

Xinglong Wu,

Yapeng Tian,

Wenming Yang,

Luc Van Gool; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xia_2023_ICCV, author = {Xia, Bin and Zhang, Yulun and Wang, Shiyin and Wang, Yitong and Wu, Xinglong and Tian, Yapeng and Yang, Wenming and Van Gool, Luc}, title = {DiffIR: Efficient Diffusion Model for Image Restoration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13095-13105} }
MoreauGrad: Sparse and Robust Interpretation of Neural Networks via Moreau Envelope: Jingwei Zhang,

Farzan Farnia; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Jingwei and Farnia, Farzan}, title = {MoreauGrad: Sparse and Robust Interpretation of Neural Networks via Moreau Envelope}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2021-2030} }
Building Bridge Across the Time: Disruption and Restoration of Murals In the Wild: Huiyang Shao,

Qianqian Xu,

Peisong Wen,

Peifeng Gao,

Zhiyong Yang,

Qingming Huang; [pdf] [supp]
[bibtex]
@InProceedings{Shao_2023_ICCV, author = {Shao, Huiyang and Xu, Qianqian and Wen, Peisong and Gao, Peifeng and Yang, Zhiyong and Huang, Qingming}, title = {Building Bridge Across the Time: Disruption and Restoration of Murals In the Wild}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20259-20269} }
Class-Incremental Grouping Network for Continual Audio-Visual Learning: Shentong Mo,

Weiguo Pian,

Yapeng Tian; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mo_2023_ICCV, author = {Mo, Shentong and Pian, Weiguo and Tian, Yapeng}, title = {Class-Incremental Grouping Network for Continual Audio-Visual Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7788-7798} }
Neural Haircut: Prior-Guided Strand-Based Hair Reconstruction: Vanessa Sklyarova,

Jenya Chelishev,

Andreea Dogaru,

Igor Medvedev,

Victor Lempitsky,

Egor Zakharov; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sklyarova_2023_ICCV, author = {Sklyarova, Vanessa and Chelishev, Jenya and Dogaru, Andreea and Medvedev, Igor and Lempitsky, Victor and Zakharov, Egor}, title = {Neural Haircut: Prior-Guided Strand-Based Hair Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19762-19773} }
Improving Sample Quality of Diffusion Models Using Self-Attention Guidance: Susung Hong,

Gyuseong Lee,

Wooseok Jang,

Seungryong Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hong_2023_ICCV, author = {Hong, Susung and Lee, Gyuseong and Jang, Wooseok and Kim, Seungryong}, title = {Improving Sample Quality of Diffusion Models Using Self-Attention Guidance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7462-7471} }
Evaluating Data Attribution for Text-to-Image Models: Sheng-Yu Wang,

Alexei A. Efros,

Jun-Yan Zhu,

Richard Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Sheng-Yu and Efros, Alexei A. and Zhu, Jun-Yan and Zhang, Richard}, title = {Evaluating Data Attribution for Text-to-Image Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7192-7203} }
Delta Denoising Score: Amir Hertz,

Kfir Aberman,

Daniel Cohen-Or; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hertz_2023_ICCV, author = {Hertz, Amir and Aberman, Kfir and Cohen-Or, Daniel}, title = {Delta Denoising Score}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2328-2337} }
Hierarchical Prior Mining for Non-local Multi-View Stereo: Chunlin Ren,

Qingshan Xu,

Shikun Zhang,

Jiaqi Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ren_2023_ICCV, author = {Ren, Chunlin and Xu, Qingshan and Zhang, Shikun and Yang, Jiaqi}, title = {Hierarchical Prior Mining for Non-local Multi-View Stereo}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3611-3620} }
Generative Multiplane Neural Radiance for 3D-Aware Image Generation: Amandeep Kumar,

Ankan Kumar Bhunia,

Sanath Narayan,

Hisham Cholakkal,

Rao Muhammad Anwer,

Salman Khan,

Ming-Hsuan Yang,

Fahad Shahbaz Khan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kumar_2023_ICCV, author = {Kumar, Amandeep and Bhunia, Ankan Kumar and Narayan, Sanath and Cholakkal, Hisham and Anwer, Rao Muhammad and Khan, Salman and Yang, Ming-Hsuan and Khan, Fahad Shahbaz}, title = {Generative Multiplane Neural Radiance for 3D-Aware Image Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7388-7398} }
DG-Recon: Depth-Guided Neural 3D Scene Reconstruction: Jihong Ju,

Ching Wei Tseng,

Oleksandr Bailo,

Georgi Dikov,

Mohsen Ghafoorian; [pdf] [supp]
[bibtex]
@InProceedings{Ju_2023_ICCV, author = {Ju, Jihong and Tseng, Ching Wei and Bailo, Oleksandr and Dikov, Georgi and Ghafoorian, Mohsen}, title = {DG-Recon: Depth-Guided Neural 3D Scene Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18184-18194} }
Simple Baselines for Interactive Video Retrieval with Questions and Answers: Kaiqu Liang,

Samuel Albanie; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liang_2023_ICCV, author = {Liang, Kaiqu and Albanie, Samuel}, title = {Simple Baselines for Interactive Video Retrieval with Questions and Answers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11091-11101} }
The Stable Signature: Rooting Watermarks in Latent Diffusion Models: Pierre Fernandez,

Guillaume Couairon,

Hervé Jégou,

Matthijs Douze,

Teddy Furon; [pdf] [supp]
[bibtex]
@InProceedings{Fernandez_2023_ICCV, author = {Fernandez, Pierre and Couairon, Guillaume and J\'egou, Herv\'e and Douze, Matthijs and Furon, Teddy}, title = {The Stable Signature: Rooting Watermarks in Latent Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22466-22477} }
Boosting Semantic Segmentation from the Perspective of Explicit Class Embeddings: Yuhe Liu,

Chuanjian Liu,

Kai Han,

Quan Tang,

Zengchang Qin; [pdf] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Yuhe and Liu, Chuanjian and Han, Kai and Tang, Quan and Qin, Zengchang}, title = {Boosting Semantic Segmentation from the Perspective of Explicit Class Embeddings}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {821-831} }
Going Denser with Open-Vocabulary Part Segmentation: Peize Sun,

Shoufa Chen,

Chenchen Zhu,

Fanyi Xiao,

Ping Luo,

Saining Xie,

Zhicheng Yan; [pdf] [arXiv]
[bibtex]
@InProceedings{Sun_2023_ICCV, author = {Sun, Peize and Chen, Shoufa and Zhu, Chenchen and Xiao, Fanyi and Luo, Ping and Xie, Saining and Yan, Zhicheng}, title = {Going Denser with Open-Vocabulary Part Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15453-15465} }
Learning to Identify Critical States for Reinforcement Learning from Videos: Haozhe Liu,

Mingchen Zhuge,

Bing Li,

Yuhui Wang,

Francesco Faccio,

Bernard Ghanem,

Jürgen Schmidhuber; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Haozhe and Zhuge, Mingchen and Li, Bing and Wang, Yuhui and Faccio, Francesco and Ghanem, Bernard and Schmidhuber, J\"urgen}, title = {Learning to Identify Critical States for Reinforcement Learning from Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1955-1965} }
Editing Implicit Assumptions in Text-to-Image Diffusion Models: Hadas Orgad,

Bahjat Kawar,

Yonatan Belinkov; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Orgad_2023_ICCV, author = {Orgad, Hadas and Kawar, Bahjat and Belinkov, Yonatan}, title = {Editing Implicit Assumptions in Text-to-Image Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7053-7061} }
OCHID-Fi: Occlusion-Robust Hand Pose Estimation in 3D via RF-Vision: Shujie Zhang,

Tianyue Zheng,

Zhe Chen,

Jingzhi Hu,

Abdelwahed Khamis,

Jiajun Liu,

Jun Luo; [pdf]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Shujie and Zheng, Tianyue and Chen, Zhe and Hu, Jingzhi and Khamis, Abdelwahed and Liu, Jiajun and Luo, Jun}, title = {OCHID-Fi: Occlusion-Robust Hand Pose Estimation in 3D via RF-Vision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15112-15121} }
Conceptual and Hierarchical Latent Space Decomposition for Face Editing: Savas Ozkan,

Mete Ozay,

Tom Robinson; [pdf] [supp]
[bibtex]
@InProceedings{Ozkan_2023_ICCV, author = {Ozkan, Savas and Ozay, Mete and Robinson, Tom}, title = {Conceptual and Hierarchical Latent Space Decomposition for Face Editing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7248-7257} }
VL-Match: Enhancing Vision-Language Pretraining with Token-Level and Instance-Level Matching: Junyu Bi,

Daixuan Cheng,

Ping Yao,

Bochen Pang,

Yuefeng Zhan,

Chuanguang Yang,

Yujing Wang,

Hao Sun,

Weiwei Deng,

Qi Zhang; [pdf]
[bibtex]
@InProceedings{Bi_2023_ICCV, author = {Bi, Junyu and Cheng, Daixuan and Yao, Ping and Pang, Bochen and Zhan, Yuefeng and Yang, Chuanguang and Wang, Yujing and Sun, Hao and Deng, Weiwei and Zhang, Qi}, title = {VL-Match: Enhancing Vision-Language Pretraining with Token-Level and Instance-Level Matching}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2584-2593} }
Reconstructing Interacting Hands with Interaction Prior from Monocular Images: Binghui Zuo,

Zimeng Zhao,

Wenqian Sun,

Wei Xie,

Zhou Xue,

Yangang Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zuo_2023_ICCV, author = {Zuo, Binghui and Zhao, Zimeng and Sun, Wenqian and Xie, Wei and Xue, Zhou and Wang, Yangang}, title = {Reconstructing Interacting Hands with Interaction Prior from Monocular Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9054-9064} }
Towards Realistic Evaluation of Industrial Continual Learning Scenarios with an Emphasis on Energy Consumption and Computational Footprint: Vivek Chavan,

Paul Koch,

Marian Schlüter,

Clemens Briese; [pdf] [supp]
[bibtex]
@InProceedings{Chavan_2023_ICCV, author = {Chavan, Vivek and Koch, Paul and Schl\"uter, Marian and Briese, Clemens}, title = {Towards Realistic Evaluation of Industrial Continual Learning Scenarios with an Emphasis on Energy Consumption and Computational Footprint}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11506-11518} }
Translating Images to Road Network: A Non-Autoregressive Sequence-to-Sequence Approach: Jiachen Lu,

Renyuan Peng,

Xinyue Cai,

Hang Xu,

Hongyang Li,

Feng Wen,

Wei Zhang,

Li Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Lu_2023_ICCV, author = {Lu, Jiachen and Peng, Renyuan and Cai, Xinyue and Xu, Hang and Li, Hongyang and Wen, Feng and Zhang, Wei and Zhang, Li}, title = {Translating Images to Road Network: A Non-Autoregressive Sequence-to-Sequence Approach}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23-33} }
How Much Temporal Long-Term Context is Needed for Action Segmentation?: Emad Bahrami,

Gianpiero Francesca,

Juergen Gall; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bahrami_2023_ICCV, author = {Bahrami, Emad and Francesca, Gianpiero and Gall, Juergen}, title = {How Much Temporal Long-Term Context is Needed for Action Segmentation?}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10351-10361} }
3D VR Sketch Guided 3D Shape Prototyping and Exploration: Ling Luo,

Pinaki Nath Chowdhury,

Tao Xiang,

Yi-Zhe Song,

Yulia Gryaditskaya; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Luo_2023_ICCV, author = {Luo, Ling and Chowdhury, Pinaki Nath and Xiang, Tao and Song, Yi-Zhe and Gryaditskaya, Yulia}, title = {3D VR Sketch Guided 3D Shape Prototyping and Exploration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9267-9276} }
Seal-3D: Interactive Pixel-Level Editing for Neural Radiance Fields: Xiangyu Wang,

Jingsen Zhu,

Qi Ye,

Yuchi Huo,

Yunlong Ran,

Zhihua Zhong,

Jiming Chen; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Xiangyu and Zhu, Jingsen and Ye, Qi and Huo, Yuchi and Ran, Yunlong and Zhong, Zhihua and Chen, Jiming}, title = {Seal-3D: Interactive Pixel-Level Editing for Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17683-17693} }
Generative Novel View Synthesis with 3D-Aware Diffusion Models: Eric R. Chan,

Koki Nagano,

Matthew A. Chan,

Alexander W. Bergman,

Jeong Joon Park,

Axel Levy,

Miika Aittala,

Shalini De Mello,

Tero Karras,

Gordon Wetzstein; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chan_2023_ICCV, author = {Chan, Eric R. and Nagano, Koki and Chan, Matthew A. and Bergman, Alexander W. and Park, Jeong Joon and Levy, Axel and Aittala, Miika and De Mello, Shalini and Karras, Tero and Wetzstein, Gordon}, title = {Generative Novel View Synthesis with 3D-Aware Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4217-4229} }
MDCS: More Diverse Experts with Consistency Self-distillation for Long-tailed Recognition: Qihao Zhao,

Chen Jiang,

Wei Hu,

Fan Zhang,

Jun Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Qihao and Jiang, Chen and Hu, Wei and Zhang, Fan and Liu, Jun}, title = {MDCS: More Diverse Experts with Consistency Self-distillation for Long-tailed Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11597-11608} }
Similarity Min-Max: Zero-Shot Day-Night Domain Adaptation: Rundong Luo,

Wenjing Wang,

Wenhan Yang,

Jiaying Liu; [pdf] [supp]
[bibtex]
@InProceedings{Luo_2023_ICCV, author = {Luo, Rundong and Wang, Wenjing and Yang, Wenhan and Liu, Jiaying}, title = {Similarity Min-Max: Zero-Shot Day-Night Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8104-8114} }
Dark Side Augmentation: Generating Diverse Night Examples for Metric Learning: Albert Mohwald,

Tomas Jenicek,

Ondřej Chum; [pdf] [supp]
[bibtex]
@InProceedings{Mohwald_2023_ICCV, author = {Mohwald, Albert and Jenicek, Tomas and Chum, Ond\v{r}ej}, title = {Dark Side Augmentation: Generating Diverse Night Examples for Metric Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11153-11163} }
NeRF-MS: Neural Radiance Fields with Multi-Sequence: Peihao Li,

Shaohui Wang,

Chen Yang,

Bingbing Liu,

Weichao Qiu,

Haoqian Wang; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Peihao and Wang, Shaohui and Yang, Chen and Liu, Bingbing and Qiu, Weichao and Wang, Haoqian}, title = {NeRF-MS: Neural Radiance Fields with Multi-Sequence}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18591-18600} }
LVOS: A Benchmark for Long-term Video Object Segmentation: Lingyi Hong,

Wenchao Chen,

Zhongying Liu,

Wei Zhang,

Pinxue Guo,

Zhaoyu Chen,

Wenqiang Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hong_2023_ICCV, author = {Hong, Lingyi and Chen, Wenchao and Liu, Zhongying and Zhang, Wei and Guo, Pinxue and Chen, Zhaoyu and Zhang, Wenqiang}, title = {LVOS: A Benchmark for Long-term Video Object Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13480-13492} }
Diffusion Model as Representation Learner: Xingyi Yang,

Xinchao Wang; [pdf] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Xingyi and Wang, Xinchao}, title = {Diffusion Model as Representation Learner}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18938-18949} }
Nerfbusters: Removing Ghostly Artifacts from Casually Captured NeRFs: Frederik Warburg,

Ethan Weber,

Matthew Tancik,

Aleksander Holynski,

Angjoo Kanazawa; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Warburg_2023_ICCV, author = {Warburg, Frederik and Weber, Ethan and Tancik, Matthew and Holynski, Aleksander and Kanazawa, Angjoo}, title = {Nerfbusters: Removing Ghostly Artifacts from Casually Captured NeRFs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18120-18130} }
Document Understanding Dataset and Evaluation (DUDE): Jordy Van Landeghem,

Rubèn Tito,

Łukasz Borchmann,

Michał Pietruszka,

Pawel Joziak,

Rafal Powalski,

Dawid Jurkiewicz,

Mickael Coustaty,

Bertrand Anckaert,

Ernest Valveny,

Matthew Blaschko,

Sien Moens,

Tomasz Stanislawek; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Van_Landeghem_2023_ICCV, author = {Van Landeghem, Jordy and Tito, Rub\`en and Borchmann, {\L}ukasz and Pietruszka, Micha{\l} and Joziak, Pawel and Powalski, Rafal and Jurkiewicz, Dawid and Coustaty, Mickael and Anckaert, Bertrand and Valveny, Ernest and Blaschko, Matthew and Moens, Sien and Stanislawek, Tomasz}, title = {Document Understanding Dataset and Evaluation (DUDE)}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19528-19540} }
ALWOD: Active Learning for Weakly-Supervised Object Detection: Yuting Wang,

Velibor Ilic,

Jiatong Li,

Branislav Kisačanin,

Vladimir Pavlovic; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Yuting and Ilic, Velibor and Li, Jiatong and Kisa\v{c}anin, Branislav and Pavlovic, Vladimir}, title = {ALWOD: Active Learning for Weakly-Supervised Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6459-6469} }
Prototypical Kernel Learning and Open-set Foreground Perception for Generalized Few-shot Semantic Segmentation: Kai Huang,

Feigege Wang,

Ye Xi,

Yutao Gao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Kai and Wang, Feigege and Xi, Ye and Gao, Yutao}, title = {Prototypical Kernel Learning and Open-set Foreground Perception for Generalized Few-shot Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19256-19265} }
Simple and Effective Out-of-Distribution Detection via Cosine-based Softmax Loss: SoonCheol Noh,

DongEon Jeong,

Jee-Hyong Lee; [pdf] [supp]
[bibtex]
@InProceedings{Noh_2023_ICCV, author = {Noh, SoonCheol and Jeong, DongEon and Lee, Jee-Hyong}, title = {Simple and Effective Out-of-Distribution Detection via Cosine-based Softmax Loss}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16560-16569} }
CFCG: Semi-Supervised Semantic Segmentation via Cross-Fusion and Contour Guidance Supervision: Shuo Li,

Yue He,

Weiming Zhang,

Wei Zhang,

Xiao Tan,

Junyu Han,

Errui Ding,

Jingdong Wang; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Shuo and He, Yue and Zhang, Weiming and Zhang, Wei and Tan, Xiao and Han, Junyu and Ding, Errui and Wang, Jingdong}, title = {CFCG: Semi-Supervised Semantic Segmentation via Cross-Fusion and Contour Guidance Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16348-16358} }
CHAMPAGNE: Learning Real-world Conversation from Large-Scale Web Videos: Seungju Han,

Jack Hessel,

Nouha Dziri,

Yejin Choi,

Youngjae Yu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Han_2023_ICCV, author = {Han, Seungju and Hessel, Jack and Dziri, Nouha and Choi, Yejin and Yu, Youngjae}, title = {CHAMPAGNE: Learning Real-world Conversation from Large-Scale Web Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15498-15509} }
SLAN: Self-Locator Aided Network for Vision-Language Understanding: Jiang-Tian Zhai,

Qi Zhang,

Tong Wu,

Xing-Yu Chen,

Jiang-Jiang Liu,

Ming-Ming Cheng; [pdf]
[bibtex]
@InProceedings{Zhai_2023_ICCV, author = {Zhai, Jiang-Tian and Zhang, Qi and Wu, Tong and Chen, Xing-Yu and Liu, Jiang-Jiang and Cheng, Ming-Ming}, title = {SLAN: Self-Locator Aided Network for Vision-Language Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21949-21958} }
S-VolSDF: Sparse Multi-View Stereo Regularization of Neural Implicit Surfaces: Haoyu Wu,

Alexandros Graikos,

Dimitris Samaras; [pdf] [supp]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Haoyu and Graikos, Alexandros and Samaras, Dimitris}, title = {S-VolSDF: Sparse Multi-View Stereo Regularization of Neural Implicit Surfaces}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3556-3568} }
Anomaly Detection using Score-based Perturbation Resilience: Woosang Shin,

Jonghyeon Lee,

Taehan Lee,

Sangmoon Lee,

Jong Pil Yun; [pdf] [supp]
[bibtex]
@InProceedings{Shin_2023_ICCV, author = {Shin, Woosang and Lee, Jonghyeon and Lee, Taehan and Lee, Sangmoon and Yun, Jong Pil}, title = {Anomaly Detection using Score-based Perturbation Resilience}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23372-23382} }
Generating Visual Scenes from Touch: Fengyu Yang,

Jiacheng Zhang,

Andrew Owens; [pdf] [supp]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Fengyu and Zhang, Jiacheng and Owens, Andrew}, title = {Generating Visual Scenes from Touch}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22070-22080} }
DeformToon3D: Deformable Neural Radiance Fields for 3D Toonification: Junzhe Zhang,

Yushi Lan,

Shuai Yang,

Fangzhou Hong,

Quan Wang,

Chai Kiat Yeo,

Ziwei Liu,

Chen Change Loy; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Junzhe and Lan, Yushi and Yang, Shuai and Hong, Fangzhou and Wang, Quan and Yeo, Chai Kiat and Liu, Ziwei and Loy, Chen Change}, title = {DeformToon3D: Deformable Neural Radiance Fields for 3D Toonification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9144-9154} }
SatlasPretrain: A Large-Scale Dataset for Remote Sensing Image Understanding: Favyen Bastani,

Piper Wolters,

Ritwik Gupta,

Joe Ferdinando,

Aniruddha Kembhavi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bastani_2023_ICCV, author = {Bastani, Favyen and Wolters, Piper and Gupta, Ritwik and Ferdinando, Joe and Kembhavi, Aniruddha}, title = {SatlasPretrain: A Large-Scale Dataset for Remote Sensing Image Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16772-16782} }
Empowering Low-Light Image Enhancer through Customized Learnable Priors: Naishan Zheng,

Man Zhou,

Yanmeng Dong,

Xiangyu Rui,

Jie Huang,

Chongyi Li,

Feng Zhao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zheng_2023_ICCV, author = {Zheng, Naishan and Zhou, Man and Dong, Yanmeng and Rui, Xiangyu and Huang, Jie and Li, Chongyi and Zhao, Feng}, title = {Empowering Low-Light Image Enhancer through Customized Learnable Priors}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12559-12569} }
TextManiA: Enriching Visual Feature by Text-driven Manifold Augmentation: Moon Ye-Bin,

Jisoo Kim,

Hongyeob Kim,

Kilho Son,

Tae-Hyun Oh; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ye-Bin_2023_ICCV, author = {Ye-Bin, Moon and Kim, Jisoo and Kim, Hongyeob and Son, Kilho and Oh, Tae-Hyun}, title = {TextManiA: Enriching Visual Feature by Text-driven Manifold Augmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2526-2537} }
Guiding Image Captioning Models Toward More Specific Captions: Simon Kornblith,

Lala Li,

Zirui Wang,

Thao Nguyen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kornblith_2023_ICCV, author = {Kornblith, Simon and Li, Lala and Wang, Zirui and Nguyen, Thao}, title = {Guiding Image Captioning Models Toward More Specific Captions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15259-15269} }
Breaking Common Sense: WHOOPS! A Vision-and-Language Benchmark of Synthetic and Compositional Images: Nitzan Bitton-Guetta,

Yonatan Bitton,

Jack Hessel,

Ludwig Schmidt,

Yuval Elovici,

Gabriel Stanovsky,

Roy Schwartz; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bitton-Guetta_2023_ICCV, author = {Bitton-Guetta, Nitzan and Bitton, Yonatan and Hessel, Jack and Schmidt, Ludwig and Elovici, Yuval and Stanovsky, Gabriel and Schwartz, Roy}, title = {Breaking Common Sense: WHOOPS! A Vision-and-Language Benchmark of Synthetic and Compositional Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2616-2627} }
Consistent Depth Prediction for Transparent Object Reconstruction from RGB-D Camera: Yuxiang Cai,

Yifan Zhu,

Haiwei Zhang,

Bo Ren; [pdf] [supp]
[bibtex]
@InProceedings{Cai_2023_ICCV, author = {Cai, Yuxiang and Zhu, Yifan and Zhang, Haiwei and Ren, Bo}, title = {Consistent Depth Prediction for Transparent Object Reconstruction from RGB-D Camera}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3459-3468} }
DReg-NeRF: Deep Registration for Neural Radiance Fields: Yu Chen,

Gim Hee Lee; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Yu and Lee, Gim Hee}, title = {DReg-NeRF: Deep Registration for Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22703-22713} }
DETR Does Not Need Multi-Scale or Locality Design: Yutong Lin,

Yuhui Yuan,

Zheng Zhang,

Chen Li,

Nanning Zheng,

Han Hu; [pdf] [supp]
[bibtex]
@InProceedings{Lin_2023_ICCV, author = {Lin, Yutong and Yuan, Yuhui and Zhang, Zheng and Li, Chen and Zheng, Nanning and Hu, Han}, title = {DETR Does Not Need Multi-Scale or Locality Design}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6545-6554} }
Towards Effective Instance Discrimination Contrastive Loss for Unsupervised Domain Adaptation: Yixin Zhang,

Zilei Wang,

Junjie Li,

Jiafan Zhuang,

Zihan Lin; [pdf]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Yixin and Wang, Zilei and Li, Junjie and Zhuang, Jiafan and Lin, Zihan}, title = {Towards Effective Instance Discrimination Contrastive Loss for Unsupervised Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11388-11399} }
ClusT3: Information Invariant Test-Time Training: Gustavo A. Vargas Hakim,

David Osowiechi,

Mehrdad Noori,

Milad Cheraghalikhani,

Ali Bahri,

Ismail Ben Ayed,

Christian Desrosiers; [pdf] [supp]
[bibtex]
@InProceedings{Hakim_2023_ICCV, author = {Hakim, Gustavo A. Vargas and Osowiechi, David and Noori, Mehrdad and Cheraghalikhani, Milad and Bahri, Ali and Ben Ayed, Ismail and Desrosiers, Christian}, title = {ClusT3: Information Invariant Test-Time Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6136-6145} }
FrozenRecon: Pose-free 3D Scene Reconstruction with Frozen Depth Models: Guangkai Xu,

Wei Yin,

Hao Chen,

Chunhua Shen,

Kai Cheng,

Feng Zhao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Guangkai and Yin, Wei and Chen, Hao and Shen, Chunhua and Cheng, Kai and Zhao, Feng}, title = {FrozenRecon: Pose-free 3D Scene Reconstruction with Frozen Depth Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9310-9320} }
Affective Image Filter: Reflecting Emotions from Text to Images: Shuchen Weng,

Peixuan Zhang,

Zheng Chang,

Xinlong Wang,

Si Li,

Boxin Shi; [pdf] [supp]
[bibtex]
@InProceedings{Weng_2023_ICCV, author = {Weng, Shuchen and Zhang, Peixuan and Chang, Zheng and Wang, Xinlong and Li, Si and Shi, Boxin}, title = {Affective Image Filter: Reflecting Emotions from Text to Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10810-10819} }
Content-Aware Local GAN for Photo-Realistic Super-Resolution: JoonKyu Park,

Sanghyun Son,

Kyoung Mu Lee; [pdf] [supp]
[bibtex]
@InProceedings{Park_2023_ICCV, author = {Park, JoonKyu and Son, Sanghyun and Lee, Kyoung Mu}, title = {Content-Aware Local GAN for Photo-Realistic Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10585-10594} }
Structure-Aware Surface Reconstruction via Primitive Assembly: Jingen Jiang,

Mingyang Zhao,

Shiqing Xin,

Yanchao Yang,

Hanxiao Wang,

Xiaohong Jia,

Dong-Ming Yan; [pdf]
[bibtex]
@InProceedings{Jiang_2023_ICCV, author = {Jiang, Jingen and Zhao, Mingyang and Xin, Shiqing and Yang, Yanchao and Wang, Hanxiao and Jia, Xiaohong and Yan, Dong-Ming}, title = {Structure-Aware Surface Reconstruction via Primitive Assembly}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14171-14180} }
FineDance: A Fine-grained Choreography Dataset for 3D Full Body Dance Generation: Ronghui Li,

Junfan Zhao,

Yachao Zhang,

Mingyang Su,

Zeping Ren,

Han Zhang,

Yansong Tang,

Xiu Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Ronghui and Zhao, Junfan and Zhang, Yachao and Su, Mingyang and Ren, Zeping and Zhang, Han and Tang, Yansong and Li, Xiu}, title = {FineDance: A Fine-grained Choreography Dataset for 3D Full Body Dance Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10234-10243} }
AssetField: Assets Mining and Reconfiguration in Ground Feature Plane Representation: Yuanbo Xiangli,

Linning Xu,

Xingang Pan,

Nanxuan Zhao,

Bo Dai,

Dahua Lin; [pdf] [arXiv]
[bibtex]
@InProceedings{Xiangli_2023_ICCV, author = {Xiangli, Yuanbo and Xu, Linning and Pan, Xingang and Zhao, Nanxuan and Dai, Bo and Lin, Dahua}, title = {AssetField: Assets Mining and Reconfiguration in Ground Feature Plane Representation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3251-3261} }
Improving Online Lane Graph Extraction by Object-Lane Clustering: Yigit Baran Can,

Alexander Liniger,

Danda Pani Paudel,

Luc Van Gool; [pdf] [arXiv]
[bibtex]
@InProceedings{Can_2023_ICCV, author = {Can, Yigit Baran and Liniger, Alexander and Paudel, Danda Pani and Van Gool, Luc}, title = {Improving Online Lane Graph Extraction by Object-Lane Clustering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8591-8601} }
SAGA: Spectral Adversarial Geometric Attack on 3D Meshes: Tomer Stolik,

Itai Lang,

Shai Avidan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Stolik_2023_ICCV, author = {Stolik, Tomer and Lang, Itai and Avidan, Shai}, title = {SAGA: Spectral Adversarial Geometric Attack on 3D Meshes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4284-4294} }
All in Tokens: Unifying Output Space of Visual Tasks via Soft Token: Jia Ning,

Chen Li,

Zheng Zhang,

Chunyu Wang,

Zigang Geng,

Qi Dai,

Kun He,

Han Hu; [pdf] [arXiv]
[bibtex]
@InProceedings{Ning_2023_ICCV, author = {Ning, Jia and Li, Chen and Zhang, Zheng and Wang, Chunyu and Geng, Zigang and Dai, Qi and He, Kun and Hu, Han}, title = {All in Tokens: Unifying Output Space of Visual Tasks via Soft Token}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19900-19910} }
Learning Navigational Visual Representations with Semantic Map Supervision: Yicong Hong,

Yang Zhou,

Ruiyi Zhang,

Franck Dernoncourt,

Trung Bui,

Stephen Gould,

Hao Tan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hong_2023_ICCV, author = {Hong, Yicong and Zhou, Yang and Zhang, Ruiyi and Dernoncourt, Franck and Bui, Trung and Gould, Stephen and Tan, Hao}, title = {Learning Navigational Visual Representations with Semantic Map Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3055-3067} }
LDL: Line Distance Functions for Panoramic Localization: Junho Kim,

Changwoon Choi,

Hojun Jang,

Young Min Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2023_ICCV, author = {Kim, Junho and Choi, Changwoon and Jang, Hojun and Kim, Young Min}, title = {LDL: Line Distance Functions for Panoramic Localization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17882-17892} }
TransTIC: Transferring Transformer-based Image Compression from Human Perception to Machine Perception: Yi-Hsin Chen,

Ying-Chieh Weng,

Chia-Hao Kao,

Cheng Chien,

Wei-Chen Chiu,

Wen-Hsiao Peng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Yi-Hsin and Weng, Ying-Chieh and Kao, Chia-Hao and Chien, Cheng and Chiu, Wei-Chen and Peng, Wen-Hsiao}, title = {TransTIC: Transferring Transformer-based Image Compression from Human Perception to Machine Perception}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23297-23307} }
CHORUS : Learning Canonicalized 3D Human-Object Spatial Relations from Unbounded Synthesized Images: Sookwan Han,

Hanbyul Joo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Han_2023_ICCV, author = {Han, Sookwan and Joo, Hanbyul}, title = {CHORUS : Learning Canonicalized 3D Human-Object Spatial Relations from Unbounded Synthesized Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15835-15846} }
Shortcut-V2V: Compression Framework for Video-to-Video Translation Based on Temporal Redundancy Reduction: Chaeyeon Chung,

Yeojeong Park,

Seunghwan Choi,

Munkhsoyol Ganbat,

Jaegul Choo; [pdf] [supp]
[bibtex]
@InProceedings{Chung_2023_ICCV, author = {Chung, Chaeyeon and Park, Yeojeong and Choi, Seunghwan and Ganbat, Munkhsoyol and Choo, Jaegul}, title = {Shortcut-V2V: Compression Framework for Video-to-Video Translation Based on Temporal Redundancy Reduction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7612-7622} }
ViLLA: Fine-Grained Vision-Language Representation Learning from Real-World Data: Maya Varma,

Jean-Benoit Delbrouck,

Sarah Hooper,

Akshay Chaudhari,

Curtis Langlotz; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Varma_2023_ICCV, author = {Varma, Maya and Delbrouck, Jean-Benoit and Hooper, Sarah and Chaudhari, Akshay and Langlotz, Curtis}, title = {ViLLA: Fine-Grained Vision-Language Representation Learning from Real-World Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22225-22235} }
SG-Former: Self-guided Transformer with Evolving Token Reallocation: Sucheng Ren,

Xingyi Yang,

Songhua Liu,

Xinchao Wang; [pdf]
[bibtex]
@InProceedings{Ren_2023_ICCV, author = {Ren, Sucheng and Yang, Xingyi and Liu, Songhua and Wang, Xinchao}, title = {SG-Former: Self-guided Transformer with Evolving Token Reallocation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6003-6014} }
Towards Unifying Medical Vision-and-Language Pre-Training via Soft Prompts: Zhihong Chen,

Shizhe Diao,

Benyou Wang,

Guanbin Li,

Xiang Wan; [pdf] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Zhihong and Diao, Shizhe and Wang, Benyou and Li, Guanbin and Wan, Xiang}, title = {Towards Unifying Medical Vision-and-Language Pre-Training via Soft Prompts}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23403-23413} }
A Large-scale Study of Spatiotemporal Representation Learning with a New Benchmark on Action Recognition: Andong Deng,

Taojiannan Yang,

Chen Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Deng_2023_ICCV, author = {Deng, Andong and Yang, Taojiannan and Chen, Chen}, title = {A Large-scale Study of Spatiotemporal Representation Learning with a New Benchmark on Action Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20519-20531} }
Video Background Music Generation: Dataset, Method and Evaluation: Le Zhuo,

Zhaokai Wang,

Baisen Wang,

Yue Liao,

Chenxi Bao,

Stanley Peng,

Songhao Han,

Aixi Zhang,

Fei Fang,

Si Liu; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhuo_2023_ICCV, author = {Zhuo, Le and Wang, Zhaokai and Wang, Baisen and Liao, Yue and Bao, Chenxi and Peng, Stanley and Han, Songhao and Zhang, Aixi and Fang, Fei and Liu, Si}, title = {Video Background Music Generation: Dataset, Method and Evaluation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15637-15647} }
HoloFusion: Towards Photo-realistic 3D Generative Modeling: Animesh Karnewar,

Niloy J. Mitra,

Andrea Vedaldi,

David Novotny; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Karnewar_2023_ICCV, author = {Karnewar, Animesh and Mitra, Niloy J. and Vedaldi, Andrea and Novotny, David}, title = {HoloFusion: Towards Photo-realistic 3D Generative Modeling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22976-22985} }
ProtoTransfer: Cross-Modal Prototype Transfer for Point Cloud Segmentation: Pin Tang,

Hai-Ming Xu,

Chao Ma; [pdf] [supp]
[bibtex]
@InProceedings{Tang_2023_ICCV, author = {Tang, Pin and Xu, Hai-Ming and Ma, Chao}, title = {ProtoTransfer: Cross-Modal Prototype Transfer for Point Cloud Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3337-3347} }
Improving Continuous Sign Language Recognition with Cross-Lingual Signs: Fangyun Wei,

Yutong Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wei_2023_ICCV, author = {Wei, Fangyun and Chen, Yutong}, title = {Improving Continuous Sign Language Recognition with Cross-Lingual Signs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23612-23621} }
Markov Game Video Augmentation for Action Segmentation: Nicolas Aziere,

Sinisa Todorovic; [pdf] [supp]
[bibtex]
@InProceedings{Aziere_2023_ICCV, author = {Aziere, Nicolas and Todorovic, Sinisa}, title = {Markov Game Video Augmentation for Action Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13505-13514} }
Deep Image Harmonization with Globally Guided Feature Transformation and Relation Distillation: Li Niu,

Linfeng Tan,

Xinhao Tao,

Junyan Cao,

Fengjun Guo,

Teng Long,

Liqing Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Niu_2023_ICCV, author = {Niu, Li and Tan, Linfeng and Tao, Xinhao and Cao, Junyan and Guo, Fengjun and Long, Teng and Zhang, Liqing}, title = {Deep Image Harmonization with Globally Guided Feature Transformation and Relation Distillation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7723-7732} }
TransIFF: An Instance-Level Feature Fusion Framework for Vehicle-Infrastructure Cooperative 3D Detection with Transformers: Ziming Chen,

Yifeng Shi,

Jinrang Jia; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Ziming and Shi, Yifeng and Jia, Jinrang}, title = {TransIFF: An Instance-Level Feature Fusion Framework for Vehicle-Infrastructure Cooperative 3D Detection with Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18205-18214} }
RegFormer: An Efficient Projection-Aware Transformer Network for Large-Scale Point Cloud Registration: Jiuming Liu,

Guangming Wang,

Zhe Liu,

Chaokang Jiang,

Marc Pollefeys,

Hesheng Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Jiuming and Wang, Guangming and Liu, Zhe and Jiang, Chaokang and Pollefeys, Marc and Wang, Hesheng}, title = {RegFormer: An Efficient Projection-Aware Transformer Network for Large-Scale Point Cloud Registration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8451-8460} }
Masked Retraining Teacher-Student Framework for Domain Adaptive Object Detection: Zijing Zhao,

Sitong Wei,

Qingchao Chen,

Dehui Li,

Yifan Yang,

Yuxin Peng,

Yang Liu; [pdf] [supp]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Zijing and Wei, Sitong and Chen, Qingchao and Li, Dehui and Yang, Yifan and Peng, Yuxin and Liu, Yang}, title = {Masked Retraining Teacher-Student Framework for Domain Adaptive Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19039-19049} }
Prune Spatio-temporal Tokens by Semantic-aware Temporal Accumulation: Shuangrui Ding,

Peisen Zhao,

Xiaopeng Zhang,

Rui Qian,

Hongkai Xiong,

Qi Tian; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ding_2023_ICCV, author = {Ding, Shuangrui and Zhao, Peisen and Zhang, Xiaopeng and Qian, Rui and Xiong, Hongkai and Tian, Qi}, title = {Prune Spatio-temporal Tokens by Semantic-aware Temporal Accumulation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16945-16956} }
VQ3D: Learning a 3D-Aware Generative Model on ImageNet: Kyle Sargent,

Jing Yu Koh,

Han Zhang,

Huiwen Chang,

Charles Herrmann,

Pratul Srinivasan,

Jiajun Wu,

Deqing Sun; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sargent_2023_ICCV, author = {Sargent, Kyle and Koh, Jing Yu and Zhang, Han and Chang, Huiwen and Herrmann, Charles and Srinivasan, Pratul and Wu, Jiajun and Sun, Deqing}, title = {VQ3D: Learning a 3D-Aware Generative Model on ImageNet}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4240-4250} }
Growing a Brain with Sparsity-Inducing Generation for Continual Learning: Hyundong Jin,

Gyeong-hyeon Kim,

Chanho Ahn,

Eunwoo Kim; [pdf]
[bibtex]
@InProceedings{Jin_2023_ICCV, author = {Jin, Hyundong and Kim, Gyeong-hyeon and Ahn, Chanho and Kim, Eunwoo}, title = {Growing a Brain with Sparsity-Inducing Generation for Continual Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18961-18970} }
Cross-Ray Neural Radiance Fields for Novel-View Synthesis from Unconstrained Image Collections: Yifan Yang,

Shuhai Zhang,

Zixiong Huang,

Yubing Zhang,

Mingkui Tan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Yifan and Zhang, Shuhai and Huang, Zixiong and Zhang, Yubing and Tan, Mingkui}, title = {Cross-Ray Neural Radiance Fields for Novel-View Synthesis from Unconstrained Image Collections}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15901-15911} }
Graphics2RAW: Mapping Computer Graphics Images to Sensor RAW Images: Donghwan Seo,

Abhijith Punnappurath,

Luxi Zhao,

Abdelrahman Abdelhamed,

Sai Kiran Tedla,

Sanguk Park,

Jihwan Choe,

Michael S. Brown; [pdf] [supp]
[bibtex]
@InProceedings{Seo_2023_ICCV, author = {Seo, Donghwan and Punnappurath, Abhijith and Zhao, Luxi and Abdelhamed, Abdelrahman and Tedla, Sai Kiran and Park, Sanguk and Choe, Jihwan and Brown, Michael S.}, title = {Graphics2RAW: Mapping Computer Graphics Images to Sensor RAW Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12622-12631} }
SPACE: Speech-driven Portrait Animation with Controllable Expression: Siddharth Gururani,

Arun Mallya,

Ting-Chun Wang,

Rafael Valle,

Ming-Yu Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gururani_2023_ICCV, author = {Gururani, Siddharth and Mallya, Arun and Wang, Ting-Chun and Valle, Rafael and Liu, Ming-Yu}, title = {SPACE: Speech-driven Portrait Animation with Controllable Expression}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20914-20923} }
2D-3D Interlaced Transformer for Point Cloud Segmentation with Scene-Level Supervision: Cheng-Kun Yang,

Min-Hung Chen,

Yung-Yu Chuang,

Yen-Yu Lin; [pdf] [supp]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Cheng-Kun and Chen, Min-Hung and Chuang, Yung-Yu and Lin, Yen-Yu}, title = {2D-3D Interlaced Transformer for Point Cloud Segmentation with Scene-Level Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {977-987} }
Collecting The Puzzle Pieces: Disentangled Self-Driven Human Pose Transfer by Permuting Textures: Nannan Li,

Kevin J Shih,

Bryan A. Plummer; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Nannan and Shih, Kevin J and Plummer, Bryan A.}, title = {Collecting The Puzzle Pieces: Disentangled Self-Driven Human Pose Transfer by Permuting Textures}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7126-7137} }
VAD: Vectorized Scene Representation for Efficient Autonomous Driving: Bo Jiang,

Shaoyu Chen,

Qing Xu,

Bencheng Liao,

Jiajie Chen,

Helong Zhou,

Qian Zhang,

Wenyu Liu,

Chang Huang,

Xinggang Wang; [pdf] [arXiv]
[bibtex]
@InProceedings{Jiang_2023_ICCV, author = {Jiang, Bo and Chen, Shaoyu and Xu, Qing and Liao, Bencheng and Chen, Jiajie and Zhou, Helong and Zhang, Qian and Liu, Wenyu and Huang, Chang and Wang, Xinggang}, title = {VAD: Vectorized Scene Representation for Efficient Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8340-8350} }
End-to-end 3D Tracking with Decoupled Queries: Yanwei Li,

Zhiding Yu,

Jonah Philion,

Anima Anandkumar,

Sanja Fidler,

Jiaya Jia,

Jose Alvarez; [pdf]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Yanwei and Yu, Zhiding and Philion, Jonah and Anandkumar, Anima and Fidler, Sanja and Jia, Jiaya and Alvarez, Jose}, title = {End-to-end 3D Tracking with Decoupled Queries}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18302-18311} }
Sound Localization from Motion: Jointly Learning Sound Direction and Camera Rotation: Ziyang Chen,

Shengyi Qian,

Andrew Owens; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Ziyang and Qian, Shengyi and Owens, Andrew}, title = {Sound Localization from Motion: Jointly Learning Sound Direction and Camera Rotation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7897-7908} }
Batch-based Model Registration for Fast 3D Sherd Reconstruction: Jiepeng Wang,

Congyi Zhang,

Peng Wang,

Xin Li,

Peter J. Cobb,

Christian Theobalt,

Wenping Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Jiepeng and Zhang, Congyi and Wang, Peng and Li, Xin and Cobb, Peter J. and Theobalt, Christian and Wang, Wenping}, title = {Batch-based Model Registration for Fast 3D Sherd Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14519-14529} }
HiFace: High-Fidelity 3D Face Reconstruction by Learning Static and Dynamic Details: Zenghao Chai,

Tianke Zhang,

Tianyu He,

Xu Tan,

Tadas Baltrusaitis,

HsiangTao Wu,

Runnan Li,

Sheng Zhao,

Chun Yuan,

Jiang Bian; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chai_2023_ICCV, author = {Chai, Zenghao and Zhang, Tianke and He, Tianyu and Tan, Xu and Baltrusaitis, Tadas and Wu, HsiangTao and Li, Runnan and Zhao, Sheng and Yuan, Chun and Bian, Jiang}, title = {HiFace: High-Fidelity 3D Face Reconstruction by Learning Static and Dynamic Details}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9087-9098} }
Fast and Accurate Transferability Measurement by Evaluating Intra-class Feature Variance: Huiwen Xu,

U Kang; [pdf] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Huiwen and Kang, U}, title = {Fast and Accurate Transferability Measurement by Evaluating Intra-class Feature Variance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11474-11482} }
Deformable Model-Driven Neural Rendering for High-Fidelity 3D Reconstruction of Human Heads Under Low-View Settings: Baixin Xu,

Jiarui Zhang,

Kwan-Yee Lin,

Chen Qian,

Ying He; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Baixin and Zhang, Jiarui and Lin, Kwan-Yee and Qian, Chen and He, Ying}, title = {Deformable Model-Driven Neural Rendering for High-Fidelity 3D Reconstruction of Human Heads Under Low-View Settings}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17924-17934} }
Algebraically Rigorous Quaternion Framework for the Neural Network Pose Estimation Problem: Chen Lin,

Andrew J. Hanson,

Sonya M. Hanson; [pdf]
[bibtex]
@InProceedings{Lin_2023_ICCV, author = {Lin, Chen and Hanson, Andrew J. and Hanson, Sonya M.}, title = {Algebraically Rigorous Quaternion Framework for the Neural Network Pose Estimation Problem}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14097-14106} }
Prompt Tuning Inversion for Text-driven Image Editing Using Diffusion Models: Wenkai Dong,

Song Xue,

Xiaoyue Duan,

Shumin Han; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dong_2023_ICCV, author = {Dong, Wenkai and Xue, Song and Duan, Xiaoyue and Han, Shumin}, title = {Prompt Tuning Inversion for Text-driven Image Editing Using Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7430-7440} }
CVSformer: Cross-View Synthesis Transformer for Semantic Scene Completion: Haotian Dong,

Enhui Ma,

Lubo Wang,

Miaohui Wang,

Wuyuan Xie,

Qing Guo,

Ping Li,

Lingyu Liang,

Kairui Yang,

Di Lin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dong_2023_ICCV, author = {Dong, Haotian and Ma, Enhui and Wang, Lubo and Wang, Miaohui and Xie, Wuyuan and Guo, Qing and Li, Ping and Liang, Lingyu and Yang, Kairui and Lin, Di}, title = {CVSformer: Cross-View Synthesis Transformer for Semantic Scene Completion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8874-8883} }
UrbanGIRAFFE: Representing Urban Scenes as Compositional Generative Neural Feature Fields: Yuanbo Yang,

Yifei Yang,

Hanlei Guo,

Rong Xiong,

Yue Wang,

Yiyi Liao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Yuanbo and Yang, Yifei and Guo, Hanlei and Xiong, Rong and Wang, Yue and Liao, Yiyi}, title = {UrbanGIRAFFE: Representing Urban Scenes as Compositional Generative Neural Feature Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9199-9210} }
UnitedHuman: Harnessing Multi-Source Data for High-Resolution Human Generation: Jianglin Fu,

Shikai Li,

Yuming Jiang,

Kwan-Yee Lin,

Wayne Wu,

Ziwei Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Fu_2023_ICCV, author = {Fu, Jianglin and Li, Shikai and Jiang, Yuming and Lin, Kwan-Yee and Wu, Wayne and Liu, Ziwei}, title = {UnitedHuman: Harnessing Multi-Source Data for High-Resolution Human Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7301-7311} }
Active Neural Mapping: Zike Yan,

Haoxiang Yang,

Hongbin Zha; [pdf] [arXiv]
[bibtex]
@InProceedings{Yan_2023_ICCV, author = {Yan, Zike and Yang, Haoxiang and Zha, Hongbin}, title = {Active Neural Mapping}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10981-10992} }
Density-invariant Features for Distant Point Cloud Registration: Quan Liu,

Hongzi Zhu,

Yunsong Zhou,

Hongyang Li,

Shan Chang,

Minyi Guo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Quan and Zhu, Hongzi and Zhou, Yunsong and Li, Hongyang and Chang, Shan and Guo, Minyi}, title = {Density-invariant Features for Distant Point Cloud Registration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18215-18225} }
UniverSeg: Universal Medical Image Segmentation: Victor Ion Butoi,

Jose Javier Gonzalez Ortiz,

Tianyu Ma,

Mert R. Sabuncu,

John Guttag,

Adrian V. Dalca; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Butoi_2023_ICCV, author = {Butoi, Victor Ion and Ortiz, Jose Javier Gonzalez and Ma, Tianyu and Sabuncu, Mert R. and Guttag, John and Dalca, Adrian V.}, title = {UniverSeg: Universal Medical Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21438-21451} }
RecRecNet: Rectangling Rectified Wide-Angle Images by Thin-Plate Spline Model and DoF-based Curriculum Learning: Kang Liao,

Lang Nie,

Chunyu Lin,

Zishuo Zheng,

Yao Zhao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liao_2023_ICCV, author = {Liao, Kang and Nie, Lang and Lin, Chunyu and Zheng, Zishuo and Zhao, Yao}, title = {RecRecNet: Rectangling Rectified Wide-Angle Images by Thin-Plate Spline Model and DoF-based Curriculum Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10800-10809} }
Neural Microfacet Fields for Inverse Rendering: Alexander Mai,

Dor Verbin,

Falko Kuester,

Sara Fridovich-Keil; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mai_2023_ICCV, author = {Mai, Alexander and Verbin, Dor and Kuester, Falko and Fridovich-Keil, Sara}, title = {Neural Microfacet Fields for Inverse Rendering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {408-418} }
Understanding Self-attention Mechanism via Dynamical System Perspective: Zhongzhan Huang,

Mingfu Liang,

Jinghui Qin,

Shanshan Zhong,

Liang Lin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Zhongzhan and Liang, Mingfu and Qin, Jinghui and Zhong, Shanshan and Lin, Liang}, title = {Understanding Self-attention Mechanism via Dynamical System Perspective}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1412-1422} }
Learning Versatile 3D Shape Generation with Improved Auto-regressive Models: Simian Luo,

Xuelin Qian,

Yanwei Fu,

Yinda Zhang,

Ying Tai,

Zhenyu Zhang,

Chengjie Wang,

Xiangyang Xue; [pdf] [supp]
[bibtex]
@InProceedings{Luo_2023_ICCV, author = {Luo, Simian and Qian, Xuelin and Fu, Yanwei and Zhang, Yinda and Tai, Ying and Zhang, Zhenyu and Wang, Chengjie and Xue, Xiangyang}, title = {Learning Versatile 3D Shape Generation with Improved Auto-regressive Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14139-14149} }
DETA: Denoised Task Adaptation for Few-Shot Learning: Ji Zhang,

Lianli Gao,

Xu Luo,

Hengtao Shen,

Jingkuan Song; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Ji and Gao, Lianli and Luo, Xu and Shen, Hengtao and Song, Jingkuan}, title = {DETA: Denoised Task Adaptation for Few-Shot Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11541-11551} }
DDG-Net: Discriminability-Driven Graph Network for Weakly-supervised Temporal Action Localization: Xiaojun Tang,

Junsong Fan,

Chuanchen Luo,

Zhaoxiang Zhang,

Man Zhang,

Zongyuan Yang; [pdf] [supp]
[bibtex]
@InProceedings{Tang_2023_ICCV, author = {Tang, Xiaojun and Fan, Junsong and Luo, Chuanchen and Zhang, Zhaoxiang and Zhang, Man and Yang, Zongyuan}, title = {DDG-Net: Discriminability-Driven Graph Network for Weakly-supervised Temporal Action Localization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6622-6632} }
Diffusion Models as Masked Autoencoders: Chen Wei,

Karttikeya Mangalam,

Po-Yao Huang,

Yanghao Li,

Haoqi Fan,

Hu Xu,

Huiyu Wang,

Cihang Xie,

Alan Yuille,

Christoph Feichtenhofer; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wei_2023_ICCV, author = {Wei, Chen and Mangalam, Karttikeya and Huang, Po-Yao and Li, Yanghao and Fan, Haoqi and Xu, Hu and Wang, Huiyu and Xie, Cihang and Yuille, Alan and Feichtenhofer, Christoph}, title = {Diffusion Models as Masked Autoencoders}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16284-16294} }
Robust Frame-to-Frame Camera Rotation Estimation in Crowded Scenes: Fabien Delattre,

David Dirnfeld,

Phat Nguyen,

Stephen K Scarano,

Michael J Jones,

Pedro Miraldo,

Erik Learned-Miller; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Delattre_2023_ICCV, author = {Delattre, Fabien and Dirnfeld, David and Nguyen, Phat and Scarano, Stephen K and Jones, Michael J and Miraldo, Pedro and Learned-Miller, Erik}, title = {Robust Frame-to-Frame Camera Rotation Estimation in Crowded Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9752-9762} }
Bayesian Prompt Learning for Image-Language Model Generalization: Mohammad Mahdi Derakhshani,

Enrique Sanchez,

Adrian Bulat,

Victor G. Turrisi da Costa,

Cees G.M. Snoek,

Georgios Tzimiropoulos,

Brais Martinez; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Derakhshani_2023_ICCV, author = {Derakhshani, Mohammad Mahdi and Sanchez, Enrique and Bulat, Adrian and da Costa, Victor G. Turrisi and Snoek, Cees G.M. and Tzimiropoulos, Georgios and Martinez, Brais}, title = {Bayesian Prompt Learning for Image-Language Model Generalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15237-15246} }
One-Shot Recognition of Any Material Anywhere Using Contrastive Learning with Physics-Based Rendering: Manuel S. Drehwald,

Sagi Eppel,

Jolina Li,

Han Hao,

Alan Aspuru-Guzik; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Drehwald_2023_ICCV, author = {Drehwald, Manuel S. and Eppel, Sagi and Li, Jolina and Hao, Han and Aspuru-Guzik, Alan}, title = {One-Shot Recognition of Any Material Anywhere Using Contrastive Learning with Physics-Based Rendering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23524-23533} }
DiLiGenT-Pi: Photometric Stereo for Planar Surfaces with Rich Details - Benchmark Dataset and Beyond: Feishi Wang,

Jieji Ren,

Heng Guo,

Mingjun Ren,

Boxin Shi; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Feishi and Ren, Jieji and Guo, Heng and Ren, Mingjun and Shi, Boxin}, title = {DiLiGenT-Pi: Photometric Stereo for Planar Surfaces with Rich Details - Benchmark Dataset and Beyond}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9477-9487} }
Rethinking Data Distillation: Do Not Overlook Calibration: Dongyao Zhu,

Bowen Lei,

Jie Zhang,

Yanbo Fang,

Yiqun Xie,

Ruqi Zhang,

Dongkuan Xu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Dongyao and Lei, Bowen and Zhang, Jie and Fang, Yanbo and Xie, Yiqun and Zhang, Ruqi and Xu, Dongkuan}, title = {Rethinking Data Distillation: Do Not Overlook Calibration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4935-4945} }
Accurate and Fast Compressed Video Captioning: Yaojie Shen,

Xin Gu,

Kai Xu,

Heng Fan,

Longyin Wen,

Libo Zhang; [pdf] [arXiv]
[bibtex]
@InProceedings{Shen_2023_ICCV, author = {Shen, Yaojie and Gu, Xin and Xu, Kai and Fan, Heng and Wen, Longyin and Zhang, Libo}, title = {Accurate and Fast Compressed Video Captioning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15558-15567} }
Building Vision Transformers with Hierarchy Aware Feature Aggregation: Yongjie Chen,

Hongmin Liu,

Haoran Yin,

Bin Fan; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Yongjie and Liu, Hongmin and Yin, Haoran and Fan, Bin}, title = {Building Vision Transformers with Hierarchy Aware Feature Aggregation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5908-5918} }
Visible-Infrared Person Re-Identification via Semantic Alignment and Affinity Inference: Xingye Fang,

Yang Yang,

Ying Fu; [pdf] [supp]
[bibtex]
@InProceedings{Fang_2023_ICCV, author = {Fang, Xingye and Yang, Yang and Fu, Ying}, title = {Visible-Infrared Person Re-Identification via Semantic Alignment and Affinity Inference}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11270-11279} }
SAL-ViT: Towards Latency Efficient Private Inference on ViT using Selective Attention Search with a Learnable Softmax Approximation: Yuke Zhang,

Dake Chen,

Souvik Kundu,

Chenghao Li,

Peter A. Beerel; [pdf]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Yuke and Chen, Dake and Kundu, Souvik and Li, Chenghao and Beerel, Peter A.}, title = {SAL-ViT: Towards Latency Efficient Private Inference on ViT using Selective Attention Search with a Learnable Softmax Approximation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5116-5125} }
TIJO: Trigger Inversion with Joint Optimization for Defending Multimodal Backdoored Models: Indranil Sur,

Karan Sikka,

Matthew Walmer,

Kaushik Koneripalli,

Anirban Roy,

Xiao Lin,

Ajay Divakaran,

Susmit Jha; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sur_2023_ICCV, author = {Sur, Indranil and Sikka, Karan and Walmer, Matthew and Koneripalli, Kaushik and Roy, Anirban and Lin, Xiao and Divakaran, Ajay and Jha, Susmit}, title = {TIJO: Trigger Inversion with Joint Optimization for Defending Multimodal Backdoored Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {165-175} }
DG3D: Generating High Quality 3D Textured Shapes by Learning to Discriminate Multi-Modal Diffusion-Renderings: Qi Zuo,

Yafei Song,

Jianfang Li,

Lin Liu,

Liefeng Bo; [pdf] [supp]
[bibtex]
@InProceedings{Zuo_2023_ICCV, author = {Zuo, Qi and Song, Yafei and Li, Jianfang and Liu, Lin and Bo, Liefeng}, title = {DG3D: Generating High Quality 3D Textured Shapes by Learning to Discriminate Multi-Modal Diffusion-Renderings}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14575-14584} }
Improving Adversarial Robustness of Masked Autoencoders via Test-time Frequency-domain Prompting: Qidong Huang,

Xiaoyi Dong,

Dongdong Chen,

Yinpeng Chen,

Lu Yuan,

Gang Hua,

Weiming Zhang,

Nenghai Yu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Qidong and Dong, Xiaoyi and Chen, Dongdong and Chen, Yinpeng and Yuan, Lu and Hua, Gang and Zhang, Weiming and Yu, Nenghai}, title = {Improving Adversarial Robustness of Masked Autoencoders via Test-time Frequency-domain Prompting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1600-1610} }
HairCLIPv2: Unifying Hair Editing via Proxy Feature Blending: Tianyi Wei,

Dongdong Chen,

Wenbo Zhou,

Jing Liao,

Weiming Zhang,

Gang Hua,

Nenghai Yu; [pdf] [supp]
[bibtex]
@InProceedings{Wei_2023_ICCV, author = {Wei, Tianyi and Chen, Dongdong and Zhou, Wenbo and Liao, Jing and Zhang, Weiming and Hua, Gang and Yu, Nenghai}, title = {HairCLIPv2: Unifying Hair Editing via Proxy Feature Blending}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23589-23599} }
VLSlice: Interactive Vision-and-Language Slice Discovery: Eric Slyman,

Minsuk Kahng,

Stefan Lee; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Slyman_2023_ICCV, author = {Slyman, Eric and Kahng, Minsuk and Lee, Stefan}, title = {VLSlice: Interactive Vision-and-Language Slice Discovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15291-15301} }
Learning to Ground Instructional Articles in Videos through Narrations: Effrosyni Mavroudi,

Triantafyllos Afouras,

Lorenzo Torresani; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mavroudi_2023_ICCV, author = {Mavroudi, Effrosyni and Afouras, Triantafyllos and Torresani, Lorenzo}, title = {Learning to Ground Instructional Articles in Videos through Narrations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15201-15213} }
DocTr: Document Transformer for Structured Information Extraction in Documents: Haofu Liao,

Aruni RoyChowdhury,

Weijian Li,

Ankan Bansal,

Yuting Zhang,

Zhuowen Tu,

Ravi Kumar Satzoda,

R. Manmatha,

Vijay Mahadevan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liao_2023_ICCV, author = {Liao, Haofu and RoyChowdhury, Aruni and Li, Weijian and Bansal, Ankan and Zhang, Yuting and Tu, Zhuowen and Satzoda, Ravi Kumar and Manmatha, R. and Mahadevan, Vijay}, title = {DocTr: Document Transformer for Structured Information Extraction in Documents}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19584-19594} }
The Making and Breaking of Camouflage: Hala Lamdouar,

Weidi Xie,

Andrew Zisserman; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lamdouar_2023_ICCV, author = {Lamdouar, Hala and Xie, Weidi and Zisserman, Andrew}, title = {The Making and Breaking of Camouflage}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {832-842} }
Role-Aware Interaction Generation from Textual Description: Mikihiro Tanaka,

Kent Fujiwara; [pdf] [supp]
[bibtex]
@InProceedings{Tanaka_2023_ICCV, author = {Tanaka, Mikihiro and Fujiwara, Kent}, title = {Role-Aware Interaction Generation from Textual Description}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15999-16009} }
MAMo: Leveraging Memory and Attention for Monocular Video Depth Estimation: Rajeev Yasarla,

Hong Cai,

Jisoo Jeong,

Yunxiao Shi,

Risheek Garrepalli,

Fatih Porikli; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yasarla_2023_ICCV, author = {Yasarla, Rajeev and Cai, Hong and Jeong, Jisoo and Shi, Yunxiao and Garrepalli, Risheek and Porikli, Fatih}, title = {MAMo: Leveraging Memory and Attention for Monocular Video Depth Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8754-8764} }
Continual Learning for Personalized Co-speech Gesture Generation: Chaitanya Ahuja,

Pratik Joshi,

Ryo Ishii,

Louis-Philippe Morency; [pdf] [supp]
[bibtex]
@InProceedings{Ahuja_2023_ICCV, author = {Ahuja, Chaitanya and Joshi, Pratik and Ishii, Ryo and Morency, Louis-Philippe}, title = {Continual Learning for Personalized Co-speech Gesture Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20893-20903} }
Object as Query: Lifting Any 2D Object Detector to 3D Detection: Zitian Wang,

Zehao Huang,

Jiahui Fu,

Naiyan Wang,

Si Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Zitian and Huang, Zehao and Fu, Jiahui and Wang, Naiyan and Liu, Si}, title = {Object as Query: Lifting Any 2D Object Detector to 3D Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3791-3800} }
HDG-ODE: A Hierarchical Continuous-Time Model for Human Pose Forecasting: Yucheng Xing,

Xin Wang; [pdf]
[bibtex]
@InProceedings{Xing_2023_ICCV, author = {Xing, Yucheng and Wang, Xin}, title = {HDG-ODE: A Hierarchical Continuous-Time Model for Human Pose Forecasting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14700-14712} }
Versatile Diffusion: Text, Images and Variations All in One Diffusion Model: Xingqian Xu,

Zhangyang Wang,

Gong Zhang,

Kai Wang,

Humphrey Shi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Xingqian and Wang, Zhangyang and Zhang, Gong and Wang, Kai and Shi, Humphrey}, title = {Versatile Diffusion: Text, Images and Variations All in One Diffusion Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7754-7765} }
DreamTeacher: Pretraining Image Backbones with Deep Generative Models: Daiqing Li,

Huan Ling,

Amlan Kar,

David Acuna,

Seung Wook Kim,

Karsten Kreis,

Antonio Torralba,

Sanja Fidler; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Daiqing and Ling, Huan and Kar, Amlan and Acuna, David and Kim, Seung Wook and Kreis, Karsten and Torralba, Antonio and Fidler, Sanja}, title = {DreamTeacher: Pretraining Image Backbones with Deep Generative Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16698-16708} }
Decomposition-Based Variational Network for Multi-Contrast MRI Super-Resolution and Reconstruction: Pengcheng Lei,

Faming Fang,

Guixu Zhang,

Tieyong Zeng; [pdf] [supp]
[bibtex]
@InProceedings{Lei_2023_ICCV, author = {Lei, Pengcheng and Fang, Faming and Zhang, Guixu and Zeng, Tieyong}, title = {Decomposition-Based Variational Network for Multi-Contrast MRI Super-Resolution and Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21296-21306} }
Self-supervised Monocular Underwater Depth Recovery, Image Restoration, and a Real-sea Video Dataset: Nisha Varghese,

Ashish Kumar,

A. N. Rajagopalan; [pdf] [supp]
[bibtex]
@InProceedings{Varghese_2023_ICCV, author = {Varghese, Nisha and Kumar, Ashish and Rajagopalan, A. N.}, title = {Self-supervised Monocular Underwater Depth Recovery, Image Restoration, and a Real-sea Video Dataset}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12248-12258} }
Geometrized Transformer for Self-Supervised Homography Estimation: Jiazhen Liu,

Xirong Li; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Jiazhen and Li, Xirong}, title = {Geometrized Transformer for Self-Supervised Homography Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9556-9565} }
Sat2Density: Faithful Density Learning from Satellite-Ground Image Pairs: Ming Qian,

Jincheng Xiong,

Gui-Song Xia,

Nan Xue; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Qian_2023_ICCV, author = {Qian, Ming and Xiong, Jincheng and Xia, Gui-Song and Xue, Nan}, title = {Sat2Density: Faithful Density Learning from Satellite-Ground Image Pairs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3683-3692} }
TiDy-PSFs: Computational Imaging with Time-Averaged Dynamic Point-Spread-Functions: Sachin Shah,

Sakshum Kulshrestha,

Christopher A. Metzler; [pdf] [supp]
[bibtex]
@InProceedings{Shah_2023_ICCV, author = {Shah, Sachin and Kulshrestha, Sakshum and Metzler, Christopher A.}, title = {TiDy-PSFs: Computational Imaging with Time-Averaged Dynamic Point-Spread-Functions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10657-10667} }
Expressive Text-to-Image Generation with Rich Text: Songwei Ge,

Taesung Park,

Jun-Yan Zhu,

Jia-Bin Huang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ge_2023_ICCV, author = {Ge, Songwei and Park, Taesung and Zhu, Jun-Yan and Huang, Jia-Bin}, title = {Expressive Text-to-Image Generation with Rich Text}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7545-7556} }
Learning Fine-Grained Features for Pixel-Wise Video Correspondences: Rui Li,

Shenglong Zhou,

Dong Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Rui and Zhou, Shenglong and Liu, Dong}, title = {Learning Fine-Grained Features for Pixel-Wise Video Correspondences}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9632-9641} }
FS-DETR: Few-Shot DEtection TRansformer with Prompting and without Re-Training: Adrian Bulat,

Ricardo Guerrero,

Brais Martinez,

Georgios Tzimiropoulos; [pdf] [supp]
[bibtex]
@InProceedings{Bulat_2023_ICCV, author = {Bulat, Adrian and Guerrero, Ricardo and Martinez, Brais and Tzimiropoulos, Georgios}, title = {FS-DETR: Few-Shot DEtection TRansformer with Prompting and without Re-Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11793-11802} }
Semi-supervised Speech-driven 3D Facial Animation via Cross-modal Encoding: Peiji Yang,

Huawei Wei,

Yicheng Zhong,

Zhisheng Wang; [pdf] [supp]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Peiji and Wei, Huawei and Zhong, Yicheng and Wang, Zhisheng}, title = {Semi-supervised Speech-driven 3D Facial Animation via Cross-modal Encoding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21032-21041} }
Learning to Learn: How to Continuously Teach Humans and Machines: Parantak Singh,

You Li,

Ankur Sikarwar,

Stan Weixian Lei,

Difei Gao,

Morgan B. Talbot,

Ying Sun,

Mike Zheng Shou,

Gabriel Kreiman,

Mengmi Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Singh_2023_ICCV, author = {Singh, Parantak and Li, You and Sikarwar, Ankur and Lei, Stan Weixian and Gao, Difei and Talbot, Morgan B. and Sun, Ying and Shou, Mike Zheng and Kreiman, Gabriel and Zhang, Mengmi}, title = {Learning to Learn: How to Continuously Teach Humans and Machines}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11708-11719} }
Text-Driven Generative Domain Adaptation with Spectral Consistency Regularization: Zhenhuan Liu,

Liang Li,

Jiayu Xiao,

Zheng-Jun Zha,

Qingming Huang; [pdf]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Zhenhuan and Li, Liang and Xiao, Jiayu and Zha, Zheng-Jun and Huang, Qingming}, title = {Text-Driven Generative Domain Adaptation with Spectral Consistency Regularization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7019-7029} }
A 5-Point Minimal Solver for Event Camera Relative Motion Estimation: Ling Gao,

Hang Su,

Daniel Gehrig,

Marco Cannici,

Davide Scaramuzza,

Laurent Kneip; [pdf]
[bibtex]
@InProceedings{Gao_2023_ICCV, author = {Gao, Ling and Su, Hang and Gehrig, Daniel and Cannici, Marco and Scaramuzza, Davide and Kneip, Laurent}, title = {A 5-Point Minimal Solver for Event Camera Relative Motion Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8049-8059} }
TM2D: Bimodality Driven 3D Dance Generation via Music-Text Integration: Kehong Gong,

Dongze Lian,

Heng Chang,

Chuan Guo,

Zihang Jiang,

Xinxin Zuo,

Michael Bi Mi,

Xinchao Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gong_2023_ICCV, author = {Gong, Kehong and Lian, Dongze and Chang, Heng and Guo, Chuan and Jiang, Zihang and Zuo, Xinxin and Mi, Michael Bi and Wang, Xinchao}, title = {TM2D: Bimodality Driven 3D Dance Generation via Music-Text Integration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9942-9952} }
Bootstrap Motion Forecasting With Self-Consistent Constraints: Maosheng Ye,

Jiamiao Xu,

Xunnong Xu,

Tengfei Wang,

Tongyi Cao,

Qifeng Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ye_2023_ICCV, author = {Ye, Maosheng and Xu, Jiamiao and Xu, Xunnong and Wang, Tengfei and Cao, Tongyi and Chen, Qifeng}, title = {Bootstrap Motion Forecasting With Self-Consistent Constraints}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8504-8514} }
CDAC: Cross-domain Attention Consistency in Transformer for Domain Adaptive Semantic Segmentation: Kaihong Wang,

Donghyun Kim,

Rogerio Feris,

Margrit Betke; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Kaihong and Kim, Donghyun and Feris, Rogerio and Betke, Margrit}, title = {CDAC: Cross-domain Attention Consistency in Transformer for Domain Adaptive Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11519-11529} }
WaveNeRF: Wavelet-based Generalizable Neural Radiance Fields: Muyu Xu,

Fangneng Zhan,

Jiahui Zhang,

Yingchen Yu,

Xiaoqin Zhang,

Christian Theobalt,

Ling Shao,

Shijian Lu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Muyu and Zhan, Fangneng and Zhang, Jiahui and Yu, Yingchen and Zhang, Xiaoqin and Theobalt, Christian and Shao, Ling and Lu, Shijian}, title = {WaveNeRF: Wavelet-based Generalizable Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18195-18204} }
LoCUS: Learning Multiscale 3D-consistent Features from Posed Images: Dominik A. Kloepfer,

Dylan Campbell,

João F. Henriques; [pdf] [supp]
[bibtex]
@InProceedings{Kloepfer_2023_ICCV, author = {Kloepfer, Dominik A. and Campbell, Dylan and Henriques, Jo\~ao F.}, title = {LoCUS: Learning Multiscale 3D-consistent Features from Posed Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16634-16644} }
Neural Reconstruction of Relightable Human Model from Monocular Video: Wenzhang Sun,

Yunlong Che,

Han Huang,

Yandong Guo; [pdf] [supp]
[bibtex]
@InProceedings{Sun_2023_ICCV, author = {Sun, Wenzhang and Che, Yunlong and Huang, Han and Guo, Yandong}, title = {Neural Reconstruction of Relightable Human Model from Monocular Video}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {397-407} }
FB-BEV: BEV Representation from Forward-Backward View Transformations: Zhiqi Li,

Zhiding Yu,

Wenhai Wang,

Anima Anandkumar,

Tong Lu,

Jose M. Alvarez; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Zhiqi and Yu, Zhiding and Wang, Wenhai and Anandkumar, Anima and Lu, Tong and Alvarez, Jose M.}, title = {FB-BEV: BEV Representation from Forward-Backward View Transformations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6919-6928} }
BoxSnake: Polygonal Instance Segmentation with Box Supervision: Rui Yang,

Lin Song,

Yixiao Ge,

Xiu Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Rui and Song, Lin and Ge, Yixiao and Li, Xiu}, title = {BoxSnake: Polygonal Instance Segmentation with Box Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {766-776} }
Confidence-based Visual Dispersal for Few-shot Unsupervised Domain Adaptation: Yizhe Xiong,

Hui Chen,

Zijia Lin,

Sicheng Zhao,

Guiguang Ding; [pdf] [supp]
[bibtex]
@InProceedings{Xiong_2023_ICCV, author = {Xiong, Yizhe and Chen, Hui and Lin, Zijia and Zhao, Sicheng and Ding, Guiguang}, title = {Confidence-based Visual Dispersal for Few-shot Unsupervised Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11621-11631} }
Event-Guided Procedure Planning from Instructional Videos with Text Supervision: An-Lan Wang,

Kun-Yu Lin,

Jia-Run Du,

Jingke Meng,

Wei-Shi Zheng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, An-Lan and Lin, Kun-Yu and Du, Jia-Run and Meng, Jingke and Zheng, Wei-Shi}, title = {Event-Guided Procedure Planning from Instructional Videos with Text Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13565-13575} }
Foreground Object Search by Distilling Composite Image Feature: Bo Zhang,

Jiacheng Sui,

Li Niu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Bo and Sui, Jiacheng and Niu, Li}, title = {Foreground Object Search by Distilling Composite Image Feature}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22986-22995} }
Multimodal Motion Conditioned Diffusion Model for Skeleton-based Video Anomaly Detection: Alessandro Flaborea,

Luca Collorone,

Guido Maria D'Amely di Melendugno,

Stefano D'Arrigo,

Bardh Prenkaj,

Fabio Galasso; [pdf] [supp]
[bibtex]
@InProceedings{Flaborea_2023_ICCV, author = {Flaborea, Alessandro and Collorone, Luca and di Melendugno, Guido Maria D'Amely and D'Arrigo, Stefano and Prenkaj, Bardh and Galasso, Fabio}, title = {Multimodal Motion Conditioned Diffusion Model for Skeleton-based Video Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10318-10329} }
ClimateNeRF: Extreme Weather Synthesis in Neural Radiance Field: Yuan Li,

Zhi-Hao Lin,

David Forsyth,

Jia-Bin Huang,

Shenlong Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Yuan and Lin, Zhi-Hao and Forsyth, David and Huang, Jia-Bin and Wang, Shenlong}, title = {ClimateNeRF: Extreme Weather Synthesis in Neural Radiance Field}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3227-3238} }
CDFSL-V: Cross-Domain Few-Shot Learning for Videos: Sarinda Samarasinghe,

Mamshad Nayeem Rizve,

Navid Kardan,

Mubarak Shah; [pdf] [supp]
[bibtex]
@InProceedings{Samarasinghe_2023_ICCV, author = {Samarasinghe, Sarinda and Rizve, Mamshad Nayeem and Kardan, Navid and Shah, Mubarak}, title = {CDFSL-V: Cross-Domain Few-Shot Learning for Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11643-11652} }
Generalized Few-Shot Point Cloud Segmentation via Geometric Words: Yating Xu,

Conghui Hu,

Na Zhao,

Gim Hee Lee; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Yating and Hu, Conghui and Zhao, Na and Lee, Gim Hee}, title = {Generalized Few-Shot Point Cloud Segmentation via Geometric Words}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21506-21515} }
Monte Carlo Linear Clustering with Single-Point Supervision is Enough for Infrared Small Target Detection: Boyang Li,

Yingqian Wang,

Longguang Wang,

Fei Zhang,

Ting Liu,

Zaiping Lin,

Wei An,

Yulan Guo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Boyang and Wang, Yingqian and Wang, Longguang and Zhang, Fei and Liu, Ting and Lin, Zaiping and An, Wei and Guo, Yulan}, title = {Monte Carlo Linear Clustering with Single-Point Supervision is Enough for Infrared Small Target Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1009-1019} }
Practical Membership Inference Attacks Against Large-Scale Multi-Modal Models: A Pilot Study: Myeongseob Ko,

Ming Jin,

Chenguang Wang,

Ruoxi Jia; [pdf] [supp]
[bibtex]
@InProceedings{Ko_2023_ICCV, author = {Ko, Myeongseob and Jin, Ming and Wang, Chenguang and Jia, Ruoxi}, title = {Practical Membership Inference Attacks Against Large-Scale Multi-Modal Models: A Pilot Study}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4871-4881} }
TCOVIS: Temporally Consistent Online Video Instance Segmentation: Junlong Li,

Bingyao Yu,

Yongming Rao,

Jie Zhou,

Jiwen Lu; [pdf] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Junlong and Yu, Bingyao and Rao, Yongming and Zhou, Jie and Lu, Jiwen}, title = {TCOVIS: Temporally Consistent Online Video Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1097-1107} }
Towards Viewpoint Robustness in Bird's Eye View Segmentation: Tzofi Klinghoffer,

Jonah Philion,

Wenzheng Chen,

Or Litany,

Zan Gojcic,

Jungseock Joo,

Ramesh Raskar,

Sanja Fidler,

Jose M. Alvarez; [pdf] [supp]
[bibtex]
@InProceedings{Klinghoffer_2023_ICCV, author = {Klinghoffer, Tzofi and Philion, Jonah and Chen, Wenzheng and Litany, Or and Gojcic, Zan and Joo, Jungseock and Raskar, Ramesh and Fidler, Sanja and Alvarez, Jose M.}, title = {Towards Viewpoint Robustness in Bird's Eye View Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8515-8524} }
Long-Term Photometric Consistent Novel View Synthesis with Diffusion Models: Jason J. Yu,

Fereshteh Forghani,

Konstantinos G. Derpanis,

Marcus A. Brubaker; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yu_2023_ICCV, author = {Yu, Jason J. and Forghani, Fereshteh and Derpanis, Konstantinos G. and Brubaker, Marcus A.}, title = {Long-Term Photometric Consistent Novel View Synthesis with Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7094-7104} }
What Can a Cook in Italy Teach a Mechanic in India? Action Recognition Generalisation Over Scenarios and Locations: Chiara Plizzari,

Toby Perrett,

Barbara Caputo,

Dima Damen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Plizzari_2023_ICCV, author = {Plizzari, Chiara and Perrett, Toby and Caputo, Barbara and Damen, Dima}, title = {What Can a Cook in Italy Teach a Mechanic in India? Action Recognition Generalisation Over Scenarios and Locations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13656-13666} }
EMDB: The Electromagnetic Database of Global 3D Human Pose and Shape in the Wild: Manuel Kaufmann,

Jie Song,

Chen Guo,

Kaiyue Shen,

Tianjian Jiang,

Chengcheng Tang,

Juan José Zárate,

Otmar Hilliges; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kaufmann_2023_ICCV, author = {Kaufmann, Manuel and Song, Jie and Guo, Chen and Shen, Kaiyue and Jiang, Tianjian and Tang, Chengcheng and Z\'arate, Juan Jos\'e and Hilliges, Otmar}, title = {EMDB: The Electromagnetic Database of Global 3D Human Pose and Shape in the Wild}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14632-14643} }
STEERER: Resolving Scale Variations for Counting and Localization via Selective Inheritance Learning: Tao Han,

Lei Bai,

Lingbo Liu,

Wanli Ouyang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Han_2023_ICCV, author = {Han, Tao and Bai, Lei and Liu, Lingbo and Ouyang, Wanli}, title = {STEERER: Resolving Scale Variations for Counting and Localization via Selective Inheritance Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21848-21859} }
Benchmarking Algorithmic Bias in Face Recognition: An Experimental Approach Using Synthetic Faces and Human Evaluation: Hao Liang,

Pietro Perona,

Guha Balakrishnan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liang_2023_ICCV, author = {Liang, Hao and Perona, Pietro and Balakrishnan, Guha}, title = {Benchmarking Algorithmic Bias in Face Recognition: An Experimental Approach Using Synthetic Faces and Human Evaluation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4977-4987} }
Spatial-Aware Token for Weakly Supervised Object Localization: Pingyu Wu,

Wei Zhai,

Yang Cao,

Jiebo Luo,

Zheng-Jun Zha; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Pingyu and Zhai, Wei and Cao, Yang and Luo, Jiebo and Zha, Zheng-Jun}, title = {Spatial-Aware Token for Weakly Supervised Object Localization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1844-1854} }
Harnessing the Spatial-Temporal Attention of Diffusion Models for High-Fidelity Text-to-Image Synthesis: Qiucheng Wu,

Yujian Liu,

Handong Zhao,

Trung Bui,

Zhe Lin,

Yang Zhang,

Shiyu Chang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Qiucheng and Liu, Yujian and Zhao, Handong and Bui, Trung and Lin, Zhe and Zhang, Yang and Chang, Shiyu}, title = {Harnessing the Spatial-Temporal Attention of Diffusion Models for High-Fidelity Text-to-Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7766-7776} }
GraphAlign: Enhancing Accurate Feature Alignment by Graph matching for Multi-Modal 3D Object Detection: Ziying Song,

Haiyue Wei,

Lin Bai,

Lei Yang,

Caiyan Jia; [pdf]
[bibtex]
@InProceedings{Song_2023_ICCV, author = {Song, Ziying and Wei, Haiyue and Bai, Lin and Yang, Lei and Jia, Caiyan}, title = {GraphAlign: Enhancing Accurate Feature Alignment by Graph matching for Multi-Modal 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3358-3369} }
Weakly-Supervised Action Segmentation and Unseen Error Detection in Anomalous Instructional Videos: Reza Ghoddoosian,

Isht Dwivedi,

Nakul Agarwal,

Behzad Dariush; [pdf] [supp]
[bibtex]
@InProceedings{Ghoddoosian_2023_ICCV, author = {Ghoddoosian, Reza and Dwivedi, Isht and Agarwal, Nakul and Dariush, Behzad}, title = {Weakly-Supervised Action Segmentation and Unseen Error Detection in Anomalous Instructional Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10128-10138} }
NEMTO: Neural Environment Matting for Novel View and Relighting Synthesis of Transparent Objects: Dongqing Wang,

Tong Zhang,

Sabine Süsstrunk; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Dongqing and Zhang, Tong and S\"usstrunk, Sabine}, title = {NEMTO: Neural Environment Matting for Novel View and Relighting Synthesis of Transparent Objects}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {317-327} }
Geometric Viewpoint Learning with Hyper-Rays and Harmonics Encoding: Zhixiang Min,

Juan Carlos Dibene,

Enrique Dunn; [pdf] [supp]
[bibtex]
@InProceedings{Min_2023_ICCV, author = {Min, Zhixiang and Dibene, Juan Carlos and Dunn, Enrique}, title = {Geometric Viewpoint Learning with Hyper-Rays and Harmonics Encoding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22520-22530} }
C2F2NeUS: Cascade Cost Frustum Fusion for High Fidelity and Generalizable Neural Surface Reconstruction: Luoyuan Xu,

Tao Guan,

Yuesong Wang,

Wenkai Liu,

Zhaojie Zeng,

Junle Wang,

Wei Yang; [pdf] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Luoyuan and Guan, Tao and Wang, Yuesong and Liu, Wenkai and Zeng, Zhaojie and Wang, Junle and Yang, Wei}, title = {C2F2NeUS: Cascade Cost Frustum Fusion for High Fidelity and Generalizable Neural Surface Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18291-18301} }
Mesh2Tex: Generating Mesh Textures from Image Queries: Alexey Bokhovkin,

Shubham Tulsiani,

Angela Dai; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bokhovkin_2023_ICCV, author = {Bokhovkin, Alexey and Tulsiani, Shubham and Dai, Angela}, title = {Mesh2Tex: Generating Mesh Textures from Image Queries}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8918-8928} }
USAGE: A Unified Seed Area Generation Paradigm for Weakly Supervised Semantic Segmentation: Zelin Peng,

Guanchun Wang,

Lingxi Xie,

Dongsheng Jiang,

Wei Shen,

Qi Tian; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Peng_2023_ICCV, author = {Peng, Zelin and Wang, Guanchun and Xie, Lingxi and Jiang, Dongsheng and Shen, Wei and Tian, Qi}, title = {USAGE: A Unified Seed Area Generation Paradigm for Weakly Supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {624-634} }
NeuS2: Fast Learning of Neural Implicit Surfaces for Multi-view Reconstruction: Yiming Wang,

Qin Han,

Marc Habermann,

Kostas Daniilidis,

Christian Theobalt,

Lingjie Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Yiming and Han, Qin and Habermann, Marc and Daniilidis, Kostas and Theobalt, Christian and Liu, Lingjie}, title = {NeuS2: Fast Learning of Neural Implicit Surfaces for Multi-view Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3295-3306} }
Deep Feature Deblurring Diffusion for Detecting Out-of-Distribution Objects: Aming Wu,

Da Chen,

Cheng Deng; [pdf] [supp]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Aming and Chen, Da and Deng, Cheng}, title = {Deep Feature Deblurring Diffusion for Detecting Out-of-Distribution Objects}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13381-13391} }
Fast Full-frame Video Stabilization with Iterative Optimization: Weiyue Zhao,

Xin Li,

Zhan Peng,

Xianrui Luo,

Xinyi Ye,

Hao Lu,

Zhiguo Cao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Weiyue and Li, Xin and Peng, Zhan and Luo, Xianrui and Ye, Xinyi and Lu, Hao and Cao, Zhiguo}, title = {Fast Full-frame Video Stabilization with Iterative Optimization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23534-23544} }
Gender Artifacts in Visual Datasets: Nicole Meister,

Dora Zhao,

Angelina Wang,

Vikram V. Ramaswamy,

Ruth Fong,

Olga Russakovsky; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Meister_2023_ICCV, author = {Meister, Nicole and Zhao, Dora and Wang, Angelina and Ramaswamy, Vikram V. and Fong, Ruth and Russakovsky, Olga}, title = {Gender Artifacts in Visual Datasets}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4837-4848} }
Learning Semi-supervised Gaussian Mixture Models for Generalized Category Discovery: Bingchen Zhao,

Xin Wen,

Kai Han; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Bingchen and Wen, Xin and Han, Kai}, title = {Learning Semi-supervised Gaussian Mixture Models for Generalized Category Discovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16623-16633} }
SuS-X: Training-Free Name-Only Transfer of Vision-Language Models: Vishaal Udandarao,

Ankush Gupta,

Samuel Albanie; [pdf] [supp]
[bibtex]
@InProceedings{Udandarao_2023_ICCV, author = {Udandarao, Vishaal and Gupta, Ankush and Albanie, Samuel}, title = {SuS-X: Training-Free Name-Only Transfer of Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2725-2736} }
Rethinking Point Cloud Registration as Masking and Reconstruction: Guangyan Chen,

Meiling Wang,

Li Yuan,

Yi Yang,

Yufeng Yue; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Guangyan and Wang, Meiling and Yuan, Li and Yang, Yi and Yue, Yufeng}, title = {Rethinking Point Cloud Registration as Masking and Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17717-17727} }
Beating Backdoor Attack at Its Own Game: Min Liu,

Alberto Sangiovanni-Vincentelli,

Xiangyu Yue; [pdf] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Min and Sangiovanni-Vincentelli, Alberto and Yue, Xiangyu}, title = {Beating Backdoor Attack at Its Own Game}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4620-4629} }
Introducing Language Guidance in Prompt-based Continual Learning: Muhammad Gul Zain Ali Khan,

Muhammad Ferjad Naeem,

Luc Van Gool,

Didier Stricker,

Federico Tombari,

Muhammad Zeshan Afzal; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Khan_2023_ICCV, author = {Khan, Muhammad Gul Zain Ali and Naeem, Muhammad Ferjad and Van Gool, Luc and Stricker, Didier and Tombari, Federico and Afzal, Muhammad Zeshan}, title = {Introducing Language Guidance in Prompt-based Continual Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11463-11473} }
Invariant Training 2D-3D Joint Hard Samples for Few-Shot Point Cloud Recognition: Xuanyu Yi,

Jiajun Deng,

Qianru Sun,

Xian-Sheng Hua,

Joo-Hwee Lim,

Hanwang Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yi_2023_ICCV, author = {Yi, Xuanyu and Deng, Jiajun and Sun, Qianru and Hua, Xian-Sheng and Lim, Joo-Hwee and Zhang, Hanwang}, title = {Invariant Training 2D-3D Joint Hard Samples for Few-Shot Point Cloud Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14463-14474} }
EigenPlaces: Training Viewpoint Robust Models for Visual Place Recognition: Gabriele Berton,

Gabriele Trivigno,

Barbara Caputo,

Carlo Masone; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Berton_2023_ICCV, author = {Berton, Gabriele and Trivigno, Gabriele and Caputo, Barbara and Masone, Carlo}, title = {EigenPlaces: Training Viewpoint Robust Models for Visual Place Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11080-11090} }
Do DALL-E and Flamingo Understand Each Other?: Hang Li,

Jindong Gu,

Rajat Koner,

Sahand Sharifzadeh,

Volker Tresp; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Hang and Gu, Jindong and Koner, Rajat and Sharifzadeh, Sahand and Tresp, Volker}, title = {Do DALL-E and Flamingo Understand Each Other?}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1999-2010} }
CIRI: Curricular Inactivation for Residue-aware One-shot Video Inpainting: Weiying Zheng,

Cheng Xu,

Xuemiao Xu,

Wenxi Liu,

Shengfeng He; [pdf] [supp]
[bibtex]
@InProceedings{Zheng_2023_ICCV, author = {Zheng, Weiying and Xu, Cheng and Xu, Xuemiao and Liu, Wenxi and He, Shengfeng}, title = {CIRI: Curricular Inactivation for Residue-aware One-shot Video Inpainting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13012-13022} }
Prototype-based Dataset Comparison: Nanne van Noord; [pdf] [supp]
[bibtex]
@InProceedings{van_Noord_2023_ICCV, author = {van Noord, Nanne}, title = {Prototype-based Dataset Comparison}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1944-1954} }
FreeCOS: Self-Supervised Learning from Fractals and Unlabeled Images for Curvilinear Object Segmentation: Tianyi Shi,

Xiaohuan Ding,

Liang Zhang,

Xin Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shi_2023_ICCV, author = {Shi, Tianyi and Ding, Xiaohuan and Zhang, Liang and Yang, Xin}, title = {FreeCOS: Self-Supervised Learning from Fractals and Unlabeled Images for Curvilinear Object Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {876-886} }
Generating Dynamic Kernels via Transformers for Lane Detection: Ziye Chen,

Yu Liu,

Mingming Gong,

Bo Du,

Guoqi Qian,

Kate Smith-Miles; [pdf]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Ziye and Liu, Yu and Gong, Mingming and Du, Bo and Qian, Guoqi and Smith-Miles, Kate}, title = {Generating Dynamic Kernels via Transformers for Lane Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6835-6844} }
RSFNet: A White-Box Image Retouching Approach using Region-Specific Color Filters: Wenqi Ouyang,

Yi Dong,

Xiaoyang Kang,

Peiran Ren,

Xin Xu,

Xuansong Xie; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ouyang_2023_ICCV, author = {Ouyang, Wenqi and Dong, Yi and Kang, Xiaoyang and Ren, Peiran and Xu, Xin and Xie, Xuansong}, title = {RSFNet: A White-Box Image Retouching Approach using Region-Specific Color Filters}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12160-12169} }
Tem-Adapter: Adapting Image-Text Pretraining for Video Question Answer: Guangyi Chen,

Xiao Liu,

Guangrun Wang,

Kun Zhang,

Philip H.S. Torr,

Xiao-Ping Zhang,

Yansong Tang; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Guangyi and Liu, Xiao and Wang, Guangrun and Zhang, Kun and Torr, Philip H.S. and Zhang, Xiao-Ping and Tang, Yansong}, title = {Tem-Adapter: Adapting Image-Text Pretraining for Video Question Answer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13945-13955} }
Boosting Long-tailed Object Detection via Step-wise Learning on Smooth-tail Data: Na Dong,

Yongqiang Zhang,

Mingli Ding,

Gim Hee Lee; [pdf] [arXiv]
[bibtex]
@InProceedings{Dong_2023_ICCV, author = {Dong, Na and Zhang, Yongqiang and Ding, Mingli and Lee, Gim Hee}, title = {Boosting Long-tailed Object Detection via Step-wise Learning on Smooth-tail Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6940-6949} }
Talking Head Generation with Probabilistic Audio-to-Visual Diffusion Priors: Zhentao Yu,

Zixin Yin,

Deyu Zhou,

Duomin Wang,

Finn Wong,

Baoyuan Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yu_2023_ICCV, author = {Yu, Zhentao and Yin, Zixin and Zhou, Deyu and Wang, Duomin and Wong, Finn and Wang, Baoyuan}, title = {Talking Head Generation with Probabilistic Audio-to-Visual Diffusion Priors}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7645-7655} }
Learning Cross-Modal Affinity for Referring Video Object Segmentation Targeting Limited Samples: Guanghui Li,

Mingqi Gao,

Heng Liu,

Xiantong Zhen,

Feng Zheng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Guanghui and Gao, Mingqi and Liu, Heng and Zhen, Xiantong and Zheng, Feng}, title = {Learning Cross-Modal Affinity for Referring Video Object Segmentation Targeting Limited Samples}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2684-2693} }
Human Part-wise 3D Motion Context Learning for Sign Language Recognition: Taeryung Lee,

Yeonguk Oh,

Kyoung Mu Lee; [pdf] [arXiv]
[bibtex]
@InProceedings{Lee_2023_ICCV, author = {Lee, Taeryung and Oh, Yeonguk and Lee, Kyoung Mu}, title = {Human Part-wise 3D Motion Context Learning for Sign Language Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20740-20750} }
Remembering Normality: Memory-guided Knowledge Distillation for Unsupervised Anomaly Detection: Zhihao Gu,

Liang Liu,

Xu Chen,

Ran Yi,

Jiangning Zhang,

Yabiao Wang,

Chengjie Wang,

Annan Shu,

Guannan Jiang,

Lizhuang Ma; [pdf] [supp]
[bibtex]
@InProceedings{Gu_2023_ICCV, author = {Gu, Zhihao and Liu, Liang and Chen, Xu and Yi, Ran and Zhang, Jiangning and Wang, Yabiao and Wang, Chengjie and Shu, Annan and Jiang, Guannan and Ma, Lizhuang}, title = {Remembering Normality: Memory-guided Knowledge Distillation for Unsupervised Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16401-16409} }
Coordinate Quantized Neural Implicit Representations for Multi-view Reconstruction: Sijia Jiang,

Jing Hua,

Zhizhong Han; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jiang_2023_ICCV, author = {Jiang, Sijia and Hua, Jing and Han, Zhizhong}, title = {Coordinate Quantized Neural Implicit Representations for Multi-view Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18358-18369} }
Unleashing the Potential of Spiking Neural Networks with Dynamic Confidence: Chen Li,

Edward G Jones,

Steve Furber; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Chen and Jones, Edward G and Furber, Steve}, title = {Unleashing the Potential of Spiking Neural Networks with Dynamic Confidence}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13350-13360} }
TeD-SPAD: Temporal Distinctiveness for Self-Supervised Privacy-Preservation for Video Anomaly Detection: Joseph Fioresi,

Ishan Rajendrakumar Dave,

Mubarak Shah; [pdf] [supp]
[bibtex]
@InProceedings{Fioresi_2023_ICCV, author = {Fioresi, Joseph and Dave, Ishan Rajendrakumar and Shah, Mubarak}, title = {TeD-SPAD: Temporal Distinctiveness for Self-Supervised Privacy-Preservation for Video Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13598-13609} }
MAS: Towards Resource-Efficient Federated Multiple-Task Learning: Weiming Zhuang,

Yonggang Wen,

Lingjuan Lyu,

Shuai Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhuang_2023_ICCV, author = {Zhuang, Weiming and Wen, Yonggang and Lyu, Lingjuan and Zhang, Shuai}, title = {MAS: Towards Resource-Efficient Federated Multiple-Task Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23414-23424} }
Bridging Cross-task Protocol Inconsistency for Distillation in Dense Object Detection: Longrong Yang,

Xianpan Zhou,

Xuewei Li,

Liang Qiao,

Zheyang Li,

Ziwei Yang,

Gaoang Wang,

Xi Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Longrong and Zhou, Xianpan and Li, Xuewei and Qiao, Liang and Li, Zheyang and Yang, Ziwei and Wang, Gaoang and Li, Xi}, title = {Bridging Cross-task Protocol Inconsistency for Distillation in Dense Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17175-17184} }
Divide and Conquer: a Two-Step Method for High Quality Face De-identification with Model Explainability: Yunqian Wen,

Bo Liu,

Jingyi Cao,

Rong Xie,

Li Song; [pdf]
[bibtex]
@InProceedings{Wen_2023_ICCV, author = {Wen, Yunqian and Liu, Bo and Cao, Jingyi and Xie, Rong and Song, Li}, title = {Divide and Conquer: a Two-Step Method for High Quality Face De-identification with Model Explainability}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5148-5157} }
HiTeA: Hierarchical Temporal-Aware Video-Language Pre-training: Qinghao Ye,

Guohai Xu,

Ming Yan,

Haiyang Xu,

Qi Qian,

Ji Zhang,

Fei Huang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ye_2023_ICCV, author = {Ye, Qinghao and Xu, Guohai and Yan, Ming and Xu, Haiyang and Qian, Qi and Zhang, Ji and Huang, Fei}, title = {HiTeA: Hierarchical Temporal-Aware Video-Language Pre-training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15405-15416} }
VAPCNet: Viewpoint-Aware 3D Point Cloud Completion: Zhiheng Fu,

Longguang Wang,

Lian Xu,

Zhiyong Wang,

Hamid Laga,

Yulan Guo,

Farid Boussaid,

Mohammed Bennamoun; [pdf]
[bibtex]
@InProceedings{Fu_2023_ICCV, author = {Fu, Zhiheng and Wang, Longguang and Xu, Lian and Wang, Zhiyong and Laga, Hamid and Guo, Yulan and Boussaid, Farid and Bennamoun, Mohammed}, title = {VAPCNet: Viewpoint-Aware 3D Point Cloud Completion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12108-12118} }
Set-level Guidance Attack: Boosting Adversarial Transferability of Vision-Language Pre-training Models: Dong Lu,

Zhiqiang Wang,

Teng Wang,

Weili Guan,

Hongchang Gao,

Feng Zheng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lu_2023_ICCV, author = {Lu, Dong and Wang, Zhiqiang and Wang, Teng and Guan, Weili and Gao, Hongchang and Zheng, Feng}, title = {Set-level Guidance Attack: Boosting Adversarial Transferability of Vision-Language Pre-training Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {102-111} }
AutoSynth: Learning to Generate 3D Training Data for Object Point Cloud Registration: Zheng Dang,

Mathieu Salzmann; [pdf] [arXiv]
[bibtex]
@InProceedings{Dang_2023_ICCV, author = {Dang, Zheng and Salzmann, Mathieu}, title = {AutoSynth: Learning to Generate 3D Training Data for Object Point Cloud Registration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9009-9019} }
Multimodal Distillation for Egocentric Action Recognition: Gorjan Radevski,

Dusan Grujicic,

Matthew Blaschko,

Marie-Francine Moens,

Tinne Tuytelaars; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Radevski_2023_ICCV, author = {Radevski, Gorjan and Grujicic, Dusan and Blaschko, Matthew and Moens, Marie-Francine and Tuytelaars, Tinne}, title = {Multimodal Distillation for Egocentric Action Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5213-5224} }
Self-supervised Learning of Implicit Shape Representation with Dense Correspondence for Deformable Objects: Baowen Zhang,

Jiahe Li,

Xiaoming Deng,

Yinda Zhang,

Cuixia Ma,

Hongan Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Baowen and Li, Jiahe and Deng, Xiaoming and Zhang, Yinda and Ma, Cuixia and Wang, Hongan}, title = {Self-supervised Learning of Implicit Shape Representation with Dense Correspondence for Deformable Objects}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14268-14278} }
Perceptual Artifacts Localization for Image Synthesis Tasks: Lingzhi Zhang,

Zhengjie Xu,

Connelly Barnes,

Yuqian Zhou,

Qing Liu,

He Zhang,

Sohrab Amirghodsi,

Zhe Lin,

Eli Shechtman,

Jianbo Shi; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Lingzhi and Xu, Zhengjie and Barnes, Connelly and Zhou, Yuqian and Liu, Qing and Zhang, He and Amirghodsi, Sohrab and Lin, Zhe and Shechtman, Eli and Shi, Jianbo}, title = {Perceptual Artifacts Localization for Image Synthesis Tasks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7579-7590} }
Narrator: Towards Natural Control of Human-Scene Interaction Generation via Relationship Reasoning: Haibiao Xuan,

Xiongzheng Li,

Jinsong Zhang,

Hongwen Zhang,

Yebin Liu,

Kun Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xuan_2023_ICCV, author = {Xuan, Haibiao and Li, Xiongzheng and Zhang, Jinsong and Zhang, Hongwen and Liu, Yebin and Li, Kun}, title = {Narrator: Towards Natural Control of Human-Scene Interaction Generation via Relationship Reasoning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22268-22278} }
Vision Relation Transformer for Unbiased Scene Graph Generation: Gopika Sudhakaran,

Devendra Singh Dhami,

Kristian Kersting,

Stefan Roth; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sudhakaran_2023_ICCV, author = {Sudhakaran, Gopika and Dhami, Devendra Singh and Kersting, Kristian and Roth, Stefan}, title = {Vision Relation Transformer for Unbiased Scene Graph Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21882-21893} }
Scaling Data Generation in Vision-and-Language Navigation: Zun Wang,

Jialu Li,

Yicong Hong,

Yi Wang,

Qi Wu,

Mohit Bansal,

Stephen Gould,

Hao Tan,

Yu Qiao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Zun and Li, Jialu and Hong, Yicong and Wang, Yi and Wu, Qi and Bansal, Mohit and Gould, Stephen and Tan, Hao and Qiao, Yu}, title = {Scaling Data Generation in Vision-and-Language Navigation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12009-12020} }
Better May Not Be Fairer: A Study on Subgroup Discrepancy in Image Classification: Ming-Chang Chiu,

Pin-Yu Chen,

Xuezhe Ma; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chiu_2023_ICCV, author = {Chiu, Ming-Chang and Chen, Pin-Yu and Ma, Xuezhe}, title = {Better May Not Be Fairer: A Study on Subgroup Discrepancy in Image Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4956-4966} }
3D Implicit Transporter for Temporally Consistent Keypoint Discovery: Chengliang Zhong,

Yuhang Zheng,

Yupeng Zheng,

Hao Zhao,

Li Yi,

Xiaodong Mu,

Ling Wang,

Pengfei Li,

Guyue Zhou,

Chao Yang,

Xinliang Zhang,

Jian Zhao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhong_2023_ICCV, author = {Zhong, Chengliang and Zheng, Yuhang and Zheng, Yupeng and Zhao, Hao and Yi, Li and Mu, Xiaodong and Wang, Ling and Li, Pengfei and Zhou, Guyue and Yang, Chao and Zhang, Xinliang and Zhao, Jian}, title = {3D Implicit Transporter for Temporally Consistent Keypoint Discovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3869-3880} }
Adaptive Rotated Convolution for Rotated Object Detection: Yifan Pu,

Yiru Wang,

Zhuofan Xia,

Yizeng Han,

Yulin Wang,

Weihao Gan,

Zidong Wang,

Shiji Song,

Gao Huang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Pu_2023_ICCV, author = {Pu, Yifan and Wang, Yiru and Xia, Zhuofan and Han, Yizeng and Wang, Yulin and Gan, Weihao and Wang, Zidong and Song, Shiji and Huang, Gao}, title = {Adaptive Rotated Convolution for Rotated Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6589-6600} }
Revisit PCA-based Technique for Out-of-Distribution Detection: Xiaoyuan Guan,

Zhouwu Liu,

Wei-Shi Zheng,

Yuren Zhou,

Ruixuan Wang; [pdf] [supp]
[bibtex]
@InProceedings{Guan_2023_ICCV, author = {Guan, Xiaoyuan and Liu, Zhouwu and Zheng, Wei-Shi and Zhou, Yuren and Wang, Ruixuan}, title = {Revisit PCA-based Technique for Out-of-Distribution Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19431-19439} }
Visually-Prompted Language Model for Fine-Grained Scene Graph Generation in an Open World: Qifan Yu,

Juncheng Li,

Yu Wu,

Siliang Tang,

Wei Ji,

Yueting Zhuang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yu_2023_ICCV, author = {Yu, Qifan and Li, Juncheng and Wu, Yu and Tang, Siliang and Ji, Wei and Zhuang, Yueting}, title = {Visually-Prompted Language Model for Fine-Grained Scene Graph Generation in an Open World}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21560-21571} }
FishNet: A Large-scale Dataset and Benchmark for Fish Recognition, Detection, and Functional Trait Prediction: Faizan Farooq Khan,

Xiang Li,

Andrew J. Temple,

Mohamed Elhoseiny; [pdf]
[bibtex]
@InProceedings{Khan_2023_ICCV, author = {Khan, Faizan Farooq and Li, Xiang and Temple, Andrew J. and Elhoseiny, Mohamed}, title = {FishNet: A Large-scale Dataset and Benchmark for Fish Recognition, Detection, and Functional Trait Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20496-20506} }
Dual Learning with Dynamic Knowledge Distillation for Partially Relevant Video Retrieval: Jianfeng Dong,

Minsong Zhang,

Zheng Zhang,

Xianke Chen,

Daizong Liu,

Xiaoye Qu,

Xun Wang,

Baolong Liu; [pdf] [supp]
[bibtex]
@InProceedings{Dong_2023_ICCV, author = {Dong, Jianfeng and Zhang, Minsong and Zhang, Zheng and Chen, Xianke and Liu, Daizong and Qu, Xiaoye and Wang, Xun and Liu, Baolong}, title = {Dual Learning with Dynamic Knowledge Distillation for Partially Relevant Video Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11302-11312} }
UniVTG: Towards Unified Video-Language Temporal Grounding: Kevin Qinghong Lin,

Pengchuan Zhang,

Joya Chen,

Shraman Pramanick,

Difei Gao,

Alex Jinpeng Wang,

Rui Yan,

Mike Zheng Shou; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lin_2023_ICCV, author = {Lin, Kevin Qinghong and Zhang, Pengchuan and Chen, Joya and Pramanick, Shraman and Gao, Difei and Wang, Alex Jinpeng and Yan, Rui and Shou, Mike Zheng}, title = {UniVTG: Towards Unified Video-Language Temporal Grounding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2794-2804} }
Disposable Transfer Learning for Selective Source Task Unlearning: Seunghee Koh,

Hyounguk Shon,

Janghyeon Lee,

Hyeong Gwon Hong,

Junmo Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Koh_2023_ICCV, author = {Koh, Seunghee and Shon, Hyounguk and Lee, Janghyeon and Hong, Hyeong Gwon and Kim, Junmo}, title = {Disposable Transfer Learning for Selective Source Task Unlearning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11752-11760} }
Grounding 3D Object Affordance from 2D Interactions in Images: Yuhang Yang,

Wei Zhai,

Hongchen Luo,

Yang Cao,

Jiebo Luo,

Zheng-Jun Zha; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Yuhang and Zhai, Wei and Luo, Hongchen and Cao, Yang and Luo, Jiebo and Zha, Zheng-Jun}, title = {Grounding 3D Object Affordance from 2D Interactions in Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10905-10915} }
Fast Globally Optimal Surface Normal Estimation from an Affine Correspondence: Levente Hajder,

Lajos Lóczi,

Daniel Barath; [pdf] [supp]
[bibtex]
@InProceedings{Hajder_2023_ICCV, author = {Hajder, Levente and L\'oczi, Lajos and Barath, Daniel}, title = {Fast Globally Optimal Surface Normal Estimation from an Affine Correspondence}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3390-3401} }
Masked Spatio-Temporal Structure Prediction for Self-supervised Learning on Point Cloud Videos: Zhiqiang Shen,

Xiaoxiao Sheng,

Hehe Fan,

Longguang Wang,

Yulan Guo,

Qiong Liu,

Hao Wen,

Xi Zhou; [pdf] [arXiv]
[bibtex]
@InProceedings{Shen_2023_ICCV, author = {Shen, Zhiqiang and Sheng, Xiaoxiao and Fan, Hehe and Wang, Longguang and Guo, Yulan and Liu, Qiong and Wen, Hao and Zhou, Xi}, title = {Masked Spatio-Temporal Structure Prediction for Self-supervised Learning on Point Cloud Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16580-16589} }
Frequency-aware GAN for Adversarial Manipulation Generation: Peifei Zhu,

Genki Osada,

Hirokatsu Kataoka,

Tsubasa Takahashi; [pdf]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Peifei and Osada, Genki and Kataoka, Hirokatsu and Takahashi, Tsubasa}, title = {Frequency-aware GAN for Adversarial Manipulation Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4315-4324} }
DreamPose: Fashion Video Synthesis with Stable Diffusion: Johanna Karras,

Aleksander Holynski,

Ting-Chun Wang,

Ira Kemelmacher-Shlizerman; [pdf] [supp]
[bibtex]
@InProceedings{Karras_2023_ICCV, author = {Karras, Johanna and Holynski, Aleksander and Wang, Ting-Chun and Kemelmacher-Shlizerman, Ira}, title = {DreamPose: Fashion Video Synthesis with Stable Diffusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22680-22690} }
Tube-Link: A Flexible Cross Tube Framework for Universal Video Segmentation: Xiangtai Li,

Haobo Yuan,

Wenwei Zhang,

Guangliang Cheng,

Jiangmiao Pang,

Chen Change Loy; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Xiangtai and Yuan, Haobo and Zhang, Wenwei and Cheng, Guangliang and Pang, Jiangmiao and Loy, Chen Change}, title = {Tube-Link: A Flexible Cross Tube Framework for Universal Video Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13923-13933} }
Hybrid Spectral Denoising Transformer with Guided Attention: Zeqiang Lai,

Chenggang Yan,

Ying Fu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lai_2023_ICCV, author = {Lai, Zeqiang and Yan, Chenggang and Fu, Ying}, title = {Hybrid Spectral Denoising Transformer with Guided Attention}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13065-13075} }
HiVLP: Hierarchical Interactive Video-Language Pre-Training: Bin Shao,

Jianzhuang Liu,

Renjing Pei,

Songcen Xu,

Peng Dai,

Juwei Lu,

Weimian Li,

Youliang Yan; [pdf] [supp]
[bibtex]
@InProceedings{Shao_2023_ICCV, author = {Shao, Bin and Liu, Jianzhuang and Pei, Renjing and Xu, Songcen and Dai, Peng and Lu, Juwei and Li, Weimian and Yan, Youliang}, title = {HiVLP: Hierarchical Interactive Video-Language Pre-Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13756-13766} }
Learning Concordant Attention via Target-aware Alignment for Visible-Infrared Person Re-identification: Jianbing Wu,

Hong Liu,

Yuxin Su,

Wei Shi,

Hao Tang; [pdf]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Jianbing and Liu, Hong and Su, Yuxin and Shi, Wei and Tang, Hao}, title = {Learning Concordant Attention via Target-aware Alignment for Visible-Infrared Person Re-identification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11122-11131} }
PhysDiff: Physics-Guided Human Motion Diffusion Model: Ye Yuan,

Jiaming Song,

Umar Iqbal,

Arash Vahdat,

Jan Kautz; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yuan_2023_ICCV, author = {Yuan, Ye and Song, Jiaming and Iqbal, Umar and Vahdat, Arash and Kautz, Jan}, title = {PhysDiff: Physics-Guided Human Motion Diffusion Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16010-16021} }
Masked Motion Predictors are Strong 3D Action Representation Learners: Yunyao Mao,

Jiajun Deng,

Wengang Zhou,

Yao Fang,

Wanli Ouyang,

Houqiang Li; [pdf] [arXiv]
[bibtex]
@InProceedings{Mao_2023_ICCV, author = {Mao, Yunyao and Deng, Jiajun and Zhou, Wengang and Fang, Yao and Ouyang, Wanli and Li, Houqiang}, title = {Masked Motion Predictors are Strong 3D Action Representation Learners}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10181-10191} }
Template-guided Hierarchical Feature Restoration for Anomaly Detection: Hewei Guo,

Liping Ren,

Jingjing Fu,

Yuwang Wang,

Zhizheng Zhang,

Cuiling Lan,

Haoqian Wang,

Xinwen Hou; [pdf] [supp]
[bibtex]
@InProceedings{Guo_2023_ICCV, author = {Guo, Hewei and Ren, Liping and Fu, Jingjing and Wang, Yuwang and Zhang, Zhizheng and Lan, Cuiling and Wang, Haoqian and Hou, Xinwen}, title = {Template-guided Hierarchical Feature Restoration for Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6447-6458} }
SwiftFormer: Efficient Additive Attention for Transformer-based Real-time Mobile Vision Applications: Abdelrahman Shaker,

Muhammad Maaz,

Hanoona Rasheed,

Salman Khan,

Ming-Hsuan Yang,

Fahad Shahbaz Khan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shaker_2023_ICCV, author = {Shaker, Abdelrahman and Maaz, Muhammad and Rasheed, Hanoona and Khan, Salman and Yang, Ming-Hsuan and Khan, Fahad Shahbaz}, title = {SwiftFormer: Efficient Additive Attention for Transformer-based Real-time Mobile Vision Applications}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17425-17436} }
UpCycling: Semi-supervised 3D Object Detection without Sharing Raw-level Unlabeled Scenes: Sunwook Hwang,

Youngseok Kim,

Seongwon Kim,

Saewoong Bahk,

Hyung-Sin Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hwang_2023_ICCV, author = {Hwang, Sunwook and Kim, Youngseok and Kim, Seongwon and Bahk, Saewoong and Kim, Hyung-Sin}, title = {UpCycling: Semi-supervised 3D Object Detection without Sharing Raw-level Unlabeled Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23351-23361} }
RIGID: Recurrent GAN Inversion and Editing of Real Face Videos: Yangyang Xu,

Shengfeng He,

Kwan-Yee K. Wong,

Ping Luo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Yangyang and He, Shengfeng and Wong, Kwan-Yee K. and Luo, Ping}, title = {RIGID: Recurrent GAN Inversion and Editing of Real Face Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13691-13701} }
PourIt!: Weakly-Supervised Liquid Perception from a Single Image for Visual Closed-Loop Robotic Pouring: Haitao Lin,

Yanwei Fu,

Xiangyang Xue; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lin_2023_ICCV, author = {Lin, Haitao and Fu, Yanwei and Xue, Xiangyang}, title = {PourIt!: Weakly-Supervised Liquid Perception from a Single Image for Visual Closed-Loop Robotic Pouring}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {241-251} }
CSDA: Learning Category-Scale Joint Feature for Domain Adaptive Object Detection: Changlong Gao,

Chengxu Liu,

Yujie Dun,

Xueming Qian; [pdf] [supp]
[bibtex]
@InProceedings{Gao_2023_ICCV, author = {Gao, Changlong and Liu, Chengxu and Dun, Yujie and Qian, Xueming}, title = {CSDA: Learning Category-Scale Joint Feature for Domain Adaptive Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11421-11430} }
A Latent Space of Stochastic Diffusion Models for Zero-Shot Image Editing and Guidance: Chen Henry Wu,

Fernando De la Torre; [pdf]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Chen Henry and De la Torre, Fernando}, title = {A Latent Space of Stochastic Diffusion Models for Zero-Shot Image Editing and Guidance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7378-7387} }
Single Image Defocus Deblurring via Implicit Neural Inverse Kernels: Yuhui Quan,

Xin Yao,

Hui Ji; [pdf] [supp]
[bibtex]
@InProceedings{Quan_2023_ICCV, author = {Quan, Yuhui and Yao, Xin and Ji, Hui}, title = {Single Image Defocus Deblurring via Implicit Neural Inverse Kernels}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12600-12610} }
Open Set Video HOI detection from Action-Centric Chain-of-Look Prompting: Nan Xi,

Jingjing Meng,

Junsong Yuan; [pdf] [supp]
[bibtex]
@InProceedings{Xi_2023_ICCV, author = {Xi, Nan and Meng, Jingjing and Yuan, Junsong}, title = {Open Set Video HOI detection from Action-Centric Chain-of-Look Prompting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3079-3089} }
Robust Mixture-of-Expert Training for Convolutional Neural Networks: Yihua Zhang,

Ruisi Cai,

Tianlong Chen,

Guanhua Zhang,

Huan Zhang,

Pin-Yu Chen,

Shiyu Chang,

Zhangyang Wang,

Sijia Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Yihua and Cai, Ruisi and Chen, Tianlong and Zhang, Guanhua and Zhang, Huan and Chen, Pin-Yu and Chang, Shiyu and Wang, Zhangyang and Liu, Sijia}, title = {Robust Mixture-of-Expert Training for Convolutional Neural Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {90-101} }
AvatarCraft: Transforming Text into Neural Human Avatars with Parameterized Shape and Pose Control: Ruixiang Jiang,

Can Wang,

Jingbo Zhang,

Menglei Chai,

Mingming He,

Dongdong Chen,

Jing Liao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jiang_2023_ICCV, author = {Jiang, Ruixiang and Wang, Can and Zhang, Jingbo and Chai, Menglei and He, Mingming and Chen, Dongdong and Liao, Jing}, title = {AvatarCraft: Transforming Text into Neural Human Avatars with Parameterized Shape and Pose Control}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14371-14382} }
s-Adaptive Decoupled Prototype for Few-Shot Object Detection: Jinhao Du,

Shan Zhang,

Qiang Chen,

Haifeng Le,

Yanpeng Sun,

Yao Ni,

Jian Wang,

Bin He,

Jingdong Wang; [pdf] [supp]
[bibtex]
@InProceedings{Du_2023_ICCV, author = {Du, Jinhao and Zhang, Shan and Chen, Qiang and Le, Haifeng and Sun, Yanpeng and Ni, Yao and Wang, Jian and He, Bin and Wang, Jingdong}, title = {s-Adaptive Decoupled Prototype for Few-Shot Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18950-18960} }
Why Is Prompt Tuning for Vision-Language Models Robust to Noisy Labels?: Cheng-En Wu,

Yu Tian,

Haichao Yu,

Heng Wang,

Pedro Morgado,

Yu Hen Hu,

Linjie Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Cheng-En and Tian, Yu and Yu, Haichao and Wang, Heng and Morgado, Pedro and Hu, Yu Hen and Yang, Linjie}, title = {Why Is Prompt Tuning for Vision-Language Models Robust to Noisy Labels?}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15488-15497} }
Unified Pre-Training with Pseudo Texts for Text-To-Image Person Re-Identification: Zhiyin Shao,

Xinyu Zhang,

Changxing Ding,

Jian Wang,

Jingdong Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shao_2023_ICCV, author = {Shao, Zhiyin and Zhang, Xinyu and Ding, Changxing and Wang, Jian and Wang, Jingdong}, title = {Unified Pre-Training with Pseudo Texts for Text-To-Image Person Re-Identification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11174-11184} }
Semantics Meets Temporal Correspondence: Self-supervised Object-centric Learning in Videos: Rui Qian,

Shuangrui Ding,

Xian Liu,

Dahua Lin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Qian_2023_ICCV, author = {Qian, Rui and Ding, Shuangrui and Liu, Xian and Lin, Dahua}, title = {Semantics Meets Temporal Correspondence: Self-supervised Object-centric Learning in Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16675-16687} }
UniTR: A Unified and Efficient Multi-Modal Transformer for Bird's-Eye-View Representation: Haiyang Wang,

Hao Tang,

Shaoshuai Shi,

Aoxue Li,

Zhenguo Li,

Bernt Schiele,

Liwei Wang; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Haiyang and Tang, Hao and Shi, Shaoshuai and Li, Aoxue and Li, Zhenguo and Schiele, Bernt and Wang, Liwei}, title = {UniTR: A Unified and Efficient Multi-Modal Transformer for Bird's-Eye-View Representation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6792-6802} }
Traj-MAE: Masked Autoencoders for Trajectory Prediction: Hao Chen,

Jiaze Wang,

Kun Shao,

Furui Liu,

Jianye Hao,

Chenyong Guan,

Guangyong Chen,

Pheng-Ann Heng; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Hao and Wang, Jiaze and Shao, Kun and Liu, Furui and Hao, Jianye and Guan, Chenyong and Chen, Guangyong and Heng, Pheng-Ann}, title = {Traj-MAE: Masked Autoencoders for Trajectory Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8351-8362} }
First Session Adaptation: A Strong Replay-Free Baseline for Class-Incremental Learning: Aristeidis Panos,

Yuriko Kobe,

Daniel Olmeda Reino,

Rahaf Aljundi,

Richard E. Turner; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Panos_2023_ICCV, author = {Panos, Aristeidis and Kobe, Yuriko and Reino, Daniel Olmeda and Aljundi, Rahaf and Turner, Richard E.}, title = {First Session Adaptation: A Strong Replay-Free Baseline for Class-Incremental Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18820-18830} }
Ada3D : Exploiting the Spatial Redundancy with Adaptive Inference for Efficient 3D Object Detection: Tianchen Zhao,

Xuefei Ning,

Ke Hong,

Zhongyuan Qiu,

Pu Lu,

Yali Zhao,

Linfeng Zhang,

Lipu Zhou,

Guohao Dai,

Huazhong Yang,

Yu Wang; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Tianchen and Ning, Xuefei and Hong, Ke and Qiu, Zhongyuan and Lu, Pu and Zhao, Yali and Zhang, Linfeng and Zhou, Lipu and Dai, Guohao and Yang, Huazhong and Wang, Yu}, title = {Ada3D : Exploiting the Spatial Redundancy with Adaptive Inference for Efficient 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17728-17738} }
R3D3: Dense 3D Reconstruction of Dynamic Scenes from Multiple Cameras: Aron Schmied,

Tobias Fischer,

Martin Danelljan,

Marc Pollefeys,

Fisher Yu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Schmied_2023_ICCV, author = {Schmied, Aron and Fischer, Tobias and Danelljan, Martin and Pollefeys, Marc and Yu, Fisher}, title = {R3D3: Dense 3D Reconstruction of Dynamic Scenes from Multiple Cameras}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3216-3226} }
UniFusion: Unified Multi-View Fusion Transformer for Spatial-Temporal Representation in Bird's-Eye-View: Zequn Qin,

Jingyu Chen,

Chao Chen,

Xiaozhi Chen,

Xi Li; [pdf] [supp]
[bibtex]
@InProceedings{Qin_2023_ICCV, author = {Qin, Zequn and Chen, Jingyu and Chen, Chao and Chen, Xiaozhi and Li, Xi}, title = {UniFusion: Unified Multi-View Fusion Transformer for Spatial-Temporal Representation in Bird's-Eye-View}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8690-8699} }
Point Contrastive Prediction with Semantic Clustering for Self-Supervised Learning on Point Cloud Videos: Xiaoxiao Sheng,

Zhiqiang Shen,

Gang Xiao,

Longguang Wang,

Yulan Guo,

Hehe Fan; [pdf] [arXiv]
[bibtex]
@InProceedings{Sheng_2023_ICCV, author = {Sheng, Xiaoxiao and Shen, Zhiqiang and Xiao, Gang and Wang, Longguang and Guo, Yulan and Fan, Hehe}, title = {Point Contrastive Prediction with Semantic Clustering for Self-Supervised Learning on Point Cloud Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16515-16524} }
Preserving Modality Structure Improves Multi-Modal Learning: Sirnam Swetha,

Mamshad Nayeem Rizve,

Nina Shvetsova,

Hilde Kuehne,

Mubarak Shah; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Swetha_2023_ICCV, author = {Swetha, Sirnam and Rizve, Mamshad Nayeem and Shvetsova, Nina and Kuehne, Hilde and Shah, Mubarak}, title = {Preserving Modality Structure Improves Multi-Modal Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21993-22003} }
Focus the Discrepancy: Intra- and Inter-Correlation Learning for Image Anomaly Detection: Xincheng Yao,

Ruoqi Li,

Zefeng Qian,

Yan Luo,

Chongyang Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Yao_2023_ICCV, author = {Yao, Xincheng and Li, Ruoqi and Qian, Zefeng and Luo, Yan and Zhang, Chongyang}, title = {Focus the Discrepancy: Intra- and Inter-Correlation Learning for Image Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6803-6813} }
Pre-training Vision Transformers with Very Limited Synthesized Images: Ryo Nakamura,

Hirokatsu Kataoka,

Sora Takashima,

Edgar Josafat Martinez Noriega,

Rio Yokota,

Nakamasa Inoue; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Nakamura_2023_ICCV, author = {Nakamura, Ryo and Kataoka, Hirokatsu and Takashima, Sora and Noriega, Edgar Josafat Martinez and Yokota, Rio and Inoue, Nakamasa}, title = {Pre-training Vision Transformers with Very Limited Synthesized Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20360-20369} }
Sample-adaptive Augmentation for Point Cloud Recognition Against Real-world Corruptions: Jie Wang,

Lihe Ding,

Tingfa Xu,

Shaocong Dong,

Xinli Xu,

Long Bai,

Jianan Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Jie and Ding, Lihe and Xu, Tingfa and Dong, Shaocong and Xu, Xinli and Bai, Long and Li, Jianan}, title = {Sample-adaptive Augmentation for Point Cloud Recognition Against Real-world Corruptions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14330-14339} }
Make Encoder Great Again in 3D GAN Inversion through Geometry and Occlusion-Aware Encoding: Ziyang Yuan,

Yiming Zhu,

Yu Li,

Hongyu Liu,

Chun Yuan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yuan_2023_ICCV, author = {Yuan, Ziyang and Zhu, Yiming and Li, Yu and Liu, Hongyu and Yuan, Chun}, title = {Make Encoder Great Again in 3D GAN Inversion through Geometry and Occlusion-Aware Encoding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2437-2447} }
Modality Unifying Network for Visible-Infrared Person Re-Identification: Hao Yu,

Xu Cheng,

Wei Peng,

Weihao Liu,

Guoying Zhao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yu_2023_ICCV, author = {Yu, Hao and Cheng, Xu and Peng, Wei and Liu, Weihao and Zhao, Guoying}, title = {Modality Unifying Network for Visible-Infrared Person Re-Identification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11185-11195} }
DLT: Conditioned layout generation with Joint Discrete-Continuous Diffusion Layout Transformer: Elad Levi,

Eli Brosh,

Mykola Mykhailych,

Meir Perez; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Levi_2023_ICCV, author = {Levi, Elad and Brosh, Eli and Mykhailych, Mykola and Perez, Meir}, title = {DLT: Conditioned layout generation with Joint Discrete-Continuous Diffusion Layout Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2106-2115} }
PADDLES: Phase-Amplitude Spectrum Disentangled Early Stopping for Learning with Noisy Labels: Huaxi Huang,

Hui Kang,

Sheng Liu,

Olivier Salvado,

Thierry Rakotoarivelo,

Dadong Wang,

Tongliang Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Huaxi and Kang, Hui and Liu, Sheng and Salvado, Olivier and Rakotoarivelo, Thierry and Wang, Dadong and Liu, Tongliang}, title = {PADDLES: Phase-Amplitude Spectrum Disentangled Early Stopping for Learning with Noisy Labels}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16719-16730} }
Taming Contrast Maximization for Learning Sequential, Low-latency, Event-based Optical Flow: Federico Paredes-Vallés,

Kirk Y. W. Scheper,

Christophe De Wagter,

Guido C. H. E. de Croon; [pdf] [supp]
[bibtex]
@InProceedings{Paredes-Valles_2023_ICCV, author = {Paredes-Vall\'es, Federico and Scheper, Kirk Y. W. and De Wagter, Christophe and de Croon, Guido C. H. E.}, title = {Taming Contrast Maximization for Learning Sequential, Low-latency, Event-based Optical Flow}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9695-9705} }
CLIP-Cluster: CLIP-Guided Attribute Hallucination for Face Clustering: Shuai Shen,

Wanhua Li,

Xiaobing Wang,

Dafeng Zhang,

Zhezhu Jin,

Jie Zhou,

Jiwen Lu; [pdf]
[bibtex]
@InProceedings{Shen_2023_ICCV, author = {Shen, Shuai and Li, Wanhua and Wang, Xiaobing and Zhang, Dafeng and Jin, Zhezhu and Zhou, Jie and Lu, Jiwen}, title = {CLIP-Cluster: CLIP-Guided Attribute Hallucination for Face Clustering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20786-20795} }
CASSPR: Cross Attention Single Scan Place Recognition: Yan Xia,

Mariia Gladkova,

Rui Wang,

Qianyun Li,

Uwe Stilla,

João F Henriques,

Daniel Cremers; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xia_2023_ICCV, author = {Xia, Yan and Gladkova, Mariia and Wang, Rui and Li, Qianyun and Stilla, Uwe and Henriques, Jo\~ao F and Cremers, Daniel}, title = {CASSPR: Cross Attention Single Scan Place Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8461-8472} }
DDFM: Denoising Diffusion Model for Multi-Modality Image Fusion: Zixiang Zhao,

Haowen Bai,

Yuanzhi Zhu,

Jiangshe Zhang,

Shuang Xu,

Yulun Zhang,

Kai Zhang,

Deyu Meng,

Radu Timofte,

Luc Van Gool; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Zixiang and Bai, Haowen and Zhu, Yuanzhi and Zhang, Jiangshe and Xu, Shuang and Zhang, Yulun and Zhang, Kai and Meng, Deyu and Timofte, Radu and Van Gool, Luc}, title = {DDFM: Denoising Diffusion Model for Multi-Modality Image Fusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8082-8093} }
A Unified Continual Learning Framework with General Parameter-Efficient Tuning: Qiankun Gao,

Chen Zhao,

Yifan Sun,

Teng Xi,

Gang Zhang,

Bernard Ghanem,

Jian Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gao_2023_ICCV, author = {Gao, Qiankun and Zhao, Chen and Sun, Yifan and Xi, Teng and Zhang, Gang and Ghanem, Bernard and Zhang, Jian}, title = {A Unified Continual Learning Framework with General Parameter-Efficient Tuning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11483-11493} }
Hierarchical Generation of Human-Object Interactions with Diffusion Probabilistic Models: Huaijin Pi,

Sida Peng,

Minghui Yang,

Xiaowei Zhou,

Hujun Bao; [pdf]
[bibtex]
@InProceedings{Pi_2023_ICCV, author = {Pi, Huaijin and Peng, Sida and Yang, Minghui and Zhou, Xiaowei and Bao, Hujun}, title = {Hierarchical Generation of Human-Object Interactions with Diffusion Probabilistic Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15061-15073} }
Learning Data-Driven Vector-Quantized Degradation Model for Animation Video Super-Resolution: Zixi Tuo,

Huan Yang,

Jianlong Fu,

Yujie Dun,

Xueming Qian; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tuo_2023_ICCV, author = {Tuo, Zixi and Yang, Huan and Fu, Jianlong and Dun, Yujie and Qian, Xueming}, title = {Learning Data-Driven Vector-Quantized Degradation Model for Animation Video Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13179-13189} }
Compositional Feature Augmentation for Unbiased Scene Graph Generation: Lin Li,

Guikun Chen,

Jun Xiao,

Yi Yang,

Chunping Wang,

Long Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Lin and Chen, Guikun and Xiao, Jun and Yang, Yi and Wang, Chunping and Chen, Long}, title = {Compositional Feature Augmentation for Unbiased Scene Graph Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21685-21695} }
Foreground and Text-lines Aware Document Image Rectification: Heng Li,

Xiangping Wu,

Qingcai Chen,

Qianjin Xiang; [pdf]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Heng and Wu, Xiangping and Chen, Qingcai and Xiang, Qianjin}, title = {Foreground and Text-lines Aware Document Image Rectification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19574-19583} }
Open-Vocabulary Semantic Segmentation with Decoupled One-Pass Network: Cong Han,

Yujie Zhong,

Dengjie Li,

Kai Han,

Lin Ma; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Han_2023_ICCV, author = {Han, Cong and Zhong, Yujie and Li, Dengjie and Han, Kai and Ma, Lin}, title = {Open-Vocabulary Semantic Segmentation with Decoupled One-Pass Network}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1086-1096} }
INSTA-BNN: Binary Neural Network with INSTAnce-aware Threshold: Changhun Lee,

Hyungjun Kim,

Eunhyeok Park,

Jae-Joon Kim; [pdf] [supp]
[bibtex]
@InProceedings{Lee_2023_ICCV, author = {Lee, Changhun and Kim, Hyungjun and Park, Eunhyeok and Kim, Jae-Joon}, title = {INSTA-BNN: Binary Neural Network with INSTAnce-aware Threshold}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17325-17334} }
Human-Inspired Facial Sketch Synthesis with Dynamic Adaptation: Fei Gao,

Yifan Zhu,

Chang Jiang,

Nannan Wang; [pdf] [arXiv]
[bibtex]
@InProceedings{Gao_2023_ICCV, author = {Gao, Fei and Zhu, Yifan and Jiang, Chang and Wang, Nannan}, title = {Human-Inspired Facial Sketch Synthesis with Dynamic Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7237-7247} }
When Epipolar Constraint Meets Non-Local Operators in Multi-View Stereo: Tianqi Liu,

Xinyi Ye,

Weiyue Zhao,

Zhiyu Pan,

Min Shi,

Zhiguo Cao; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Tianqi and Ye, Xinyi and Zhao, Weiyue and Pan, Zhiyu and Shi, Min and Cao, Zhiguo}, title = {When Epipolar Constraint Meets Non-Local Operators in Multi-View Stereo}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18088-18097} }
LU-NeRF: Scene and Pose Estimation by Synchronizing Local Unposed NeRFs: Zezhou Cheng,

Carlos Esteves,

Varun Jampani,

Abhishek Kar,

Subhransu Maji,

Ameesh Makadia; [pdf] [supp]
[bibtex]
@InProceedings{Cheng_2023_ICCV, author = {Cheng, Zezhou and Esteves, Carlos and Jampani, Varun and Kar, Abhishek and Maji, Subhransu and Makadia, Ameesh}, title = {LU-NeRF: Scene and Pose Estimation by Synchronizing Local Unposed NeRFs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18312-18321} }
Calibrating Panoramic Depth Estimation for Practical Localization and Mapping: Junho Kim,

Eun Sun Lee,

Young Min Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2023_ICCV, author = {Kim, Junho and Lee, Eun Sun and Kim, Young Min}, title = {Calibrating Panoramic Depth Estimation for Practical Localization and Mapping}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8830-8840} }
DiffDis: Empowering Generative Diffusion Model with Cross-Modal Discrimination Capability: Runhui Huang,

Jianhua Han,

Guansong Lu,

Xiaodan Liang,

Yihan Zeng,

Wei Zhang,

Hang Xu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Runhui and Han, Jianhua and Lu, Guansong and Liang, Xiaodan and Zeng, Yihan and Zhang, Wei and Xu, Hang}, title = {DiffDis: Empowering Generative Diffusion Model with Cross-Modal Discrimination Capability}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15713-15723} }
DS-Fusion: Artistic Typography via Discriminated and Stylized Diffusion: Maham Tanveer,

Yizhi Wang,

Ali Mahdavi-Amiri,

Hao Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Tanveer_2023_ICCV, author = {Tanveer, Maham and Wang, Yizhi and Mahdavi-Amiri, Ali and Zhang, Hao}, title = {DS-Fusion: Artistic Typography via Discriminated and Stylized Diffusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {374-384} }
Distilling DETR with Visual-Linguistic Knowledge for Open-Vocabulary Object Detection: Liangqi Li,

Jiaxu Miao,

Dahu Shi,

Wenming Tan,

Ye Ren,

Yi Yang,

Shiliang Pu; [pdf]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Liangqi and Miao, Jiaxu and Shi, Dahu and Tan, Wenming and Ren, Ye and Yang, Yi and Pu, Shiliang}, title = {Distilling DETR with Visual-Linguistic Knowledge for Open-Vocabulary Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6501-6510} }
Scale-MAE: A Scale-Aware Masked Autoencoder for Multiscale Geospatial Representation Learning: Colorado J Reed,

Ritwik Gupta,

Shufan Li,

Sarah Brockman,

Christopher Funk,

Brian Clipp,

Kurt Keutzer,

Salvatore Candido,

Matt Uyttendaele,

Trevor Darrell; [pdf] [supp]
[bibtex]
@InProceedings{Reed_2023_ICCV, author = {Reed, Colorado J and Gupta, Ritwik and Li, Shufan and Brockman, Sarah and Funk, Christopher and Clipp, Brian and Keutzer, Kurt and Candido, Salvatore and Uyttendaele, Matt and Darrell, Trevor}, title = {Scale-MAE: A Scale-Aware Masked Autoencoder for Multiscale Geospatial Representation Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4088-4099} }
View Consistent Purification for Accurate Cross-View Localization: Shan Wang,

Yanhao Zhang,

Akhil Perincherry,

Ankit Vora,

Hongdong Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Shan and Zhang, Yanhao and Perincherry, Akhil and Vora, Ankit and Li, Hongdong}, title = {View Consistent Purification for Accurate Cross-View Localization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8197-8206} }
A Unified Framework for Robustness on Diverse Sampling Errors: Myeongho Jeon,

Myungjoo Kang,

Joonseok Lee; [pdf] [supp]
[bibtex]
@InProceedings{Jeon_2023_ICCV, author = {Jeon, Myeongho and Kang, Myungjoo and Lee, Joonseok}, title = {A Unified Framework for Robustness on Diverse Sampling Errors}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1464-1472} }
Efficient Video Action Detection with Token Dropout and Context Refinement: Lei Chen,

Zhan Tong,

Yibing Song,

Gangshan Wu,

Limin Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Lei and Tong, Zhan and Song, Yibing and Wu, Gangshan and Wang, Limin}, title = {Efficient Video Action Detection with Token Dropout and Context Refinement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10388-10399} }
Explicit Motion Disentangling for Efficient Optical Flow Estimation: Changxing Deng,

Ao Luo,

Haibin Huang,

Shaodan Ma,

Jiangyu Liu,

Shuaicheng Liu; [pdf]
[bibtex]
@InProceedings{Deng_2023_ICCV, author = {Deng, Changxing and Luo, Ao and Huang, Haibin and Ma, Shaodan and Liu, Jiangyu and Liu, Shuaicheng}, title = {Explicit Motion Disentangling for Efficient Optical Flow Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9521-9530} }
LiDAR-Camera Panoptic Segmentation via Geometry-Consistent and Semantic-Aware Alignment: Zhiwei Zhang,

Zhizhong Zhang,

Qian Yu,

Ran Yi,

Yuan Xie,

Lizhuang Ma; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Zhiwei and Zhang, Zhizhong and Yu, Qian and Yi, Ran and Xie, Yuan and Ma, Lizhuang}, title = {LiDAR-Camera Panoptic Segmentation via Geometry-Consistent and Semantic-Aware Alignment}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3662-3671} }
GrowCLIP: Data-Aware Automatic Model Growing for Large-scale Contrastive Language-Image Pre-Training: Xinchi Deng,

Han Shi,

Runhui Huang,

Changlin Li,

Hang Xu,

Jianhua Han,

James Kwok,

Shen Zhao,

Wei Zhang,

Xiaodan Liang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Deng_2023_ICCV, author = {Deng, Xinchi and Shi, Han and Huang, Runhui and Li, Changlin and Xu, Hang and Han, Jianhua and Kwok, James and Zhao, Shen and Zhang, Wei and Liang, Xiaodan}, title = {GrowCLIP: Data-Aware Automatic Model Growing for Large-scale Contrastive Language-Image Pre-Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22178-22189} }
From Chaos Comes Order: Ordering Event Representations for Object Recognition and Detection: Nikola Zubić,

Daniel Gehrig,

Mathias Gehrig,

Davide Scaramuzza; [pdf] [supp]
[bibtex]
@InProceedings{Zubic_2023_ICCV, author = {Zubi\'c, Nikola and Gehrig, Daniel and Gehrig, Mathias and Scaramuzza, Davide}, title = {From Chaos Comes Order: Ordering Event Representations for Object Recognition and Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12846-12856} }
LA-Net: Landmark-Aware Learning for Reliable Facial Expression Recognition under Label Noise: Zhiyu Wu,

Jinshi Cui; [pdf] [supp]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Zhiyu and Cui, Jinshi}, title = {LA-Net: Landmark-Aware Learning for Reliable Facial Expression Recognition under Label Noise}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20698-20707} }
Identity-Consistent Aggregation for Video Object Detection: Chaorui Deng,

Da Chen,

Qi Wu; [pdf] [arXiv]
[bibtex]
@InProceedings{Deng_2023_ICCV, author = {Deng, Chaorui and Chen, Da and Wu, Qi}, title = {Identity-Consistent Aggregation for Video Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13434-13444} }
Scene-Aware Label Graph Learning for Multi-Label Image Classification: Xuelin Zhu,

Jian Liu,

Weijia Liu,

Jiawei Ge,

Bo Liu,

Jiuxin Cao; [pdf] [supp]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Xuelin and Liu, Jian and Liu, Weijia and Ge, Jiawei and Liu, Bo and Cao, Jiuxin}, title = {Scene-Aware Label Graph Learning for Multi-Label Image Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1473-1482} }
Relightify: Relightable 3D Faces from a Single Image via Diffusion Models: Foivos Paraperas Papantoniou,

Alexandros Lattas,

Stylianos Moschoglou,

Stefanos Zafeiriou; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Papantoniou_2023_ICCV, author = {Papantoniou, Foivos Paraperas and Lattas, Alexandros and Moschoglou, Stylianos and Zafeiriou, Stefanos}, title = {Relightify: Relightable 3D Faces from a Single Image via Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8806-8817} }
Fcaformer: Forward Cross Attention in Hybrid Vision Transformer: Haokui Zhang,

Wenze Hu,

Xiaoyu Wang; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Haokui and Hu, Wenze and Wang, Xiaoyu}, title = {Fcaformer: Forward Cross Attention in Hybrid Vision Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6060-6069} }
Progressive Spatio-Temporal Prototype Matching for Text-Video Retrieval: Pandeng Li,

Chen-Wei Xie,

Liming Zhao,

Hongtao Xie,

Jiannan Ge,

Yun Zheng,

Deli Zhao,

Yongdong Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Pandeng and Xie, Chen-Wei and Zhao, Liming and Xie, Hongtao and Ge, Jiannan and Zheng, Yun and Zhao, Deli and Zhang, Yongdong}, title = {Progressive Spatio-Temporal Prototype Matching for Text-Video Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4100-4110} }
Leveraging Spatio-Temporal Dependency for Skeleton-Based Action Recognition: Jungho Lee,

Minhyeok Lee,

Suhwan Cho,

Sungmin Woo,

Sungjun Jang,

Sangyoun Lee; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2023_ICCV, author = {Lee, Jungho and Lee, Minhyeok and Cho, Suhwan and Woo, Sungmin and Jang, Sungjun and Lee, Sangyoun}, title = {Leveraging Spatio-Temporal Dependency for Skeleton-Based Action Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10255-10264} }
Data Augmented Flatness-aware Gradient Projection for Continual Learning: Enneng Yang,

Li Shen,

Zhenyi Wang,

Shiwei Liu,

Guibing Guo,

Xingwei Wang; [pdf] [supp]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Enneng and Shen, Li and Wang, Zhenyi and Liu, Shiwei and Guo, Guibing and Wang, Xingwei}, title = {Data Augmented Flatness-aware Gradient Projection for Continual Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5630-5639} }
Camera-Driven Representation Learning for Unsupervised Domain Adaptive Person Re-identification: Geon Lee,

Sanghoon Lee,

Dohyung Kim,

Younghoon Shin,

Yongsang Yoon,

Bumsub Ham; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2023_ICCV, author = {Lee, Geon and Lee, Sanghoon and Kim, Dohyung and Shin, Younghoon and Yoon, Yongsang and Ham, Bumsub}, title = {Camera-Driven Representation Learning for Unsupervised Domain Adaptive Person Re-identification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11453-11462} }
Sample-wise Label Confidence Incorporation for Learning with Noisy Labels: Chanho Ahn,

Kikyung Kim,

Ji-won Baek,

Jongin Lim,

Seungju Han; [pdf] [supp]
[bibtex]
@InProceedings{Ahn_2023_ICCV, author = {Ahn, Chanho and Kim, Kikyung and Baek, Ji-won and Lim, Jongin and Han, Seungju}, title = {Sample-wise Label Confidence Incorporation for Learning with Noisy Labels}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1823-1832} }
CLIPTrans: Transferring Visual Knowledge with Pre-trained Models for Multimodal Machine Translation: Devaansh Gupta,

Siddhant Kharbanda,

Jiawei Zhou,

Wanhua Li,

Hanspeter Pfister,

Donglai Wei; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gupta_2023_ICCV, author = {Gupta, Devaansh and Kharbanda, Siddhant and Zhou, Jiawei and Li, Wanhua and Pfister, Hanspeter and Wei, Donglai}, title = {CLIPTrans: Transferring Visual Knowledge with Pre-trained Models for Multimodal Machine Translation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2875-2886} }
SGAligner: 3D Scene Alignment with Scene Graphs: Sayan Deb Sarkar,

Ondrej Miksik,

Marc Pollefeys,

Daniel Barath,

Iro Armeni; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sarkar_2023_ICCV, author = {Sarkar, Sayan Deb and Miksik, Ondrej and Pollefeys, Marc and Barath, Daniel and Armeni, Iro}, title = {SGAligner: 3D Scene Alignment with Scene Graphs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21927-21937} }
Name Your Colour For the Task: Artificially Discover Colour Naming via Colour Quantisation Transformer: Shenghan Su,

Lin Gu,

Yue Yang,

Zenghui Zhang,

Tatsuya Harada; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Su_2023_ICCV, author = {Su, Shenghan and Gu, Lin and Yang, Yue and Zhang, Zenghui and Harada, Tatsuya}, title = {Name Your Colour For the Task: Artificially Discover Colour Naming via Colour Quantisation Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12021-12031} }
FSAR: Federated Skeleton-based Action Recognition with Adaptive Topology Structure and Knowledge Distillation: Jingwen Guo,

Hong Liu,

Shitong Sun,

Tianyu Guo,

Min Zhang,

Chenyang Si; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Guo_2023_ICCV, author = {Guo, Jingwen and Liu, Hong and Sun, Shitong and Guo, Tianyu and Zhang, Min and Si, Chenyang}, title = {FSAR: Federated Skeleton-based Action Recognition with Adaptive Topology Structure and Knowledge Distillation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10400-10410} }
Video Adverse-Weather-Component Suppression Network via Weather Messenger and Adversarial Backpropagation: Yijun Yang,

Angelica I. Aviles-Rivero,

Huazhu Fu,

Ye Liu,

Weiming Wang,

Lei Zhu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Yijun and Aviles-Rivero, Angelica I. and Fu, Huazhu and Liu, Ye and Wang, Weiming and Zhu, Lei}, title = {Video Adverse-Weather-Component Suppression Network via Weather Messenger and Adversarial Backpropagation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13200-13210} }
Efficient Discovery and Effective Evaluation of Visual Perceptual Similarity: A Benchmark and Beyond: Oren Barkan,

Tal Reiss,

Jonathan Weill,

Ori Katz,

Roy Hirsch,

Itzik Malkiel,

Noam Koenigstein; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Barkan_2023_ICCV, author = {Barkan, Oren and Reiss, Tal and Weill, Jonathan and Katz, Ori and Hirsch, Roy and Malkiel, Itzik and Koenigstein, Noam}, title = {Efficient Discovery and Effective Evaluation of Visual Perceptual Similarity: A Benchmark and Beyond}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20007-20018} }
Ego-Only: Egocentric Action Detection without Exocentric Transferring: Huiyu Wang,

Mitesh Kumar Singh,

Lorenzo Torresani; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Huiyu and Singh, Mitesh Kumar and Torresani, Lorenzo}, title = {Ego-Only: Egocentric Action Detection without Exocentric Transferring}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5250-5261} }
CoinSeg: Contrast Inter- and Intra- Class Representations for Incremental Segmentation: Zekang Zhang,

Guangyu Gao,

Jianbo Jiao,

Chi Harold Liu,

Yunchao Wei; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Zekang and Gao, Guangyu and Jiao, Jianbo and Liu, Chi Harold and Wei, Yunchao}, title = {CoinSeg: Contrast Inter- and Intra- Class Representations for Incremental Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {843-853} }
Multi-View Active Fine-Grained Visual Recognition: Ruoyi Du,

Wenqing Yu,

Heqing Wang,

Ting-En Lin,

Dongliang Chang,

Zhanyu Ma; [pdf]
[bibtex]
@InProceedings{Du_2023_ICCV, author = {Du, Ruoyi and Yu, Wenqing and Wang, Heqing and Lin, Ting-En and Chang, Dongliang and Ma, Zhanyu}, title = {Multi-View Active Fine-Grained Visual Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1568-1578} }
Part-Aware Transformer for Generalizable Person Re-identification: Hao Ni,

Yuke Li,

Lianli Gao,

Heng Tao Shen,

Jingkuan Song; [pdf] [arXiv]
[bibtex]
@InProceedings{Ni_2023_ICCV, author = {Ni, Hao and Li, Yuke and Gao, Lianli and Shen, Heng Tao and Song, Jingkuan}, title = {Part-Aware Transformer for Generalizable Person Re-identification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11280-11289} }
Variational Causal Inference Network for Explanatory Visual Question Answering: Dizhan Xue,

Shengsheng Qian,

Changsheng Xu; [pdf] [supp]
[bibtex]
@InProceedings{Xue_2023_ICCV, author = {Xue, Dizhan and Qian, Shengsheng and Xu, Changsheng}, title = {Variational Causal Inference Network for Explanatory Visual Question Answering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2515-2525} }
Improving Representation Learning for Histopathologic Images with Cluster Constraints: Weiyi Wu,

Chongyang Gao,

Joseph DiPalma,

Soroush Vosoughi,

Saeed Hassanpour; [pdf] [supp]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Weiyi and Gao, Chongyang and DiPalma, Joseph and Vosoughi, Soroush and Hassanpour, Saeed}, title = {Improving Representation Learning for Histopathologic Images with Cluster Constraints}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21404-21414} }
Blending-NeRF: Text-Driven Localized Editing in Neural Radiance Fields: Hyeonseop Song,

Seokhun Choi,

Hoseok Do,

Chul Lee,

Taehyeong Kim; [pdf] [supp]
[bibtex]
@InProceedings{Song_2023_ICCV, author = {Song, Hyeonseop and Choi, Seokhun and Do, Hoseok and Lee, Chul and Kim, Taehyeong}, title = {Blending-NeRF: Text-Driven Localized Editing in Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14383-14393} }
Panoramas from Photons: Sacha Jungerman,

Atul Ingle,

Mohit Gupta; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jungerman_2023_ICCV, author = {Jungerman, Sacha and Ingle, Atul and Gupta, Mohit}, title = {Panoramas from Photons}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10626-10636} }
Global Adaptation Meets Local Generalization: Unsupervised Domain Adaptation for 3D Human Pose Estimation: Wenhao Chai,

Zhongyu Jiang,

Jenq-Neng Hwang,

Gaoang Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chai_2023_ICCV, author = {Chai, Wenhao and Jiang, Zhongyu and Hwang, Jenq-Neng and Wang, Gaoang}, title = {Global Adaptation Meets Local Generalization: Unsupervised Domain Adaptation for 3D Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14655-14665} }
Learning Neural Implicit Surfaces with Object-Aware Radiance Fields: Yiheng Zhang,

Zhaofan Qiu,

Yingwei Pan,

Ting Yao,

Tao Mei; [pdf]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Yiheng and Qiu, Zhaofan and Pan, Yingwei and Yao, Ting and Mei, Tao}, title = {Learning Neural Implicit Surfaces with Object-Aware Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17893-17902} }
PADCLIP: Pseudo-labeling with Adaptive Debiasing in CLIP for Unsupervised Domain Adaptation: Zhengfeng Lai,

Noranart Vesdapunt,

Ning Zhou,

Jun Wu,

Cong Phuoc Huynh,

Xuelu Li,

Kah Kuen Fu,

Chen-Nee Chuah; [pdf] [supp]
[bibtex]
@InProceedings{Lai_2023_ICCV, author = {Lai, Zhengfeng and Vesdapunt, Noranart and Zhou, Ning and Wu, Jun and Huynh, Cong Phuoc and Li, Xuelu and Fu, Kah Kuen and Chuah, Chen-Nee}, title = {PADCLIP: Pseudo-labeling with Adaptive Debiasing in CLIP for Unsupervised Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16155-16165} }
Causal-DFQ: Causality Guided Data-Free Network Quantization: Yuzhang Shang,

Bingxin Xu,

Gaowen Liu,

Ramana Rao Kompella,

Yan Yan; [pdf]
[bibtex]
@InProceedings{Shang_2023_ICCV, author = {Shang, Yuzhang and Xu, Bingxin and Liu, Gaowen and Kompella, Ramana Rao and Yan, Yan}, title = {Causal-DFQ: Causality Guided Data-Free Network Quantization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17437-17446} }
Enhancing Generalization of Universal Adversarial Perturbation through Gradient Aggregation: Xuannan Liu,

Yaoyao Zhong,

Yuhang Zhang,

Lixiong Qin,

Weihong Deng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Xuannan and Zhong, Yaoyao and Zhang, Yuhang and Qin, Lixiong and Deng, Weihong}, title = {Enhancing Generalization of Universal Adversarial Perturbation through Gradient Aggregation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4435-4444} }
CancerUniT: Towards a Single Unified Model for Effective Detection, Segmentation, and Diagnosis of Eight Major Cancers Using a Large Collection of CT Scans: Jieneng Chen,

Yingda Xia,

Jiawen Yao,

Ke Yan,

Jianpeng Zhang,

Le Lu,

Fakai Wang,

Bo Zhou,

Mingyan Qiu,

Qihang Yu,

Mingze Yuan,

Wei Fang,

Yuxing Tang,

Minfeng Xu,

Jian Zhou,

Yuqian Zhao,

Qifeng Wang,

Xianghua Ye,

Xiaoli Yin,

Yu Shi,

Xin Chen,

Jingren Zhou,

Alan Yuille,

Zaiyi Liu,

Ling Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Jieneng and Xia, Yingda and Yao, Jiawen and Yan, Ke and Zhang, Jianpeng and Lu, Le and Wang, Fakai and Zhou, Bo and Qiu, Mingyan and Yu, Qihang and Yuan, Mingze and Fang, Wei and Tang, Yuxing and Xu, Minfeng and Zhou, Jian and Zhao, Yuqian and Wang, Qifeng and Ye, Xianghua and Yin, Xiaoli and Shi, Yu and Chen, Xin and Zhou, Jingren and Yuille, Alan and Liu, Zaiyi and Zhang, Ling}, title = {CancerUniT: Towards a Single Unified Model for Effective Detection, Segmentation, and Diagnosis of Eight Major Cancers Using a Large Collection of CT Scans}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21327-21338} }
Dual Meta-Learning with Longitudinally Consistent Regularization for One-Shot Brain Tissue Segmentation Across the Human Lifespan: Yongheng Sun,

Fan Wang,

Jun Shu,

Haifeng Wang,

Li Wang,

Deyu Meng,

Chunfeng Lian; [pdf]
[bibtex]
@InProceedings{Sun_2023_ICCV, author = {Sun, Yongheng and Wang, Fan and Shu, Jun and Wang, Haifeng and Wang, Li and Meng, Deyu and Lian, Chunfeng}, title = {Dual Meta-Learning with Longitudinally Consistent Regularization for One-Shot Brain Tissue Segmentation Across the Human Lifespan}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21118-21128} }
DeFormer: Integrating Transformers with Deformable Models for 3D Shape Abstraction from a Single Image: Di Liu,

Xiang Yu,

Meng Ye,

Qilong Zhangli,

Zhuowei Li,

Zhixing Zhang,

Dimitris N. Metaxas; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Di and Yu, Xiang and Ye, Meng and Zhangli, Qilong and Li, Zhuowei and Zhang, Zhixing and Metaxas, Dimitris N.}, title = {DeFormer: Integrating Transformers with Deformable Models for 3D Shape Abstraction from a Single Image}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14236-14246} }
Parallel Attention Interaction Network for Few-Shot Skeleton-Based Action Recognition: Xingyu Liu,

Sanping Zhou,

Le Wang,

Gang Hua; [pdf]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Xingyu and Zhou, Sanping and Wang, Le and Hua, Gang}, title = {Parallel Attention Interaction Network for Few-Shot Skeleton-Based Action Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1379-1388} }
Cross-view Semantic Alignment for Livestreaming Product Recognition: Wenjie Yang,

Yiyi Chen,

Yan Li,

Yanhua Cheng,

Xudong Liu,

Quan Chen,

Han Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Wenjie and Chen, Yiyi and Li, Yan and Cheng, Yanhua and Liu, Xudong and Chen, Quan and Li, Han}, title = {Cross-view Semantic Alignment for Livestreaming Product Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13404-13413} }
Continuously Masked Transformer for Image Inpainting: Keunsoo Ko,

Chang-Su Kim; [pdf] [supp]
[bibtex]
@InProceedings{Ko_2023_ICCV, author = {Ko, Keunsoo and Kim, Chang-Su}, title = {Continuously Masked Transformer for Image Inpainting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13169-13178} }
Vanishing Point Estimation in Uncalibrated Images with Prior Gravity Direction: Rémi Pautrat,

Shaohui Liu,

Petr Hruby,

Marc Pollefeys,

Daniel Barath; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Pautrat_2023_ICCV, author = {Pautrat, R\'emi and Liu, Shaohui and Hruby, Petr and Pollefeys, Marc and Barath, Daniel}, title = {Vanishing Point Estimation in Uncalibrated Images with Prior Gravity Direction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14118-14127} }
Learn TAROT with MENTOR: A Meta-Learned Self-Supervised Approach for Trajectory Prediction: Mozhgan Pourkeshavarz,

Changhe Chen,

Amir Rasouli; [pdf] [supp]
[bibtex]
@InProceedings{Pourkeshavarz_2023_ICCV, author = {Pourkeshavarz, Mozhgan and Chen, Changhe and Rasouli, Amir}, title = {Learn TAROT with MENTOR: A Meta-Learned Self-Supervised Approach for Trajectory Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8384-8393} }
MatrixVT: Efficient Multi-Camera to BEV Transformation for 3D Perception: Hongyu Zhou,

Zheng Ge,

Zeming Li,

Xiangyu Zhang; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Hongyu and Ge, Zheng and Li, Zeming and Zhang, Xiangyu}, title = {MatrixVT: Efficient Multi-Camera to BEV Transformation for 3D Perception}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8548-8557} }
Local and Global Logit Adjustments for Long-Tailed Learning: Yingfan Tao,

Jingna Sun,

Hao Yang,

Li Chen,

Xu Wang,

Wenming Yang,

Daniel Du,

Min Zheng; [pdf]
[bibtex]
@InProceedings{Tao_2023_ICCV, author = {Tao, Yingfan and Sun, Jingna and Yang, Hao and Chen, Li and Wang, Xu and Yang, Wenming and Du, Daniel and Zheng, Min}, title = {Local and Global Logit Adjustments for Long-Tailed Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11783-11792} }
Active Self-Supervised Learning: A Few Low-Cost Relationships Are All You Need: Vivien Cabannes,

Leon Bottou,

Yann Lecun,

Randall Balestriero; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cabannes_2023_ICCV, author = {Cabannes, Vivien and Bottou, Leon and Lecun, Yann and Balestriero, Randall}, title = {Active Self-Supervised Learning: A Few Low-Cost Relationships Are All You Need}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16274-16283} }
Wasserstein Expansible Variational Autoencoder for Discriminative and Generative Continual Learning: Fei Ye,

Adrian G. Bors; [pdf] [supp]
[bibtex]
@InProceedings{Ye_2023_ICCV, author = {Ye, Fei and Bors, Adrian G.}, title = {Wasserstein Expansible Variational Autoencoder for Discriminative and Generative Continual Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18665-18675} }
Sensitivity-Aware Visual Parameter-Efficient Fine-Tuning: Haoyu He,

Jianfei Cai,

Jing Zhang,

Dacheng Tao,

Bohan Zhuang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{He_2023_ICCV, author = {He, Haoyu and Cai, Jianfei and Zhang, Jing and Tao, Dacheng and Zhuang, Bohan}, title = {Sensitivity-Aware Visual Parameter-Efficient Fine-Tuning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11825-11835} }
Label-Free Event-based Object Recognition via Joint Learning with Image Reconstruction from Events: Hoonhee Cho,

Hyeonseong Kim,

Yujeong Chae,

Kuk-Jin Yoon; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cho_2023_ICCV, author = {Cho, Hoonhee and Kim, Hyeonseong and Chae, Yujeong and Yoon, Kuk-Jin}, title = {Label-Free Event-based Object Recognition via Joint Learning with Image Reconstruction from Events}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19866-19877} }
Gloss-Free Sign Language Translation: Improving from Visual-Language Pretraining: Benjia Zhou,

Zhigang Chen,

Albert Clapés,

Jun Wan,

Yanyan Liang,

Sergio Escalera,

Zhen Lei,

Du Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Benjia and Chen, Zhigang and Clap\'es, Albert and Wan, Jun and Liang, Yanyan and Escalera, Sergio and Lei, Zhen and Zhang, Du}, title = {Gloss-Free Sign Language Translation: Improving from Visual-Language Pretraining}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20871-20881} }
Weakly-supervised 3D Pose Transfer with Keypoints: Jinnan Chen,

Chen Li,

Gim Hee Lee; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Jinnan and Li, Chen and Lee, Gim Hee}, title = {Weakly-supervised 3D Pose Transfer with Keypoints}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15156-15165} }
Not All Features Matter: Enhancing Few-shot CLIP with Adaptive Prior Refinement: Xiangyang Zhu,

Renrui Zhang,

Bowei He,

Aojun Zhou,

Dong Wang,

Bin Zhao,

Peng Gao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Xiangyang and Zhang, Renrui and He, Bowei and Zhou, Aojun and Wang, Dong and Zhao, Bin and Gao, Peng}, title = {Not All Features Matter: Enhancing Few-shot CLIP with Adaptive Prior Refinement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2605-2615} }
EgoVLPv2: Egocentric Video-Language Pre-training with Fusion in the Backbone: Shraman Pramanick,

Yale Song,

Sayan Nag,

Kevin Qinghong Lin,

Hardik Shah,

Mike Zheng Shou,

Rama Chellappa,

Pengchuan Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Pramanick_2023_ICCV, author = {Pramanick, Shraman and Song, Yale and Nag, Sayan and Lin, Kevin Qinghong and Shah, Hardik and Shou, Mike Zheng and Chellappa, Rama and Zhang, Pengchuan}, title = {EgoVLPv2: Egocentric Video-Language Pre-training with Fusion in the Backbone}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5285-5297} }
On the Effectiveness of Spectral Discriminators for Perceptual Quality Improvement: Xin Luo,

Yunan Zhu,

Shunxin Xu,

Dong Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Luo_2023_ICCV, author = {Luo, Xin and Zhu, Yunan and Xu, Shunxin and Liu, Dong}, title = {On the Effectiveness of Spectral Discriminators for Perceptual Quality Improvement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13243-13253} }
Shrinking Class Space for Enhanced Certainty in Semi-Supervised Learning: Lihe Yang,

Zhen Zhao,

Lei Qi,

Yu Qiao,

Yinghuan Shi,

Hengshuang Zhao; [pdf] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Lihe and Zhao, Zhen and Qi, Lei and Qiao, Yu and Shi, Yinghuan and Zhao, Hengshuang}, title = {Shrinking Class Space for Enhanced Certainty in Semi-Supervised Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16187-16196} }
Deep Equilibrium Object Detection: Shuai Wang,

Yao Teng,

Limin Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Shuai and Teng, Yao and Wang, Limin}, title = {Deep Equilibrium Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6296-6306} }
Diffusion-Based 3D Human Pose Estimation with Multi-Hypothesis Aggregation: Wenkang Shan,

Zhenhua Liu,

Xinfeng Zhang,

Zhao Wang,

Kai Han,

Shanshe Wang,

Siwei Ma,

Wen Gao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shan_2023_ICCV, author = {Shan, Wenkang and Liu, Zhenhua and Zhang, Xinfeng and Wang, Zhao and Han, Kai and Wang, Shanshe and Ma, Siwei and Gao, Wen}, title = {Diffusion-Based 3D Human Pose Estimation with Multi-Hypothesis Aggregation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14761-14771} }
RPEFlow: Multimodal Fusion of RGB-PointCloud-Event for Joint Optical Flow and Scene Flow Estimation: Zhexiong Wan,

Yuxin Mao,

Jing Zhang,

Yuchao Dai; [pdf] [supp]
[bibtex]
@InProceedings{Wan_2023_ICCV, author = {Wan, Zhexiong and Mao, Yuxin and Zhang, Jing and Dai, Yuchao}, title = {RPEFlow: Multimodal Fusion of RGB-PointCloud-Event for Joint Optical Flow and Scene Flow Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10030-10040} }
SMAUG: Sparse Masked Autoencoder for Efficient Video-Language Pre-Training: Yuanze Lin,

Chen Wei,

Huiyu Wang,

Alan Yuille,

Cihang Xie; [pdf] [arXiv]
[bibtex]
@InProceedings{Lin_2023_ICCV, author = {Lin, Yuanze and Wei, Chen and Wang, Huiyu and Yuille, Alan and Xie, Cihang}, title = {SMAUG: Sparse Masked Autoencoder for Efficient Video-Language Pre-Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2459-2469} }
eP-ALM: Efficient Perceptual Augmentation of Language Models: Mustafa Shukor,

Corentin Dancette,

Matthieu Cord; [pdf] [supp]
[bibtex]
@InProceedings{Shukor_2023_ICCV, author = {Shukor, Mustafa and Dancette, Corentin and Cord, Matthieu}, title = {eP-ALM: Efficient Perceptual Augmentation of Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22056-22069} }
Multimodal Optimal Transport-based Co-Attention Transformer with Global Structure Consistency for Survival Prediction: Yingxue Xu,

Hao Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Yingxue and Chen, Hao}, title = {Multimodal Optimal Transport-based Co-Attention Transformer with Global Structure Consistency for Survival Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21241-21251} }
Communication-Efficient Vertical Federated Learning with Limited Overlapping Samples: Jingwei Sun,

Ziyue Xu,

Dong Yang,

Vishwesh Nath,

Wenqi Li,

Can Zhao,

Daguang Xu,

Yiran Chen,

Holger R. Roth; [pdf] [arXiv]
[bibtex]
@InProceedings{Sun_2023_ICCV, author = {Sun, Jingwei and Xu, Ziyue and Yang, Dong and Nath, Vishwesh and Li, Wenqi and Zhao, Can and Xu, Daguang and Chen, Yiran and Roth, Holger R.}, title = {Communication-Efficient Vertical Federated Learning with Limited Overlapping Samples}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5203-5212} }
On the Audio-visual Synchronization for Lip-to-Speech Synthesis: Zhe Niu,

Brian Mak; [pdf] [arXiv]
[bibtex]
@InProceedings{Niu_2023_ICCV, author = {Niu, Zhe and Mak, Brian}, title = {On the Audio-visual Synchronization for Lip-to-Speech Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7843-7852} }
Robust One-Shot Face Video Re-enactment using Hybrid Latent Spaces of StyleGAN2: Trevine Oorloff,

Yaser Yacoob; [pdf] [supp]
[bibtex]
@InProceedings{Oorloff_2023_ICCV, author = {Oorloff, Trevine and Yacoob, Yaser}, title = {Robust One-Shot Face Video Re-enactment using Hybrid Latent Spaces of StyleGAN2}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20947-20957} }
BallGAN: 3D-aware Image Synthesis with a Spherical Background: Minjung Shin,

Yunji Seo,

Jeongmin Bae,

Young Sun Choi,

Hyunsu Kim,

Hyeran Byun,

Youngjung Uh; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shin_2023_ICCV, author = {Shin, Minjung and Seo, Yunji and Bae, Jeongmin and Choi, Young Sun and Kim, Hyunsu and Byun, Hyeran and Uh, Youngjung}, title = {BallGAN: 3D-aware Image Synthesis with a Spherical Background}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7268-7279} }
RPG-Palm: Realistic Pseudo-data Generation for Palmprint Recognition: Lei Shen,

Jianlong Jin,

Ruixin Zhang,

Huaen Li,

Kai Zhao,

Yingyi Zhang,

Jingyun Zhang,

Shouhong Ding,

Yang Zhao,

Wei Jia; [pdf] [supp]
[bibtex]
@InProceedings{Shen_2023_ICCV, author = {Shen, Lei and Jin, Jianlong and Zhang, Ruixin and Li, Huaen and Zhao, Kai and Zhang, Yingyi and Zhang, Jingyun and Ding, Shouhong and Zhao, Yang and Jia, Wei}, title = {RPG-Palm: Realistic Pseudo-data Generation for Palmprint Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19605-19616} }
Lecture Presentations Multimodal Dataset: Towards Understanding Multimodality in Educational Videos: Dong Won Lee,

Chaitanya Ahuja,

Paul Pu Liang,

Sanika Natu,

Louis-Philippe Morency; [pdf] [supp]
[bibtex]
@InProceedings{Lee_2023_ICCV, author = {Lee, Dong Won and Ahuja, Chaitanya and Liang, Paul Pu and Natu, Sanika and Morency, Louis-Philippe}, title = {Lecture Presentations Multimodal Dataset: Towards Understanding Multimodality in Educational Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20087-20098} }
Window-Based Early-Exit Cascades for Uncertainty Estimation: When Deep Ensembles are More Efficient than Single Models: Guoxuan Xia,

Christos-Savvas Bouganis; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xia_2023_ICCV, author = {Xia, Guoxuan and Bouganis, Christos-Savvas}, title = {Window-Based Early-Exit Cascades for Uncertainty Estimation: When Deep Ensembles are More Efficient than Single Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17368-17380} }
AttT2M: Text-Driven Human Motion Generation with Multi-Perspective Attention Mechanism: Chongyang Zhong,

Lei Hu,

Zihao Zhang,

Shihong Xia; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhong_2023_ICCV, author = {Zhong, Chongyang and Hu, Lei and Zhang, Zihao and Xia, Shihong}, title = {AttT2M: Text-Driven Human Motion Generation with Multi-Perspective Attention Mechanism}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {509-519} }
A Theory of Topological Derivatives for Inverse Rendering of Geometry: Ishit Mehta,

Manmohan Chandraker,

Ravi Ramamoorthi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mehta_2023_ICCV, author = {Mehta, Ishit and Chandraker, Manmohan and Ramamoorthi, Ravi}, title = {A Theory of Topological Derivatives for Inverse Rendering of Geometry}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {419-429} }
Canonical Factors for Hybrid Neural Fields: Brent Yi,

Weijia Zeng,

Sam Buchanan,

Yi Ma; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yi_2023_ICCV, author = {Yi, Brent and Zeng, Weijia and Buchanan, Sam and Ma, Yi}, title = {Canonical Factors for Hybrid Neural Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3414-3426} }
XNet: Wavelet-Based Low and High Frequency Fusion Networks for Fully- and Semi-Supervised Semantic Segmentation of Biomedical Images: Yanfeng Zhou,

Jiaxing Huang,

Chenlong Wang,

Le Song,

Ge Yang; [pdf]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Yanfeng and Huang, Jiaxing and Wang, Chenlong and Song, Le and Yang, Ge}, title = {XNet: Wavelet-Based Low and High Frequency Fusion Networks for Fully- and Semi-Supervised Semantic Segmentation of Biomedical Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21085-21096} }
Betrayed by Captions: Joint Caption Grounding and Generation for Open Vocabulary Instance Segmentation: Jianzong Wu,

Xiangtai Li,

Henghui Ding,

Xia Li,

Guangliang Cheng,

Yunhai Tong,

Chen Change Loy; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Jianzong and Li, Xiangtai and Ding, Henghui and Li, Xia and Cheng, Guangliang and Tong, Yunhai and Loy, Chen Change}, title = {Betrayed by Captions: Joint Caption Grounding and Generation for Open Vocabulary Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21938-21948} }
StyleGANEX: StyleGAN-Based Manipulation Beyond Cropped Aligned Faces: Shuai Yang,

Liming Jiang,

Ziwei Liu,

Chen Change Loy; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Shuai and Jiang, Liming and Liu, Ziwei and Loy, Chen Change}, title = {StyleGANEX: StyleGAN-Based Manipulation Beyond Cropped Aligned Faces}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21000-21010} }
HandR2N2: Iterative 3D Hand Pose Estimation Using a Residual Recurrent Neural Network: Wencan Cheng,

Jong Hwan Ko; [pdf]
[bibtex]
@InProceedings{Cheng_2023_ICCV, author = {Cheng, Wencan and Ko, Jong Hwan}, title = {HandR2N2: Iterative 3D Hand Pose Estimation Using a Residual Recurrent Neural Network}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20904-20913} }
GET: Group Event Transformer for Event-Based Vision: Yansong Peng,

Yueyi Zhang,

Zhiwei Xiong,

Xiaoyan Sun,

Feng Wu; [pdf] [supp]
[bibtex]
@InProceedings{Peng_2023_ICCV, author = {Peng, Yansong and Zhang, Yueyi and Xiong, Zhiwei and Sun, Xiaoyan and Wu, Feng}, title = {GET: Group Event Transformer for Event-Based Vision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6038-6048} }
Unsupervised Learning of Object-Centric Embeddings for Cell Instance Segmentation in Microscopy Images: Steffen Wolf,

Manan Lalit,

Katie McDole,

Jan Funke; [pdf] [supp]
[bibtex]
@InProceedings{Wolf_2023_ICCV, author = {Wolf, Steffen and Lalit, Manan and McDole, Katie and Funke, Jan}, title = {Unsupervised Learning of Object-Centric Embeddings for Cell Instance Segmentation in Microscopy Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21263-21272} }
DyGait: Exploiting Dynamic Representations for High-performance Gait Recognition: Ming Wang,

Xianda Guo,

Beibei Lin,

Tian Yang,

Zheng Zhu,

Lincheng Li,

Shunli Zhang,

Xin Yu; [pdf] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Ming and Guo, Xianda and Lin, Beibei and Yang, Tian and Zhu, Zheng and Li, Lincheng and Zhang, Shunli and Yu, Xin}, title = {DyGait: Exploiting Dynamic Representations for High-performance Gait Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13424-13433} }
When Do Curricula Work in Federated Learning?: Saeed Vahidian,

Sreevatsank Kadaveru,

Woonjoon Baek,

Weijia Wang,

Vyacheslav Kungurtsev,

Chen Chen,

Mubarak Shah,

Bill Lin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Vahidian_2023_ICCV, author = {Vahidian, Saeed and Kadaveru, Sreevatsank and Baek, Woonjoon and Wang, Weijia and Kungurtsev, Vyacheslav and Chen, Chen and Shah, Mubarak and Lin, Bill}, title = {When Do Curricula Work in Federated Learning?}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5084-5094} }
XiNet: Efficient Neural Networks for tinyML: Alberto Ancilotto,

Francesco Paissan,

Elisabetta Farella; [pdf] [supp]
[bibtex]
@InProceedings{Ancilotto_2023_ICCV, author = {Ancilotto, Alberto and Paissan, Francesco and Farella, Elisabetta}, title = {XiNet: Efficient Neural Networks for tinyML}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16968-16977} }
GridPull: Towards Scalability in Learning Implicit Representations from 3D Point Clouds: Chao Chen,

Yu-Shen Liu,

Zhizhong Han; [pdf] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Chao and Liu, Yu-Shen and Han, Zhizhong}, title = {GridPull: Towards Scalability in Learning Implicit Representations from 3D Point Clouds}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18322-18334} }
Audio-Visual Class-Incremental Learning: Weiguo Pian,

Shentong Mo,

Yunhui Guo,

Yapeng Tian; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Pian_2023_ICCV, author = {Pian, Weiguo and Mo, Shentong and Guo, Yunhui and Tian, Yapeng}, title = {Audio-Visual Class-Incremental Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7799-7811} }
GeoMIM: Towards Better 3D Knowledge Transfer via Masked Image Modeling for Multi-view 3D Understanding: Jihao Liu,

Tai Wang,

Boxiao Liu,

Qihang Zhang,

Yu Liu,

Hongsheng Li; [pdf] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Jihao and Wang, Tai and Liu, Boxiao and Zhang, Qihang and Liu, Yu and Li, Hongsheng}, title = {GeoMIM: Towards Better 3D Knowledge Transfer via Masked Image Modeling for Multi-view 3D Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17839-17849} }
Towards Viewpoint-Invariant Visual Recognition via Adversarial Training: Shouwei Ruan,

Yinpeng Dong,

Hang Su,

Jianteng Peng,

Ning Chen,

Xingxing Wei; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ruan_2023_ICCV, author = {Ruan, Shouwei and Dong, Yinpeng and Su, Hang and Peng, Jianteng and Chen, Ning and Wei, Xingxing}, title = {Towards Viewpoint-Invariant Visual Recognition via Adversarial Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4709-4719} }
Helping Hands: An Object-Aware Ego-Centric Video Recognition Model: Chuhan Zhang,

Ankush Gupta,

Andrew Zisserman; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Chuhan and Gupta, Ankush and Zisserman, Andrew}, title = {Helping Hands: An Object-Aware Ego-Centric Video Recognition Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13901-13912} }
RenderIH: A Large-Scale Synthetic Dataset for 3D Interacting Hand Pose Estimation: Lijun Li,

Linrui Tian,

Xindi Zhang,

Qi Wang,

Bang Zhang,

Liefeng Bo,

Mengyuan Liu,

Chen Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Lijun and Tian, Linrui and Zhang, Xindi and Wang, Qi and Zhang, Bang and Bo, Liefeng and Liu, Mengyuan and Chen, Chen}, title = {RenderIH: A Large-Scale Synthetic Dataset for 3D Interacting Hand Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20395-20405} }
Multi-Metrics Adaptively Identifies Backdoors in Federated Learning: Siquan Huang,

Yijiang Li,

Chong Chen,

Leyu Shi,

Ying Gao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Siquan and Li, Yijiang and Chen, Chong and Shi, Leyu and Gao, Ying}, title = {Multi-Metrics Adaptively Identifies Backdoors in Federated Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4652-4662} }
SpinCam: High-Speed Imaging via a Rotating Point-Spread Function: Dorian Chan,

Mark Sheinin,

Matthew O'Toole; [pdf] [supp]
[bibtex]
@InProceedings{Chan_2023_ICCV, author = {Chan, Dorian and Sheinin, Mark and O'Toole, Matthew}, title = {SpinCam: High-Speed Imaging via a Rotating Point-Spread Function}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10789-10799} }
FPR: False Positive Rectification for Weakly Supervised Semantic Segmentation: Liyi Chen,

Chenyang Lei,

Ruihuang Li,

Shuai Li,

Zhaoxiang Zhang,

Lei Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Liyi and Lei, Chenyang and Li, Ruihuang and Li, Shuai and Zhang, Zhaoxiang and Zhang, Lei}, title = {FPR: False Positive Rectification for Weakly Supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1108-1118} }
Cross-modal Scalable Hyperbolic Hierarchical Clustering: Teng Long,

Nanne van Noord; [pdf]
[bibtex]
@InProceedings{Long_2023_ICCV, author = {Long, Teng and van Noord, Nanne}, title = {Cross-modal Scalable Hyperbolic Hierarchical Clustering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16655-16664} }
DETRDistill: A Universal Knowledge Distillation Framework for DETR-families: Jiahao Chang,

Shuo Wang,

Hai-Ming Xu,

Zehui Chen,

Chenhongyi Yang,

Feng Zhao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chang_2023_ICCV, author = {Chang, Jiahao and Wang, Shuo and Xu, Hai-Ming and Chen, Zehui and Yang, Chenhongyi and Zhao, Feng}, title = {DETRDistill: A Universal Knowledge Distillation Framework for DETR-families}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6898-6908} }
F&F Attack: Adversarial Attack against Multiple Object Trackers by Inducing False Negatives and False Positives: Tao Zhou,

Qi Ye,

Wenhan Luo,

Kaihao Zhang,

Zhiguo Shi,

Jiming Chen; [pdf] [supp]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Tao and Ye, Qi and Luo, Wenhan and Zhang, Kaihao and Shi, Zhiguo and Chen, Jiming}, title = {F\&F Attack: Adversarial Attack against Multiple Object Trackers by Inducing False Negatives and False Positives}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4573-4583} }
Transferable Decoding with Visual Entities for Zero-Shot Image Captioning: Junjie Fei,

Teng Wang,

Jinrui Zhang,

Zhenyu He,

Chengjie Wang,

Feng Zheng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Fei_2023_ICCV, author = {Fei, Junjie and Wang, Teng and Zhang, Jinrui and He, Zhenyu and Wang, Chengjie and Zheng, Feng}, title = {Transferable Decoding with Visual Entities for Zero-Shot Image Captioning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3136-3146} }
ReMoDiffuse: Retrieval-Augmented Motion Diffusion Model: Mingyuan Zhang,

Xinying Guo,

Liang Pan,

Zhongang Cai,

Fangzhou Hong,

Huirong Li,

Lei Yang,

Ziwei Liu; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Mingyuan and Guo, Xinying and Pan, Liang and Cai, Zhongang and Hong, Fangzhou and Li, Huirong and Yang, Lei and Liu, Ziwei}, title = {ReMoDiffuse: Retrieval-Augmented Motion Diffusion Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {364-373} }
GlueStick: Robust Image Matching by Sticking Points and Lines Together: Rémi Pautrat,

Iago Suárez,

Yifan Yu,

Marc Pollefeys,

Viktor Larsson; [pdf] [supp]
[bibtex]
@InProceedings{Pautrat_2023_ICCV, author = {Pautrat, R\'emi and Su\'arez, Iago and Yu, Yifan and Pollefeys, Marc and Larsson, Viktor}, title = {GlueStick: Robust Image Matching by Sticking Points and Lines Together}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9706-9716} }
Computational 3D Imaging with Position Sensors: Jeremy Klotz,

Mohit Gupta,

Aswin C. Sankaranarayanan; [pdf] [supp]
[bibtex]
@InProceedings{Klotz_2023_ICCV, author = {Klotz, Jeremy and Gupta, Mohit and Sankaranarayanan, Aswin C.}, title = {Computational 3D Imaging with Position Sensors}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8125-8134} }
PointMBF: A Multi-scale Bidirectional Fusion Network for Unsupervised RGB-D Point Cloud Registration: Mingzhi Yuan,

Kexue Fu,

Zhihao Li,

Yucong Meng,

Manning Wang; [pdf] [supp]
[bibtex]
@InProceedings{Yuan_2023_ICCV, author = {Yuan, Mingzhi and Fu, Kexue and Li, Zhihao and Meng, Yucong and Wang, Manning}, title = {PointMBF: A Multi-scale Bidirectional Fusion Network for Unsupervised RGB-D Point Cloud Registration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17694-17705} }
Towards Multi-Layered 3D Garments Animation: Yidi Shao,

Chen Change Loy,

Bo Dai; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shao_2023_ICCV, author = {Shao, Yidi and Loy, Chen Change and Dai, Bo}, title = {Towards Multi-Layered 3D Garments Animation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14361-14370} }
LiveHand: Real-time and Photorealistic Neural Hand Rendering: Akshay Mundra,

Mallikarjun B R,

Jiayi Wang,

Marc Habermann,

Christian Theobalt,

Mohamed Elgharib; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mundra_2023_ICCV, author = {Mundra, Akshay and R, Mallikarjun B and Wang, Jiayi and Habermann, Marc and Theobalt, Christian and Elgharib, Mohamed}, title = {LiveHand: Real-time and Photorealistic Neural Hand Rendering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18035-18045} }
Advancing Referring Expression Segmentation Beyond Single Image: Yixuan Wu,

Zhao Zhang,

Chi Xie,

Feng Zhu,

Rui Zhao; [pdf] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Yixuan and Zhang, Zhao and Xie, Chi and Zhu, Feng and Zhao, Rui}, title = {Advancing Referring Expression Segmentation Beyond Single Image}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2628-2638} }
Learning Image Harmonization in the Linear Color Space: Ke Xu,

Gerhard Petrus Hancke,

Rynson W.H. Lau; [pdf]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Ke and Hancke, Gerhard Petrus and Lau, Rynson W.H.}, title = {Learning Image Harmonization in the Linear Color Space}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12570-12579} }
Chasing Clouds: Differentiable Volumetric Rasterisation of Point Clouds as a Highly Efficient and Accurate Loss for Large-Scale Deformable 3D Registration: Mattias P. Heinrich,

Alexander Bigalke,

Christoph Großbröhmer,

Lasse Hansen; [pdf] [supp]
[bibtex]
@InProceedings{Heinrich_2023_ICCV, author = {Heinrich, Mattias P. and Bigalke, Alexander and Gro{\ss}br\"ohmer, Christoph and Hansen, Lasse}, title = {Chasing Clouds: Differentiable Volumetric Rasterisation of Point Clouds as a Highly Efficient and Accurate Loss for Large-Scale Deformable 3D Registration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8026-8036} }
TripLe: Revisiting Pretrained Model Reuse and Progressive Learning for Efficient Vision Transformer Scaling and Searching: Cheng Fu,

Hanxian Huang,

Zixuan Jiang,

Yun Ni,

Lifeng Nai,

Gang Wu,

Liqun Cheng,

Yanqi Zhou,

Sheng Li,

Andrew Li,

Jishen Zhao; [pdf] [supp]
[bibtex]
@InProceedings{Fu_2023_ICCV, author = {Fu, Cheng and Huang, Hanxian and Jiang, Zixuan and Ni, Yun and Nai, Lifeng and Wu, Gang and Cheng, Liqun and Zhou, Yanqi and Li, Sheng and Li, Andrew and Zhao, Jishen}, title = {TripLe: Revisiting Pretrained Model Reuse and Progressive Learning for Efficient Vision Transformer Scaling and Searching}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17153-17163} }
LogicSeg: Parsing Visual Semantics with Neural Logic Learning and Reasoning: Liulei Li,

Wenguan Wang,

Yi Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Liulei and Wang, Wenguan and Yang, Yi}, title = {LogicSeg: Parsing Visual Semantics with Neural Logic Learning and Reasoning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4122-4133} }
The Devil is in the Upsampling: Architectural Decisions Made Simpler for Denoising with Deep Image Prior: Yilin Liu,

Jiang Li,

Yunkui Pang,

Dong Nie,

Pew-Thian Yap; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Yilin and Li, Jiang and Pang, Yunkui and Nie, Dong and Yap, Pew-Thian}, title = {The Devil is in the Upsampling: Architectural Decisions Made Simpler for Denoising with Deep Image Prior}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12408-12417} }
Video Object Segmentation-aware Video Frame Interpolation: Jun-Sang Yoo,

Hongjae Lee,

Seung-Won Jung; [pdf] [supp]
[bibtex]
@InProceedings{Yoo_2023_ICCV, author = {Yoo, Jun-Sang and Lee, Hongjae and Jung, Seung-Won}, title = {Video Object Segmentation-aware Video Frame Interpolation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12322-12333} }
Coherent Event Guided Low-Light Video Enhancement: Jinxiu Liang,

Yixin Yang,

Boyu Li,

Peiqi Duan,

Yong Xu,

Boxin Shi; [pdf] [supp]
[bibtex]
@InProceedings{Liang_2023_ICCV, author = {Liang, Jinxiu and Yang, Yixin and Li, Boyu and Duan, Peiqi and Xu, Yong and Shi, Boxin}, title = {Coherent Event Guided Low-Light Video Enhancement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10615-10625} }
Texture Learning Domain Randomization for Domain Generalized Segmentation: Sunghwan Kim,

Dae-hwan Kim,

Hoseong Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2023_ICCV, author = {Kim, Sunghwan and Kim, Dae-hwan and Kim, Hoseong}, title = {Texture Learning Domain Randomization for Domain Generalized Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {677-687} }
FCCNs: Fully Complex-valued Convolutional Networks using Complex-valued Color Model and Loss Function: Saurabh Yadav,

Koteswar Rao Jerripothula; [pdf] [supp]
[bibtex]
@InProceedings{Yadav_2023_ICCV, author = {Yadav, Saurabh and Jerripothula, Koteswar Rao}, title = {FCCNs: Fully Complex-valued Convolutional Networks using Complex-valued Color Model and Loss Function}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10689-10698} }
Learning Concise and Descriptive Attributes for Visual Recognition: An Yan,

Yu Wang,

Yiwu Zhong,

Chengyu Dong,

Zexue He,

Yujie Lu,

William Yang Wang,

Jingbo Shang,

Julian McAuley; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yan_2023_ICCV, author = {Yan, An and Wang, Yu and Zhong, Yiwu and Dong, Chengyu and He, Zexue and Lu, Yujie and Wang, William Yang and Shang, Jingbo and McAuley, Julian}, title = {Learning Concise and Descriptive Attributes for Visual Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3090-3100} }
Learning Unified Decompositional and Compositional NeRF for Editable Novel View Synthesis: Yuxin Wang,

Wayne Wu,

Dan Xu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Yuxin and Wu, Wayne and Xu, Dan}, title = {Learning Unified Decompositional and Compositional NeRF for Editable Novel View Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18247-18256} }
Label-Noise Learning with Intrinsically Long-Tailed Data: Yang Lu,

Yiliang Zhang,

Bo Han,

Yiu-ming Cheung,

Hanzi Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lu_2023_ICCV, author = {Lu, Yang and Zhang, Yiliang and Han, Bo and Cheung, Yiu-ming and Wang, Hanzi}, title = {Label-Noise Learning with Intrinsically Long-Tailed Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1369-1378} }
SeeABLE: Soft Discrepancies and Bounded Contrastive Learning for Exposing Deepfakes: Nicolas Larue,

Ngoc-Son Vu,

Vitomir Struc,

Peter Peer,

Vassilis Christophides; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Larue_2023_ICCV, author = {Larue, Nicolas and Vu, Ngoc-Son and Struc, Vitomir and Peer, Peter and Christophides, Vassilis}, title = {SeeABLE: Soft Discrepancies and Bounded Contrastive Learning for Exposing Deepfakes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21011-21021} }
Semi-Supervised Learning via Weight-Aware Distillation under Class Distribution Mismatch: Pan Du,

Suyun Zhao,

Zisen Sheng,

Cuiping Li,

Hong Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Du_2023_ICCV, author = {Du, Pan and Zhao, Suyun and Sheng, Zisen and Li, Cuiping and Chen, Hong}, title = {Semi-Supervised Learning via Weight-Aware Distillation under Class Distribution Mismatch}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16410-16420} }
ELFNet: Evidential Local-global Fusion for Stereo Matching: Jieming Lou,

Weide Liu,

Zhuo Chen,

Fayao Liu,

Jun Cheng; [pdf] [arXiv]
[bibtex]
@InProceedings{Lou_2023_ICCV, author = {Lou, Jieming and Liu, Weide and Chen, Zhuo and Liu, Fayao and Cheng, Jun}, title = {ELFNet: Evidential Local-global Fusion for Stereo Matching}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17784-17793} }
SimpleClick: Interactive Image Segmentation with Simple Vision Transformers: Qin Liu,

Zhenlin Xu,

Gedas Bertasius,

Marc Niethammer; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Qin and Xu, Zhenlin and Bertasius, Gedas and Niethammer, Marc}, title = {SimpleClick: Interactive Image Segmentation with Simple Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22290-22300} }
Towards Content-based Pixel Retrieval in Revisited Oxford and Paris: Guoyuan An,

Woo Jae Kim,

Saelyne Yang,

Rong Li,

Yuchi Huo,

Sun-Eui Yoon; [pdf] [arXiv]
[bibtex]
@InProceedings{An_2023_ICCV, author = {An, Guoyuan and Kim, Woo Jae and Yang, Saelyne and Li, Rong and Huo, Yuchi and Yoon, Sun-Eui}, title = {Towards Content-based Pixel Retrieval in Revisited Oxford and Paris}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20507-20518} }
S-TREK: Sequential Translation and Rotation Equivariant Keypoints for Local Feature Extraction: Emanuele Santellani,

Christian Sormann,

Mattia Rossi,

Andreas Kuhn,

Friedrich Fraundorfer; [pdf] [supp]
[bibtex]
@InProceedings{Santellani_2023_ICCV, author = {Santellani, Emanuele and Sormann, Christian and Rossi, Mattia and Kuhn, Andreas and Fraundorfer, Friedrich}, title = {S-TREK: Sequential Translation and Rotation Equivariant Keypoints for Local Feature Extraction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9728-9737} }
Retro-FPN: Retrospective Feature Pyramid Network for Point Cloud Semantic Segmentation: Peng Xiang,

Xin Wen,

Yu-Shen Liu,

Hui Zhang,

Yi Fang,

Zhizhong Han; [pdf] [supp]
[bibtex]
@InProceedings{Xiang_2023_ICCV, author = {Xiang, Peng and Wen, Xin and Liu, Yu-Shen and Zhang, Hui and Fang, Yi and Han, Zhizhong}, title = {Retro-FPN: Retrospective Feature Pyramid Network for Point Cloud Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17826-17838} }
Rethinking Range View Representation for LiDAR Segmentation: Lingdong Kong,

Youquan Liu,

Runnan Chen,

Yuexin Ma,

Xinge Zhu,

Yikang Li,

Yuenan Hou,

Yu Qiao,

Ziwei Liu; [pdf] [arXiv]
[bibtex]
@InProceedings{Kong_2023_ICCV, author = {Kong, Lingdong and Liu, Youquan and Chen, Runnan and Ma, Yuexin and Zhu, Xinge and Li, Yikang and Hou, Yuenan and Qiao, Yu and Liu, Ziwei}, title = {Rethinking Range View Representation for LiDAR Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {228-240} }
Divide and Conquer: 3D Point Cloud Instance Segmentation With Point-Wise Binarization: Weiguang Zhao,

Yuyao Yan,

Chaolong Yang,

Jianan Ye,

Xi Yang,

Kaizhu Huang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Weiguang and Yan, Yuyao and Yang, Chaolong and Ye, Jianan and Yang, Xi and Huang, Kaizhu}, title = {Divide and Conquer: 3D Point Cloud Instance Segmentation With Point-Wise Binarization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {562-571} }
BANSAC: A Dynamic BAyesian Network for Adaptive SAmple Consensus: Valter Piedade,

Pedro Miraldo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Piedade_2023_ICCV, author = {Piedade, Valter and Miraldo, Pedro}, title = {BANSAC: A Dynamic BAyesian Network for Adaptive SAmple Consensus}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3738-3747} }
ShapeScaffolder: Structure-Aware 3D Shape Generation from Text: Xi Tian,

Yong-Liang Yang,

Qi Wu; [pdf] [supp]
[bibtex]
@InProceedings{Tian_2023_ICCV, author = {Tian, Xi and Yang, Yong-Liang and Wu, Qi}, title = {ShapeScaffolder: Structure-Aware 3D Shape Generation from Text}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2715-2724} }
Read-only Prompt Optimization for Vision-Language Few-shot Learning: Dongjun Lee,

Seokwon Song,

Jihee Suh,

Joonmyeong Choi,

Sanghyeok Lee,

Hyunwoo J. Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2023_ICCV, author = {Lee, Dongjun and Song, Seokwon and Suh, Jihee and Choi, Joonmyeong and Lee, Sanghyeok and Kim, Hyunwoo J.}, title = {Read-only Prompt Optimization for Vision-Language Few-shot Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1401-1411} }
COCO-O: A Benchmark for Object Detectors under Natural Distribution Shifts: Xiaofeng Mao,

Yuefeng Chen,

Yao Zhu,

Da Chen,

Hang Su,

Rong Zhang,

Hui Xue; [pdf] [supp]
[bibtex]
@InProceedings{Mao_2023_ICCV, author = {Mao, Xiaofeng and Chen, Yuefeng and Zhu, Yao and Chen, Da and Su, Hang and Zhang, Rong and Xue, Hui}, title = {COCO-O: A Benchmark for Object Detectors under Natural Distribution Shifts}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6339-6350} }
E2NeRF: Event Enhanced Neural Radiance Fields from Blurry Images: Yunshan Qi,

Lin Zhu,

Yu Zhang,

Jia Li; [pdf] [supp]
[bibtex]
@InProceedings{Qi_2023_ICCV, author = {Qi, Yunshan and Zhu, Lin and Zhang, Yu and Li, Jia}, title = {E2NeRF: Event Enhanced Neural Radiance Fields from Blurry Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13254-13264} }
EgoTV: Egocentric Task Verification from Natural Language Task Descriptions: Rishi Hazra,

Brian Chen,

Akshara Rai,

Nitin Kamra,

Ruta Desai; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hazra_2023_ICCV, author = {Hazra, Rishi and Chen, Brian and Rai, Akshara and Kamra, Nitin and Desai, Ruta}, title = {EgoTV: Egocentric Task Verification from Natural Language Task Descriptions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15417-15429} }
Benchmarking Low-Shot Robustness to Natural Distribution Shifts: Aaditya Singh,

Kartik Sarangmath,

Prithvijit Chattopadhyay,

Judy Hoffman; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Singh_2023_ICCV, author = {Singh, Aaditya and Sarangmath, Kartik and Chattopadhyay, Prithvijit and Hoffman, Judy}, title = {Benchmarking Low-Shot Robustness to Natural Distribution Shifts}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16232-16242} }
StageInteractor: Query-based Object Detector with Cross-stage Interaction: Yao Teng,

Haisong Liu,

Sheng Guo,

Limin Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Teng_2023_ICCV, author = {Teng, Yao and Liu, Haisong and Guo, Sheng and Wang, Limin}, title = {StageInteractor: Query-based Object Detector with Cross-stage Interaction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6577-6588} }
DeLiRa: Self-Supervised Depth, Light, and Radiance Fields: Vitor Guizilini,

Igor Vasiljevic,

Jiading Fang,

Rares Ambrus,

Sergey Zakharov,

Vincent Sitzmann,

Adrien Gaidon; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Guizilini_2023_ICCV, author = {Guizilini, Vitor and Vasiljevic, Igor and Fang, Jiading and Ambrus, Rares and Zakharov, Sergey and Sitzmann, Vincent and Gaidon, Adrien}, title = {DeLiRa: Self-Supervised Depth, Light, and Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17935-17945} }
Moment Detection in Long Tutorial Videos: Ioana Croitoru,

Simion-Vlad Bogolin,

Samuel Albanie,

Yang Liu,

Zhaowen Wang,

Seunghyun Yoon,

Franck Dernoncourt,

Hailin Jin,

Trung Bui; [pdf] [supp]
[bibtex]
@InProceedings{Croitoru_2023_ICCV, author = {Croitoru, Ioana and Bogolin, Simion-Vlad and Albanie, Samuel and Liu, Yang and Wang, Zhaowen and Yoon, Seunghyun and Dernoncourt, Franck and Jin, Hailin and Bui, Trung}, title = {Moment Detection in Long Tutorial Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2594-2604} }
Stable Cluster Discrimination for Deep Clustering: Qi Qian; [pdf] [supp]
[bibtex]
@InProceedings{Qian_2023_ICCV, author = {Qian, Qi}, title = {Stable Cluster Discrimination for Deep Clustering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16645-16654} }
Pix2Video: Video Editing using Image Diffusion: Duygu Ceylan,

Chun-Hao P. Huang,

Niloy J. Mitra; [pdf] [arXiv]
[bibtex]
@InProceedings{Ceylan_2023_ICCV, author = {Ceylan, Duygu and Huang, Chun-Hao P. and Mitra, Niloy J.}, title = {Pix2Video: Video Editing using Image Diffusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23206-23217} }
DFA3D: 3D Deformable Attention For 2D-to-3D Feature Lifting: Hongyang Li,

Hao Zhang,

Zhaoyang Zeng,

Shilong Liu,

Feng Li,

Tianhe Ren,

Lei Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Hongyang and Zhang, Hao and Zeng, Zhaoyang and Liu, Shilong and Li, Feng and Ren, Tianhe and Zhang, Lei}, title = {DFA3D: 3D Deformable Attention For 2D-to-3D Feature Lifting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6684-6693} }
Holistic Geometric Feature Learning for Structured Reconstruction: Ziqiong Lu,

Linxi Huan,

Qiyuan Ma,

Xianwei Zheng; [pdf] [arXiv]
[bibtex]
@InProceedings{Lu_2023_ICCV, author = {Lu, Ziqiong and Huan, Linxi and Ma, Qiyuan and Zheng, Xianwei}, title = {Holistic Geometric Feature Learning for Structured Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21807-21817} }
FateZero: Fusing Attentions for Zero-shot Text-based Video Editing: Chenyang QI,

Xiaodong Cun,

Yong Zhang,

Chenyang Lei,

Xintao Wang,

Ying Shan,

Qifeng Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{QI_2023_ICCV, author = {QI, Chenyang and Cun, Xiaodong and Zhang, Yong and Lei, Chenyang and Wang, Xintao and Shan, Ying and Chen, Qifeng}, title = {FateZero: Fusing Attentions for Zero-shot Text-based Video Editing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15932-15942} }
Uncertainty-guided Learning for Improving Image Manipulation Detection: Kaixiang Ji,

Feng Chen,

Xin Guo,

Yadong Xu,

Jian Wang,

Jingdong Chen; [pdf] [supp]
[bibtex]
@InProceedings{Ji_2023_ICCV, author = {Ji, Kaixiang and Chen, Feng and Guo, Xin and Xu, Yadong and Wang, Jian and Chen, Jingdong}, title = {Uncertainty-guided Learning for Improving Image Manipulation Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22456-22465} }
LMR: A Large-Scale Multi-Reference Dataset for Reference-Based Super-Resolution: Lin Zhang,

Xin Li,

Dongliang He,

Fu Li,

Errui Ding,

Zhaoxiang Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Lin and Li, Xin and He, Dongliang and Li, Fu and Ding, Errui and Zhang, Zhaoxiang}, title = {LMR: A Large-Scale Multi-Reference Dataset for Reference-Based Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13118-13127} }
Neural Implicit Surface Evolution: Tiago Novello,

Vinicius da Silva,

Guilherme Schardong,

Luiz Schirmer,

Helio Lopes,

Luiz Velho; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Novello_2023_ICCV, author = {Novello, Tiago and da Silva, Vinicius and Schardong, Guilherme and Schirmer, Luiz and Lopes, Helio and Velho, Luiz}, title = {Neural Implicit Surface Evolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14279-14289} }
Distribution-Aligned Diffusion for Human Mesh Recovery: Lin Geng Foo,

Jia Gong,

Hossein Rahmani,

Jun Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Foo_2023_ICCV, author = {Foo, Lin Geng and Gong, Jia and Rahmani, Hossein and Liu, Jun}, title = {Distribution-Aligned Diffusion for Human Mesh Recovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9221-9232} }
Rosetta Neurons: Mining the Common Units in a Model Zoo: Amil Dravid,

Yossi Gandelsman,

Alexei A. Efros,

Assaf Shocher; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dravid_2023_ICCV, author = {Dravid, Amil and Gandelsman, Yossi and Efros, Alexei A. and Shocher, Assaf}, title = {Rosetta Neurons: Mining the Common Units in a Model Zoo}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1934-1943} }
Semi-Supervised Semantic Segmentation under Label Noise via Diverse Learning Groups: Peixia Li,

Pulak Purkait,

Thalaiyasingam Ajanthan,

Majid Abdolshah,

Ravi Garg,

Hisham Husain,

Chenchen Xu,

Stephen Gould,

Wanli Ouyang,

Anton van den Hengel; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Peixia and Purkait, Pulak and Ajanthan, Thalaiyasingam and Abdolshah, Majid and Garg, Ravi and Husain, Hisham and Xu, Chenchen and Gould, Stephen and Ouyang, Wanli and van den Hengel, Anton}, title = {Semi-Supervised Semantic Segmentation under Label Noise via Diverse Learning Groups}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1229-1238} }
AdaMV-MoE: Adaptive Multi-Task Vision Mixture-of-Experts: Tianlong Chen,

Xuxi Chen,

Xianzhi Du,

Abdullah Rashwan,

Fan Yang,

Huizhong Chen,

Zhangyang Wang,

Yeqing Li; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Tianlong and Chen, Xuxi and Du, Xianzhi and Rashwan, Abdullah and Yang, Fan and Chen, Huizhong and Wang, Zhangyang and Li, Yeqing}, title = {AdaMV-MoE: Adaptive Multi-Task Vision Mixture-of-Experts}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17346-17357} }
Hierarchical Visual Categories Modeling: A Joint Representation Learning and Density Estimation Framework for Out-of-Distribution Detection: Jinglun Li,

Xinyu Zhou,

Pinxue Guo,

Yixuan Sun,

Yiwen Huang,

Weifeng Ge,

Wenqiang Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Jinglun and Zhou, Xinyu and Guo, Pinxue and Sun, Yixuan and Huang, Yiwen and Ge, Weifeng and Zhang, Wenqiang}, title = {Hierarchical Visual Categories Modeling: A Joint Representation Learning and Density Estimation Framework for Out-of-Distribution Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23425-23435} }
Diffuse3D: Wide-Angle 3D Photography via Bilateral Diffusion: Yutao Jiang,

Yang Zhou,

Yuan Liang,

Wenxi Liu,

Jianbo Jiao,

Yuhui Quan,

Shengfeng He; [pdf] [supp]
[bibtex]
@InProceedings{Jiang_2023_ICCV, author = {Jiang, Yutao and Zhou, Yang and Liang, Yuan and Liu, Wenxi and Jiao, Jianbo and Quan, Yuhui and He, Shengfeng}, title = {Diffuse3D: Wide-Angle 3D Photography via Bilateral Diffusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8998-9008} }
ReNeRF: Relightable Neural Radiance Fields with Nearfield Lighting: Yingyan Xu,

Gaspard Zoss,

Prashanth Chandran,

Markus Gross,

Derek Bradley,

Paulo Gotardo; [pdf] [supp]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Yingyan and Zoss, Gaspard and Chandran, Prashanth and Gross, Markus and Bradley, Derek and Gotardo, Paulo}, title = {ReNeRF: Relightable Neural Radiance Fields with Nearfield Lighting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22581-22591} }
Segment Anything: Alexander Kirillov,

Eric Mintun,

Nikhila Ravi,

Hanzi Mao,

Chloe Rolland,

Laura Gustafson,

Tete Xiao,

Spencer Whitehead,

Alexander C. Berg,

Wan-Yen Lo,

Piotr Dollar,

Ross Girshick; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kirillov_2023_ICCV, author = {Kirillov, Alexander and Mintun, Eric and Ravi, Nikhila and Mao, Hanzi and Rolland, Chloe and Gustafson, Laura and Xiao, Tete and Whitehead, Spencer and Berg, Alexander C. and Lo, Wan-Yen and Dollar, Piotr and Girshick, Ross}, title = {Segment Anything}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4015-4026} }
Unsupervised Prompt Tuning for Text-Driven Object Detection: Weizhen He,

Weijie Chen,

Binbin Chen,

Shicai Yang,

Di Xie,

Luojun Lin,

Donglian Qi,

Yueting Zhuang; [pdf]
[bibtex]
@InProceedings{He_2023_ICCV, author = {He, Weizhen and Chen, Weijie and Chen, Binbin and Yang, Shicai and Xie, Di and Lin, Luojun and Qi, Donglian and Zhuang, Yueting}, title = {Unsupervised Prompt Tuning for Text-Driven Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2651-2661} }
Tubelet-Contrastive Self-Supervision for Video-Efficient Generalization: Fida Mohammad Thoker,

Hazel Doughty,

Cees G. M. Snoek; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Thoker_2023_ICCV, author = {Thoker, Fida Mohammad and Doughty, Hazel and Snoek, Cees G. M.}, title = {Tubelet-Contrastive Self-Supervision for Video-Efficient Generalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13812-13823} }
Re-ReND: Real-Time Rendering of NeRFs across Devices: Sara Rojas,

Jesus Zarzar,

Juan C. Pérez,

Artsiom Sanakoyeu,

Ali Thabet,

Albert Pumarola,

Bernard Ghanem; [pdf] [supp]
[bibtex]
@InProceedings{Rojas_2023_ICCV, author = {Rojas, Sara and Zarzar, Jesus and P\'erez, Juan C. and Sanakoyeu, Artsiom and Thabet, Ali and Pumarola, Albert and Ghanem, Bernard}, title = {Re-ReND: Real-Time Rendering of NeRFs across Devices}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3632-3641} }
360VOT: A New Benchmark Dataset for Omnidirectional Visual Object Tracking: Huajian Huang,

Yinzhe Xu,

Yingshu Chen,

Sai-Kit Yeung; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Huajian and Xu, Yinzhe and Chen, Yingshu and Yeung, Sai-Kit}, title = {360VOT: A New Benchmark Dataset for Omnidirectional Visual Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20566-20576} }
Is Imitation All You Need? Generalized Decision-Making with Dual-Phase Training: Yao Wei,

Yanchao Sun,

Ruijie Zheng,

Sai Vemprala,

Rogerio Bonatti,

Shuhang Chen,

Ratnesh Madaan,

Zhongjie Ba,

Ashish Kapoor,

Shuang Ma; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wei_2023_ICCV, author = {Wei, Yao and Sun, Yanchao and Zheng, Ruijie and Vemprala, Sai and Bonatti, Rogerio and Chen, Shuhang and Madaan, Ratnesh and Ba, Zhongjie and Kapoor, Ashish and Ma, Shuang}, title = {Is Imitation All You Need? Generalized Decision-Making with Dual-Phase Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16221-16231} }
Generalizing Event-Based Motion Deblurring in Real-World Scenarios: Xiang Zhang,

Lei Yu,

Wen Yang,

Jianzhuang Liu,

Gui-Song Xia; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Xiang and Yu, Lei and Yang, Wen and Liu, Jianzhuang and Xia, Gui-Song}, title = {Generalizing Event-Based Motion Deblurring in Real-World Scenarios}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10734-10744} }
Handwritten and Printed Text Segmentation: A Signature Case Study: Sina Gholamian,

Ali Vahdat; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gholamian_2023_ICCV, author = {Gholamian, Sina and Vahdat, Ali}, title = {Handwritten and Printed Text Segmentation: A Signature Case Study}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {582-592} }
LERF: Language Embedded Radiance Fields: Justin Kerr,

Chung Min Kim,

Ken Goldberg,

Angjoo Kanazawa,

Matthew Tancik; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kerr_2023_ICCV, author = {Kerr, Justin and Kim, Chung Min and Goldberg, Ken and Kanazawa, Angjoo and Tancik, Matthew}, title = {LERF: Language Embedded Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19729-19739} }
DomainAdaptor: A Novel Approach to Test-time Adaptation: Jian Zhang,

Lei Qi,

Yinghuan Shi,

Yang Gao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Jian and Qi, Lei and Shi, Yinghuan and Gao, Yang}, title = {DomainAdaptor: A Novel Approach to Test-time Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18971-18981} }
RCA-NOC: Relative Contrastive Alignment for Novel Object Captioning: Jiashuo Fan,

Yaoyuan Liang,

Leyao Liu,

Shaolun Huang,

Lei Zhang; [pdf]
[bibtex]
@InProceedings{Fan_2023_ICCV, author = {Fan, Jiashuo and Liang, Yaoyuan and Liu, Leyao and Huang, Shaolun and Zhang, Lei}, title = {RCA-NOC: Relative Contrastive Alignment for Novel Object Captioning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15510-15520} }
Mitigating and Evaluating Static Bias of Action Representations in the Background and the Foreground: Haoxin Li,

Yuan Liu,

Hanwang Zhang,

Boyang Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Haoxin and Liu, Yuan and Zhang, Hanwang and Li, Boyang}, title = {Mitigating and Evaluating Static Bias of Action Representations in the Background and the Foreground}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19911-19923} }
RbA: Segmenting Unknown Regions Rejected by All: Nazir Nayal,

Misra Yavuz,

João F. Henriques,

Fatma Güney; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Nayal_2023_ICCV, author = {Nayal, Nazir and Yavuz, Misra and Henriques, Jo\~ao F. and G\"uney, Fatma}, title = {RbA: Segmenting Unknown Regions Rejected by All}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {711-722} }
CuNeRF: Cube-Based Neural Radiance Field for Zero-Shot Medical Image Arbitrary-Scale Super Resolution: Zixuan Chen,

Lingxiao Yang,

Jian-Huang Lai,

Xiaohua Xie; [pdf] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Zixuan and Yang, Lingxiao and Lai, Jian-Huang and Xie, Xiaohua}, title = {CuNeRF: Cube-Based Neural Radiance Field for Zero-Shot Medical Image Arbitrary-Scale Super Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21185-21195} }
Beyond Object Recognition: A New Benchmark towards Object Concept Learning: Yong-Lu Li,

Yue Xu,

Xinyu Xu,

Xiaohan Mao,

Yuan Yao,

Siqi Liu,

Cewu Lu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Yong-Lu and Xu, Yue and Xu, Xinyu and Mao, Xiaohan and Yao, Yuan and Liu, Siqi and Lu, Cewu}, title = {Beyond Object Recognition: A New Benchmark towards Object Concept Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20029-20040} }
Towards Open-Vocabulary Video Instance Segmentation: Haochen Wang,

Cilin Yan,

Shuai Wang,

Xiaolong Jiang,

Xu Tang,

Yao Hu,

Weidi Xie,

Efstratios Gavves; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Haochen and Yan, Cilin and Wang, Shuai and Jiang, Xiaolong and Tang, Xu and Hu, Yao and Xie, Weidi and Gavves, Efstratios}, title = {Towards Open-Vocabulary Video Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4057-4066} }
Unleashing the Power of Gradient Signal-to-Noise Ratio for Zero-Shot NAS: Zihao Sun,

Yu Sun,

Longxing Yang,

Shun Lu,

Jilin Mei,

Wenxiao Zhao,

Yu Hu; [pdf] [supp]
[bibtex]
@InProceedings{Sun_2023_ICCV, author = {Sun, Zihao and Sun, Yu and Yang, Longxing and Lu, Shun and Mei, Jilin and Zhao, Wenxiao and Hu, Yu}, title = {Unleashing the Power of Gradient Signal-to-Noise Ratio for Zero-Shot NAS}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5763-5773} }
EgoObjects: A Large-Scale Egocentric Dataset for Fine-Grained Object Understanding: Chenchen Zhu,

Fanyi Xiao,

Andres Alvarado,

Yasmine Babaei,

Jiabo Hu,

Hichem El-Mohri,

Sean Culatana,

Roshan Sumbaly,

Zhicheng Yan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Chenchen and Xiao, Fanyi and Alvarado, Andres and Babaei, Yasmine and Hu, Jiabo and El-Mohri, Hichem and Culatana, Sean and Sumbaly, Roshan and Yan, Zhicheng}, title = {EgoObjects: A Large-Scale Egocentric Dataset for Fine-Grained Object Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20110-20120} }
What Can Simple Arithmetic Operations Do for Temporal Modeling?: Wenhao Wu,

Yuxin Song,

Zhun Sun,

Jingdong Wang,

Chang Xu,

Wanli Ouyang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Wenhao and Song, Yuxin and Sun, Zhun and Wang, Jingdong and Xu, Chang and Ouyang, Wanli}, title = {What Can Simple Arithmetic Operations Do for Temporal Modeling?}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13712-13722} }
Pixel Adaptive Deep Unfolding Transformer for Hyperspectral Image Reconstruction: Miaoyu Li,

Ying Fu,

Ji Liu,

Yulun Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Miaoyu and Fu, Ying and Liu, Ji and Zhang, Yulun}, title = {Pixel Adaptive Deep Unfolding Transformer for Hyperspectral Image Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12959-12968} }
BiViT: Extremely Compressed Binary Vision Transformers: Yefei He,

Zhenyu Lou,

Luoming Zhang,

Jing Liu,

Weijia Wu,

Hong Zhou,

Bohan Zhuang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{He_2023_ICCV, author = {He, Yefei and Lou, Zhenyu and Zhang, Luoming and Liu, Jing and Wu, Weijia and Zhou, Hong and Zhuang, Bohan}, title = {BiViT: Extremely Compressed Binary Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5651-5663} }
Dynamic PlenOctree for Adaptive Sampling Refinement in Explicit NeRF: Haotian Bai,

Yiqi Lin,

Yize Chen,

Lin Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bai_2023_ICCV, author = {Bai, Haotian and Lin, Yiqi and Chen, Yize and Wang, Lin}, title = {Dynamic PlenOctree for Adaptive Sampling Refinement in Explicit NeRF}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8785-8795} }
Scene Matters: Model-based Deep Video Compression: Lv Tang,

Xinfeng Zhang,

Gai Zhang,

Xiaoqi Ma; [pdf] [arXiv]
[bibtex]
@InProceedings{Tang_2023_ICCV, author = {Tang, Lv and Zhang, Xinfeng and Zhang, Gai and Ma, Xiaoqi}, title = {Scene Matters: Model-based Deep Video Compression}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12481-12491} }
Tree-Structured Shading Decomposition: Chen Geng,

Hong-Xing Yu,

Sharon Zhang,

Maneesh Agrawala,

Jiajun Wu; [pdf] [arXiv]
[bibtex]
@InProceedings{Geng_2023_ICCV, author = {Geng, Chen and Yu, Hong-Xing and Zhang, Sharon and Agrawala, Maneesh and Wu, Jiajun}, title = {Tree-Structured Shading Decomposition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {488-498} }
EfficientTrain: Exploring Generalized Curriculum Learning for Training Visual Backbones: Yulin Wang,

Yang Yue,

Rui Lu,

Tianjiao Liu,

Zhao Zhong,

Shiji Song,

Gao Huang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Yulin and Yue, Yang and Lu, Rui and Liu, Tianjiao and Zhong, Zhao and Song, Shiji and Huang, Gao}, title = {EfficientTrain: Exploring Generalized Curriculum Learning for Training Visual Backbones}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5852-5864} }
Simulating Fluids in Real-World Still Images: Siming Fan,

Jingtan Piao,

Chen Qian,

Hongsheng Li,

Kwan-Yee Lin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Fan_2023_ICCV, author = {Fan, Siming and Piao, Jingtan and Qian, Chen and Li, Hongsheng and Lin, Kwan-Yee}, title = {Simulating Fluids in Real-World Still Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15922-15931} }
SC3K: Self-supervised and Coherent 3D Keypoints Estimation from Rotated, Noisy, and Decimated Point Cloud Data: Mohammad Zohaib,

Alessio Del Bue; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zohaib_2023_ICCV, author = {Zohaib, Mohammad and Del Bue, Alessio}, title = {SC3K: Self-supervised and Coherent 3D Keypoints Estimation from Rotated, Noisy, and Decimated Point Cloud Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22509-22519} }
IntrinsicNeRF: Learning Intrinsic Neural Radiance Fields for Editable Novel View Synthesis: Weicai Ye,

Shuo Chen,

Chong Bao,

Hujun Bao,

Marc Pollefeys,

Zhaopeng Cui,

Guofeng Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ye_2023_ICCV, author = {Ye, Weicai and Chen, Shuo and Bao, Chong and Bao, Hujun and Pollefeys, Marc and Cui, Zhaopeng and Zhang, Guofeng}, title = {IntrinsicNeRF: Learning Intrinsic Neural Radiance Fields for Editable Novel View Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {339-351} }
Segmenting Known Objects and Unseen Unknowns without Prior Knowledge: Stefano Gasperini,

Alvaro Marcos-Ramiro,

Michael Schmidt,

Nassir Navab,

Benjamin Busam,

Federico Tombari; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gasperini_2023_ICCV, author = {Gasperini, Stefano and Marcos-Ramiro, Alvaro and Schmidt, Michael and Navab, Nassir and Busam, Benjamin and Tombari, Federico}, title = {Segmenting Known Objects and Unseen Unknowns without Prior Knowledge}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19321-19332} }
A Good Student is Cooperative and Reliable: CNN-Transformer Collaborative Learning for Semantic Segmentation: Jinjing Zhu,

Yunhao Luo,

Xu Zheng,

Hao Wang,

Lin Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Jinjing and Luo, Yunhao and Zheng, Xu and Wang, Hao and Wang, Lin}, title = {A Good Student is Cooperative and Reliable: CNN-Transformer Collaborative Learning for Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11720-11730} }
CMDA: Cross-Modality Domain Adaptation for Nighttime Semantic Segmentation: Ruihao Xia,

Chaoqiang Zhao,

Meng Zheng,

Ziyan Wu,

Qiyu Sun,

Yang Tang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xia_2023_ICCV, author = {Xia, Ruihao and Zhao, Chaoqiang and Zheng, Meng and Wu, Ziyan and Sun, Qiyu and Tang, Yang}, title = {CMDA: Cross-Modality Domain Adaptation for Nighttime Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21572-21581} }
Learning with Diversity: Self-Expanded Equalization for Better Generalized Deep Metric Learning: Jiexi Yan,

Zhihui Yin,

Erkun Yang,

Yanhua Yang,

Heng Huang; [pdf]
[bibtex]
@InProceedings{Yan_2023_ICCV, author = {Yan, Jiexi and Yin, Zhihui and Yang, Erkun and Yang, Yanhua and Huang, Heng}, title = {Learning with Diversity: Self-Expanded Equalization for Better Generalized Deep Metric Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19365-19374} }
Fan-Beam Binarization Difference Projection (FB-BDP): A Novel Local Object Descriptor for Fine-Grained Leaf Image Retrieval: Xin Chen,

Bin Wang,

Yongsheng Gao; [pdf]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Xin and Wang, Bin and Gao, Yongsheng}, title = {Fan-Beam Binarization Difference Projection (FB-BDP): A Novel Local Object Descriptor for Fine-Grained Leaf Image Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11102-11111} }
Dynamic Residual Classifier for Class Incremental Learning: Xiuwei Chen,

Xiaobin Chang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Xiuwei and Chang, Xiaobin}, title = {Dynamic Residual Classifier for Class Incremental Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18743-18752} }
Optimizing the Placement of Roadside LiDARs for Autonomous Driving: Wentao Jiang,

Hao Xiang,

Xinyu Cai,

Runsheng Xu,

Jiaqi Ma,

Yikang Li,

Gim Hee Lee,

Si Liu; [pdf] [supp]
[bibtex]
@InProceedings{Jiang_2023_ICCV, author = {Jiang, Wentao and Xiang, Hao and Cai, Xinyu and Xu, Runsheng and Ma, Jiaqi and Li, Yikang and Lee, Gim Hee and Liu, Si}, title = {Optimizing the Placement of Roadside LiDARs for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18381-18390} }
Diverse Inpainting and Editing with GAN Inversion: Ahmet Burak Yildirim,

Hamza Pehlivan,

Bahri Batuhan Bilecen,

Aysegul Dundar; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yildirim_2023_ICCV, author = {Yildirim, Ahmet Burak and Pehlivan, Hamza and Bilecen, Bahri Batuhan and Dundar, Aysegul}, title = {Diverse Inpainting and Editing with GAN Inversion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23120-23130} }
InterDiff: Generating 3D Human-Object Interactions with Physics-Informed Diffusion: Sirui Xu,

Zhengyuan Li,

Yu-Xiong Wang,

Liang-Yan Gui; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Sirui and Li, Zhengyuan and Wang, Yu-Xiong and Gui, Liang-Yan}, title = {InterDiff: Generating 3D Human-Object Interactions with Physics-Informed Diffusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14928-14940} }
DiFaReli: Diffusion Face Relighting: Puntawat Ponglertnapakorn,

Nontawat Tritrong,

Supasorn Suwajanakorn; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ponglertnapakorn_2023_ICCV, author = {Ponglertnapakorn, Puntawat and Tritrong, Nontawat and Suwajanakorn, Supasorn}, title = {DiFaReli: Diffusion Face Relighting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22646-22657} }
IST-Net: Prior-Free Category-Level Pose Estimation with Implicit Space Transformation: Jianhui Liu,

Yukang Chen,

Xiaoqing Ye,

Xiaojuan Qi; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Jianhui and Chen, Yukang and Ye, Xiaoqing and Qi, Xiaojuan}, title = {IST-Net: Prior-Free Category-Level Pose Estimation with Implicit Space Transformation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13978-13988} }
Building3D: A Urban-Scale Dataset and Benchmarks for Learning Roof Structures from Point Clouds: Ruisheng Wang,

Shangfeng Huang,

Hongxin Yang; [pdf]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Ruisheng and Huang, Shangfeng and Yang, Hongxin}, title = {Building3D: A Urban-Scale Dataset and Benchmarks for Learning Roof Structures from Point Clouds}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20076-20086} }
Multi-Object Discovery by Low-Dimensional Object Motion: Sadra Safadoust,

Fatma Güney; [pdf] [supp]
[bibtex]
@InProceedings{Safadoust_2023_ICCV, author = {Safadoust, Sadra and G\"uney, Fatma}, title = {Multi-Object Discovery by Low-Dimensional Object Motion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {734-744} }
Localizing Object-Level Shape Variations with Text-to-Image Diffusion Models: Or Patashnik,

Daniel Garibi,

Idan Azuri,

Hadar Averbuch-Elor,

Daniel Cohen-Or; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Patashnik_2023_ICCV, author = {Patashnik, Or and Garibi, Daniel and Azuri, Idan and Averbuch-Elor, Hadar and Cohen-Or, Daniel}, title = {Localizing Object-Level Shape Variations with Text-to-Image Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23051-23061} }
CoSign: Exploring Co-occurrence Signals in Skeleton-based Continuous Sign Language Recognition: Peiqi Jiao,

Yuecong Min,

Yanan Li,

Xiaotao Wang,

Lei Lei,

Xilin Chen; [pdf] [supp]
[bibtex]
@InProceedings{Jiao_2023_ICCV, author = {Jiao, Peiqi and Min, Yuecong and Li, Yanan and Wang, Xiaotao and Lei, Lei and Chen, Xilin}, title = {CoSign: Exploring Co-occurrence Signals in Skeleton-based Continuous Sign Language Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20676-20686} }
GACE: Geometry Aware Confidence Enhancement for Black-Box 3D Object Detectors on LiDAR-Data: David Schinagl,

Georg Krispel,

Christian Fruhwirth-Reisinger,

Horst Possegger,

Horst Bischof; [pdf] [supp]
[bibtex]
@InProceedings{Schinagl_2023_ICCV, author = {Schinagl, David and Krispel, Georg and Fruhwirth-Reisinger, Christian and Possegger, Horst and Bischof, Horst}, title = {GACE: Geometry Aware Confidence Enhancement for Black-Box 3D Object Detectors on LiDAR-Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6566-6576} }
Curvature-Aware Training for Coordinate Networks: Hemanth Saratchandran,

Shin-Fang Chng,

Sameera Ramasinghe,

Lachlan MacDonald,

Simon Lucey; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Saratchandran_2023_ICCV, author = {Saratchandran, Hemanth and Chng, Shin-Fang and Ramasinghe, Sameera and MacDonald, Lachlan and Lucey, Simon}, title = {Curvature-Aware Training for Coordinate Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13328-13338} }
Disentangle then Parse: Night-time Semantic Segmentation with Illumination Disentanglement: Zhixiang Wei,

Lin Chen,

Tao Tu,

Pengyang Ling,

Huaian Chen,

Yi Jin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wei_2023_ICCV, author = {Wei, Zhixiang and Chen, Lin and Tu, Tao and Ling, Pengyang and Chen, Huaian and Jin, Yi}, title = {Disentangle then Parse: Night-time Semantic Segmentation with Illumination Disentanglement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21593-21603} }
Large-Scale Land Cover Mapping with Fine-Grained Classes via Class-Aware Semi-Supervised Semantic Segmentation: Runmin Dong,

Lichao Mou,

Mengxuan Chen,

Weijia Li,

Xin-Yi Tong,

Shuai Yuan,

Lixian Zhang,

Juepeng Zheng,

Xiaoxiang Zhu,

Haohuan Fu; [pdf] [supp]
[bibtex]
@InProceedings{Dong_2023_ICCV, author = {Dong, Runmin and Mou, Lichao and Chen, Mengxuan and Li, Weijia and Tong, Xin-Yi and Yuan, Shuai and Zhang, Lixian and Zheng, Juepeng and Zhu, Xiaoxiang and Fu, Haohuan}, title = {Large-Scale Land Cover Mapping with Fine-Grained Classes via Class-Aware Semi-Supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16783-16793} }
ToonTalker: Cross-Domain Face Reenactment: Yuan Gong,

Yong Zhang,

Xiaodong Cun,

Fei Yin,

Yanbo Fan,

Xuan Wang,

Baoyuan Wu,

Yujiu Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gong_2023_ICCV, author = {Gong, Yuan and Zhang, Yong and Cun, Xiaodong and Yin, Fei and Fan, Yanbo and Wang, Xuan and Wu, Baoyuan and Yang, Yujiu}, title = {ToonTalker: Cross-Domain Face Reenactment}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7690-7700} }
LISTER: Neighbor Decoding for Length-Insensitive Scene Text Recognition: Changxu Cheng,

Peng Wang,

Cheng Da,

Qi Zheng,

Cong Yao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cheng_2023_ICCV, author = {Cheng, Changxu and Wang, Peng and Da, Cheng and Zheng, Qi and Yao, Cong}, title = {LISTER: Neighbor Decoding for Length-Insensitive Scene Text Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19541-19551} }
Proxy Anchor-based Unsupervised Learning for Continuous Generalized Category Discovery: Hyungmin Kim,

Sungho Suh,

Daehwan Kim,

Daun Jeong,

Hansang Cho,

Junmo Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2023_ICCV, author = {Kim, Hyungmin and Suh, Sungho and Kim, Daehwan and Jeong, Daun and Cho, Hansang and Kim, Junmo}, title = {Proxy Anchor-based Unsupervised Learning for Continuous Generalized Category Discovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16688-16697} }
Distribution-Aware Prompt Tuning for Vision-Language Models: Eulrang Cho,

Jooyeon Kim,

Hyunwoo J Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cho_2023_ICCV, author = {Cho, Eulrang and Kim, Jooyeon and Kim, Hyunwoo J}, title = {Distribution-Aware Prompt Tuning for Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22004-22013} }
Learning Rain Location Prior for Nighttime Deraining: Fan Zhang,

Shaodi You,

Yu Li,

Ying Fu; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Fan and You, Shaodi and Li, Yu and Fu, Ying}, title = {Learning Rain Location Prior for Nighttime Deraining}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13148-13157} }
FBLNet: FeedBack Loop Network for Driver Attention Prediction: Yilong Chen,

Zhixiong Nan,

Tao Xiang; [pdf] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Yilong and Nan, Zhixiong and Xiang, Tao}, title = {FBLNet: FeedBack Loop Network for Driver Attention Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13371-13380} }
Source-free Domain Adaptive Human Pose Estimation: Qucheng Peng,

Ce Zheng,

Chen Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Peng_2023_ICCV, author = {Peng, Qucheng and Zheng, Ce and Chen, Chen}, title = {Source-free Domain Adaptive Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4826-4836} }
Video Anomaly Detection via Sequentially Learning Multiple Pretext Tasks: Chenrui Shi,

Che Sun,

Yuwei Wu,

Yunde Jia; [pdf] [supp]
[bibtex]
@InProceedings{Shi_2023_ICCV, author = {Shi, Chenrui and Sun, Che and Wu, Yuwei and Jia, Yunde}, title = {Video Anomaly Detection via Sequentially Learning Multiple Pretext Tasks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10330-10340} }
SlaBins: Fisheye Depth Estimation using Slanted Bins on Road Environments: Jongsung Lee,

Gyeongsu Cho,

Jeongin Park,

Kyongjun Kim,

Seongoh Lee,

Jung-Hee Kim,

Seong-Gyun Jeong,

Kyungdon Joo; [pdf] [supp]
[bibtex]
@InProceedings{Lee_2023_ICCV, author = {Lee, Jongsung and Cho, Gyeongsu and Park, Jeongin and Kim, Kyongjun and Lee, Seongoh and Kim, Jung-Hee and Jeong, Seong-Gyun and Joo, Kyungdon}, title = {SlaBins: Fisheye Depth Estimation using Slanted Bins on Road Environments}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8765-8774} }
DOT: A Distillation-Oriented Trainer: Borui Zhao,

Quan Cui,

Renjie Song,

Jiajun Liang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Borui and Cui, Quan and Song, Renjie and Liang, Jiajun}, title = {DOT: A Distillation-Oriented Trainer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6189-6198} }
Neural Collage Transfer: Artistic Reconstruction via Material Manipulation: Ganghun Lee,

Minji Kim,

Yunsu Lee,

Minsu Lee,

Byoung-Tak Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Lee_2023_ICCV, author = {Lee, Ganghun and Kim, Minji and Lee, Yunsu and Lee, Minsu and Zhang, Byoung-Tak}, title = {Neural Collage Transfer: Artistic Reconstruction via Material Manipulation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2394-2405} }
Fantasia3D: Disentangling Geometry and Appearance for High-quality Text-to-3D Content Creation: Rui Chen,

Yongwei Chen,

Ningxin Jiao,

Kui Jia; [pdf] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Rui and Chen, Yongwei and Jiao, Ningxin and Jia, Kui}, title = {Fantasia3D: Disentangling Geometry and Appearance for High-quality Text-to-3D Content Creation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22246-22256} }
MagicFusion: Boosting Text-to-Image Generation Performance by Fusing Diffusion Models: Jing Zhao,

Heliang Zheng,

Chaoyue Wang,

Long Lan,

Wenjing Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Jing and Zheng, Heliang and Wang, Chaoyue and Lan, Long and Yang, Wenjing}, title = {MagicFusion: Boosting Text-to-Image Generation Performance by Fusing Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22592-22602} }
UCF: Uncovering Common Features for Generalizable Deepfake Detection: Zhiyuan Yan,

Yong Zhang,

Yanbo Fan,

Baoyuan Wu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yan_2023_ICCV, author = {Yan, Zhiyuan and Zhang, Yong and Fan, Yanbo and Wu, Baoyuan}, title = {UCF: Uncovering Common Features for Generalizable Deepfake Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22412-22423} }
March in Chat: Interactive Prompting for Remote Embodied Referring Expression: Yanyuan Qiao,

Yuankai Qi,

Zheng Yu,

Jing Liu,

Qi Wu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Qiao_2023_ICCV, author = {Qiao, Yanyuan and Qi, Yuankai and Yu, Zheng and Liu, Jing and Wu, Qi}, title = {March in Chat: Interactive Prompting for Remote Embodied Referring Expression}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15758-15767} }
Sample4Geo: Hard Negative Sampling For Cross-View Geo-Localisation: Fabian Deuser,

Konrad Habel,

Norbert Oswald; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Deuser_2023_ICCV, author = {Deuser, Fabian and Habel, Konrad and Oswald, Norbert}, title = {Sample4Geo: Hard Negative Sampling For Cross-View Geo-Localisation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16847-16856} }
Novel Scenes & Classes: Towards Adaptive Open-set Object Detection: Wuyang Li,

Xiaoqing Guo,

Yixuan Yuan; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Wuyang and Guo, Xiaoqing and Yuan, Yixuan}, title = {Novel Scenes \& Classes: Towards Adaptive Open-set Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15780-15790} }
LIMITR: Leveraging Local Information for Medical Image-Text Representation: Gefen Dawidowicz,

Elad Hirsch,

Ayellet Tal; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dawidowicz_2023_ICCV, author = {Dawidowicz, Gefen and Hirsch, Elad and Tal, Ayellet}, title = {LIMITR: Leveraging Local Information for Medical Image-Text Representation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21165-21173} }
Multi-task View Synthesis with Neural Radiance Fields: Shuhong Zheng,

Zhipeng Bao,

Martial Hebert,

Yu-Xiong Wang; [pdf] [supp]
[bibtex]
@InProceedings{Zheng_2023_ICCV, author = {Zheng, Shuhong and Bao, Zhipeng and Hebert, Martial and Wang, Yu-Xiong}, title = {Multi-task View Synthesis with Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21538-21549} }
Informative Data Mining for One-Shot Cross-Domain Semantic Segmentation: Yuxi Wang,

Jian Liang,

Jun Xiao,

Shuqi Mei,

Yuran Yang,

Zhaoxiang Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Yuxi and Liang, Jian and Xiao, Jun and Mei, Shuqi and Yang, Yuran and Zhang, Zhaoxiang}, title = {Informative Data Mining for One-Shot Cross-Domain Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1064-1074} }
Efficient Unified Demosaicing for Bayer and Non-Bayer Patterned Image Sensors: Haechang Lee,

Dongwon Park,

Wongi Jeong,

Kijeong Kim,

Hyunwoo Je,

Dongil Ryu,

Se Young Chun; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2023_ICCV, author = {Lee, Haechang and Park, Dongwon and Jeong, Wongi and Kim, Kijeong and Je, Hyunwoo and Ryu, Dongil and Chun, Se Young}, title = {Efficient Unified Demosaicing for Bayer and Non-Bayer Patterned Image Sensors}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12750-12759} }
Visual Traffic Knowledge Graph Generation from Scene Images: Yunfei Guo,

Fei Yin,

Xiao-hui Li,

Xudong Yan,

Tao Xue,

Shuqi Mei,

Cheng-Lin Liu; [pdf] [supp]
[bibtex]
@InProceedings{Guo_2023_ICCV, author = {Guo, Yunfei and Yin, Fei and Li, Xiao-hui and Yan, Xudong and Xue, Tao and Mei, Shuqi and Liu, Cheng-Lin}, title = {Visual Traffic Knowledge Graph Generation from Scene Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21604-21613} }
Householder Projector for Unsupervised Latent Semantics Discovery: Yue Song,

Jichao Zhang,

Nicu Sebe,

Wei Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Song_2023_ICCV, author = {Song, Yue and Zhang, Jichao and Sebe, Nicu and Wang, Wei}, title = {Householder Projector for Unsupervised Latent Semantics Discovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7712-7722} }
Spatially-Adaptive Feature Modulation for Efficient Image Super-Resolution: Long Sun,

Jiangxin Dong,

Jinhui Tang,

Jinshan Pan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sun_2023_ICCV, author = {Sun, Long and Dong, Jiangxin and Tang, Jinhui and Pan, Jinshan}, title = {Spatially-Adaptive Feature Modulation for Efficient Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13190-13199} }
Unsupervised Image Denoising in Real-World Scenarios via Self-Collaboration Parallel Generative Adversarial Branches: Xin Lin,

Chao Ren,

Xiao Liu,

Jie Huang,

Yinjie Lei; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lin_2023_ICCV, author = {Lin, Xin and Ren, Chao and Liu, Xiao and Huang, Jie and Lei, Yinjie}, title = {Unsupervised Image Denoising in Real-World Scenarios via Self-Collaboration Parallel Generative Adversarial Branches}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12642-12652} }
Bayesian Optimization Meets Self-Distillation: HyunJae Lee,

Heon Song,

Hyeonsoo Lee,

Gi-hyeon Lee,

Suyeong Park,

Donggeun Yoo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2023_ICCV, author = {Lee, HyunJae and Song, Heon and Lee, Hyeonsoo and Lee, Gi-hyeon and Park, Suyeong and Yoo, Donggeun}, title = {Bayesian Optimization Meets Self-Distillation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1696-1705} }
No Fear of Classifier Biases: Neural Collapse Inspired Federated Learning with Synthetic and Fixed Classifier: Zexi Li,

Xinyi Shang,

Rui He,

Tao Lin,

Chao Wu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Zexi and Shang, Xinyi and He, Rui and Lin, Tao and Wu, Chao}, title = {No Fear of Classifier Biases: Neural Collapse Inspired Federated Learning with Synthetic and Fixed Classifier}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5319-5329} }
MemorySeg: Online LiDAR Semantic Segmentation with a Latent Memory: Enxu Li,

Sergio Casas,

Raquel Urtasun; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Enxu and Casas, Sergio and Urtasun, Raquel}, title = {MemorySeg: Online LiDAR Semantic Segmentation with a Latent Memory}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {745-754} }
Hashing Neural Video Decomposition with Multiplicative Residuals in Space-Time: Cheng-Hung Chan,

Cheng-Yang Yuan,

Cheng Sun,

Hwann-Tzong Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chan_2023_ICCV, author = {Chan, Cheng-Hung and Yuan, Cheng-Yang and Sun, Cheng and Chen, Hwann-Tzong}, title = {Hashing Neural Video Decomposition with Multiplicative Residuals in Space-Time}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7743-7753} }
Multimodal Variational Auto-encoder based Audio-Visual Segmentation: Yuxin Mao,

Jing Zhang,

Mochu Xiang,

Yiran Zhong,

Yuchao Dai; [pdf] [supp]
[bibtex]
@InProceedings{Mao_2023_ICCV, author = {Mao, Yuxin and Zhang, Jing and Xiang, Mochu and Zhong, Yiran and Dai, Yuchao}, title = {Multimodal Variational Auto-encoder based Audio-Visual Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {954-965} }
DynaMITe: Dynamic Query Bootstrapping for Multi-object Interactive Segmentation Transformer: Amit Kumar Rana,

Sabarinath Mahadevan,

Alexander Hermans,

Bastian Leibe; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Rana_2023_ICCV, author = {Rana, Amit Kumar and Mahadevan, Sabarinath and Hermans, Alexander and Leibe, Bastian}, title = {DynaMITe: Dynamic Query Bootstrapping for Multi-object Interactive Segmentation Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1043-1052} }
FRAug: Tackling Federated Learning with Non-IID Features via Representation Augmentation: Haokun Chen,

Ahmed Frikha,

Denis Krompass,

Jindong Gu,

Volker Tresp; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Haokun and Frikha, Ahmed and Krompass, Denis and Gu, Jindong and Tresp, Volker}, title = {FRAug: Tackling Federated Learning with Non-IID Features via Representation Augmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4849-4859} }
Homography Guided Temporal Fusion for Road Line and Marking Segmentation: Shan Wang,

Chuong Nguyen,

Jiawei Liu,

Kaihao Zhang,

Wenhan Luo,

Yanhao Zhang,

Sundaram Muthu,

Fahira Afzal Maken,

Hongdong Li; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Shan and Nguyen, Chuong and Liu, Jiawei and Zhang, Kaihao and Luo, Wenhan and Zhang, Yanhao and Muthu, Sundaram and Maken, Fahira Afzal and Li, Hongdong}, title = {Homography Guided Temporal Fusion for Road Line and Marking Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1075-1085} }
NeuRBF: A Neural Fields Representation with Adaptive Radial Basis Functions: Zhang Chen,

Zhong Li,

Liangchen Song,

Lele Chen,

Jingyi Yu,

Junsong Yuan,

Yi Xu; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Zhang and Li, Zhong and Song, Liangchen and Chen, Lele and Yu, Jingyi and Yuan, Junsong and Xu, Yi}, title = {NeuRBF: A Neural Fields Representation with Adaptive Radial Basis Functions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4182-4194} }
OmnimatteRF: Robust Omnimatte with 3D Background Modeling: Geng Lin,

Chen Gao,

Jia-Bin Huang,

Changil Kim,

Yipeng Wang,

Matthias Zwicker,

Ayush Saraf; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lin_2023_ICCV, author = {Lin, Geng and Gao, Chen and Huang, Jia-Bin and Kim, Changil and Wang, Yipeng and Zwicker, Matthias and Saraf, Ayush}, title = {OmnimatteRF: Robust Omnimatte with 3D Background Modeling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23471-23480} }
Self-supervised Image Denoising with Downsampled Invariance Loss and Conditional Blind-Spot Network: Yeong Il Jang,

Keuntek Lee,

Gu Yong Park,

Seyun Kim,

Nam Ik Cho; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jang_2023_ICCV, author = {Jang, Yeong Il and Lee, Keuntek and Park, Gu Yong and Kim, Seyun and Cho, Nam Ik}, title = {Self-supervised Image Denoising with Downsampled Invariance Loss and Conditional Blind-Spot Network}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12196-12205} }
Multi-granularity Interaction Simulation for Unsupervised Interactive Segmentation: Kehan Li,

Yian Zhao,

Zhennan Wang,

Zesen Cheng,

Peng Jin,

Xiangyang Ji,

Li Yuan,

Chang Liu,

Jie Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Kehan and Zhao, Yian and Wang, Zhennan and Cheng, Zesen and Jin, Peng and Ji, Xiangyang and Yuan, Li and Liu, Chang and Chen, Jie}, title = {Multi-granularity Interaction Simulation for Unsupervised Interactive Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {666-676} }
RecursiveDet: End-to-End Region-Based Recursive Object Detection: Jing Zhao,

Li Sun,

Qingli Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Jing and Sun, Li and Li, Qingli}, title = {RecursiveDet: End-to-End Region-Based Recursive Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6307-6316} }
Bold but Cautious: Unlocking the Potential of Personalized Federated Learning through Cautiously Aggressive Collaboration: Xinghao Wu,

Xuefeng Liu,

Jianwei Niu,

Guogang Zhu,

Shaojie Tang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Xinghao and Liu, Xuefeng and Niu, Jianwei and Zhu, Guogang and Tang, Shaojie}, title = {Bold but Cautious: Unlocking the Potential of Personalized Federated Learning through Cautiously Aggressive Collaboration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19375-19384} }
ESSAformer: Efficient Transformer for Hyperspectral Image Super-resolution: Mingjin Zhang,

Chi Zhang,

Qiming Zhang,

Jie Guo,

Xinbo Gao,

Jing Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Mingjin and Zhang, Chi and Zhang, Qiming and Guo, Jie and Gao, Xinbo and Zhang, Jing}, title = {ESSAformer: Efficient Transformer for Hyperspectral Image Super-resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23073-23084} }
Generative Action Description Prompts for Skeleton-based Action Recognition: Wangmeng Xiang,

Chao Li,

Yuxuan Zhou,

Biao Wang,

Lei Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xiang_2023_ICCV, author = {Xiang, Wangmeng and Li, Chao and Zhou, Yuxuan and Wang, Biao and Zhang, Lei}, title = {Generative Action Description Prompts for Skeleton-based Action Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10276-10285} }
Structure Invariant Transformation for better Adversarial Transferability: Xiaosen Wang,

Zeliang Zhang,

Jianping Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Xiaosen and Zhang, Zeliang and Zhang, Jianping}, title = {Structure Invariant Transformation for better Adversarial Transferability}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4607-4619} }
Thinking Image Color Aesthetics Assessment: Models, Datasets and Benchmarks: Shuai He,

Anlong Ming,

Yaqi Li,

Jinyuan Sun,

ShunTian Zheng,

Huadong Ma; [pdf]
[bibtex]
@InProceedings{He_2023_ICCV, author = {He, Shuai and Ming, Anlong and Li, Yaqi and Sun, Jinyuan and Zheng, ShunTian and Ma, Huadong}, title = {Thinking Image Color Aesthetics Assessment: Models, Datasets and Benchmarks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21838-21847} }
Multi-body Depth and Camera Pose Estimation from Multiple Views: Andrea Porfiri Dal Cin,

Giacomo Boracchi,

Luca Magri; [pdf] [supp]
[bibtex]
@InProceedings{Cin_2023_ICCV, author = {Cin, Andrea Porfiri Dal and Boracchi, Giacomo and Magri, Luca}, title = {Multi-body Depth and Camera Pose Estimation from Multiple Views}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17804-17814} }
DISeR: Designing Imaging Systems with Reinforcement Learning: Tzofi Klinghoffer,

Kushagra Tiwary,

Nikhil Behari,

Bhavya Agrawalla,

Ramesh Raskar; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Klinghoffer_2023_ICCV, author = {Klinghoffer, Tzofi and Tiwary, Kushagra and Behari, Nikhil and Agrawalla, Bhavya and Raskar, Ramesh}, title = {DISeR: Designing Imaging Systems with Reinforcement Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23632-23642} }
The Euclidean Space is Evil: Hyperbolic Attribute Editing for Few-shot Image Generation: Lingxiao Li,

Yi Zhang,

Shuhui Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Lingxiao and Zhang, Yi and Wang, Shuhui}, title = {The Euclidean Space is Evil: Hyperbolic Attribute Editing for Few-shot Image Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22714-22724} }
FULLER: Unified Multi-modality Multi-task 3D Perception via Multi-level Gradient Calibration: Zhijian Huang,

Sihao Lin,

Guiyu Liu,

Mukun Luo,

Chaoqiang Ye,

Hang Xu,

Xiaojun Chang,

Xiaodan Liang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Zhijian and Lin, Sihao and Liu, Guiyu and Luo, Mukun and Ye, Chaoqiang and Xu, Hang and Chang, Xiaojun and Liang, Xiaodan}, title = {FULLER: Unified Multi-modality Multi-task 3D Perception via Multi-level Gradient Calibration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3502-3511} }
Transparent Shape from a Single View Polarization Image: Mingqi Shao,

Chongkun Xia,

Zhendong Yang,

Junnan Huang,

Xueqian Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shao_2023_ICCV, author = {Shao, Mingqi and Xia, Chongkun and Yang, Zhendong and Huang, Junnan and Wang, Xueqian}, title = {Transparent Shape from a Single View Polarization Image}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9277-9286} }
Invariant Feature Regularization for Fair Face Recognition: Jiali Ma,

Zhongqi Yue,

Kagaya Tomoyuki,

Suzuki Tomoki,

Karlekar Jayashree,

Sugiri Pranata,

Hanwang Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Ma_2023_ICCV, author = {Ma, Jiali and Yue, Zhongqi and Tomoyuki, Kagaya and Tomoki, Suzuki and Jayashree, Karlekar and Pranata, Sugiri and Zhang, Hanwang}, title = {Invariant Feature Regularization for Fair Face Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20861-20870} }
Cross-Domain Product Representation Learning for Rich-Content E-Commerce: Xuehan Bai,

Yan Li,

Yanhua Cheng,

Wenjie Yang,

Quan Chen,

Han Li; [pdf] [supp]
[bibtex]
@InProceedings{Bai_2023_ICCV, author = {Bai, Xuehan and Li, Yan and Cheng, Yanhua and Yang, Wenjie and Chen, Quan and Li, Han}, title = {Cross-Domain Product Representation Learning for Rich-Content E-Commerce}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5697-5706} }
DriveAdapter: Breaking the Coupling Barrier of Perception and Planning in End-to-End Autonomous Driving: Xiaosong Jia,

Yulu Gao,

Li Chen,

Junchi Yan,

Patrick Langechuan Liu,

Hongyang Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jia_2023_ICCV, author = {Jia, Xiaosong and Gao, Yulu and Chen, Li and Yan, Junchi and Liu, Patrick Langechuan and Li, Hongyang}, title = {DriveAdapter: Breaking the Coupling Barrier of Perception and Planning in End-to-End Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7953-7963} }
General Planar Motion from a Pair of 3D Correspondences: Juan Carlos Dibene,

Zhixiang Min,

Enrique Dunn; [pdf] [supp]
[bibtex]
@InProceedings{Dibene_2023_ICCV, author = {Dibene, Juan Carlos and Min, Zhixiang and Dunn, Enrique}, title = {General Planar Motion from a Pair of 3D Correspondences}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8060-8070} }
Single Depth-image 3D Reflection Symmetry and Shape Prediction: Zhaoxuan Zhang,

Bo Dong,

Tong Li,

Felix Heide,

Pieter Peers,

Baocai Yin,

Xin Yang; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Zhaoxuan and Dong, Bo and Li, Tong and Heide, Felix and Peers, Pieter and Yin, Baocai and Yang, Xin}, title = {Single Depth-image 3D Reflection Symmetry and Shape Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8896-8906} }
Local Context-Aware Active Domain Adaptation: Tao Sun,

Cheng Lu,

Haibin Ling; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sun_2023_ICCV, author = {Sun, Tao and Lu, Cheng and Ling, Haibin}, title = {Local Context-Aware Active Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18634-18643} }
Deep Incubation: Training Large Models by Divide-and-Conquering: Zanlin Ni,

Yulin Wang,

Jiangwei Yu,

Haojun Jiang,

Yue Cao,

Gao Huang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ni_2023_ICCV, author = {Ni, Zanlin and Wang, Yulin and Yu, Jiangwei and Jiang, Haojun and Cao, Yue and Huang, Gao}, title = {Deep Incubation: Training Large Models by Divide-and-Conquering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17335-17345} }
Downscaled Representation Matters: Improving Image Rescaling with Collaborative Downscaled Images: Bingna Xu,

Yong Guo,

Luoqian Jiang,

Mianjie Yu,

Jian Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Bingna and Guo, Yong and Jiang, Luoqian and Yu, Mianjie and Chen, Jian}, title = {Downscaled Representation Matters: Improving Image Rescaling with Collaborative Downscaled Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12237-12247} }
Detection Transformer with Stable Matching: Shilong Liu,

Tianhe Ren,

Jiayu Chen,

Zhaoyang Zeng,

Hao Zhang,

Feng Li,

Hongyang Li,

Jun Huang,

Hang Su,

Jun Zhu,

Lei Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Shilong and Ren, Tianhe and Chen, Jiayu and Zeng, Zhaoyang and Zhang, Hao and Li, Feng and Li, Hongyang and Huang, Jun and Su, Hang and Zhu, Jun and Zhang, Lei}, title = {Detection Transformer with Stable Matching}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6491-6500} }
Be Everywhere - Hear Everything (BEE): Audio Scene Reconstruction by Sparse Audio-Visual Samples: Mingfei Chen,

Kun Su,

Eli Shlizerman; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Mingfei and Su, Kun and Shlizerman, Eli}, title = {Be Everywhere - Hear Everything (BEE): Audio Scene Reconstruction by Sparse Audio-Visual Samples}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7853-7862} }
iVS-Net: Learning Human View Synthesis from Internet Videos: Junting Dong,

Qi Fang,

Tianshuo Yang,

Qing Shuai,

Chengyu Qiao,

Sida Peng; [pdf] [supp]
[bibtex]
@InProceedings{Dong_2023_ICCV, author = {Dong, Junting and Fang, Qi and Yang, Tianshuo and Shuai, Qing and Qiao, Chengyu and Peng, Sida}, title = {iVS-Net: Learning Human View Synthesis from Internet Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22942-22951} }
Story Visualization by Online Text Augmentation with Context Memory: Daechul Ahn,

Daneul Kim,

Gwangmo Song,

Seung Hwan Kim,

Honglak Lee,

Dongyeop Kang,

Jonghyun Choi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ahn_2023_ICCV, author = {Ahn, Daechul and Kim, Daneul and Song, Gwangmo and Kim, Seung Hwan and Lee, Honglak and Kang, Dongyeop and Choi, Jonghyun}, title = {Story Visualization by Online Text Augmentation with Context Memory}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3125-3135} }
Attention Discriminant Sampling for Point Clouds: Cheng-Yao Hong,

Yu-Ying Chou,

Tyng-Luh Liu; [pdf] [supp]
[bibtex]
@InProceedings{Hong_2023_ICCV, author = {Hong, Cheng-Yao and Chou, Yu-Ying and Liu, Tyng-Luh}, title = {Attention Discriminant Sampling for Point Clouds}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14429-14440} }
Global Balanced Experts for Federated Long-Tailed Learning: Yaopei Zeng,

Lei Liu,

Li Liu,

Li Shen,

Shaoguo Liu,

Baoyuan Wu; [pdf] [supp]
[bibtex]
@InProceedings{Zeng_2023_ICCV, author = {Zeng, Yaopei and Liu, Lei and Liu, Li and Shen, Li and Liu, Shaoguo and Wu, Baoyuan}, title = {Global Balanced Experts for Federated Long-Tailed Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4815-4825} }
All4One: Symbiotic Neighbour Contrastive Learning via Self-Attention and Redundancy Reduction: Imanol G. Estepa,

Ignacio Sarasua,

Bhalaji Nagarajan,

Petia Radeva; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Estepa_2023_ICCV, author = {Estepa, Imanol G. and Sarasua, Ignacio and Nagarajan, Bhalaji and Radeva, Petia}, title = {All4One: Symbiotic Neighbour Contrastive Learning via Self-Attention and Redundancy Reduction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16243-16253} }
Contrastive Pseudo Learning for Open-World DeepFake Attribution: Zhimin Sun,

Shen Chen,

Taiping Yao,

Bangjie Yin,

Ran Yi,

Shouhong Ding,

Lizhuang Ma; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sun_2023_ICCV, author = {Sun, Zhimin and Chen, Shen and Yao, Taiping and Yin, Bangjie and Yi, Ran and Ding, Shouhong and Ma, Lizhuang}, title = {Contrastive Pseudo Learning for Open-World DeepFake Attribution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20882-20892} }
ICL-D3IE: In-Context Learning with Diverse Demonstrations Updating for Document Information Extraction: Jiabang He,

Lei Wang,

Yi Hu,

Ning Liu,

Hui Liu,

Xing Xu,

Heng Tao Shen; [pdf]
[bibtex]
@InProceedings{He_2023_ICCV, author = {He, Jiabang and Wang, Lei and Hu, Yi and Liu, Ning and Liu, Hui and Xu, Xing and Shen, Heng Tao}, title = {ICL-D3IE: In-Context Learning with Diverse Demonstrations Updating for Document Information Extraction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19485-19494} }
IHNet: Iterative Hierarchical Network Guided by High-Resolution Estimated Information for Scene Flow Estimation: Yun Wang,

Cheng Chi,

Min Lin,

Xin Yang; [pdf]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Yun and Chi, Cheng and Lin, Min and Yang, Xin}, title = {IHNet: Iterative Hierarchical Network Guided by High-Resolution Estimated Information for Scene Flow Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10073-10082} }
SimNP: Learning Self-Similarity Priors Between Neural Points: Christopher Wewer,

Eddy Ilg,

Bernt Schiele,

Jan Eric Lenssen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wewer_2023_ICCV, author = {Wewer, Christopher and Ilg, Eddy and Schiele, Bernt and Lenssen, Jan Eric}, title = {SimNP: Learning Self-Similarity Priors Between Neural Points}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8841-8852} }
Beyond the Limitation of Monocular 3D Detector via Knowledge Distillation: Yiran Yang,

Dongshuo Yin,

Xuee Rong,

Xian Sun,

Wenhui Diao,

Xinming Li; [pdf]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Yiran and Yin, Dongshuo and Rong, Xuee and Sun, Xian and Diao, Wenhui and Li, Xinming}, title = {Beyond the Limitation of Monocular 3D Detector via Knowledge Distillation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9077-9086} }
Cascade-DETR: Delving into High-Quality Universal Object Detection: Mingqiao Ye,

Lei Ke,

Siyuan Li,

Yu-Wing Tai,

Chi-Keung Tang,

Martin Danelljan,

Fisher Yu; [pdf] [supp]
[bibtex]
@InProceedings{Ye_2023_ICCV, author = {Ye, Mingqiao and Ke, Lei and Li, Siyuan and Tai, Yu-Wing and Tang, Chi-Keung and Danelljan, Martin and Yu, Fisher}, title = {Cascade-DETR: Delving into High-Quality Universal Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6704-6714} }
ACLS: Adaptive and Conditional Label Smoothing for Network Calibration: Hyekang Park,

Jongyoun Noh,

Youngmin Oh,

Donghyeon Baek,

Bumsub Ham; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Park_2023_ICCV, author = {Park, Hyekang and Noh, Jongyoun and Oh, Youngmin and Baek, Donghyeon and Ham, Bumsub}, title = {ACLS: Adaptive and Conditional Label Smoothing for Network Calibration}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3936-3945} }
EMR-MSF: Self-Supervised Recurrent Monocular Scene Flow Exploiting Ego-Motion Rigidity: Zijie Jiang,

Masatoshi Okutomi; [pdf] [supp]
[bibtex]
@InProceedings{Jiang_2023_ICCV, author = {Jiang, Zijie and Okutomi, Masatoshi}, title = {EMR-MSF: Self-Supervised Recurrent Monocular Scene Flow Exploiting Ego-Motion Rigidity}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {69-78} }
Evaluation and Improvement of Interpretability for Self-Explainable Part-Prototype Networks: Qihan Huang,

Mengqi Xue,

Wenqi Huang,

Haofei Zhang,

Jie Song,

Yongcheng Jing,

Mingli Song; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Qihan and Xue, Mengqi and Huang, Wenqi and Zhang, Haofei and Song, Jie and Jing, Yongcheng and Song, Mingli}, title = {Evaluation and Improvement of Interpretability for Self-Explainable Part-Prototype Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2011-2020} }
Temporal-Coded Spiking Neural Networks with Dynamic Firing Threshold: Learning with Event-Driven Backpropagation: Wenjie Wei,

Malu Zhang,

Hong Qu,

Ammar Belatreche,

Jian Zhang,

Hong Chen; [pdf]
[bibtex]
@InProceedings{Wei_2023_ICCV, author = {Wei, Wenjie and Zhang, Malu and Qu, Hong and Belatreche, Ammar and Zhang, Jian and Chen, Hong}, title = {Temporal-Coded Spiking Neural Networks with Dynamic Firing Threshold: Learning with Event-Driven Backpropagation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10552-10562} }
Mitigating Adversarial Vulnerability through Causal Parameter Estimation by Adversarial Double Machine Learning: Byung-Kwan Lee,

Junho Kim,

Yong Man Ro; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2023_ICCV, author = {Lee, Byung-Kwan and Kim, Junho and Ro, Yong Man}, title = {Mitigating Adversarial Vulnerability through Causal Parameter Estimation by Adversarial Double Machine Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4499-4509} }
Dynamic Token Pruning in Plain Vision Transformers for Semantic Segmentation: Quan Tang,

Bowen Zhang,

Jiajun Liu,

Fagui Liu,

Yifan Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tang_2023_ICCV, author = {Tang, Quan and Zhang, Bowen and Liu, Jiajun and Liu, Fagui and Liu, Yifan}, title = {Dynamic Token Pruning in Plain Vision Transformers for Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {777-786} }
Shape Anchor Guided Holistic Indoor Scene Understanding: Mingyue Dong,

Linxi Huan,

Hanjiang Xiong,

Shuhan Shen,

Xianwei Zheng; [pdf] [arXiv]
[bibtex]
@InProceedings{Dong_2023_ICCV, author = {Dong, Mingyue and Huan, Linxi and Xiong, Hanjiang and Shen, Shuhan and Zheng, Xianwei}, title = {Shape Anchor Guided Holistic Indoor Scene Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21916-21926} }
Knowledge-Aware Federated Active Learning with Non-IID Data: Yu-Tong Cao,

Ye Shi,

Baosheng Yu,

Jingya Wang,

Dacheng Tao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cao_2023_ICCV, author = {Cao, Yu-Tong and Shi, Ye and Yu, Baosheng and Wang, Jingya and Tao, Dacheng}, title = {Knowledge-Aware Federated Active Learning with Non-IID Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22279-22289} }
PlankAssembly: Robust 3D Reconstruction from Three Orthographic Views with Learnt Shape Programs: Wentao Hu,

Jia Zheng,

Zixin Zhang,

Xiaojun Yuan,

Jian Yin,

Zihan Zhou; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hu_2023_ICCV, author = {Hu, Wentao and Zheng, Jia and Zhang, Zixin and Yuan, Xiaojun and Yin, Jian and Zhou, Zihan}, title = {PlankAssembly: Robust 3D Reconstruction from Three Orthographic Views with Learnt Shape Programs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18495-18505} }
PODIA-3D: Domain Adaptation of 3D Generative Model Across Large Domain Gap Using Pose-Preserved Text-to-Image Diffusion: Gwanghyun Kim,

Ji Ha Jang,

Se Young Chun; [pdf] [supp]
[bibtex]
@InProceedings{Kim_2023_ICCV, author = {Kim, Gwanghyun and Jang, Ji Ha and Chun, Se Young}, title = {PODIA-3D: Domain Adaptation of 3D Generative Model Across Large Domain Gap Using Pose-Preserved Text-to-Image Diffusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22603-22612} }
Steered Diffusion: A Generalized Framework for Plug-and-Play Conditional Image Synthesis: Nithin Gopalakrishnan Nair,

Anoop Cherian,

Suhas Lohit,

Ye Wang,

Toshiaki Koike-Akino,

Vishal M. Patel,

Tim K. Marks; [pdf] [supp]
[bibtex]
@InProceedings{Nair_2023_ICCV, author = {Nair, Nithin Gopalakrishnan and Cherian, Anoop and Lohit, Suhas and Wang, Ye and Koike-Akino, Toshiaki and Patel, Vishal M. and Marks, Tim K.}, title = {Steered Diffusion: A Generalized Framework for Plug-and-Play Conditional Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20850-20860} }
DiffFit: Unlocking Transferability of Large Diffusion Models via Simple Parameter-efficient Fine-Tuning: Enze Xie,

Lewei Yao,

Han Shi,

Zhili Liu,

Daquan Zhou,

Zhaoqiang Liu,

Jiawei Li,

Zhenguo Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xie_2023_ICCV, author = {Xie, Enze and Yao, Lewei and Shi, Han and Liu, Zhili and Zhou, Daquan and Liu, Zhaoqiang and Li, Jiawei and Li, Zhenguo}, title = {DiffFit: Unlocking Transferability of Large Diffusion Models via Simple Parameter-efficient Fine-Tuning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4230-4239} }
NeO 360: Neural Fields for Sparse View Synthesis of Outdoor Scenes: Muhammad Zubair Irshad,

Sergey Zakharov,

Katherine Liu,

Vitor Guizilini,

Thomas Kollar,

Adrien Gaidon,

Zsolt Kira,

Rares Ambrus; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Irshad_2023_ICCV, author = {Irshad, Muhammad Zubair and Zakharov, Sergey and Liu, Katherine and Guizilini, Vitor and Kollar, Thomas and Gaidon, Adrien and Kira, Zsolt and Ambrus, Rares}, title = {NeO 360: Neural Fields for Sparse View Synthesis of Outdoor Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9187-9198} }
UnLoc: A Unified Framework for Video Localization Tasks: Shen Yan,

Xuehan Xiong,

Arsha Nagrani,

Anurag Arnab,

Zhonghao Wang,

Weina Ge,

David Ross,

Cordelia Schmid; [pdf] [arXiv]
[bibtex]
@InProceedings{Yan_2023_ICCV, author = {Yan, Shen and Xiong, Xuehan and Nagrani, Arsha and Arnab, Anurag and Wang, Zhonghao and Ge, Weina and Ross, David and Schmid, Cordelia}, title = {UnLoc: A Unified Framework for Video Localization Tasks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13623-13633} }
QD-BEV : Quantization-aware View-guided Distillation for Multi-view 3D Object Detection: Yifan Zhang,

Zhen Dong,

Huanrui Yang,

Ming Lu,

Cheng-Ching Tseng,

Yuan Du,

Kurt Keutzer,

Li Du,

Shanghang Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Yifan and Dong, Zhen and Yang, Huanrui and Lu, Ming and Tseng, Cheng-Ching and Du, Yuan and Keutzer, Kurt and Du, Li and Zhang, Shanghang}, title = {QD-BEV : Quantization-aware View-guided Distillation for Multi-view 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3825-3835} }
Fast Inference and Update of Probabilistic Density Estimation on Trajectory Prediction: Takahiro Maeda,

Norimichi Ukita; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Maeda_2023_ICCV, author = {Maeda, Takahiro and Ukita, Norimichi}, title = {Fast Inference and Update of Probabilistic Density Estimation on Trajectory Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9795-9805} }
CLIPascene: Scene Sketching with Different Types and Levels of Abstraction: Yael Vinker,

Yuval Alaluf,

Daniel Cohen-Or,

Ariel Shamir; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Vinker_2023_ICCV, author = {Vinker, Yael and Alaluf, Yuval and Cohen-Or, Daniel and Shamir, Ariel}, title = {CLIPascene: Scene Sketching with Different Types and Levels of Abstraction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4146-4156} }
Vision Grid Transformer for Document Layout Analysis: Cheng Da,

Chuwei Luo,

Qi Zheng,

Cong Yao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Da_2023_ICCV, author = {Da, Cheng and Luo, Chuwei and Zheng, Qi and Yao, Cong}, title = {Vision Grid Transformer for Document Layout Analysis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19462-19472} }
Multi-Directional Subspace Editing in Style-Space: Chen Naveh; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Naveh_2023_ICCV, author = {Naveh, Chen}, title = {Multi-Directional Subspace Editing in Style-Space}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7138-7148} }
Adaptive Superpixel for Active Learning in Semantic Segmentation: Hoyoung Kim,

Minhyeon Oh,

Sehyun Hwang,

Suha Kwak,

Jungseul Ok; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2023_ICCV, author = {Kim, Hoyoung and Oh, Minhyeon and Hwang, Sehyun and Kwak, Suha and Ok, Jungseul}, title = {Adaptive Superpixel for Active Learning in Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {943-953} }
Adaptive Spiral Layers for Efficient 3D Representation Learning on Meshes: Francesca Babiloni,

Matteo Maggioni,

Thomas Tanay,

Jiankang Deng,

Ales Leonardis,

Stefanos Zafeiriou; [pdf] [supp]
[bibtex]
@InProceedings{Babiloni_2023_ICCV, author = {Babiloni, Francesca and Maggioni, Matteo and Tanay, Thomas and Deng, Jiankang and Leonardis, Ales and Zafeiriou, Stefanos}, title = {Adaptive Spiral Layers for Efficient 3D Representation Learning on Meshes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14620-14631} }
Parametric Information Maximization for Generalized Category Discovery: Florent Chiaroni,

Jose Dolz,

Ziko Imtiaz Masud,

Amar Mitiche,

Ismail Ben Ayed; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chiaroni_2023_ICCV, author = {Chiaroni, Florent and Dolz, Jose and Masud, Ziko Imtiaz and Mitiche, Amar and Ben Ayed, Ismail}, title = {Parametric Information Maximization for Generalized Category Discovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1729-1739} }
Convex Decomposition of Indoor Scenes: Vaibhav Vavilala,

David Forsyth; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Vavilala_2023_ICCV, author = {Vavilala, Vaibhav and Forsyth, David}, title = {Convex Decomposition of Indoor Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9176-9186} }
Toward Unsupervised Realistic Visual Question Answering: Yuwei Zhang,

Chih-Hui Ho,

Nuno Vasconcelos; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Yuwei and Ho, Chih-Hui and Vasconcelos, Nuno}, title = {Toward Unsupervised Realistic Visual Question Answering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15613-15624} }
A Generalist Framework for Panoptic Segmentation of Images and Videos: Ting Chen,

Lala Li,

Saurabh Saxena,

Geoffrey Hinton,

David J. Fleet; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Ting and Li, Lala and Saxena, Saurabh and Hinton, Geoffrey and Fleet, David J.}, title = {A Generalist Framework for Panoptic Segmentation of Images and Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {909-919} }
DALL-Eval: Probing the Reasoning Skills and Social Biases of Text-to-Image Generation Models: Jaemin Cho,

Abhay Zala,

Mohit Bansal; [pdf] [supp]
[bibtex]
@InProceedings{Cho_2023_ICCV, author = {Cho, Jaemin and Zala, Abhay and Bansal, Mohit}, title = {DALL-Eval: Probing the Reasoning Skills and Social Biases of Text-to-Image Generation Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3043-3054} }
Video OWL-ViT: Temporally-consistent Open-world Localization in Video: Georg Heigold,

Matthias Minderer,

Alexey Gritsenko,

Alex Bewley,

Daniel Keysers,

Mario Lučić,

Fisher Yu,

Thomas Kipf; [pdf] [supp]
[bibtex]
@InProceedings{Heigold_2023_ICCV, author = {Heigold, Georg and Minderer, Matthias and Gritsenko, Alexey and Bewley, Alex and Keysers, Daniel and Lu\v{c}i\'c, Mario and Yu, Fisher and Kipf, Thomas}, title = {Video OWL-ViT: Temporally-consistent Open-world Localization in Video}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13802-13811} }
Few Shot Font Generation Via Transferring Similarity Guided Global Style and Quantization Local Style: Wei Pan,

Anna Zhu,

Xinyu Zhou,

Brian Kenji Iwana,

Shilin Li; [pdf] [arXiv]
[bibtex]
@InProceedings{Pan_2023_ICCV, author = {Pan, Wei and Zhu, Anna and Zhou, Xinyu and Iwana, Brian Kenji and Li, Shilin}, title = {Few Shot Font Generation Via Transferring Similarity Guided Global Style and Quantization Local Style}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19506-19516} }
Differentiable Transportation Pruning: Yunqiang Li,

Jan C. van Gemert,

Torsten Hoefler,

Bert Moons,

Evangelos Eleftheriou,

Bram-Ernst Verhoef; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Yunqiang and van Gemert, Jan C. and Hoefler, Torsten and Moons, Bert and Eleftheriou, Evangelos and Verhoef, Bram-Ernst}, title = {Differentiable Transportation Pruning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16957-16967} }
Physics-Driven Turbulence Image Restoration with Stochastic Refinement: Ajay Jaiswal,

Xingguang Zhang,

Stanley H. Chan,

Zhangyang Wang; [pdf] [arXiv]
[bibtex]
@InProceedings{Jaiswal_2023_ICCV, author = {Jaiswal, Ajay and Zhang, Xingguang and Chan, Stanley H. and Wang, Zhangyang}, title = {Physics-Driven Turbulence Image Restoration with Stochastic Refinement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12170-12181} }
Enhancing Non-line-of-sight Imaging via Learnable Inverse Kernel and Attention Mechanisms: Yanhua Yu,

Siyuan Shen,

Zi Wang,

Binbin Huang,

Yuehan Wang,

Xingyue Peng,

Suan Xia,

Ping Liu,

Ruiqian Li,

Shiying Li; [pdf]
[bibtex]
@InProceedings{Yu_2023_ICCV, author = {Yu, Yanhua and Shen, Siyuan and Wang, Zi and Huang, Binbin and Wang, Yuehan and Peng, Xingyue and Xia, Suan and Liu, Ping and Li, Ruiqian and Li, Shiying}, title = {Enhancing Non-line-of-sight Imaging via Learnable Inverse Kernel and Attention Mechanisms}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10563-10573} }
DECO: Dense Estimation of 3D Human-Scene Contact In The Wild: Shashank Tripathi,

Agniv Chatterjee,

Jean-Claude Passy,

Hongwei Yi,

Dimitrios Tzionas,

Michael J. Black; [pdf] [supp]
[bibtex]
@InProceedings{Tripathi_2023_ICCV, author = {Tripathi, Shashank and Chatterjee, Agniv and Passy, Jean-Claude and Yi, Hongwei and Tzionas, Dimitrios and Black, Michael J.}, title = {DECO: Dense Estimation of 3D Human-Scene Contact In The Wild}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8001-8013} }
Scale-Aware Modulation Meet Transformer: Weifeng Lin,

Ziheng Wu,

Jiayu Chen,

Jun Huang,

Lianwen Jin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lin_2023_ICCV, author = {Lin, Weifeng and Wu, Ziheng and Chen, Jiayu and Huang, Jun and Jin, Lianwen}, title = {Scale-Aware Modulation Meet Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6015-6026} }
Large Selective Kernel Network for Remote Sensing Object Detection: Yuxuan Li,

Qibin Hou,

Zhaohui Zheng,

Ming-Ming Cheng,

Jian Yang,

Xiang Li; [pdf] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Yuxuan and Hou, Qibin and Zheng, Zhaohui and Cheng, Ming-Ming and Yang, Jian and Li, Xiang}, title = {Large Selective Kernel Network for Remote Sensing Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16794-16805} }
PlaneRecTR: Unified Query Learning for 3D Plane Recovery from a Single View: Jingjia Shi,

Shuaifeng Zhi,

Kai Xu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shi_2023_ICCV, author = {Shi, Jingjia and Zhi, Shuaifeng and Xu, Kai}, title = {PlaneRecTR: Unified Query Learning for 3D Plane Recovery from a Single View}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9377-9386} }
EigenTrajectory: Low-Rank Descriptors for Multi-Modal Trajectory Forecasting: Inhwan Bae,

Jean Oh,

Hae-Gon Jeon; [pdf] [arXiv]
[bibtex]
@InProceedings{Bae_2023_ICCV, author = {Bae, Inhwan and Oh, Jean and Jeon, Hae-Gon}, title = {EigenTrajectory: Low-Rank Descriptors for Multi-Modal Trajectory Forecasting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10017-10029} }
I-ViT: Integer-only Quantization for Efficient Vision Transformer Inference: Zhikai Li,

Qingyi Gu; [pdf]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Zhikai and Gu, Qingyi}, title = {I-ViT: Integer-only Quantization for Efficient Vision Transformer Inference}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17065-17075} }
SUMMIT: Source-Free Adaptation of Uni-Modal Models to Multi-Modal Targets: Cody Simons,

Dripta S. Raychaudhuri,

Sk Miraj Ahmed,

Suya You,

Konstantinos Karydis,

Amit K. Roy-Chowdhury; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Simons_2023_ICCV, author = {Simons, Cody and Raychaudhuri, Dripta S. and Ahmed, Sk Miraj and You, Suya and Karydis, Konstantinos and Roy-Chowdhury, Amit K.}, title = {SUMMIT: Source-Free Adaptation of Uni-Modal Models to Multi-Modal Targets}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1239-1249} }
Learning a More Continuous Zero Level Set in Unsigned Distance Fields through Level Set Projection: Junsheng Zhou,

Baorui Ma,

Shujuan Li,

Yu-Shen Liu,

Zhizhong Han; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Junsheng and Ma, Baorui and Li, Shujuan and Liu, Yu-Shen and Han, Zhizhong}, title = {Learning a More Continuous Zero Level Set in Unsigned Distance Fields through Level Set Projection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3181-3192} }
Video-FocalNets: Spatio-Temporal Focal Modulation for Video Action Recognition: Syed Talal Wasim,

Muhammad Uzair Khattak,

Muzammal Naseer,

Salman Khan,

Mubarak Shah,

Fahad Shahbaz Khan; [pdf]
[bibtex]
@InProceedings{Wasim_2023_ICCV, author = {Wasim, Syed Talal and Khattak, Muhammad Uzair and Naseer, Muzammal and Khan, Salman and Shah, Mubarak and Khan, Fahad Shahbaz}, title = {Video-FocalNets: Spatio-Temporal Focal Modulation for Video Action Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13778-13789} }
To Adapt or Not to Adapt? Real-Time Adaptation for Semantic Segmentation: Marc Botet Colomer,

Pier Luigi Dovesi,

Theodoros Panagiotakopoulos,

Joao Frederico Carvalho,

Linus Härenstam-Nielsen,

Hossein Azizpour,

Hedvig Kjellström,

Daniel Cremers,

Matteo Poggi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Colomer_2023_ICCV, author = {Colomer, Marc Botet and Dovesi, Pier Luigi and Panagiotakopoulos, Theodoros and Carvalho, Joao Frederico and H\"arenstam-Nielsen, Linus and Azizpour, Hossein and Kjellstr\"om, Hedvig and Cremers, Daniel and Poggi, Matteo}, title = {To Adapt or Not to Adapt? Real-Time Adaptation for Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16548-16559} }
Hidden Biases of End-to-End Driving Models: Bernhard Jaeger,

Kashyap Chitta,

Andreas Geiger; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jaeger_2023_ICCV, author = {Jaeger, Bernhard and Chitta, Kashyap and Geiger, Andreas}, title = {Hidden Biases of End-to-End Driving Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8240-8249} }
HairNeRF: Geometry-Aware Image Synthesis for Hairstyle Transfer: Seunggyu Chang,

Gihoon Kim,

Hayeon Kim; [pdf]
[bibtex]
@InProceedings{Chang_2023_ICCV, author = {Chang, Seunggyu and Kim, Gihoon and Kim, Hayeon}, title = {HairNeRF: Geometry-Aware Image Synthesis for Hairstyle Transfer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2448-2458} }
Strivec: Sparse Tri-Vector Radiance Fields: Quankai Gao,

Qiangeng Xu,

Hao Su,

Ulrich Neumann,

Zexiang Xu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gao_2023_ICCV, author = {Gao, Quankai and Xu, Qiangeng and Su, Hao and Neumann, Ulrich and Xu, Zexiang}, title = {Strivec: Sparse Tri-Vector Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17569-17579} }
Multiscale Representation for Real-Time Anti-Aliasing Neural Rendering: Dongting Hu,

Zhenkai Zhang,

Tingbo Hou,

Tongliang Liu,

Huan Fu,

Mingming Gong; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hu_2023_ICCV, author = {Hu, Dongting and Zhang, Zhenkai and Hou, Tingbo and Liu, Tongliang and Fu, Huan and Gong, Mingming}, title = {Multiscale Representation for Real-Time Anti-Aliasing Neural Rendering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17772-17783} }
Borrowing Knowledge From Pre-trained Language Model: A New Data-efficient Visual Learning Paradigm: Wenxuan Ma,

Shuang Li,

JinMing Zhang,

Chi Harold Liu,

Jingxuan Kang,

Yulin Wang,

Gao Huang; [pdf] [supp]
[bibtex]
@InProceedings{Ma_2023_ICCV, author = {Ma, Wenxuan and Li, Shuang and Zhang, JinMing and Liu, Chi Harold and Kang, Jingxuan and Wang, Yulin and Huang, Gao}, title = {Borrowing Knowledge From Pre-trained Language Model: A New Data-efficient Visual Learning Paradigm}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18786-18797} }
GETAvatar: Generative Textured Meshes for Animatable Human Avatars: Xuanmeng Zhang,

Jianfeng Zhang,

Rohan Chacko,

Hongyi Xu,

Guoxian Song,

Yi Yang,

Jiashi Feng; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Xuanmeng and Zhang, Jianfeng and Chacko, Rohan and Xu, Hongyi and Song, Guoxian and Yang, Yi and Feng, Jiashi}, title = {GETAvatar: Generative Textured Meshes for Animatable Human Avatars}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2273-2282} }
Tracking without Label: Unsupervised Multiple Object Tracking via Contrastive Similarity Learning: Sha Meng,

Dian Shao,

Jiacheng Guo,

Shan Gao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Meng_2023_ICCV, author = {Meng, Sha and Shao, Dian and Guo, Jiacheng and Gao, Shan}, title = {Tracking without Label: Unsupervised Multiple Object Tracking via Contrastive Similarity Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16264-16273} }
PIDRo: Parallel Isomeric Attention with Dynamic Routing for Text-Video Retrieval: Peiyan Guan,

Renjing Pei,

Bin Shao,

Jianzhuang Liu,

Weimian Li,

Jiaxi Gu,

Hang Xu,

Songcen Xu,

Youliang Yan,

Edmund Y. Lam; [pdf] [supp]
[bibtex]
@InProceedings{Guan_2023_ICCV, author = {Guan, Peiyan and Pei, Renjing and Shao, Bin and Liu, Jianzhuang and Li, Weimian and Gu, Jiaxi and Xu, Hang and Xu, Songcen and Yan, Youliang and Lam, Edmund Y.}, title = {PIDRo: Parallel Isomeric Attention with Dynamic Routing for Text-Video Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11164-11173} }
Re-mine, Learn and Reason: Exploring the Cross-modal Semantic Correlations for Language-guided HOI detection: Yichao Cao,

Qingfei Tang,

Feng Yang,

Xiu Su,

Shan You,

Xiaobo Lu,

Chang Xu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cao_2023_ICCV, author = {Cao, Yichao and Tang, Qingfei and Yang, Feng and Su, Xiu and You, Shan and Lu, Xiaobo and Xu, Chang}, title = {Re-mine, Learn and Reason: Exploring the Cross-modal Semantic Correlations for Language-guided HOI detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23492-23503} }
Strata-NeRF : Neural Radiance Fields for Stratified Scenes: Ankit Dhiman,

R Srinath,

Harsh Rangwani,

Rishubh Parihar,

Lokesh R Boregowda,

Srinath Sridhar,

R Venkatesh Babu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dhiman_2023_ICCV, author = {Dhiman, Ankit and Srinath, R and Rangwani, Harsh and Parihar, Rishubh and Boregowda, Lokesh R and Sridhar, Srinath and Babu, R Venkatesh}, title = {Strata-NeRF : Neural Radiance Fields for Stratified Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17603-17614} }
StylerDALLE: Language-Guided Style Transfer Using a Vector-Quantized Tokenizer of a Large-Scale Generative Model: Zipeng Xu,

Enver Sangineto,

Nicu Sebe; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Zipeng and Sangineto, Enver and Sebe, Nicu}, title = {StylerDALLE: Language-Guided Style Transfer Using a Vector-Quantized Tokenizer of a Large-Scale Generative Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7601-7611} }
3D-aware Blending with Generative NeRFs: Hyunsu Kim,

Gayoung Lee,

Yunjey Choi,

Jin-Hwa Kim,

Jun-Yan Zhu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2023_ICCV, author = {Kim, Hyunsu and Lee, Gayoung and Choi, Yunjey and Kim, Jin-Hwa and Zhu, Jun-Yan}, title = {3D-aware Blending with Generative NeRFs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22906-22918} }
Multi-Modal Gated Mixture of Local-to-Global Experts for Dynamic Image Fusion: Bing Cao,

Yiming Sun,

Pengfei Zhu,

Qinghua Hu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cao_2023_ICCV, author = {Cao, Bing and Sun, Yiming and Zhu, Pengfei and Hu, Qinghua}, title = {Multi-Modal Gated Mixture of Local-to-Global Experts for Dynamic Image Fusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23555-23564} }
Deep Image Harmonization with Learnable Augmentation: Li Niu,

Junyan Cao,

Wenyan Cong,

Liqing Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Niu_2023_ICCV, author = {Niu, Li and Cao, Junyan and Cong, Wenyan and Zhang, Liqing}, title = {Deep Image Harmonization with Learnable Augmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7482-7491} }
DELFlow: Dense Efficient Learning of Scene Flow for Large-Scale Point Clouds: Chensheng Peng,

Guangming Wang,

Xian Wan Lo,

Xinrui Wu,

Chenfeng Xu,

Masayoshi Tomizuka,

Wei Zhan,

Hesheng Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Peng_2023_ICCV, author = {Peng, Chensheng and Wang, Guangming and Lo, Xian Wan and Wu, Xinrui and Xu, Chenfeng and Tomizuka, Masayoshi and Zhan, Wei and Wang, Hesheng}, title = {DELFlow: Dense Efficient Learning of Scene Flow for Large-Scale Point Clouds}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16901-16910} }
RFD-ECNet: Extreme Underwater Image Compression with Reference to Feature Dictionary: Mengyao Li,

Liquan Shen,

Peng Ye,

Guorui Feng,

Zheyin Wang; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Mengyao and Shen, Liquan and Ye, Peng and Feng, Guorui and Wang, Zheyin}, title = {RFD-ECNet: Extreme Underwater Image Compression with Reference to Feature Dictionary}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12980-12989} }
E^2VPT: An Effective and Efficient Approach for Visual Prompt Tuning: Cheng Han,

Qifan Wang,

Yiming Cui,

Zhiwen Cao,

Wenguan Wang,

Siyuan Qi,

Dongfang Liu; [pdf] [supp]
[bibtex]
@InProceedings{Han_2023_ICCV, author = {Han, Cheng and Wang, Qifan and Cui, Yiming and Cao, Zhiwen and Wang, Wenguan and Qi, Siyuan and Liu, Dongfang}, title = {E{\textasciicircum}2VPT: An Effective and Efficient Approach for Visual Prompt Tuning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17491-17502} }
High-Resolution Document Shadow Removal via A Large-Scale Real-World Dataset and A Frequency-Aware Shadow Erasing Net: Zinuo Li,

Xuhang Chen,

Chi-Man Pun,

Xiaodong Cun; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Zinuo and Chen, Xuhang and Pun, Chi-Man and Cun, Xiaodong}, title = {High-Resolution Document Shadow Removal via A Large-Scale Real-World Dataset and A Frequency-Aware Shadow Erasing Net}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12449-12458} }
Scalable Diffusion Models with Transformers: William Peebles,

Saining Xie; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Peebles_2023_ICCV, author = {Peebles, William and Xie, Saining}, title = {Scalable Diffusion Models with Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4195-4205} }
MMST-ViT: Climate Change-aware Crop Yield Prediction via Multi-Modal Spatial-Temporal Vision Transformer: Fudong Lin,

Summer Crawford,

Kaleb Guillot,

Yihe Zhang,

Yan Chen,

Xu Yuan,

Li Chen,

Shelby Williams,

Robert Minvielle,

Xiangming Xiao,

Drew Gholson,

Nicolas Ashwell,

Tri Setiyono,

Brenda Tubana,

Lu Peng,

Magdy Bayoumi,

Nian-Feng Tzeng; [pdf]
[bibtex]
@InProceedings{Lin_2023_ICCV, author = {Lin, Fudong and Crawford, Summer and Guillot, Kaleb and Zhang, Yihe and Chen, Yan and Yuan, Xu and Chen, Li and Williams, Shelby and Minvielle, Robert and Xiao, Xiangming and Gholson, Drew and Ashwell, Nicolas and Setiyono, Tri and Tubana, Brenda and Peng, Lu and Bayoumi, Magdy and Tzeng, Nian-Feng}, title = {MMST-ViT: Climate Change-aware Crop Yield Prediction via Multi-Modal Spatial-Temporal Vision Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5774-5784} }
From Knowledge Distillation to Self-Knowledge Distillation: A Unified Approach with Normalized Loss and Customized Soft Labels: Zhendong Yang,

Ailing Zeng,

Zhe Li,

Tianke Zhang,

Chun Yuan,

Yu Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Zhendong and Zeng, Ailing and Li, Zhe and Zhang, Tianke and Yuan, Chun and Li, Yu}, title = {From Knowledge Distillation to Self-Knowledge Distillation: A Unified Approach with Normalized Loss and Customized Soft Labels}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17185-17194} }
SILT: Shadow-Aware Iterative Label Tuning for Learning to Detect Shadows from Noisy Labels: Han Yang,

Tianyu Wang,

Xiaowei Hu,

Chi-Wing Fu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Han and Wang, Tianyu and Hu, Xiaowei and Fu, Chi-Wing}, title = {SILT: Shadow-Aware Iterative Label Tuning for Learning to Detect Shadows from Noisy Labels}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12687-12698} }
Implicit Autoencoder for Point-Cloud Self-Supervised Representation Learning: Siming Yan,

Zhenpei Yang,

Haoxiang Li,

Chen Song,

Li Guan,

Hao Kang,

Gang Hua,

Qixing Huang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yan_2023_ICCV, author = {Yan, Siming and Yang, Zhenpei and Li, Haoxiang and Song, Chen and Guan, Li and Kang, Hao and Hua, Gang and Huang, Qixing}, title = {Implicit Autoencoder for Point-Cloud Self-Supervised Representation Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14530-14542} }
Grounded Image Text Matching with Mismatched Relation Reasoning: Yu Wu,

Yana Wei,

Haozhe Wang,

Yongfei Liu,

Sibei Yang,

Xuming He; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Yu and Wei, Yana and Wang, Haozhe and Liu, Yongfei and Yang, Sibei and He, Xuming}, title = {Grounded Image Text Matching with Mismatched Relation Reasoning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2976-2987} }
UniKD: Universal Knowledge Distillation for Mimicking Homogeneous or Heterogeneous Object Detectors: Shanshan Lao,

Guanglu Song,

Boxiao Liu,

Yu Liu,

Yujiu Yang; [pdf] [supp]
[bibtex]
@InProceedings{Lao_2023_ICCV, author = {Lao, Shanshan and Song, Guanglu and Liu, Boxiao and Liu, Yu and Yang, Yujiu}, title = {UniKD: Universal Knowledge Distillation for Mimicking Homogeneous or Heterogeneous Object Detectors}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6362-6372} }
Speech4Mesh: Speech-Assisted Monocular 3D Facial Reconstruction for Speech-Driven 3D Facial Animation: Shan He,

Haonan He,

Shuo Yang,

Xiaoyan Wu,

Pengcheng Xia,

Bing Yin,

Cong Liu,

Lirong Dai,

Chang Xu; [pdf] [supp]
[bibtex]
@InProceedings{He_2023_ICCV, author = {He, Shan and He, Haonan and Yang, Shuo and Wu, Xiaoyan and Xia, Pengcheng and Yin, Bing and Liu, Cong and Dai, Lirong and Xu, Chang}, title = {Speech4Mesh: Speech-Assisted Monocular 3D Facial Reconstruction for Speech-Driven 3D Facial Animation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14192-14202} }
BoxDiff: Text-to-Image Synthesis with Training-Free Box-Constrained Diffusion: Jinheng Xie,

Yuexiang Li,

Yawen Huang,

Haozhe Liu,

Wentian Zhang,

Yefeng Zheng,

Mike Zheng Shou; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xie_2023_ICCV, author = {Xie, Jinheng and Li, Yuexiang and Huang, Yawen and Liu, Haozhe and Zhang, Wentian and Zheng, Yefeng and Shou, Mike Zheng}, title = {BoxDiff: Text-to-Image Synthesis with Training-Free Box-Constrained Diffusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7452-7461} }
Generalizing Neural Human Fitting to Unseen Poses With Articulated SE(3) Equivariance: Haiwen Feng,

Peter Kulits,

Shichen Liu,

Michael J. Black,

Victoria Fernandez Abrevaya; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Feng_2023_ICCV, author = {Feng, Haiwen and Kulits, Peter and Liu, Shichen and Black, Michael J. and Abrevaya, Victoria Fernandez}, title = {Generalizing Neural Human Fitting to Unseen Poses With Articulated SE(3) Equivariance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7977-7988} }
Rapid Network Adaptation: Learning to Adapt Neural Networks Using Test-Time Feedback: Teresa Yeo,

Oğuzhan Fatih Kar,

Zahra Sodagar,

Amir Zamir; [pdf]
[bibtex]
@InProceedings{Yeo_2023_ICCV, author = {Yeo, Teresa and Kar, O\u{g}uzhan Fatih and Sodagar, Zahra and Zamir, Amir}, title = {Rapid Network Adaptation: Learning to Adapt Neural Networks Using Test-Time Feedback}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4674-4687} }
Theoretical and Numerical Analysis of 3D Reconstruction Using Point and Line Incidences: Felix Rydell,

Elima Shehu,

Angélica Torres; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Rydell_2023_ICCV, author = {Rydell, Felix and Shehu, Elima and Torres, Ang\'elica}, title = {Theoretical and Numerical Analysis of 3D Reconstruction Using Point and Line Incidences}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3748-3757} }
Explaining Adversarial Robustness of Neural Networks from Clustering Effect Perspective: Yulin Jin,

Xiaoyu Zhang,

Jian Lou,

Xu Ma,

Zilong Wang,

Xiaofeng Chen; [pdf]
[bibtex]
@InProceedings{Jin_2023_ICCV, author = {Jin, Yulin and Zhang, Xiaoyu and Lou, Jian and Ma, Xu and Wang, Zilong and Chen, Xiaofeng}, title = {Explaining Adversarial Robustness of Neural Networks from Clustering Effect Perspective}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4522-4531} }
Leaping Into Memories: Space-Time Deep Feature Synthesis: Alexandros Stergiou,

Nikos Deligiannis; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Stergiou_2023_ICCV, author = {Stergiou, Alexandros and Deligiannis, Nikos}, title = {Leaping Into Memories: Space-Time Deep Feature Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1966-1976} }
Improving Generalization in Visual Reinforcement Learning via Conflict-aware Gradient Agreement Augmentation: Siao Liu,

Zhaoyu Chen,

Yang Liu,

Yuzheng Wang,

Dingkang Yang,

Zhile Zhao,

Ziqing Zhou,

Xie Yi,

Wei Li,

Wenqiang Zhang,

Zhongxue Gan; [pdf] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Siao and Chen, Zhaoyu and Liu, Yang and Wang, Yuzheng and Yang, Dingkang and Zhao, Zhile and Zhou, Ziqing and Yi, Xie and Li, Wei and Zhang, Wenqiang and Gan, Zhongxue}, title = {Improving Generalization in Visual Reinforcement Learning via Conflict-aware Gradient Agreement Augmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23436-23446} }
Graph Matching with Bi-level Noisy Correspondence: Yijie Lin,

Mouxing Yang,

Jun Yu,

Peng Hu,

Changqing Zhang,

Xi Peng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lin_2023_ICCV, author = {Lin, Yijie and Yang, Mouxing and Yu, Jun and Hu, Peng and Zhang, Changqing and Peng, Xi}, title = {Graph Matching with Bi-level Noisy Correspondence}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23362-23371} }
Learning from Noisy Pseudo Labels for Semi-Supervised Temporal Action Localization: Kun Xia,

Le Wang,

Sanping Zhou,

Gang Hua,

Wei Tang; [pdf] [supp]
[bibtex]
@InProceedings{Xia_2023_ICCV, author = {Xia, Kun and Wang, Le and Zhou, Sanping and Hua, Gang and Tang, Wei}, title = {Learning from Noisy Pseudo Labels for Semi-Supervised Temporal Action Localization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10160-10169} }
InfiniCity: Infinite-Scale City Synthesis: Chieh Hubert Lin,

Hsin-Ying Lee,

Willi Menapace,

Menglei Chai,

Aliaksandr Siarohin,

Ming-Hsuan Yang,

Sergey Tulyakov; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lin_2023_ICCV, author = {Lin, Chieh Hubert and Lee, Hsin-Ying and Menapace, Willi and Chai, Menglei and Siarohin, Aliaksandr and Yang, Ming-Hsuan and Tulyakov, Sergey}, title = {InfiniCity: Infinite-Scale City Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22808-22818} }
OpenOccupancy: A Large Scale Benchmark for Surrounding Semantic Occupancy Perception: Xiaofeng Wang,

Zheng Zhu,

Wenbo Xu,

Yunpeng Zhang,

Yi Wei,

Xu Chi,

Yun Ye,

Dalong Du,

Jiwen Lu,

Xingang Wang; [pdf] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Xiaofeng and Zhu, Zheng and Xu, Wenbo and Zhang, Yunpeng and Wei, Yi and Chi, Xu and Ye, Yun and Du, Dalong and Lu, Jiwen and Wang, Xingang}, title = {OpenOccupancy: A Large Scale Benchmark for Surrounding Semantic Occupancy Perception}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17850-17859} }
Weakly-Supervised Text-Driven Contrastive Learning for Facial Behavior Understanding: Xiang Zhang,

Taoyue Wang,

Xiaotian Li,

Huiyuan Yang,

Lijun Yin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Xiang and Wang, Taoyue and Li, Xiaotian and Yang, Huiyuan and Yin, Lijun}, title = {Weakly-Supervised Text-Driven Contrastive Learning for Facial Behavior Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20751-20762} }
Box-based Refinement for Weakly Supervised and Unsupervised Localization Tasks: Eyal Gomel,

Tal Shaharbany,

Lior Wolf; [pdf] [supp]
[bibtex]
@InProceedings{Gomel_2023_ICCV, author = {Gomel, Eyal and Shaharbany, Tal and Wolf, Lior}, title = {Box-based Refinement for Weakly Supervised and Unsupervised Localization Tasks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16044-16054} }
Activate and Reject: Towards Safe Domain Generalization under Category Shift: Chaoqi Chen,

Luyao Tang,

Leitian Tao,

Hong-Yu Zhou,

Yue Huang,

Xiaoguang Han,

Yizhou Yu; [pdf]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Chaoqi and Tang, Luyao and Tao, Leitian and Zhou, Hong-Yu and Huang, Yue and Han, Xiaoguang and Yu, Yizhou}, title = {Activate and Reject: Towards Safe Domain Generalization under Category Shift}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11552-11563} }
PRIOR: Prototype Representation Joint Learning from Medical Images and Reports: Pujin Cheng,

Li Lin,

Junyan Lyu,

Yijin Huang,

Wenhan Luo,

Xiaoying Tang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cheng_2023_ICCV, author = {Cheng, Pujin and Lin, Li and Lyu, Junyan and Huang, Yijin and Luo, Wenhan and Tang, Xiaoying}, title = {PRIOR: Prototype Representation Joint Learning from Medical Images and Reports}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21361-21371} }
Dynamic Mesh Recovery from Partial Point Cloud Sequence: Hojun Jang,

Minkwan Kim,

Jinseok Bae,

Young Min Kim; [pdf] [supp]
[bibtex]
@InProceedings{Jang_2023_ICCV, author = {Jang, Hojun and Kim, Minkwan and Bae, Jinseok and Kim, Young Min}, title = {Dynamic Mesh Recovery from Partial Point Cloud Sequence}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15074-15084} }
WDiscOOD: Out-of-Distribution Detection via Whitened Linear Discriminant Analysis: Yiye Chen,

Yunzhi Lin,

Ruinian Xu,

Patricio A. Vela; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Yiye and Lin, Yunzhi and Xu, Ruinian and Vela, Patricio A.}, title = {WDiscOOD: Out-of-Distribution Detection via Whitened Linear Discriminant Analysis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5298-5307} }
Boosting Few-shot Action Recognition with Graph-guided Hybrid Matching: Jiazheng Xing,

Mengmeng Wang,

Yudi Ruan,

Bofan Chen,

Yaowei Guo,

Boyu Mu,

Guang Dai,

Jingdong Wang,

Yong Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xing_2023_ICCV, author = {Xing, Jiazheng and Wang, Mengmeng and Ruan, Yudi and Chen, Bofan and Guo, Yaowei and Mu, Boyu and Dai, Guang and Wang, Jingdong and Liu, Yong}, title = {Boosting Few-shot Action Recognition with Graph-guided Hybrid Matching}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1740-1750} }
Neural Deformable Models for 3D Bi-Ventricular Heart Shape Reconstruction and Modeling from 2D Sparse Cardiac Magnetic Resonance Imaging: Meng Ye,

Dong Yang,

Mikael Kanski,

Leon Axel,

Dimitris Metaxas; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ye_2023_ICCV, author = {Ye, Meng and Yang, Dong and Kanski, Mikael and Axel, Leon and Metaxas, Dimitris}, title = {Neural Deformable Models for 3D Bi-Ventricular Heart Shape Reconstruction and Modeling from 2D Sparse Cardiac Magnetic Resonance Imaging}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14247-14256} }
Vision HGNN: An Image is More than a Graph of Nodes: Yan Han,

Peihao Wang,

Souvik Kundu,

Ying Ding,

Zhangyang Wang; [pdf]
[bibtex]
@InProceedings{Han_2023_ICCV, author = {Han, Yan and Wang, Peihao and Kundu, Souvik and Ding, Ying and Wang, Zhangyang}, title = {Vision HGNN: An Image is More than a Graph of Nodes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19878-19888} }
Nonrigid Object Contact Estimation With Regional Unwrapping Transformer: Wei Xie,

Zimeng Zhao,

Shiying Li,

Binghui Zuo,

Yangang Wang; [pdf] [arXiv]
[bibtex]
@InProceedings{Xie_2023_ICCV, author = {Xie, Wei and Zhao, Zimeng and Li, Shiying and Zuo, Binghui and Wang, Yangang}, title = {Nonrigid Object Contact Estimation With Regional Unwrapping Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9342-9351} }
Diffusion in Style: Martin Nicolas Everaert,

Marco Bocchio,

Sami Arpa,

Sabine Süsstrunk,

Radhakrishna Achanta; [pdf] [supp]
[bibtex]
@InProceedings{Everaert_2023_ICCV, author = {Everaert, Martin Nicolas and Bocchio, Marco and Arpa, Sami and S\"usstrunk, Sabine and Achanta, Radhakrishna}, title = {Diffusion in Style}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2251-2261} }
FunnyBirds: A Synthetic Vision Dataset for a Part-Based Analysis of Explainable AI Methods: Robin Hesse,

Simone Schaub-Meyer,

Stefan Roth; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hesse_2023_ICCV, author = {Hesse, Robin and Schaub-Meyer, Simone and Roth, Stefan}, title = {FunnyBirds: A Synthetic Vision Dataset for a Part-Based Analysis of Explainable AI Methods}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3981-3991} }
Deformable Neural Radiance Fields using RGB and Event Cameras: Qi Ma,

Danda Pani Paudel,

Ajad Chhatkuli,

Luc Van Gool; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ma_2023_ICCV, author = {Ma, Qi and Paudel, Danda Pani and Chhatkuli, Ajad and Van Gool, Luc}, title = {Deformable Neural Radiance Fields using RGB and Event Cameras}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3590-3600} }
BeLFusion: Latent Diffusion for Behavior-Driven Human Motion Prediction: German Barquero,

Sergio Escalera,

Cristina Palmero; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Barquero_2023_ICCV, author = {Barquero, German and Escalera, Sergio and Palmero, Cristina}, title = {BeLFusion: Latent Diffusion for Behavior-Driven Human Motion Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2317-2327} }
Semi-supervised Semantics-guided Adversarial Training for Robust Trajectory Prediction: Ruochen Jiao,

Xiangguo Liu,

Takami Sato,

Qi Alfred Chen,

Qi Zhu; [pdf] [supp]
[bibtex]
@InProceedings{Jiao_2023_ICCV, author = {Jiao, Ruochen and Liu, Xiangguo and Sato, Takami and Chen, Qi Alfred and Zhu, Qi}, title = {Semi-supervised Semantics-guided Adversarial Training for Robust Trajectory Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8207-8217} }
Linear-Covariance Loss for End-to-End Learning of 6D Pose Estimation: Fulin Liu,

Yinlin Hu,

Mathieu Salzmann; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Fulin and Hu, Yinlin and Salzmann, Mathieu}, title = {Linear-Covariance Loss for End-to-End Learning of 6D Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14107-14117} }
RLSAC: Reinforcement Learning Enhanced Sample Consensus for End-to-End Robust Estimation: Chang Nie,

Guangming Wang,

Zhe Liu,

Luca Cavalli,

Marc Pollefeys,

Hesheng Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Nie_2023_ICCV, author = {Nie, Chang and Wang, Guangming and Liu, Zhe and Cavalli, Luca and Pollefeys, Marc and Wang, Hesheng}, title = {RLSAC: Reinforcement Learning Enhanced Sample Consensus for End-to-End Robust Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9891-9900} }
CleanCLIP: Mitigating Data Poisoning Attacks in Multimodal Contrastive Learning: Hritik Bansal,

Nishad Singhi,

Yu Yang,

Fan Yin,

Aditya Grover,

Kai-Wei Chang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bansal_2023_ICCV, author = {Bansal, Hritik and Singhi, Nishad and Yang, Yu and Yin, Fan and Grover, Aditya and Chang, Kai-Wei}, title = {CleanCLIP: Mitigating Data Poisoning Attacks in Multimodal Contrastive Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {112-123} }
Multi-Frequency Representation Enhancement with Privilege Information for Video Super-Resolution: Fei Li,

Linfeng Zhang,

Zikun Liu,

Juan Lei,

Zhenbo Li; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Fei and Zhang, Linfeng and Liu, Zikun and Lei, Juan and Li, Zhenbo}, title = {Multi-Frequency Representation Enhancement with Privilege Information for Video Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12814-12825} }
Self-supervised Pre-training for Mirror Detection: Jiaying Lin,

Rynson W.H. Lau; [pdf]
[bibtex]
@InProceedings{Lin_2023_ICCV, author = {Lin, Jiaying and Lau, Rynson W.H.}, title = {Self-supervised Pre-training for Mirror Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12227-12236} }
GlowGAN: Unsupervised Learning of HDR Images from LDR Images in the Wild: Chao Wang,

Ana Serrano,

Xingang Pan,

Bin Chen,

Karol Myszkowski,

Hans-Peter Seidel,

Christian Theobalt,

Thomas Leimkühler; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Chao and Serrano, Ana and Pan, Xingang and Chen, Bin and Myszkowski, Karol and Seidel, Hans-Peter and Theobalt, Christian and Leimk\"uhler, Thomas}, title = {GlowGAN: Unsupervised Learning of HDR Images from LDR Images in the Wild}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10509-10519} }
Cumulative Spatial Knowledge Distillation for Vision Transformers: Borui Zhao,

Renjie Song,

Jiajun Liang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Borui and Song, Renjie and Liang, Jiajun}, title = {Cumulative Spatial Knowledge Distillation for Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6146-6155} }
Dual Pseudo-Labels Interactive Self-Training for Semi-Supervised Visible-Infrared Person Re-Identification: Jiangming Shi,

Yachao Zhang,

Xiangbo Yin,

Yuan Xie,

Zhizhong Zhang,

Jianping Fan,

Zhongchao Shi,

Yanyun Qu; [pdf] [supp]
[bibtex]
@InProceedings{Shi_2023_ICCV, author = {Shi, Jiangming and Zhang, Yachao and Yin, Xiangbo and Xie, Yuan and Zhang, Zhizhong and Fan, Jianping and Shi, Zhongchao and Qu, Yanyun}, title = {Dual Pseudo-Labels Interactive Self-Training for Semi-Supervised Visible-Infrared Person Re-Identification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11218-11228} }
Less is More: Focus Attention for Efficient DETR: Dehua Zheng,

Wenhui Dong,

Hailin Hu,

Xinghao Chen,

Yunhe Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zheng_2023_ICCV, author = {Zheng, Dehua and Dong, Wenhui and Hu, Hailin and Chen, Xinghao and Wang, Yunhe}, title = {Less is More: Focus Attention for Efficient DETR}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6674-6683} }
Efficient Controllable Multi-Task Architectures: Abhishek Aich,

Samuel Schulter,

Amit K. Roy-Chowdhury,

Manmohan Chandraker,

Yumin Suh; [pdf] [arXiv]
[bibtex]
@InProceedings{Aich_2023_ICCV, author = {Aich, Abhishek and Schulter, Samuel and Roy-Chowdhury, Amit K. and Chandraker, Manmohan and Suh, Yumin}, title = {Efficient Controllable Multi-Task Architectures}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5740-5751} }
HumanSD: A Native Skeleton-Guided Diffusion Model for Human Image Generation: Xuan Ju,

Ailing Zeng,

Chenchen Zhao,

Jianan Wang,

Lei Zhang,

Qiang Xu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ju_2023_ICCV, author = {Ju, Xuan and Zeng, Ailing and Zhao, Chenchen and Wang, Jianan and Zhang, Lei and Xu, Qiang}, title = {HumanSD: A Native Skeleton-Guided Diffusion Model for Human Image Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15988-15998} }
Lens Parameter Estimation for Realistic Depth of Field Modeling: Dominique Piché-Meunier,

Yannick Hold-Geoffroy,

Jianming Zhang,

Jean-François Lalonde; [pdf] [supp]
[bibtex]
@InProceedings{Piche-Meunier_2023_ICCV, author = {Pich\'e-Meunier, Dominique and Hold-Geoffroy, Yannick and Zhang, Jianming and Lalonde, Jean-Fran\c{c}ois}, title = {Lens Parameter Estimation for Realistic Depth of Field Modeling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {499-508} }
Learned Compressive Representations for Single-Photon 3D Imaging: Felipe Gutierrez-Barragan,

Fangzhou Mu,

Andrei Ardelean,

Atul Ingle,

Claudio Bruschini,

Edoardo Charbon,

Yin Li,

Mohit Gupta,

Andreas Velten; [pdf] [supp]
[bibtex]
@InProceedings{Gutierrez-Barragan_2023_ICCV, author = {Gutierrez-Barragan, Felipe and Mu, Fangzhou and Ardelean, Andrei and Ingle, Atul and Bruschini, Claudio and Charbon, Edoardo and Li, Yin and Gupta, Mohit and Velten, Andreas}, title = {Learned Compressive Representations for Single-Photon 3D Imaging}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10756-10766} }
Alignment-free HDR Deghosting with Semantics Consistent Transformer: Steven Tel,

Zongwei Wu,

Yulun Zhang,

Barthélémy Heyrman,

Cédric Demonceaux,

Radu Timofte,

Dominique Ginhac; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tel_2023_ICCV, author = {Tel, Steven and Wu, Zongwei and Zhang, Yulun and Heyrman, Barth\'el\'emy and Demonceaux, C\'edric and Timofte, Radu and Ginhac, Dominique}, title = {Alignment-free HDR Deghosting with Semantics Consistent Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12836-12845} }
Semantic-Aware Implicit Template Learning via Part Deformation Consistency: Sihyeon Kim,

Minseok Joo,

Jaewon Lee,

Juyeon Ko,

Juhan Cha,

Hyunwoo J. Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2023_ICCV, author = {Kim, Sihyeon and Joo, Minseok and Lee, Jaewon and Ko, Juyeon and Cha, Juhan and Kim, Hyunwoo J.}, title = {Semantic-Aware Implicit Template Learning via Part Deformation Consistency}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {593-603} }
HRS-Bench: Holistic, Reliable and Scalable Benchmark for Text-to-Image Models: Eslam Mohamed Bakr,

Pengzhan Sun,

Xiaoqian Shen,

Faizan Farooq Khan,

Li Erran Li,

Mohamed Elhoseiny; [pdf] [supp]
[bibtex]
@InProceedings{Bakr_2023_ICCV, author = {Bakr, Eslam Mohamed and Sun, Pengzhan and Shen, Xiaoqian and Khan, Faizan Farooq and Li, Li Erran and Elhoseiny, Mohamed}, title = {HRS-Bench: Holistic, Reliable and Scalable Benchmark for Text-to-Image Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20041-20053} }
Multi3DRefer: Grounding Text Description to Multiple 3D Objects: Yiming Zhang,

ZeMing Gong,

Angel X. Chang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Yiming and Gong, ZeMing and Chang, Angel X.}, title = {Multi3DRefer: Grounding Text Description to Multiple 3D Objects}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15225-15236} }
Examining Autoexposure for Challenging Scenes: SaiKiran Tedla,

Beixuan Yang,

Michael S. Brown; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tedla_2023_ICCV, author = {Tedla, SaiKiran and Yang, Beixuan and Brown, Michael S.}, title = {Examining Autoexposure for Challenging Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13076-13085} }
DiffCloth: Diffusion Based Garment Synthesis and Manipulation via Structural Cross-modal Semantic Alignment: Xujie Zhang,

Binbin Yang,

Michael C. Kampffmeyer,

Wenqing Zhang,

Shiyue Zhang,

Guansong Lu,

Liang Lin,

Hang Xu,

Xiaodan Liang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Xujie and Yang, Binbin and Kampffmeyer, Michael C. and Zhang, Wenqing and Zhang, Shiyue and Lu, Guansong and Lin, Liang and Xu, Hang and Liang, Xiaodan}, title = {DiffCloth: Diffusion Based Garment Synthesis and Manipulation via Structural Cross-modal Semantic Alignment}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23154-23163} }
Improved Visual Fine-tuning with Natural Language Supervision: Junyang Wang,

Yuanhong Xu,

Juhua Hu,

Ming Yan,

Jitao Sang,

Qi Qian; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Junyang and Xu, Yuanhong and Hu, Juhua and Yan, Ming and Sang, Jitao and Qian, Qi}, title = {Improved Visual Fine-tuning with Natural Language Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11899-11909} }
Person Re-Identification without Identification via Event anonymization: Shafiq Ahmad,

Pietro Morerio,

Alessio Del Bue; [pdf] [arXiv]
[bibtex]
@InProceedings{Ahmad_2023_ICCV, author = {Ahmad, Shafiq and Morerio, Pietro and Del Bue, Alessio}, title = {Person Re-Identification without Identification via Event anonymization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11132-11141} }
GRAM-HD: 3D-Consistent Image Generation at High Resolution with Generative Radiance Manifolds: Jianfeng Xiang,

Jiaolong Yang,

Yu Deng,

Xin Tong; [pdf] [supp]
[bibtex]
@InProceedings{Xiang_2023_ICCV, author = {Xiang, Jianfeng and Yang, Jiaolong and Deng, Yu and Tong, Xin}, title = {GRAM-HD: 3D-Consistent Image Generation at High Resolution with Generative Radiance Manifolds}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2195-2205} }
Small Object Detection via Coarse-to-fine Proposal Generation and Imitation Learning: Xiang Yuan,

Gong Cheng,

Kebing Yan,

Qinghua Zeng,

Junwei Han; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yuan_2023_ICCV, author = {Yuan, Xiang and Cheng, Gong and Yan, Kebing and Zeng, Qinghua and Han, Junwei}, title = {Small Object Detection via Coarse-to-fine Proposal Generation and Imitation Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6317-6327} }
Anomaly Detection Under Distribution Shift: Tri Cao,

Jiawen Zhu,

Guansong Pang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cao_2023_ICCV, author = {Cao, Tri and Zhu, Jiawen and Pang, Guansong}, title = {Anomaly Detection Under Distribution Shift}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6511-6523} }
Class Prior-Free Positive-Unlabeled Learning with Taylor Variational Loss for Hyperspectral Remote Sensing Imagery: Hengwei Zhao,

Xinyu Wang,

Jingtao Li,

Yanfei Zhong; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Hengwei and Wang, Xinyu and Li, Jingtao and Zhong, Yanfei}, title = {Class Prior-Free Positive-Unlabeled Learning with Taylor Variational Loss for Hyperspectral Remote Sensing Imagery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16827-16836} }
HoloAssist: an Egocentric Human Interaction Dataset for Interactive AI Assistants in the Real World: Xin Wang,

Taein Kwon,

Mahdi Rad,

Bowen Pan,

Ishani Chakraborty,

Sean Andrist,

Dan Bohus,

Ashley Feniello,

Bugra Tekin,

Felipe Vieira Frujeri,

Neel Joshi,

Marc Pollefeys; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Xin and Kwon, Taein and Rad, Mahdi and Pan, Bowen and Chakraborty, Ishani and Andrist, Sean and Bohus, Dan and Feniello, Ashley and Tekin, Bugra and Frujeri, Felipe Vieira and Joshi, Neel and Pollefeys, Marc}, title = {HoloAssist: an Egocentric Human Interaction Dataset for Interactive AI Assistants in the Real World}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20270-20281} }
Self-Feedback DETR for Temporal Action Detection: Jihwan Kim,

Miso Lee,

Jae-Pil Heo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2023_ICCV, author = {Kim, Jihwan and Lee, Miso and Heo, Jae-Pil}, title = {Self-Feedback DETR for Temporal Action Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10286-10296} }
StableVideo: Text-driven Consistency-aware Diffusion Video Editing: Wenhao Chai,

Xun Guo,

Gaoang Wang,

Yan Lu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chai_2023_ICCV, author = {Chai, Wenhao and Guo, Xun and Wang, Gaoang and Lu, Yan}, title = {StableVideo: Text-driven Consistency-aware Diffusion Video Editing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23040-23050} }
PIRNet: Privacy-Preserving Image Restoration Network via Wavelet Lifting: Xin Deng,

Chao Gao,

Mai Xu; [pdf]
[bibtex]
@InProceedings{Deng_2023_ICCV, author = {Deng, Xin and Gao, Chao and Xu, Mai}, title = {PIRNet: Privacy-Preserving Image Restoration Network via Wavelet Lifting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22368-22377} }
LAW-Diffusion: Complex Scene Generation by Diffusion with Layouts: Binbin Yang,

Yi Luo,

Ziliang Chen,

Guangrun Wang,

Xiaodan Liang,

Liang Lin; [pdf] [supp]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Binbin and Luo, Yi and Chen, Ziliang and Wang, Guangrun and Liang, Xiaodan and Lin, Liang}, title = {LAW-Diffusion: Complex Scene Generation by Diffusion with Layouts}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22669-22679} }
Multi-Label Knowledge Distillation: Penghui Yang,

Ming-Kun Xie,

Chen-Chen Zong,

Lei Feng,

Gang Niu,

Masashi Sugiyama,

Sheng-Jun Huang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Penghui and Xie, Ming-Kun and Zong, Chen-Chen and Feng, Lei and Niu, Gang and Sugiyama, Masashi and Huang, Sheng-Jun}, title = {Multi-Label Knowledge Distillation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17271-17280} }
Towards Geospatial Foundation Models via Continual Pretraining: Matías Mendieta,

Boran Han,

Xingjian Shi,

Yi Zhu,

Chen Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mendieta_2023_ICCV, author = {Mendieta, Mat{\'\i}as and Han, Boran and Shi, Xingjian and Zhu, Yi and Chen, Chen}, title = {Towards Geospatial Foundation Models via Continual Pretraining}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16806-16816} }
ConSlide: Asynchronous Hierarchical Interaction Transformer with Breakup-Reorganize Rehearsal for Continual Whole Slide Image Analysis: Yanyan Huang,

Weiqin Zhao,

Shujun Wang,

Yu Fu,

Yuming Jiang,

Lequan Yu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Yanyan and Zhao, Weiqin and Wang, Shujun and Fu, Yu and Jiang, Yuming and Yu, Lequan}, title = {ConSlide: Asynchronous Hierarchical Interaction Transformer with Breakup-Reorganize Rehearsal for Continual Whole Slide Image Analysis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21349-21360} }
RepQ-ViT: Scale Reparameterization for Post-Training Quantization of Vision Transformers: Zhikai Li,

Junrui Xiao,

Lianwei Yang,

Qingyi Gu; [pdf]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Zhikai and Xiao, Junrui and Yang, Lianwei and Gu, Qingyi}, title = {RepQ-ViT: Scale Reparameterization for Post-Training Quantization of Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17227-17236} }
Enhancing Privacy Preservation in Federated Learning via Learning Rate Perturbation: Guangnian Wan,

Haitao Du,

Xuejing Yuan,

Jun Yang,

Meiling Chen,

Jie Xu; [pdf] [supp]
[bibtex]
@InProceedings{Wan_2023_ICCV, author = {Wan, Guangnian and Du, Haitao and Yuan, Xuejing and Yang, Jun and Chen, Meiling and Xu, Jie}, title = {Enhancing Privacy Preservation in Federated Learning via Learning Rate Perturbation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4772-4781} }
UMC: A Unified Bandwidth-efficient and Multi-resolution based Collaborative Perception Framework: Tianhang Wang,

Guang Chen,

Kai Chen,

Zhengfa Liu,

Bo Zhang,

Alois Knoll,

Changjun Jiang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Tianhang and Chen, Guang and Chen, Kai and Liu, Zhengfa and Zhang, Bo and Knoll, Alois and Jiang, Changjun}, title = {UMC: A Unified Bandwidth-efficient and Multi-resolution based Collaborative Perception Framework}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8187-8196} }
Viewing Graph Solvability in Practice: Federica Arrigoni,

Tomas Pajdla,

Andrea Fusiello; [pdf]
[bibtex]
@InProceedings{Arrigoni_2023_ICCV, author = {Arrigoni, Federica and Pajdla, Tomas and Fusiello, Andrea}, title = {Viewing Graph Solvability in Practice}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8147-8155} }
SATR: Zero-Shot Semantic Segmentation of 3D Shapes: Ahmed Abdelreheem,

Ivan Skorokhodov,

Maks Ovsjanikov,

Peter Wonka; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Abdelreheem_2023_ICCV, author = {Abdelreheem, Ahmed and Skorokhodov, Ivan and Ovsjanikov, Maks and Wonka, Peter}, title = {SATR: Zero-Shot Semantic Segmentation of 3D Shapes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15166-15179} }
ReactioNet: Learning High-Order Facial Behavior from Universal Stimulus-Reaction by Dyadic Relation Reasoning: Xiaotian Li,

Taoyue Wang,

Geran Zhao,

Xiang Zhang,

Xi Kang,

Lijun Yin; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Xiaotian and Wang, Taoyue and Zhao, Geran and Zhang, Xiang and Kang, Xi and Yin, Lijun}, title = {ReactioNet: Learning High-Order Facial Behavior from Universal Stimulus-Reaction by Dyadic Relation Reasoning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20774-20785} }
Pseudo Flow Consistency for Self-Supervised 6D Object Pose Estimation: Yang Hai,

Rui Song,

Jiaojiao Li,

David Ferstl,

Yinlin Hu; [pdf] [arXiv]
[bibtex]
@InProceedings{Hai_2023_ICCV, author = {Hai, Yang and Song, Rui and Li, Jiaojiao and Ferstl, David and Hu, Yinlin}, title = {Pseudo Flow Consistency for Self-Supervised 6D Object Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14075-14085} }
Emotional Listener Portrait: Neural Listener Head Generation with Emotion: Luchuan Song,

Guojun Yin,

Zhenchao Jin,

Xiaoyi Dong,

Chenliang Xu; [pdf] [supp]
[bibtex]
@InProceedings{Song_2023_ICCV, author = {Song, Luchuan and Yin, Guojun and Jin, Zhenchao and Dong, Xiaoyi and Xu, Chenliang}, title = {Emotional Listener Portrait: Neural Listener Head Generation with Emotion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20839-20849} }
Unsupervised Domain Adaptation for Training Event-Based Networks Using Contrastive Learning and Uncorrelated Conditioning: Dayuan Jian,

Mohammad Rostami; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jian_2023_ICCV, author = {Jian, Dayuan and Rostami, Mohammad}, title = {Unsupervised Domain Adaptation for Training Event-Based Networks Using Contrastive Learning and Uncorrelated Conditioning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18721-18731} }
Probabilistic Human Mesh Recovery in 3D Scenes from Egocentric Views: Siwei Zhang,

Qianli Ma,

Yan Zhang,

Sadegh Aliakbarian,

Darren Cosker,

Siyu Tang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Siwei and Ma, Qianli and Zhang, Yan and Aliakbarian, Sadegh and Cosker, Darren and Tang, Siyu}, title = {Probabilistic Human Mesh Recovery in 3D Scenes from Egocentric Views}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7989-8000} }
ImGeoNet: Image-induced Geometry-aware Voxel Representation for Multi-view 3D Object Detection: Tao Tu,

Shun-Po Chuang,

Yu-Lun Liu,

Cheng Sun,

Ke Zhang,

Donna Roy,

Cheng-Hao Kuo,

Min Sun; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tu_2023_ICCV, author = {Tu, Tao and Chuang, Shun-Po and Liu, Yu-Lun and Sun, Cheng and Zhang, Ke and Roy, Donna and Kuo, Cheng-Hao and Sun, Min}, title = {ImGeoNet: Image-induced Geometry-aware Voxel Representation for Multi-view 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6996-7007} }
DRAW: Defending Camera-shooted RAW Against Image Manipulation: Xiaoxiao Hu,

Qichao Ying,

Zhenxing Qian,

Sheng Li,

Xinpeng Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hu_2023_ICCV, author = {Hu, Xiaoxiao and Ying, Qichao and Qian, Zhenxing and Li, Sheng and Zhang, Xinpeng}, title = {DRAW: Defending Camera-shooted RAW Against Image Manipulation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22434-22444} }
Controllable Person Image Synthesis with Pose-Constrained Latent Diffusion: Xiao Han,

Xiatian Zhu,

Jiankang Deng,

Yi-Zhe Song,

Tao Xiang; [pdf] [supp]
[bibtex]
@InProceedings{Han_2023_ICCV, author = {Han, Xiao and Zhu, Xiatian and Deng, Jiankang and Song, Yi-Zhe and Xiang, Tao}, title = {Controllable Person Image Synthesis with Pose-Constrained Latent Diffusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22768-22777} }
Diffusion-based Image Translation with Label Guidance for Domain Adaptive Semantic Segmentation: Duo Peng,

Ping Hu,

Qiuhong Ke,

Jun Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Peng_2023_ICCV, author = {Peng, Duo and Hu, Ping and Ke, Qiuhong and Liu, Jun}, title = {Diffusion-based Image Translation with Label Guidance for Domain Adaptive Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {808-820} }
TopoSeg: Topology-Aware Nuclear Instance Segmentation: Hongliang He,

Jun Wang,

Pengxu Wei,

Fan Xu,

Xiangyang Ji,

Chang Liu,

Jie Chen; [pdf]
[bibtex]
@InProceedings{He_2023_ICCV, author = {He, Hongliang and Wang, Jun and Wei, Pengxu and Xu, Fan and Ji, Xiangyang and Liu, Chang and Chen, Jie}, title = {TopoSeg: Topology-Aware Nuclear Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21307-21316} }
SceneRF: Self-Supervised Monocular 3D Scene Reconstruction with Radiance Fields: Anh-Quan Cao,

Raoul de Charette; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cao_2023_ICCV, author = {Cao, Anh-Quan and de Charette, Raoul}, title = {SceneRF: Self-Supervised Monocular 3D Scene Reconstruction with Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9387-9398} }
Isomer: Isomerous Transformer for Zero-shot Video Object Segmentation: Yichen Yuan,

Yifan Wang,

Lijun Wang,

Xiaoqi Zhao,

Huchuan Lu,

Yu Wang,

Weibo Su,

Lei Zhang; [pdf] [arXiv]
[bibtex]
@InProceedings{Yuan_2023_ICCV, author = {Yuan, Yichen and Wang, Yifan and Wang, Lijun and Zhao, Xiaoqi and Lu, Huchuan and Wang, Yu and Su, Weibo and Zhang, Lei}, title = {Isomer: Isomerous Transformer for Zero-shot Video Object Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {966-976} }
CPCM: Contextual Point Cloud Modeling for Weakly-supervised Point Cloud Semantic Segmentation: Lizhao Liu,

Zhuangwei Zhuang,

Shangxin Huang,

Xunlong Xiao,

Tianhang Xiang,

Cen Chen,

Jingdong Wang,

Mingkui Tan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Lizhao and Zhuang, Zhuangwei and Huang, Shangxin and Xiao, Xunlong and Xiang, Tianhang and Chen, Cen and Wang, Jingdong and Tan, Mingkui}, title = {CPCM: Contextual Point Cloud Modeling for Weakly-supervised Point Cloud Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18413-18422} }
PATMAT: Person Aware Tuning of Mask-Aware Transformer for Face Inpainting: Saman Motamed,

Jianjin Xu,

Chen Henry Wu,

Christian Häne,

Jean-Charles Bazin,

Fernando De la Torre; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Motamed_2023_ICCV, author = {Motamed, Saman and Xu, Jianjin and Wu, Chen Henry and H\"ane, Christian and Bazin, Jean-Charles and De la Torre, Fernando}, title = {PATMAT: Person Aware Tuning of Mask-Aware Transformer for Face Inpainting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22778-22787} }
Adaptive Nonlinear Latent Transformation for Conditional Face Editing: Zhizhong Huang,

Siteng Ma,

Junping Zhang,

Hongming Shan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Zhizhong and Ma, Siteng and Zhang, Junping and Shan, Hongming}, title = {Adaptive Nonlinear Latent Transformation for Conditional Face Editing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21022-21031} }
Tiny Updater: Towards Efficient Neural Network-Driven Software Updating: Linfeng Zhang,

Kaisheng Ma; [pdf]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Linfeng and Ma, Kaisheng}, title = {Tiny Updater: Towards Efficient Neural Network-Driven Software Updating}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23447-23459} }
INT2: Interactive Trajectory Prediction at Intersections: Zhijie Yan,

Pengfei Li,

Zheng Fu,

Shaocong Xu,

Yongliang Shi,

Xiaoxue Chen,

Yuhang Zheng,

Yang Li,

Tianyu Liu,

Chuxuan Li,

Nairui Luo,

Xu Gao,

Yilun Chen,

Zuoxu Wang,

Yifeng Shi,

Pengfei Huang,

Zhengxiao Han,

Jirui Yuan,

Jiangtao Gong,

Guyue Zhou,

Hang Zhao,

Hao Zhao; [pdf]
[bibtex]
@InProceedings{Yan_2023_ICCV, author = {Yan, Zhijie and Li, Pengfei and Fu, Zheng and Xu, Shaocong and Shi, Yongliang and Chen, Xiaoxue and Zheng, Yuhang and Li, Yang and Liu, Tianyu and Li, Chuxuan and Luo, Nairui and Gao, Xu and Chen, Yilun and Wang, Zuoxu and Shi, Yifeng and Huang, Pengfei and Han, Zhengxiao and Yuan, Jirui and Gong, Jiangtao and Zhou, Guyue and Zhao, Hang and Zhao, Hao}, title = {INT2: Interactive Trajectory Prediction at Intersections}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8536-8547} }
MapPrior: Bird's-Eye View Map Layout Estimation with Generative Models: Xiyue Zhu,

Vlas Zyrianov,

Zhijian Liu,

Shenlong Wang; [pdf] [supp]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Xiyue and Zyrianov, Vlas and Liu, Zhijian and Wang, Shenlong}, title = {MapPrior: Bird's-Eye View Map Layout Estimation with Generative Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8228-8239} }
CAD-Estate: Large-scale CAD Model Annotation in RGB Videos: Kevis-Kokitsi Maninis,

Stefan Popov,

Matthias Nießner,

Vittorio Ferrari; [pdf]
[bibtex]
@InProceedings{Maninis_2023_ICCV, author = {Maninis, Kevis-Kokitsi and Popov, Stefan and Nie{\ss}ner, Matthias and Ferrari, Vittorio}, title = {CAD-Estate: Large-scale CAD Model Annotation in RGB Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20189-20199} }
Conditional Cross Attention Network for Multi-Space Embedding without Entanglement in Only a SINGLE Network: Chull Hwan Song,

Taebaek Hwang,

Jooyoung Yoon,

Shunghyun Choi,

Yeong Hyeon Gu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Song_2023_ICCV, author = {Song, Chull Hwan and Hwang, Taebaek and Yoon, Jooyoung and Choi, Shunghyun and Gu, Yeong Hyeon}, title = {Conditional Cross Attention Network for Multi-Space Embedding without Entanglement in Only a SINGLE Network}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11112-11121} }
MB-TaylorFormer: Multi-Branch Efficient Transformer Expanded by Taylor Formula for Image Dehazing: Yuwei Qiu,

Kaihao Zhang,

Chenxi Wang,

Wenhan Luo,

Hongdong Li,

Zhi Jin; [pdf] [supp]
[bibtex]
@InProceedings{Qiu_2023_ICCV, author = {Qiu, Yuwei and Zhang, Kaihao and Wang, Chenxi and Luo, Wenhan and Li, Hongdong and Jin, Zhi}, title = {MB-TaylorFormer: Multi-Branch Efficient Transformer Expanded by Taylor Formula for Image Dehazing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12802-12813} }
X-Mesh: Towards Fast and Accurate Text-driven 3D Stylization via Dynamic Textual Guidance: Yiwei Ma,

Xiaoqing Zhang,

Xiaoshuai Sun,

Jiayi Ji,

Haowei Wang,

Guannan Jiang,

Weilin Zhuang,

Rongrong Ji; [pdf]
[bibtex]
@InProceedings{Ma_2023_ICCV, author = {Ma, Yiwei and Zhang, Xiaoqing and Sun, Xiaoshuai and Ji, Jiayi and Wang, Haowei and Jiang, Guannan and Zhuang, Weilin and Ji, Rongrong}, title = {X-Mesh: Towards Fast and Accurate Text-driven 3D Stylization via Dynamic Textual Guidance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2749-2760} }
Muscles in Action: Mia Chiquier,

Carl Vondrick; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chiquier_2023_ICCV, author = {Chiquier, Mia and Vondrick, Carl}, title = {Muscles in Action}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22091-22101} }
Large-Scale Person Detection and Localization Using Overhead Fisheye Cameras: Lu Yang,

Liulei Li,

Xueshi Xin,

Yifan Sun,

Qing Song,

Wenguan Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Lu and Li, Liulei and Xin, Xueshi and Sun, Yifan and Song, Qing and Wang, Wenguan}, title = {Large-Scale Person Detection and Localization Using Overhead Fisheye Cameras}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19961-19971} }
ViLTA: Enhancing Vision-Language Pre-training through Textual Augmentation: Weihan Wang,

Zhen Yang,

Bin Xu,

Juanzi Li,

Yankui Sun; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Weihan and Yang, Zhen and Xu, Bin and Li, Juanzi and Sun, Yankui}, title = {ViLTA: Enhancing Vision-Language Pre-training through Textual Augmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3158-3169} }
All-to-Key Attention for Arbitrary Style Transfer: Mingrui Zhu,

Xiao He,

Nannan Wang,

Xiaoyu Wang,

Xinbo Gao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Mingrui and He, Xiao and Wang, Nannan and Wang, Xiaoyu and Gao, Xinbo}, title = {All-to-Key Attention for Arbitrary Style Transfer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23109-23119} }
Learning to Distill Global Representation for Sparse-View CT: Zilong Li,

Chenglong Ma,

Jie Chen,

Junping Zhang,

Hongming Shan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Zilong and Ma, Chenglong and Chen, Jie and Zhang, Junping and Shan, Hongming}, title = {Learning to Distill Global Representation for Sparse-View CT}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21196-21207} }
FocalFormer3D: Focusing on Hard Instance for 3D Object Detection: Yilun Chen,

Zhiding Yu,

Yukang Chen,

Shiyi Lan,

Anima Anandkumar,

Jiaya Jia,

Jose M. Alvarez; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Yilun and Yu, Zhiding and Chen, Yukang and Lan, Shiyi and Anandkumar, Anima and Jia, Jiaya and Alvarez, Jose M.}, title = {FocalFormer3D: Focusing on Hard Instance for 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8394-8405} }
Not Every Side Is Equal: Localization Uncertainty Estimation for Semi-Supervised 3D Object Detection: Chuxin Wang,

Wenfei Yang,

Tianzhu Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Chuxin and Yang, Wenfei and Zhang, Tianzhu}, title = {Not Every Side Is Equal: Localization Uncertainty Estimation for Semi-Supervised 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3814-3824} }
Teaching CLIP to Count to Ten: Roni Paiss,

Ariel Ephrat,

Omer Tov,

Shiran Zada,

Inbar Mosseri,

Michal Irani,

Tali Dekel; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Paiss_2023_ICCV, author = {Paiss, Roni and Ephrat, Ariel and Tov, Omer and Zada, Shiran and Mosseri, Inbar and Irani, Michal and Dekel, Tali}, title = {Teaching CLIP to Count to Ten}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3170-3180} }
TEMPO: Efficient Multi-View Pose Estimation, Tracking, and Forecasting: Rohan Choudhury,

Kris M. Kitani,

László A. Jeni; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Choudhury_2023_ICCV, author = {Choudhury, Rohan and Kitani, Kris M. and Jeni, L\'aszl\'o A.}, title = {TEMPO: Efficient Multi-View Pose Estimation, Tracking, and Forecasting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14750-14760} }
SparseMAE: Sparse Training Meets Masked Autoencoders: Aojun Zhou,

Yang Li,

Zipeng Qin,

Jianbo Liu,

Junting Pan,

Renrui Zhang,

Rui Zhao,

Peng Gao,

Hongsheng Li; [pdf] [supp]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Aojun and Li, Yang and Qin, Zipeng and Liu, Jianbo and Pan, Junting and Zhang, Renrui and Zhao, Rui and Gao, Peng and Li, Hongsheng}, title = {SparseMAE: Sparse Training Meets Masked Autoencoders}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16176-16186} }
DiffPose: SpatioTemporal Diffusion Model for Video-Based Human Pose Estimation: Runyang Feng,

Yixing Gao,

Tze Ho Elden Tse,

Xueqing Ma,

Hyung Jin Chang; [pdf] [arXiv]
[bibtex]
@InProceedings{Feng_2023_ICCV, author = {Feng, Runyang and Gao, Yixing and Tse, Tze Ho Elden and Ma, Xueqing and Chang, Hyung Jin}, title = {DiffPose: SpatioTemporal Diffusion Model for Video-Based Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14861-14872} }
ELITE: Encoding Visual Concepts into Textual Embeddings for Customized Text-to-Image Generation: Yuxiang Wei,

Yabo Zhang,

Zhilong Ji,

Jinfeng Bai,

Lei Zhang,

Wangmeng Zuo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wei_2023_ICCV, author = {Wei, Yuxiang and Zhang, Yabo and Ji, Zhilong and Bai, Jinfeng and Zhang, Lei and Zuo, Wangmeng}, title = {ELITE: Encoding Visual Concepts into Textual Embeddings for Customized Text-to-Image Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15943-15953} }
Text2Performer: Text-Driven Human Video Generation: Yuming Jiang,

Shuai Yang,

Tong Liang Koh,

Wayne Wu,

Chen Change Loy,

Ziwei Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jiang_2023_ICCV, author = {Jiang, Yuming and Yang, Shuai and Koh, Tong Liang and Wu, Wayne and Loy, Chen Change and Liu, Ziwei}, title = {Text2Performer: Text-Driven Human Video Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22747-22757} }
A Simple Recipe to Meta-Learn Forward and Backward Transfer: Edoardo Cetin,

Antonio Carta,

Oya Celiktutan; [pdf] [supp]
[bibtex]
@InProceedings{Cetin_2023_ICCV, author = {Cetin, Edoardo and Carta, Antonio and Celiktutan, Oya}, title = {A Simple Recipe to Meta-Learn Forward and Backward Transfer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18732-18742} }
4D Myocardium Reconstruction with Decoupled Motion and Shape Model: Xiaohan Yuan,

Cong Liu,

Yangang Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yuan_2023_ICCV, author = {Yuan, Xiaohan and Liu, Cong and Wang, Yangang}, title = {4D Myocardium Reconstruction with Decoupled Motion and Shape Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21252-21262} }
IntentQA: Context-aware Video Intent Reasoning: Jiapeng Li,

Ping Wei,

Wenjuan Han,

Lifeng Fan; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Jiapeng and Wei, Ping and Han, Wenjuan and Fan, Lifeng}, title = {IntentQA: Context-aware Video Intent Reasoning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11963-11974} }
LiDAR-UDA: Self-ensembling Through Time for Unsupervised LiDAR Domain Adaptation: Amirreza Shaban,

JoonHo Lee,

Sanghun Jung,

Xiangyun Meng,

Byron Boots; [pdf] [supp]
[bibtex]
@InProceedings{Shaban_2023_ICCV, author = {Shaban, Amirreza and Lee, JoonHo and Jung, Sanghun and Meng, Xiangyun and Boots, Byron}, title = {LiDAR-UDA: Self-ensembling Through Time for Unsupervised LiDAR Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19784-19794} }
Robust Monocular Depth Estimation under Challenging Conditions: Stefano Gasperini,

Nils Morbitzer,

HyunJun Jung,

Nassir Navab,

Federico Tombari; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gasperini_2023_ICCV, author = {Gasperini, Stefano and Morbitzer, Nils and Jung, HyunJun and Navab, Nassir and Tombari, Federico}, title = {Robust Monocular Depth Estimation under Challenging Conditions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8177-8186} }
Parametric Depth Based Feature Representation Learning for Object Detection and Segmentation in Bird's-Eye View: Jiayu Yang,

Enze Xie,

Miaomiao Liu,

Jose M. Alvarez; [pdf]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Jiayu and Xie, Enze and Liu, Miaomiao and Alvarez, Jose M.}, title = {Parametric Depth Based Feature Representation Learning for Object Detection and Segmentation in Bird's-Eye View}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8483-8492} }
MSI: Maximize Support-Set Information for Few-Shot Segmentation: Seonghyeon Moon,

Samuel S. Sohn,

Honglu Zhou,

Sejong Yoon,

Vladimir Pavlovic,

Muhammad Haris Khan,

Mubbasir Kapadia; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Moon_2023_ICCV, author = {Moon, Seonghyeon and Sohn, Samuel S. and Zhou, Honglu and Yoon, Sejong and Pavlovic, Vladimir and Khan, Muhammad Haris and Kapadia, Mubbasir}, title = {MSI: Maximize Support-Set Information for Few-Shot Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19266-19276} }
Global Features are All You Need for Image Retrieval and Reranking: Shihao Shao,

Kaifeng Chen,

Arjun Karpur,

Qinghua Cui,

André Araujo,

Bingyi Cao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shao_2023_ICCV, author = {Shao, Shihao and Chen, Kaifeng and Karpur, Arjun and Cui, Qinghua and Araujo, Andr\'e and Cao, Bingyi}, title = {Global Features are All You Need for Image Retrieval and Reranking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11036-11046} }
DPF-Net: Combining Explicit Shape Priors in Deformable Primitive Field for Unsupervised Structural Reconstruction of 3D Objects: Qingyao Shuai,

Chi Zhang,

Kaizhi Yang,

Xuejin Chen; [pdf] [supp]
[bibtex]
@InProceedings{Shuai_2023_ICCV, author = {Shuai, Qingyao and Zhang, Chi and Yang, Kaizhi and Chen, Xuejin}, title = {DPF-Net: Combining Explicit Shape Priors in Deformable Primitive Field for Unsupervised Structural Reconstruction of 3D Objects}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14321-14329} }
CORE: Co-planarity Regularized Monocular Geometry Estimation with Weak Supervision: Yuguang Li,

Kai Wang,

Hui Li,

Seon-Min Rhee,

Seungju Han,

Jihye Kim,

Min Yang,

Ran Yang,

Feng Zhu; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Yuguang and Wang, Kai and Li, Hui and Rhee, Seon-Min and Han, Seungju and Kim, Jihye and Yang, Min and Yang, Ran and Zhu, Feng}, title = {CORE: Co-planarity Regularized Monocular Geometry Estimation with Weak Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8796-8805} }
A Sentence Speaks a Thousand Images: Domain Generalization through Distilling CLIP with Language Guidance: Zeyi Huang,

Andy Zhou,

Zijian Ling,

Mu Cai,

Haohan Wang,

Yong Jae Lee; [pdf]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Zeyi and Zhou, Andy and Ling, Zijian and Cai, Mu and Wang, Haohan and Lee, Yong Jae}, title = {A Sentence Speaks a Thousand Images: Domain Generalization through Distilling CLIP with Language Guidance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11685-11695} }
H3WB: Human3.6M 3D WholeBody Dataset and Benchmark: Yue Zhu,

Nermin Samet,

David Picard; [pdf] [supp]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Yue and Samet, Nermin and Picard, David}, title = {H3WB: Human3.6M 3D WholeBody Dataset and Benchmark}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20166-20177} }
Yes, we CANN: Constrained Approximate Nearest Neighbors for Local Feature-Based Visual Localization: Dror Aiger,

Andre Araujo,

Simon Lynen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Aiger_2023_ICCV, author = {Aiger, Dror and Araujo, Andre and Lynen, Simon}, title = {Yes, we CANN: Constrained Approximate Nearest Neighbors for Local Feature-Based Visual Localization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13339-13349} }
Multi-Object Navigation with Dynamically Learned Neural Implicit Representations: Pierre Marza,

Laetitia Matignon,

Olivier Simonin,

Christian Wolf; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Marza_2023_ICCV, author = {Marza, Pierre and Matignon, Laetitia and Simonin, Olivier and Wolf, Christian}, title = {Multi-Object Navigation with Dynamically Learned Neural Implicit Representations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11004-11015} }
NPC: Neural Point Characters from Video: Shih-Yang Su,

Timur Bagautdinov,

Helge Rhodin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Su_2023_ICCV, author = {Su, Shih-Yang and Bagautdinov, Timur and Rhodin, Helge}, title = {NPC: Neural Point Characters from Video}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14795-14805} }
LDP-Feat: Image Features with Local Differential Privacy: Francesco Pittaluga,

Bingbing Zhuang; [pdf] [supp]
[bibtex]
@InProceedings{Pittaluga_2023_ICCV, author = {Pittaluga, Francesco and Zhuang, Bingbing}, title = {LDP-Feat: Image Features with Local Differential Privacy}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17580-17590} }
Pre-Training-Free Image Manipulation Localization through Non-Mutually Exclusive Contrastive Learning: Jizhe Zhou,

Xiaochen Ma,

Xia Du,

Ahmed Y. Alhammadi,

Wentao Feng; [pdf]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Jizhe and Ma, Xiaochen and Du, Xia and Alhammadi, Ahmed Y. and Feng, Wentao}, title = {Pre-Training-Free Image Manipulation Localization through Non-Mutually Exclusive Contrastive Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22346-22356} }
MRN: Multiplexed Routing Network for Incremental Multilingual Text Recognition: Tianlun Zheng,

Zhineng Chen,

Bingchen Huang,

Wei Zhang,

Yu-Gang Jiang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zheng_2023_ICCV, author = {Zheng, Tianlun and Chen, Zhineng and Huang, Bingchen and Zhang, Wei and Jiang, Yu-Gang}, title = {MRN: Multiplexed Routing Network for Incremental Multilingual Text Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18644-18653} }
Domain Generalization Guided by Gradient Signal to Noise Ratio of Parameters: Mateusz Michalkiewicz,

Masoud Faraki,

Xiang Yu,

Manmohan Chandraker,

Mahsa Baktashmotlagh; [pdf] [supp]
[bibtex]
@InProceedings{Michalkiewicz_2023_ICCV, author = {Michalkiewicz, Mateusz and Faraki, Masoud and Yu, Xiang and Chandraker, Manmohan and Baktashmotlagh, Mahsa}, title = {Domain Generalization Guided by Gradient Signal to Noise Ratio of Parameters}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6177-6188} }
Counterfactual-based Saliency Map: Towards Visual Contrastive Explanations for Neural Networks: Xue Wang,

Zhibo Wang,

Haiqin Weng,

Hengchang Guo,

Zhifei Zhang,

Lu Jin,

Tao Wei,

Kui Ren; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Xue and Wang, Zhibo and Weng, Haiqin and Guo, Hengchang and Zhang, Zhifei and Jin, Lu and Wei, Tao and Ren, Kui}, title = {Counterfactual-based Saliency Map: Towards Visual Contrastive Explanations for Neural Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2042-2051} }
MST-compression: Compressing and Accelerating Binary Neural Networks with Minimum Spanning Tree: Quang Hieu Vo,

Linh-Tam Tran,

Sung-Ho Bae,

Lok-Won Kim,

Choong Seon Hong; [pdf] [supp]
[bibtex]
@InProceedings{Vo_2023_ICCV, author = {Vo, Quang Hieu and Tran, Linh-Tam and Bae, Sung-Ho and Kim, Lok-Won and Hong, Choong Seon}, title = {MST-compression: Compressing and Accelerating Binary Neural Networks with Minimum Spanning Tree}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6091-6100} }
MOST: Multiple Object Localization with Self-Supervised Transformers for Object Discovery: Sai Saketh Rambhatla,

Ishan Misra,

Rama Chellappa,

Abhinav Shrivastava; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Rambhatla_2023_ICCV, author = {Rambhatla, Sai Saketh and Misra, Ishan and Chellappa, Rama and Shrivastava, Abhinav}, title = {MOST: Multiple Object Localization with Self-Supervised Transformers for Object Discovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15823-15834} }
IIEU: Rethinking Neural Feature Activation from Decision-Making: Sudong Cai; [pdf] [supp]
[bibtex]
@InProceedings{Cai_2023_ICCV, author = {Cai, Sudong}, title = {IIEU: Rethinking Neural Feature Activation from Decision-Making}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5796-5806} }
Integrally Migrating Pre-trained Transformer Encoder-decoders for Visual Object Detection: Feng Liu,

Xiaosong Zhang,

Zhiliang Peng,

Zonghao Guo,

Fang Wan,

Xiangyang Ji,

Qixiang Ye; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Feng and Zhang, Xiaosong and Peng, Zhiliang and Guo, Zonghao and Wan, Fang and Ji, Xiangyang and Ye, Qixiang}, title = {Integrally Migrating Pre-trained Transformer Encoder-decoders for Visual Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6825-6834} }
V-FUSE: Volumetric Depth Map Fusion with Long-Range Constraints: Nathaniel Burgdorfer,

Philippos Mordohai; [pdf] [supp]
[bibtex]
@InProceedings{Burgdorfer_2023_ICCV, author = {Burgdorfer, Nathaniel and Mordohai, Philippos}, title = {V-FUSE: Volumetric Depth Map Fusion with Long-Range Constraints}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3449-3458} }
CrossLoc3D: Aerial-Ground Cross-Source 3D Place Recognition: Tianrui Guan,

Aswath Muthuselvam,

Montana Hoover,

Xijun Wang,

Jing Liang,

Adarsh Jagan Sathyamoorthy,

Damon Conover,

Dinesh Manocha; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Guan_2023_ICCV, author = {Guan, Tianrui and Muthuselvam, Aswath and Hoover, Montana and Wang, Xijun and Liang, Jing and Sathyamoorthy, Adarsh Jagan and Conover, Damon and Manocha, Dinesh}, title = {CrossLoc3D: Aerial-Ground Cross-Source 3D Place Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11335-11344} }
Recursive Video Lane Detection: Dongkwon Jin,

Dahyun Kim,

Chang-Su Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jin_2023_ICCV, author = {Jin, Dongkwon and Kim, Dahyun and Kim, Chang-Su}, title = {Recursive Video Lane Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8473-8482} }
GECCO: Geometrically-Conditioned Point Diffusion Models: Michał J Tyszkiewicz,

Pascal Fua,

Eduard Trulls; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tyszkiewicz_2023_ICCV, author = {Tyszkiewicz, Micha{\l} J and Fua, Pascal and Trulls, Eduard}, title = {GECCO: Geometrically-Conditioned Point Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2128-2138} }
Unsupervised Self-Driving Attention Prediction via Uncertainty Mining and Knowledge Embedding: Pengfei Zhu,

Mengshi Qi,

Xia Li,

Weijian Li,

Huadong Ma; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Pengfei and Qi, Mengshi and Li, Xia and Li, Weijian and Ma, Huadong}, title = {Unsupervised Self-Driving Attention Prediction via Uncertainty Mining and Knowledge Embedding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8558-8568} }
PETRv2: A Unified Framework for 3D Perception from Multi-Camera Images: Yingfei Liu,

Junjie Yan,

Fan Jia,

Shuailin Li,

Aqi Gao,

Tiancai Wang,

Xiangyu Zhang; [pdf] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Yingfei and Yan, Junjie and Jia, Fan and Li, Shuailin and Gao, Aqi and Wang, Tiancai and Zhang, Xiangyu}, title = {PETRv2: A Unified Framework for 3D Perception from Multi-Camera Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3262-3272} }
Out-of-Domain GAN Inversion via Invertibility Decomposition for Photo-Realistic Human Face Manipulation: Xin Yang,

Xiaogang XU,

Yingcong Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Xin and XU, Xiaogang and Chen, Yingcong}, title = {Out-of-Domain GAN Inversion via Invertibility Decomposition for Photo-Realistic Human Face Manipulation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7492-7501} }
SAFE: Machine Unlearning With Shard Graphs: Yonatan Dukler,

Benjamin Bowman,

Alessandro Achille,

Aditya Golatkar,

Ashwin Swaminathan,

Stefano Soatto; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dukler_2023_ICCV, author = {Dukler, Yonatan and Bowman, Benjamin and Achille, Alessandro and Golatkar, Aditya and Swaminathan, Ashwin and Soatto, Stefano}, title = {SAFE: Machine Unlearning With Shard Graphs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17108-17118} }
Learning Trajectory-Word Alignments for Video-Language Tasks: Xu Yang,

Zhangzikang Li,

Haiyang Xu,

Hanwang Zhang,

Qinghao Ye,

Chenliang Li,

Ming Yan,

Yu Zhang,

Fei Huang,

Songfang Huang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Xu and Li, Zhangzikang and Xu, Haiyang and Zhang, Hanwang and Ye, Qinghao and Li, Chenliang and Yan, Ming and Zhang, Yu and Huang, Fei and Huang, Songfang}, title = {Learning Trajectory-Word Alignments for Video-Language Tasks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2504-2514} }
OrthoPlanes: A Novel Representation for Better 3D-Awareness of GANs: Honglin He,

Zhuoqian Yang,

Shikai Li,

Bo Dai,

Wayne Wu; [pdf] [supp]
[bibtex]
@InProceedings{He_2023_ICCV, author = {He, Honglin and Yang, Zhuoqian and Li, Shikai and Dai, Bo and Wu, Wayne}, title = {OrthoPlanes: A Novel Representation for Better 3D-Awareness of GANs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22996-23007} }
Geometry-guided Feature Learning and Fusion for Indoor Scene Reconstruction: Ruihong Yin,

Sezer Karaoglu,

Theo Gevers; [pdf] [supp]
[bibtex]
@InProceedings{Yin_2023_ICCV, author = {Yin, Ruihong and Karaoglu, Sezer and Gevers, Theo}, title = {Geometry-guided Feature Learning and Fusion for Indoor Scene Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3652-3661} }
Atmospheric Transmission and Thermal Inertia Induced Blind Road Segmentation with a Large-Scale Dataset TBRSD: Junzhang Chen,

Xiangzhi Bai; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Junzhang and Bai, Xiangzhi}, title = {Atmospheric Transmission and Thermal Inertia Induced Blind Road Segmentation with a Large-Scale Dataset TBRSD}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1053-1063} }
NeTO:Neural Reconstruction of Transparent Objects with Self-Occlusion Aware Refraction-Tracing: Zongcheng Li,

Xiaoxiao Long,

Yusen Wang,

Tuo Cao,

Wenping Wang,

Fei Luo,

Chunxia Xiao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Zongcheng and Long, Xiaoxiao and Wang, Yusen and Cao, Tuo and Wang, Wenping and Luo, Fei and Xiao, Chunxia}, title = {NeTO:Neural Reconstruction of Transparent Objects with Self-Occlusion Aware Refraction-Tracing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18547-18557} }
Boosting 3-DoF Ground-to-Satellite Camera Localization Accuracy via Geometry-Guided Cross-View Transformer: Yujiao Shi,

Fei Wu,

Akhil Perincherry,

Ankit Vora,

Hongdong Li; [pdf] [supp]
[bibtex]
@InProceedings{Shi_2023_ICCV, author = {Shi, Yujiao and Wu, Fei and Perincherry, Akhil and Vora, Ankit and Li, Hongdong}, title = {Boosting 3-DoF Ground-to-Satellite Camera Localization Accuracy via Geometry-Guided Cross-View Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21516-21526} }
Efficient-VQGAN: Towards High-Resolution Image Generation with Efficient Vision Transformers: Shiyue Cao,

Yueqin Yin,

Lianghua Huang,

Yu Liu,

Xin Zhao,

Deli Zhao,

Kaigi Huang; [pdf]
[bibtex]
@InProceedings{Cao_2023_ICCV, author = {Cao, Shiyue and Yin, Yueqin and Huang, Lianghua and Liu, Yu and Zhao, Xin and Zhao, Deli and Huang, Kaigi}, title = {Efficient-VQGAN: Towards High-Resolution Image Generation with Efficient Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7368-7377} }
DLGSANet: Lightweight Dynamic Local and Global Self-Attention Networks for Image Super-Resolution: Xiang Li,

Jiangxin Dong,

Jinhui Tang,

Jinshan Pan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Xiang and Dong, Jiangxin and Tang, Jinhui and Pan, Jinshan}, title = {DLGSANet: Lightweight Dynamic Local and Global Self-Attention Networks for Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12792-12801} }
Adaptive Reordering Sampler with Neurally Guided MAGSAC: Tong Wei,

Jiri Matas,

Daniel Barath; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wei_2023_ICCV, author = {Wei, Tong and Matas, Jiri and Barath, Daniel}, title = {Adaptive Reordering Sampler with Neurally Guided MAGSAC}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18163-18173} }
Learning Cross-Representation Affinity Consistency for Sparsely Supervised Biomedical Instance Segmentation: Xiaoyu Liu,

Wei Huang,

Zhiwei Xiong,

Shenglong Zhou,

Yueyi Zhang,

Xuejin Chen,

Zheng-Jun Zha,

Feng Wu; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Xiaoyu and Huang, Wei and Xiong, Zhiwei and Zhou, Shenglong and Zhang, Yueyi and Chen, Xuejin and Zha, Zheng-Jun and Wu, Feng}, title = {Learning Cross-Representation Affinity Consistency for Sparsely Supervised Biomedical Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21107-21117} }
Black-Box Unsupervised Domain Adaptation with Bi-Directional Atkinson-Shiffrin Memory: Jingyi Zhang,

Jiaxing Huang,

Xueying Jiang,

Shijian Lu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Jingyi and Huang, Jiaxing and Jiang, Xueying and Lu, Shijian}, title = {Black-Box Unsupervised Domain Adaptation with Bi-Directional Atkinson-Shiffrin Memory}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11771-11782} }
Towards Fair and Comprehensive Comparisons for Image-Based 3D Object Detection: Xinzhu Ma,

Yongtao Wang,

Yinmin Zhang,

Zhiyi Xia,

Yuan Meng,

Zhihui Wang,

Haojie Li,

Wanli Ouyang; [pdf] [supp]
[bibtex]
@InProceedings{Ma_2023_ICCV, author = {Ma, Xinzhu and Wang, Yongtao and Zhang, Yinmin and Xia, Zhiyi and Meng, Yuan and Wang, Zhihui and Li, Haojie and Ouyang, Wanli}, title = {Towards Fair and Comprehensive Comparisons for Image-Based 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6425-6435} }
Disentangling Spatial and Temporal Learning for Efficient Image-to-Video Transfer Learning: Zhiwu Qing,

Shiwei Zhang,

Ziyuan Huang,

Yingya Zhang,

Changxin Gao,

Deli Zhao,

Nong Sang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Qing_2023_ICCV, author = {Qing, Zhiwu and Zhang, Shiwei and Huang, Ziyuan and Zhang, Yingya and Gao, Changxin and Zhao, Deli and Sang, Nong}, title = {Disentangling Spatial and Temporal Learning for Efficient Image-to-Video Transfer Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13934-13944} }
A Skeletonization Algorithm for Gradient-Based Optimization: Martin J. Menten,

Johannes C. Paetzold,

Veronika A. Zimmer,

Suprosanna Shit,

Ivan Ezhov,

Robbie Holland,

Monika Probst,

Julia A. Schnabel,

Daniel Rueckert; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Menten_2023_ICCV, author = {Menten, Martin J. and Paetzold, Johannes C. and Zimmer, Veronika A. and Shit, Suprosanna and Ezhov, Ivan and Holland, Robbie and Probst, Monika and Schnabel, Julia A. and Rueckert, Daniel}, title = {A Skeletonization Algorithm for Gradient-Based Optimization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21394-21403} }
V3Det: Vast Vocabulary Visual Detection Dataset: Jiaqi Wang,

Pan Zhang,

Tao Chu,

Yuhang Cao,

Yujie Zhou,

Tong Wu,

Bin Wang,

Conghui He,

Dahua Lin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Jiaqi and Zhang, Pan and Chu, Tao and Cao, Yuhang and Zhou, Yujie and Wu, Tong and Wang, Bin and He, Conghui and Lin, Dahua}, title = {V3Det: Vast Vocabulary Visual Detection Dataset}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19844-19854} }
Coarse-to-Fine: Learning Compact Discriminative Representation for Single-Stage Image Retrieval: Yunquan Zhu,

Xinkai Gao,

Bo Ke,

Ruizhi Qiao,

Xing Sun; [pdf]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Yunquan and Gao, Xinkai and Ke, Bo and Qiao, Ruizhi and Sun, Xing}, title = {Coarse-to-Fine: Learning Compact Discriminative Representation for Single-Stage Image Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11260-11269} }
Multi-weather Image Restoration via Domain Translation: Prashant W. Patil,

Sunil Gupta,

Santu Rana,

Svetha Venkatesh,

Subrahmanyam Murala; [pdf] [supp]
[bibtex]
@InProceedings{Patil_2023_ICCV, author = {Patil, Prashant W. and Gupta, Sunil and Rana, Santu and Venkatesh, Svetha and Murala, Subrahmanyam}, title = {Multi-weather Image Restoration via Domain Translation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21696-21705} }
Deep Fusion Transformer Network with Weighted Vector-Wise Keypoints Voting for Robust 6D Object Pose Estimation: Jun Zhou,

Kai Chen,

Linlin Xu,

Qi Dou,

Jing Qin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Jun and Chen, Kai and Xu, Linlin and Dou, Qi and Qin, Jing}, title = {Deep Fusion Transformer Network with Weighted Vector-Wise Keypoints Voting for Robust 6D Object Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13967-13977} }
BT^2: Backward-compatible Training with Basis Transformation: Yifei Zhou,

Zilu Li,

Abhinav Shrivastava,

Hengshuang Zhao,

Antonio Torralba,

Taipeng Tian,

Ser-Nam Lim; [pdf] [supp]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Yifei and Li, Zilu and Shrivastava, Abhinav and Zhao, Hengshuang and Torralba, Antonio and Tian, Taipeng and Lim, Ser-Nam}, title = {BT{\textasciicircum}2: Backward-compatible Training with Basis Transformation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11229-11238} }
ViperGPT: Visual Inference via Python Execution for Reasoning: Dídac Surís,

Sachit Menon,

Carl Vondrick; [pdf] [supp]
[bibtex]
@InProceedings{Suris_2023_ICCV, author = {Sur{\'\i}s, D{\'\i}dac and Menon, Sachit and Vondrick, Carl}, title = {ViperGPT: Visual Inference via Python Execution for Reasoning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11888-11898} }
Improving Unsupervised Visual Program Inference with Code Rewriting Families: Aditya Ganeshan,

R. Kenny Jones,

Daniel Ritchie; [pdf] [supp]
[bibtex]
@InProceedings{Ganeshan_2023_ICCV, author = {Ganeshan, Aditya and Jones, R. Kenny and Ritchie, Daniel}, title = {Improving Unsupervised Visual Program Inference with Code Rewriting Families}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15791-15801} }
Essential Matrix Estimation using Convex Relaxations in Orthogonal Space: Arman Karimian,

Roberto Tron; [pdf] [supp]
[bibtex]
@InProceedings{Karimian_2023_ICCV, author = {Karimian, Arman and Tron, Roberto}, title = {Essential Matrix Estimation using Convex Relaxations in Orthogonal Space}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17142-17152} }
Concept-wise Fine-tuning Matters in Preventing Negative Transfer: Yunqiao Yang,

Long-Kai Huang,

Ying Wei; [pdf] [supp]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Yunqiao and Huang, Long-Kai and Wei, Ying}, title = {Concept-wise Fine-tuning Matters in Preventing Negative Transfer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18753-18763} }
Learning Human Dynamics in Autonomous Driving Scenarios: Jingbo Wang,

Ye Yuan,

Zhengyi Luo,

Kevin Xie,

Dahua Lin,

Umar Iqbal,

Sanja Fidler,

Sameh Khamis; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Jingbo and Yuan, Ye and Luo, Zhengyi and Xie, Kevin and Lin, Dahua and Iqbal, Umar and Fidler, Sanja and Khamis, Sameh}, title = {Learning Human Dynamics in Autonomous Driving Scenarios}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20796-20806} }
Fine-grained Visible Watermark Removal: Li Niu,

Xing Zhao,

Bo Zhang,

Liqing Zhang; [pdf]
[bibtex]
@InProceedings{Niu_2023_ICCV, author = {Niu, Li and Zhao, Xing and Zhang, Bo and Zhang, Liqing}, title = {Fine-grained Visible Watermark Removal}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12770-12779} }
DDP: Diffusion Model for Dense Visual Prediction: Yuanfeng Ji,

Zhe Chen,

Enze Xie,

Lanqing Hong,

Xihui Liu,

Zhaoqiang Liu,

Tong Lu,

Zhenguo Li,

Ping Luo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ji_2023_ICCV, author = {Ji, Yuanfeng and Chen, Zhe and Xie, Enze and Hong, Lanqing and Liu, Xihui and Liu, Zhaoqiang and Lu, Tong and Li, Zhenguo and Luo, Ping}, title = {DDP: Diffusion Model for Dense Visual Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21741-21752} }
Semantics-Consistent Feature Search for Self-Supervised Visual Representation Learning: Kaiyou Song,

Shan Zhang,

Zimeng Luo,

Tong Wang,

Jin Xie; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Song_2023_ICCV, author = {Song, Kaiyou and Zhang, Shan and Luo, Zimeng and Wang, Tong and Xie, Jin}, title = {Semantics-Consistent Feature Search for Self-Supervised Visual Representation Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16099-16108} }
GridMM: Grid Memory Map for Vision-and-Language Navigation: Zihan Wang,

Xiangyang Li,

Jiahao Yang,

Yeqi Liu,

Shuqiang Jiang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Zihan and Li, Xiangyang and Yang, Jiahao and Liu, Yeqi and Jiang, Shuqiang}, title = {GridMM: Grid Memory Map for Vision-and-Language Navigation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15625-15636} }
Probabilistic Modeling of Inter- and Intra-observer Variability in Medical Image Segmentation: Arne Schmidt,

Pablo Morales-Álvarez,

Rafael Molina; [pdf]
[bibtex]
@InProceedings{Schmidt_2023_ICCV, author = {Schmidt, Arne and Morales-\'Alvarez, Pablo and Molina, Rafael}, title = {Probabilistic Modeling of Inter- and Intra-observer Variability in Medical Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21097-21106} }
LAC - Latent Action Composition for Skeleton-based Action Segmentation: Di Yang,

Yaohui Wang,

Antitza Dantcheva,

Quan Kong,

Lorenzo Garattoni,

Gianpiero Francesca,

Francois Bremond; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Di and Wang, Yaohui and Dantcheva, Antitza and Kong, Quan and Garattoni, Lorenzo and Francesca, Gianpiero and Bremond, Francois}, title = {LAC - Latent Action Composition for Skeleton-based Action Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13679-13690} }
Learning Vision-and-Language Navigation from YouTube Videos: Kunyang Lin,

Peihao Chen,

Diwei Huang,

Thomas H. Li,

Mingkui Tan,

Chuang Gan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lin_2023_ICCV, author = {Lin, Kunyang and Chen, Peihao and Huang, Diwei and Li, Thomas H. and Tan, Mingkui and Gan, Chuang}, title = {Learning Vision-and-Language Navigation from YouTube Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8317-8326} }
Total-Recon: Deformable Scene Reconstruction for Embodied View Synthesis: Chonghyuk Song,

Gengshan Yang,

Kangle Deng,

Jun-Yan Zhu,

Deva Ramanan; [pdf] [supp]
[bibtex]
@InProceedings{Song_2023_ICCV, author = {Song, Chonghyuk and Yang, Gengshan and Deng, Kangle and Zhu, Jun-Yan and Ramanan, Deva}, title = {Total-Recon: Deformable Scene Reconstruction for Embodied View Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17671-17682} }
AdaNIC: Towards Practical Neural Image Compression via Dynamic Transform Routing: Lvfang Tao,

Wei Gao,

Ge Li,

Chenhao Zhang; [pdf]
[bibtex]
@InProceedings{Tao_2023_ICCV, author = {Tao, Lvfang and Gao, Wei and Li, Ge and Zhang, Chenhao}, title = {AdaNIC: Towards Practical Neural Image Compression via Dynamic Transform Routing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16879-16888} }
Uncertainty-aware State Space Transformer for Egocentric 3D Hand Trajectory Forecasting: Wentao Bao,

Lele Chen,

Libing Zeng,

Zhong Li,

Yi Xu,

Junsong Yuan,

Yu Kong; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bao_2023_ICCV, author = {Bao, Wentao and Chen, Lele and Zeng, Libing and Li, Zhong and Xu, Yi and Yuan, Junsong and Kong, Yu}, title = {Uncertainty-aware State Space Transformer for Egocentric 3D Hand Trajectory Forecasting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13702-13711} }
Pretrained Language Models as Visual Planners for Human Assistance: Dhruvesh Patel,

Hamid Eghbalzadeh,

Nitin Kamra,

Michael Louis Iuzzolino,

Unnat Jain,

Ruta Desai; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Patel_2023_ICCV, author = {Patel, Dhruvesh and Eghbalzadeh, Hamid and Kamra, Nitin and Iuzzolino, Michael Louis and Jain, Unnat and Desai, Ruta}, title = {Pretrained Language Models as Visual Planners for Human Assistance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15302-15314} }
Dynamic Point Fields: Sergey Prokudin,

Qianli Ma,

Maxime Raafat,

Julien Valentin,

Siyu Tang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Prokudin_2023_ICCV, author = {Prokudin, Sergey and Ma, Qianli and Raafat, Maxime and Valentin, Julien and Tang, Siyu}, title = {Dynamic Point Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7964-7976} }
Lip2Vec: Efficient and Robust Visual Speech Recognition via Latent-to-Latent Visual to Audio Representation Mapping: Yasser Abdelaziz Dahou Djilali,

Sanath Narayan,

Haithem Boussaid,

Ebtessam Almazrouei,

Merouane Debbah; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Djilali_2023_ICCV, author = {Djilali, Yasser Abdelaziz Dahou and Narayan, Sanath and Boussaid, Haithem and Almazrouei, Ebtessam and Debbah, Merouane}, title = {Lip2Vec: Efficient and Robust Visual Speech Recognition via Latent-to-Latent Visual to Audio Representation Mapping}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13790-13801} }
Privacy Preserving Localization via Coordinate Permutations: Linfei Pan,

Johannes L. Schönberger,

Viktor Larsson,

Marc Pollefeys; [pdf] [supp]
[bibtex]
@InProceedings{Pan_2023_ICCV, author = {Pan, Linfei and Sch\"onberger, Johannes L. and Larsson, Viktor and Pollefeys, Marc}, title = {Privacy Preserving Localization via Coordinate Permutations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18174-18183} }
Random Boxes Are Open-world Object Detectors: Yanghao Wang,

Zhongqi Yue,

Xian-Sheng Hua,

Hanwang Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Yanghao and Yue, Zhongqi and Hua, Xian-Sheng and Zhang, Hanwang}, title = {Random Boxes Are Open-world Object Detectors}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6233-6243} }
DiffDreamer: Towards Consistent Unsupervised Single-view Scene Extrapolation with Conditional Diffusion Models: Shengqu Cai,

Eric Ryan Chan,

Songyou Peng,

Mohamad Shahbazi,

Anton Obukhov,

Luc Van Gool,

Gordon Wetzstein; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cai_2023_ICCV, author = {Cai, Shengqu and Chan, Eric Ryan and Peng, Songyou and Shahbazi, Mohamad and Obukhov, Anton and Van Gool, Luc and Wetzstein, Gordon}, title = {DiffDreamer: Towards Consistent Unsupervised Single-view Scene Extrapolation with Conditional Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2139-2150} }
Spectral Graphormer: Spectral Graph-Based Transformer for Egocentric Two-Hand Reconstruction using Multi-View Color Images: Tze Ho Elden Tse,

Franziska Mueller,

Zhengyang Shen,

Danhang Tang,

Thabo Beeler,

Mingsong Dou,

Yinda Zhang,

Sasa Petrovic,

Hyung Jin Chang,

Jonathan Taylor,

Bardia Doosti; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tse_2023_ICCV, author = {Tse, Tze Ho Elden and Mueller, Franziska and Shen, Zhengyang and Tang, Danhang and Beeler, Thabo and Dou, Mingsong and Zhang, Yinda and Petrovic, Sasa and Chang, Hyung Jin and Taylor, Jonathan and Doosti, Bardia}, title = {Spectral Graphormer: Spectral Graph-Based Transformer for Egocentric Two-Hand Reconstruction using Multi-View Color Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14666-14677} }
SMMix: Self-Motivated Image Mixing for Vision Transformers: Mengzhao Chen,

Mingbao Lin,

Zhihang Lin,

Yuxin Zhang,

Fei Chao,

Rongrong Ji; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Mengzhao and Lin, Mingbao and Lin, Zhihang and Zhang, Yuxin and Chao, Fei and Ji, Rongrong}, title = {SMMix: Self-Motivated Image Mixing for Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17260-17270} }
Enhancing Adversarial Robustness in Low-Label Regime via Adaptively Weighted Regularization and Knowledge Distillation: Dongyoon Yang,

Insung Kong,

Yongdai Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Dongyoon and Kong, Insung and Kim, Yongdai}, title = {Enhancing Adversarial Robustness in Low-Label Regime via Adaptively Weighted Regularization and Knowledge Distillation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4552-4561} }
Recovering a Molecule's 3D Dynamics from Liquid-phase Electron Microscopy Movies: Enze Ye,

Yuhang Wang,

Hong Zhang,

Yiqin Gao,

Huan Wang,

He Sun; [pdf] [supp]
[bibtex]
@InProceedings{Ye_2023_ICCV, author = {Ye, Enze and Wang, Yuhang and Zhang, Hong and Gao, Yiqin and Wang, Huan and Sun, He}, title = {Recovering a Molecule's 3D Dynamics from Liquid-phase Electron Microscopy Movies}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10767-10777} }
Reconciling Object-Level and Global-Level Objectives for Long-Tail Detection: Shaoyu Zhang,

Chen Chen,

Silong Peng; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Shaoyu and Chen, Chen and Peng, Silong}, title = {Reconciling Object-Level and Global-Level Objectives for Long-Tail Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18982-18992} }
In-Style: Bridging Text and Uncurated Videos with Style Transfer for Text-Video Retrieval: Nina Shvetsova,

Anna Kukleva,

Bernt Schiele,

Hilde Kuehne; [pdf] [supp]
[bibtex]
@InProceedings{Shvetsova_2023_ICCV, author = {Shvetsova, Nina and Kukleva, Anna and Schiele, Bernt and Kuehne, Hilde}, title = {In-Style: Bridging Text and Uncurated Videos with Style Transfer for Text-Video Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21981-21992} }
MIMO-NeRF: Fast Neural Rendering with Multi-input Multi-output Neural Radiance Fields: Takuhiro Kaneko; [pdf] [supp]
[bibtex]
@InProceedings{Kaneko_2023_ICCV, author = {Kaneko, Takuhiro}, title = {MIMO-NeRF: Fast Neural Rendering with Multi-input Multi-output Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3273-3283} }
Instance Neural Radiance Field: Yichen Liu,

Benran Hu,

Junkai Huang,

Yu-Wing Tai,

Chi-Keung Tang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Yichen and Hu, Benran and Huang, Junkai and Tai, Yu-Wing and Tang, Chi-Keung}, title = {Instance Neural Radiance Field}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {787-796} }
One-bit Flip is All You Need: When Bit-flip Attack Meets Model Training: Jianshuo Dong,

Han Qiu,

Yiming Li,

Tianwei Zhang,

Yuanjie Li,

Zeqi Lai,

Chao Zhang,

Shu-Tao Xia; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dong_2023_ICCV, author = {Dong, Jianshuo and Qiu, Han and Li, Yiming and Zhang, Tianwei and Li, Yuanjie and Lai, Zeqi and Zhang, Chao and Xia, Shu-Tao}, title = {One-bit Flip is All You Need: When Bit-flip Attack Meets Model Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4688-4698} }
CLIPTER: Looking at the Bigger Picture in Scene Text Recognition: Aviad Aberdam,

David Bensaid,

Alona Golts,

Roy Ganz,

Oren Nuriel,

Royee Tichauer,

Shai Mazor,

Ron Litman; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Aberdam_2023_ICCV, author = {Aberdam, Aviad and Bensaid, David and Golts, Alona and Ganz, Roy and Nuriel, Oren and Tichauer, Royee and Mazor, Shai and Litman, Ron}, title = {CLIPTER: Looking at the Bigger Picture in Scene Text Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21706-21717} }
Revisiting Scene Text Recognition: A Data Perspective: Qing Jiang,

Jiapeng Wang,

Dezhi Peng,

Chongyu Liu,

Lianwen Jin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jiang_2023_ICCV, author = {Jiang, Qing and Wang, Jiapeng and Peng, Dezhi and Liu, Chongyu and Jin, Lianwen}, title = {Revisiting Scene Text Recognition: A Data Perspective}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20543-20554} }
Improving CLIP Fine-tuning Performance: Yixuan Wei,

Han Hu,

Zhenda Xie,

Ze Liu,

Zheng Zhang,

Yue Cao,

Jianmin Bao,

Dong Chen,

Baining Guo; [pdf] [supp]
[bibtex]
@InProceedings{Wei_2023_ICCV, author = {Wei, Yixuan and Hu, Han and Xie, Zhenda and Liu, Ze and Zhang, Zheng and Cao, Yue and Bao, Jianmin and Chen, Dong and Guo, Baining}, title = {Improving CLIP Fine-tuning Performance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5439-5449} }
The Power of Sound (TPoS): Audio Reactive Video Generation with Stable Diffusion: Yujin Jeong,

Wonjeong Ryoo,

Seunghyun Lee,

Dabin Seo,

Wonmin Byeon,

Sangpil Kim,

Jinkyu Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jeong_2023_ICCV, author = {Jeong, Yujin and Ryoo, Wonjeong and Lee, Seunghyun and Seo, Dabin and Byeon, Wonmin and Kim, Sangpil and Kim, Jinkyu}, title = {The Power of Sound (TPoS): Audio Reactive Video Generation with Stable Diffusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7822-7832} }
SOCS: Semantically-Aware Object Coordinate Space for Category-Level 6D Object Pose Estimation under Large Shape Variations: Boyan Wan,

Yifei Shi,

Kai Xu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wan_2023_ICCV, author = {Wan, Boyan and Shi, Yifei and Xu, Kai}, title = {SOCS: Semantically-Aware Object Coordinate Space for Category-Level 6D Object Pose Estimation under Large Shape Variations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14065-14074} }
NeRF-LOAM: Neural Implicit Representation for Large-Scale Incremental LiDAR Odometry and Mapping: Junyuan Deng,

Qi Wu,

Xieyuanli Chen,

Songpengcheng Xia,

Zhen Sun,

Guoqing Liu,

Wenxian Yu,

Ling Pei; [pdf] [supp]
[bibtex]
@InProceedings{Deng_2023_ICCV, author = {Deng, Junyuan and Wu, Qi and Chen, Xieyuanli and Xia, Songpengcheng and Sun, Zhen and Liu, Guoqing and Yu, Wenxian and Pei, Ling}, title = {NeRF-LOAM: Neural Implicit Representation for Large-Scale Incremental LiDAR Odometry and Mapping}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8218-8227} }
DINAR: Diffusion Inpainting of Neural Textures for One-Shot Human Avatars: David Svitov,

Dmitrii Gudkov,

Renat Bashirov,

Victor Lempitsky; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Svitov_2023_ICCV, author = {Svitov, David and Gudkov, Dmitrii and Bashirov, Renat and Lempitsky, Victor}, title = {DINAR: Diffusion Inpainting of Neural Textures for One-Shot Human Avatars}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7062-7072} }
DPM-OT: A New Diffusion Probabilistic Model Based on Optimal Transport: Zezeng Li,

Shenghao Li,

Zhanpeng Wang,

Na Lei,

Zhongxuan Luo,

David Xianfeng Gu; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Zezeng and Li, Shenghao and Wang, Zhanpeng and Lei, Na and Luo, Zhongxuan and Gu, David Xianfeng}, title = {DPM-OT: A New Diffusion Probabilistic Model Based on Optimal Transport}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22624-22633} }
ElasticViT: Conflict-aware Supernet Training for Deploying Fast Vision Transformer on Diverse Mobile Devices: Chen Tang,

Li Lyna Zhang,

Huiqiang Jiang,

Jiahang Xu,

Ting Cao,

Quanlu Zhang,

Yuqing Yang,

Zhi Wang,

Mao Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tang_2023_ICCV, author = {Tang, Chen and Zhang, Li Lyna and Jiang, Huiqiang and Xu, Jiahang and Cao, Ting and Zhang, Quanlu and Yang, Yuqing and Wang, Zhi and Yang, Mao}, title = {ElasticViT: Conflict-aware Supernet Training for Deploying Fast Vision Transformer on Diverse Mobile Devices}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5829-5840} }
OmniLabel: A Challenging Benchmark for Language-Based Object Detection: Samuel Schulter,

Vijay Kumar B G,

Yumin Suh,

Konstantinos M. Dafnis,

Zhixing Zhang,

Shiyu Zhao,

Dimitris Metaxas; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Schulter_2023_ICCV, author = {Schulter, Samuel and G, Vijay Kumar B and Suh, Yumin and Dafnis, Konstantinos M. and Zhang, Zhixing and Zhao, Shiyu and Metaxas, Dimitris}, title = {OmniLabel: A Challenging Benchmark for Language-Based Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11953-11962} }
Noise-Aware Learning from Web-Crawled Image-Text Data for Image Captioning: Wooyoung Kang,

Jonghwan Mun,

Sungjun Lee,

Byungseok Roh; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kang_2023_ICCV, author = {Kang, Wooyoung and Mun, Jonghwan and Lee, Sungjun and Roh, Byungseok}, title = {Noise-Aware Learning from Web-Crawled Image-Text Data for Image Captioning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2942-2952} }
Divide&Classify: Fine-Grained Classification for City-Wide Visual Geo-Localization: Gabriele Trivigno,

Gabriele Berton,

Juan Aragon,

Barbara Caputo,

Carlo Masone; [pdf] [supp]
[bibtex]
@InProceedings{Trivigno_2023_ICCV, author = {Trivigno, Gabriele and Berton, Gabriele and Aragon, Juan and Caputo, Barbara and Masone, Carlo}, title = {Divide\&Classify: Fine-Grained Classification for City-Wide Visual Geo-Localization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11142-11152} }
3D Semantic Subspace Traverser: Empowering 3D Generative Model with Shape Editing Capability: Ruowei Wang,

Yu Liu,

Pei Su,

Jianwei Zhang,

Qijun Zhao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Ruowei and Liu, Yu and Su, Pei and Zhang, Jianwei and Zhao, Qijun}, title = {3D Semantic Subspace Traverser: Empowering 3D Generative Model with Shape Editing Capability}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14406-14417} }
Inherent Redundancy in Spiking Neural Networks: Man Yao,

Jiakui Hu,

Guangshe Zhao,

Yaoyuan Wang,

Ziyang Zhang,

Bo Xu,

Guoqi Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yao_2023_ICCV, author = {Yao, Man and Hu, Jiakui and Zhao, Guangshe and Wang, Yaoyuan and Zhang, Ziyang and Xu, Bo and Li, Guoqi}, title = {Inherent Redundancy in Spiking Neural Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16924-16934} }
Text2Room: Extracting Textured 3D Meshes from 2D Text-to-Image Models: Lukas Höllein,

Ang Cao,

Andrew Owens,

Justin Johnson,

Matthias Nießner; [pdf] [supp]
[bibtex]
@InProceedings{Hollein_2023_ICCV, author = {H\"ollein, Lukas and Cao, Ang and Owens, Andrew and Johnson, Justin and Nie{\ss}ner, Matthias}, title = {Text2Room: Extracting Textured 3D Meshes from 2D Text-to-Image Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7909-7920} }
On the Robustness of Normalizing Flows for Inverse Problems in Imaging: Seongmin Hong,

Inbum Park,

Se Young Chun; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hong_2023_ICCV, author = {Hong, Seongmin and Park, Inbum and Chun, Se Young}, title = {On the Robustness of Normalizing Flows for Inverse Problems in Imaging}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10745-10755} }
FastRecon: Few-shot Industrial Anomaly Detection via Fast Feature Reconstruction: Zheng Fang,

Xiaoyang Wang,

Haocheng Li,

Jiejie Liu,

Qiugui Hu,

Jimin Xiao; [pdf]
[bibtex]
@InProceedings{Fang_2023_ICCV, author = {Fang, Zheng and Wang, Xiaoyang and Li, Haocheng and Liu, Jiejie and Hu, Qiugui and Xiao, Jimin}, title = {FastRecon: Few-shot Industrial Anomaly Detection via Fast Feature Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17481-17490} }
Local or Global: Selective Knowledge Assimilation for Federated Learning with Limited Labels: Yae Jee Cho,

Gauri Joshi,

Dimitrios Dimitriadis; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cho_2023_ICCV, author = {Cho, Yae Jee and Joshi, Gauri and Dimitriadis, Dimitrios}, title = {Local or Global: Selective Knowledge Assimilation for Federated Learning with Limited Labels}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17087-17096} }
DistillBEV: Boosting Multi-Camera 3D Object Detection with Cross-Modal Knowledge Distillation: Zeyu Wang,

Dingwen Li,

Chenxu Luo,

Cihang Xie,

Xiaodong Yang; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Zeyu and Li, Dingwen and Luo, Chenxu and Xie, Cihang and Yang, Xiaodong}, title = {DistillBEV: Boosting Multi-Camera 3D Object Detection with Cross-Modal Knowledge Distillation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8637-8646} }
PoseFix: Correcting 3D Human Poses with Natural Language: Ginger Delmas,

Philippe Weinzaepfel,

Francesc Moreno-Noguer,

Grégory Rogez; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Delmas_2023_ICCV, author = {Delmas, Ginger and Weinzaepfel, Philippe and Moreno-Noguer, Francesc and Rogez, Gr\'egory}, title = {PoseFix: Correcting 3D Human Poses with Natural Language}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15018-15028} }
TAPIR: Tracking Any Point with Per-Frame Initialization and Temporal Refinement: Carl Doersch,

Yi Yang,

Mel Vecerik,

Dilara Gokay,

Ankush Gupta,

Yusuf Aytar,

Joao Carreira,

Andrew Zisserman; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Doersch_2023_ICCV, author = {Doersch, Carl and Yang, Yi and Vecerik, Mel and Gokay, Dilara and Gupta, Ankush and Aytar, Yusuf and Carreira, Joao and Zisserman, Andrew}, title = {TAPIR: Tracking Any Point with Per-Frame Initialization and Temporal Refinement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10061-10072} }
SwinLSTM: Improving Spatiotemporal Prediction Accuracy using Swin Transformer and LSTM: Song Tang,

Chuang Li,

Pu Zhang,

RongNian Tang; [pdf] [arXiv]
[bibtex]
@InProceedings{Tang_2023_ICCV, author = {Tang, Song and Li, Chuang and Zhang, Pu and Tang, RongNian}, title = {SwinLSTM: Improving Spatiotemporal Prediction Accuracy using Swin Transformer and LSTM}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13470-13479} }
Detecting Objects with Context-Likelihood Graphs and Graph Refinement: Aritra Bhowmik,

Yu Wang,

Nora Baka,

Martin R. Oswald,

Cees G. M. Snoek; [pdf]
[bibtex]
@InProceedings{Bhowmik_2023_ICCV, author = {Bhowmik, Aritra and Wang, Yu and Baka, Nora and Oswald, Martin R. and Snoek, Cees G. M.}, title = {Detecting Objects with Context-Likelihood Graphs and Graph Refinement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6524-6533} }
Coarse-to-Fine Amodal Segmentation with Shape Prior: Jianxiong Gao,

Xuelin Qian,

Yikai Wang,

Tianjun Xiao,

Tong He,

Zheng Zhang,

Yanwei Fu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gao_2023_ICCV, author = {Gao, Jianxiong and Qian, Xuelin and Wang, Yikai and Xiao, Tianjun and He, Tong and Zhang, Zheng and Fu, Yanwei}, title = {Coarse-to-Fine Amodal Segmentation with Shape Prior}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1262-1271} }
DEDRIFT: Robust Similarity Search under Content Drift: Dmitry Baranchuk,

Matthijs Douze,

Yash Upadhyay,

I. Zeki Yalniz; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Baranchuk_2023_ICCV, author = {Baranchuk, Dmitry and Douze, Matthijs and Upadhyay, Yash and Yalniz, I. Zeki}, title = {DEDRIFT: Robust Similarity Search under Content Drift}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11026-11035} }
Learning Pseudo-Relations for Cross-domain Semantic Segmentation: Dong Zhao,

Shuang Wang,

Qi Zang,

Dou Quan,

Xiutiao Ye,

Rui Yang,

Licheng Jiao; [pdf] [supp]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Dong and Wang, Shuang and Zang, Qi and Quan, Dou and Ye, Xiutiao and Yang, Rui and Jiao, Licheng}, title = {Learning Pseudo-Relations for Cross-domain Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19191-19203} }
AdVerb: Visually Guided Audio Dereverberation: Sanjoy Chowdhury,

Sreyan Ghosh,

Subhrajyoti Dasgupta,

Anton Ratnarajah,

Utkarsh Tyagi,

Dinesh Manocha; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chowdhury_2023_ICCV, author = {Chowdhury, Sanjoy and Ghosh, Sreyan and Dasgupta, Subhrajyoti and Ratnarajah, Anton and Tyagi, Utkarsh and Manocha, Dinesh}, title = {AdVerb: Visually Guided Audio Dereverberation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7884-7896} }
Audio-Enhanced Text-to-Video Retrieval using Text-Conditioned Feature Alignment: Sarah Ibrahimi,

Xiaohang Sun,

Pichao Wang,

Amanmeet Garg,

Ashutosh Sanan,

Mohamed Omar; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ibrahimi_2023_ICCV, author = {Ibrahimi, Sarah and Sun, Xiaohang and Wang, Pichao and Garg, Amanmeet and Sanan, Ashutosh and Omar, Mohamed}, title = {Audio-Enhanced Text-to-Video Retrieval using Text-Conditioned Feature Alignment}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12054-12064} }
Open-vocabulary Object Segmentation with Diffusion Models: Ziyi Li,

Qinye Zhou,

Xiaoyun Zhang,

Ya Zhang,

Yanfeng Wang,

Weidi Xie; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Ziyi and Zhou, Qinye and Zhang, Xiaoyun and Zhang, Ya and Wang, Yanfeng and Xie, Weidi}, title = {Open-vocabulary Object Segmentation with Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7667-7676} }
Human-centric Scene Understanding for 3D Large-scale Scenarios: Yiteng Xu,

Peishan Cong,

Yichen Yao,

Runnan Chen,

Yuenan Hou,

Xinge Zhu,

Xuming He,

Jingyi Yu,

Yuexin Ma; [pdf] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Yiteng and Cong, Peishan and Yao, Yichen and Chen, Runnan and Hou, Yuenan and Zhu, Xinge and He, Xuming and Yu, Jingyi and Ma, Yuexin}, title = {Human-centric Scene Understanding for 3D Large-scale Scenarios}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20349-20359} }
With a Little Help from Your Own Past: Prototypical Memory Networks for Image Captioning: Manuele Barraco,

Sara Sarto,

Marcella Cornia,

Lorenzo Baraldi,

Rita Cucchiara; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Barraco_2023_ICCV, author = {Barraco, Manuele and Sarto, Sara and Cornia, Marcella and Baraldi, Lorenzo and Cucchiara, Rita}, title = {With a Little Help from Your Own Past: Prototypical Memory Networks for Image Captioning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3021-3031} }
SimMatchV2: Semi-Supervised Learning with Graph Consistency: Mingkai Zheng,

Shan You,

Lang Huang,

Chen Luo,

Fei Wang,

Chen Qian,

Chang Xu; [pdf] [arXiv]
[bibtex]
@InProceedings{Zheng_2023_ICCV, author = {Zheng, Mingkai and You, Shan and Huang, Lang and Luo, Chen and Wang, Fei and Qian, Chen and Xu, Chang}, title = {SimMatchV2: Semi-Supervised Learning with Graph Consistency}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16432-16442} }
Reinforced Disentanglement for Face Swapping without Skip Connection: Xiaohang Ren,

Xingyu Chen,

Pengfei Yao,

Heung-Yeung Shum,

Baoyuan Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ren_2023_ICCV, author = {Ren, Xiaohang and Chen, Xingyu and Yao, Pengfei and Shum, Heung-Yeung and Wang, Baoyuan}, title = {Reinforced Disentanglement for Face Swapping without Skip Connection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20665-20675} }
PDiscoNet: Semantically consistent part discovery for fine-grained recognition: Robert van der Klis,

Stephan Alaniz,

Massimiliano Mancini,

Cassio F. Dantas,

Dino Ienco,

Zeynep Akata,

Diego Marcos; [pdf] [arXiv]
[bibtex]
@InProceedings{van_der_Klis_2023_ICCV, author = {van der Klis, Robert and Alaniz, Stephan and Mancini, Massimiliano and Dantas, Cassio F. and Ienco, Dino and Akata, Zeynep and Marcos, Diego}, title = {PDiscoNet: Semantically consistent part discovery for fine-grained recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1866-1876} }
Privacy-Preserving Face Recognition Using Random Frequency Components: Yuxi Mi,

Yuge Huang,

Jiazhen Ji,

Minyi Zhao,

Jiaxiang Wu,

Xingkun Xu,

Shouhong Ding,

Shuigeng Zhou; [pdf] [arXiv]
[bibtex]
@InProceedings{Mi_2023_ICCV, author = {Mi, Yuxi and Huang, Yuge and Ji, Jiazhen and Zhao, Minyi and Wu, Jiaxiang and Xu, Xingkun and Ding, Shouhong and Zhou, Shuigeng}, title = {Privacy-Preserving Face Recognition Using Random Frequency Components}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19673-19684} }
Vision Transformer Adapters for Generalizable Multitask Learning: Deblina Bhattacharjee,

Sabine Süsstrunk,

Mathieu Salzmann; [pdf] [supp]
[bibtex]
@InProceedings{Bhattacharjee_2023_ICCV, author = {Bhattacharjee, Deblina and S\"usstrunk, Sabine and Salzmann, Mathieu}, title = {Vision Transformer Adapters for Generalizable Multitask Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19015-19026} }
How to Choose your Best Allies for a Transferable Attack?: Thibault Maho,

Seyed-Mohsen Moosavi-Dezfooli,

Teddy Furon; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Maho_2023_ICCV, author = {Maho, Thibault and Moosavi-Dezfooli, Seyed-Mohsen and Furon, Teddy}, title = {How to Choose your Best Allies for a Transferable Attack?}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4542-4551} }
CVRecon: Rethinking 3D Geometric Feature Learning For Neural Reconstruction: Ziyue Feng,

Liang Yang,

Pengsheng Guo,

Bing Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Feng_2023_ICCV, author = {Feng, Ziyue and Yang, Liang and Guo, Pengsheng and Li, Bing}, title = {CVRecon: Rethinking 3D Geometric Feature Learning For Neural Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17750-17760} }
Self-Supervised Object Detection from Egocentric Videos: Peri Akiva,

Jing Huang,

Kevin J Liang,

Rama Kovvuri,

Xingyu Chen,

Matt Feiszli,

Kristin Dana,

Tal Hassner; [pdf] [supp]
[bibtex]
@InProceedings{Akiva_2023_ICCV, author = {Akiva, Peri and Huang, Jing and Liang, Kevin J and Kovvuri, Rama and Chen, Xingyu and Feiszli, Matt and Dana, Kristin and Hassner, Tal}, title = {Self-Supervised Object Detection from Egocentric Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5225-5237} }
Prior-guided Source-free Domain Adaptation for Human Pose Estimation: Dripta S. Raychaudhuri,

Calvin-Khang Ta,

Arindam Dutta,

Rohit Lal,

Amit K. Roy-Chowdhury; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Raychaudhuri_2023_ICCV, author = {Raychaudhuri, Dripta S. and Ta, Calvin-Khang and Dutta, Arindam and Lal, Rohit and Roy-Chowdhury, Amit K.}, title = {Prior-guided Source-free Domain Adaptation for Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14996-15006} }
ClothesNet: An Information-Rich 3D Garment Model Repository with Simulated Clothes Environment: Bingyang Zhou,

Haoyu Zhou,

Tianhai Liang,

Qiaojun Yu,

Siheng Zhao,

Yuwei Zeng,

Jun Lv,

Siyuan Luo,

Qiancai Wang,

Xinyuan Yu,

Haonan Chen,

Cewu Lu,

Lin Shao; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Bingyang and Zhou, Haoyu and Liang, Tianhai and Yu, Qiaojun and Zhao, Siheng and Zeng, Yuwei and Lv, Jun and Luo, Siyuan and Wang, Qiancai and Yu, Xinyuan and Chen, Haonan and Lu, Cewu and Shao, Lin}, title = {ClothesNet: An Information-Rich 3D Garment Model Repository with Simulated Clothes Environment}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20428-20438} }
Auxiliary Tasks Benefit 3D Skeleton-based Human Motion Prediction: Chenxin Xu,

Robby T. Tan,

Yuhong Tan,

Siheng Chen,

Xinchao Wang,

Yanfeng Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Chenxin and Tan, Robby T. and Tan, Yuhong and Chen, Siheng and Wang, Xinchao and Wang, Yanfeng}, title = {Auxiliary Tasks Benefit 3D Skeleton-based Human Motion Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9509-9520} }
Measuring Asymmetric Gradient Discrepancy in Parallel Continual Learning: Fan Lyu,

Qing Sun,

Fanhua Shang,

Liang Wan,

Wei Feng; [pdf] [supp]
[bibtex]
@InProceedings{Lyu_2023_ICCV, author = {Lyu, Fan and Sun, Qing and Shang, Fanhua and Wan, Liang and Feng, Wei}, title = {Measuring Asymmetric Gradient Discrepancy in Parallel Continual Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11411-11420} }
StyleLipSync: Style-based Personalized Lip-sync Video Generation: Taekyung Ki,

Dongchan Min; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ki_2023_ICCV, author = {Ki, Taekyung and Min, Dongchan}, title = {StyleLipSync: Style-based Personalized Lip-sync Video Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22841-22850} }
Cross Contrasting Feature Perturbation for Domain Generalization: Chenming Li,

Daoan Zhang,

Wenjian Huang,

Jianguo Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Chenming and Zhang, Daoan and Huang, Wenjian and Zhang, Jianguo}, title = {Cross Contrasting Feature Perturbation for Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1327-1337} }
DiffusionRet: Generative Text-Video Retrieval with Diffusion Model: Peng Jin,

Hao Li,

Zesen Cheng,

Kehan Li,

Xiangyang Ji,

Chang Liu,

Li Yuan,

Jie Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jin_2023_ICCV, author = {Jin, Peng and Li, Hao and Cheng, Zesen and Li, Kehan and Ji, Xiangyang and Liu, Chang and Yuan, Li and Chen, Jie}, title = {DiffusionRet: Generative Text-Video Retrieval with Diffusion Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2470-2481} }
Efficient 3D Semantic Segmentation with Superpoint Transformer: Damien Robert,

Hugo Raguet,

Loic Landrieu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Robert_2023_ICCV, author = {Robert, Damien and Raguet, Hugo and Landrieu, Loic}, title = {Efficient 3D Semantic Segmentation with Superpoint Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17195-17204} }
Adversarial Finetuning with Latent Representation Constraint to Mitigate Accuracy-Robustness Tradeoff: Satoshi Suzuki,

Shin'ya Yamaguchi,

Shoichiro Takeda,

Sekitoshi Kanai,

Naoki Makishima,

Atsushi Ando,

Ryo Masumura; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Suzuki_2023_ICCV, author = {Suzuki, Satoshi and Yamaguchi, Shin'ya and Takeda, Shoichiro and Kanai, Sekitoshi and Makishima, Naoki and Ando, Atsushi and Masumura, Ryo}, title = {Adversarial Finetuning with Latent Representation Constraint to Mitigate Accuracy-Robustness Tradeoff}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4390-4401} }
HyperDiffusion: Generating Implicit Neural Fields with Weight-Space Diffusion: Ziya Erkoç,

Fangchang Ma,

Qi Shan,

Matthias Nießner,

Angela Dai; [pdf] [supp]
[bibtex]
@InProceedings{Erkoc_2023_ICCV, author = {Erko\c{c}, Ziya and Ma, Fangchang and Shan, Qi and Nie{\ss}ner, Matthias and Dai, Angela}, title = {HyperDiffusion: Generating Implicit Neural Fields with Weight-Space Diffusion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14300-14310} }
Retinexformer: One-stage Retinex-based Transformer for Low-light Image Enhancement: Yuanhao Cai,

Hao Bian,

Jing Lin,

Haoqian Wang,

Radu Timofte,

Yulun Zhang; [pdf] [arXiv]
[bibtex]
@InProceedings{Cai_2023_ICCV, author = {Cai, Yuanhao and Bian, Hao and Lin, Jing and Wang, Haoqian and Timofte, Radu and Zhang, Yulun}, title = {Retinexformer: One-stage Retinex-based Transformer for Low-light Image Enhancement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12504-12513} }
Minimum Latency Deep Online Video Stabilization: Zhuofan Zhang,

Zhen Liu,

Ping Tan,

Bing Zeng,

Shuaicheng Liu; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Zhuofan and Liu, Zhen and Tan, Ping and Zeng, Bing and Liu, Shuaicheng}, title = {Minimum Latency Deep Online Video Stabilization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23030-23039} }
Speech2Lip: High-fidelity Speech to Lip Generation by Learning from a Short Video: Xiuzhe Wu,

Pengfei Hu,

Yang Wu,

Xiaoyang Lyu,

Yan-Pei Cao,

Ying Shan,

Wenming Yang,

Zhongqian Sun,

Xiaojuan Qi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Xiuzhe and Hu, Pengfei and Wu, Yang and Lyu, Xiaoyang and Cao, Yan-Pei and Shan, Ying and Yang, Wenming and Sun, Zhongqian and Qi, Xiaojuan}, title = {Speech2Lip: High-fidelity Speech to Lip Generation by Learning from a Short Video}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22168-22177} }
UHDNeRF: Ultra-High-Definition Neural Radiance Fields: Quewei Li,

Feichao Li,

Jie Guo,

Yanwen Guo; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Quewei and Li, Feichao and Guo, Jie and Guo, Yanwen}, title = {UHDNeRF: Ultra-High-Definition Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23097-23108} }
Linear Spaces of Meanings: Compositional Structures in Vision-Language Models: Matthew Trager,

Pramuditha Perera,

Luca Zancato,

Alessandro Achille,

Parminder Bhatia,

Stefano Soatto; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Trager_2023_ICCV, author = {Trager, Matthew and Perera, Pramuditha and Zancato, Luca and Achille, Alessandro and Bhatia, Parminder and Soatto, Stefano}, title = {Linear Spaces of Meanings: Compositional Structures in Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15395-15404} }
MULLER: Multilayer Laplacian Resizer for Vision: Zhengzhong Tu,

Peyman Milanfar,

Hossein Talebi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tu_2023_ICCV, author = {Tu, Zhengzhong and Milanfar, Peyman and Talebi, Hossein}, title = {MULLER: Multilayer Laplacian Resizer for Vision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6877-6887} }
X-VoE: Measuring eXplanatory Violation of Expectation in Physical Events: Bo Dai,

Linge Wang,

Baoxiong Jia,

Zeyu Zhang,

Song-Chun Zhu,

Chi Zhang,

Yixin Zhu; [pdf] [supp]
[bibtex]
@InProceedings{Dai_2023_ICCV, author = {Dai, Bo and Wang, Linge and Jia, Baoxiong and Zhang, Zeyu and Zhu, Song-Chun and Zhang, Chi and Zhu, Yixin}, title = {X-VoE: Measuring eXplanatory Violation of Expectation in Physical Events}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3992-4002} }
Tracking by Natural Language Specification with Long Short-term Context Decoupling: Ding Ma,

Xiangqian Wu; [pdf]
[bibtex]
@InProceedings{Ma_2023_ICCV, author = {Ma, Ding and Wu, Xiangqian}, title = {Tracking by Natural Language Specification with Long Short-term Context Decoupling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14012-14021} }
COOP: Decoupling and Coupling of Whole-Body Grasping Pose Generation: Yanzhao Zheng,

Yunzhou Shi,

Yuhao Cui,

Zhongzhou Zhao,

Zhiling Luo,

Wei Zhou; [pdf]
[bibtex]
@InProceedings{Zheng_2023_ICCV, author = {Zheng, Yanzhao and Shi, Yunzhou and Cui, Yuhao and Zhao, Zhongzhou and Luo, Zhiling and Zhou, Wei}, title = {COOP: Decoupling and Coupling of Whole-Body Grasping Pose Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2163-2173} }
Pyramid Dual Domain Injection Network for Pan-sharpening: Xuanhua He,

Keyu Yan,

Rui Li,

Chengjun Xie,

Jie Zhang,

Man Zhou; [pdf]
[bibtex]
@InProceedings{He_2023_ICCV, author = {He, Xuanhua and Yan, Keyu and Li, Rui and Xie, Chengjun and Zhang, Jie and Zhou, Man}, title = {Pyramid Dual Domain Injection Network for Pan-sharpening}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12908-12917} }
Why do networks have inhibitory/negative connections?: Qingyang Wang,

Mike A. Powell,

Ali Geisa,

Eric Bridgeford,

Carey E. Priebe,

Joshua T. Vogelstein; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Qingyang and Powell, Mike A. and Geisa, Ali and Bridgeford, Eric and Priebe, Carey E. and Vogelstein, Joshua T.}, title = {Why do networks have inhibitory/negative connections?}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22551-22559} }
Ordinal Label Distribution Learning: Changsong Wen,

Xin Zhang,

Xingxu Yao,

Jufeng Yang; [pdf]
[bibtex]
@InProceedings{Wen_2023_ICCV, author = {Wen, Changsong and Zhang, Xin and Yao, Xingxu and Yang, Jufeng}, title = {Ordinal Label Distribution Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23481-23491} }
Model Calibration in Dense Classification with Adaptive Label Perturbation: Jiawei Liu,

Changkun Ye,

Shan Wang,

Ruikai Cui,

Jing Zhang,

Kaihao Zhang,

Nick Barnes; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Jiawei and Ye, Changkun and Wang, Shan and Cui, Ruikai and Zhang, Jing and Zhang, Kaihao and Barnes, Nick}, title = {Model Calibration in Dense Classification with Adaptive Label Perturbation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1173-1184} }
Boosting Multi-modal Model Performance with Adaptive Gradient Modulation: Hong Li,

Xingyu Li,

Pengbo Hu,

Yinuo Lei,

Chunxiao Li,

Yi Zhou; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Hong and Li, Xingyu and Hu, Pengbo and Lei, Yinuo and Li, Chunxiao and Zhou, Yi}, title = {Boosting Multi-modal Model Performance with Adaptive Gradient Modulation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22214-22224} }
Semantic Information in Contrastive Learning: Shengjiang Quan,

Masahiro Hirano,

Yuji Yamakawa; [pdf] [supp]
[bibtex]
@InProceedings{Quan_2023_ICCV, author = {Quan, Shengjiang and Hirano, Masahiro and Yamakawa, Yuji}, title = {Semantic Information in Contrastive Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5686-5696} }
Structure and Content-Guided Video Synthesis with Diffusion Models: Patrick Esser,

Johnathan Chiu,

Parmida Atighehchian,

Jonathan Granskog,

Anastasis Germanidis; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Esser_2023_ICCV, author = {Esser, Patrick and Chiu, Johnathan and Atighehchian, Parmida and Granskog, Jonathan and Germanidis, Anastasis}, title = {Structure and Content-Guided Video Synthesis with Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7346-7356} }
NeSS-ST: Detecting Good and Stable Keypoints with a Neural Stability Score and the Shi-Tomasi detector: Konstantin Pakulev,

Alexander Vakhitov,

Gonzalo Ferrer; [pdf] [supp]
[bibtex]
@InProceedings{Pakulev_2023_ICCV, author = {Pakulev, Konstantin and Vakhitov, Alexander and Ferrer, Gonzalo}, title = {NeSS-ST: Detecting Good and Stable Keypoints with a Neural Stability Score and the Shi-Tomasi detector}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9578-9588} }
Beyond Skin Tone: A Multidimensional Measure of Apparent Skin Color: William Thong,

Przemyslaw Joniak,

Alice Xiang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Thong_2023_ICCV, author = {Thong, William and Joniak, Przemyslaw and Xiang, Alice}, title = {Beyond Skin Tone: A Multidimensional Measure of Apparent Skin Color}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4903-4913} }
PODA: Prompt-driven Zero-shot Domain Adaptation: Mohammad Fahes,

Tuan-Hung Vu,

Andrei Bursuc,

Patrick Pérez,

Raoul de Charette; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Fahes_2023_ICCV, author = {Fahes, Mohammad and Vu, Tuan-Hung and Bursuc, Andrei and P\'erez, Patrick and de Charette, Raoul}, title = {PODA: Prompt-driven Zero-shot Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18623-18633} }
Video Action Segmentation via Contextually Refined Temporal Keypoints: Borui Jiang,

Yang Jin,

Zhentao Tan,

Yadong Mu; [pdf] [supp]
[bibtex]
@InProceedings{Jiang_2023_ICCV, author = {Jiang, Borui and Jin, Yang and Tan, Zhentao and Mu, Yadong}, title = {Video Action Segmentation via Contextually Refined Temporal Keypoints}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13836-13845} }
Shatter and Gather: Learning Referring Image Segmentation with Text Supervision: Dongwon Kim,

Namyup Kim,

Cuiling Lan,

Suha Kwak; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2023_ICCV, author = {Kim, Dongwon and Kim, Namyup and Lan, Cuiling and Kwak, Suha}, title = {Shatter and Gather: Learning Referring Image Segmentation with Text Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15547-15557} }
Two-in-One Depth: Bridging the Gap Between Monocular and Binocular Self-Supervised Depth Estimation: Zhengming Zhou,

Qiulei Dong; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Zhengming and Dong, Qiulei}, title = {Two-in-One Depth: Bridging the Gap Between Monocular and Binocular Self-Supervised Depth Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9411-9421} }
SAFL-Net: Semantic-Agnostic Feature Learning Network with Auxiliary Plugins for Image Manipulation Detection: Zhihao Sun,

Haoran Jiang,

Danding Wang,

Xirong Li,

Juan Cao; [pdf] [supp]
[bibtex]
@InProceedings{Sun_2023_ICCV, author = {Sun, Zhihao and Jiang, Haoran and Wang, Danding and Li, Xirong and Cao, Juan}, title = {SAFL-Net: Semantic-Agnostic Feature Learning Network with Auxiliary Plugins for Image Manipulation Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22424-22433} }
DataDAM: Efficient Dataset Distillation with Attention Matching: Ahmad Sajedi,

Samir Khaki,

Ehsan Amjadian,

Lucy Z. Liu,

Yuri A. Lawryshyn,

Konstantinos N. Plataniotis; [pdf] [supp]
[bibtex]
@InProceedings{Sajedi_2023_ICCV, author = {Sajedi, Ahmad and Khaki, Samir and Amjadian, Ehsan and Liu, Lucy Z. and Lawryshyn, Yuri A. and Plataniotis, Konstantinos N.}, title = {DataDAM: Efficient Dataset Distillation with Attention Matching}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17097-17107} }
Rethinking Pose Estimation in Crowds: Overcoming the Detection Information Bottleneck and Ambiguity: Mu Zhou,

Lucas Stoffl,

Mackenzie Weygandt Mathis,

Alexander Mathis; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Mu and Stoffl, Lucas and Mathis, Mackenzie Weygandt and Mathis, Alexander}, title = {Rethinking Pose Estimation in Crowds: Overcoming the Detection Information Bottleneck and Ambiguity}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14689-14699} }
Social Diffusion: Long-term Multiple Human Motion Anticipation: Julian Tanke,

Linguang Zhang,

Amy Zhao,

Chengcheng Tang,

Yujun Cai,

Lezi Wang,

Po-Chen Wu,

Juergen Gall,

Cem Keskin; [pdf] [supp]
[bibtex]
@InProceedings{Tanke_2023_ICCV, author = {Tanke, Julian and Zhang, Linguang and Zhao, Amy and Tang, Chengcheng and Cai, Yujun and Wang, Lezi and Wu, Po-Chen and Gall, Juergen and Keskin, Cem}, title = {Social Diffusion: Long-term Multiple Human Motion Anticipation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9601-9611} }
Synchronize Feature Extracting and Matching: A Single Branch Framework for 3D Object Tracking: Teli Ma,

Mengmeng Wang,

Jimin Xiao,

Huifeng Wu,

Yong Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ma_2023_ICCV, author = {Ma, Teli and Wang, Mengmeng and Xiao, Jimin and Wu, Huifeng and Liu, Yong}, title = {Synchronize Feature Extracting and Matching: A Single Branch Framework for 3D Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9953-9963} }
Leveraging Intrinsic Properties for Non-Rigid Garment Alignment: Siyou Lin,

Boyao Zhou,

Zerong Zheng,

Hongwen Zhang,

Yebin Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lin_2023_ICCV, author = {Lin, Siyou and Zhou, Boyao and Zheng, Zerong and Zhang, Hongwen and Liu, Yebin}, title = {Leveraging Intrinsic Properties for Non-Rigid Garment Alignment}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14485-14496} }
NeILF++: Inter-Reflectable Light Fields for Geometry and Material Estimation: Jingyang Zhang,

Yao Yao,

Shiwei Li,

Jingbo Liu,

Tian Fang,

David McKinnon,

Yanghai Tsin,

Long Quan; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Jingyang and Yao, Yao and Li, Shiwei and Liu, Jingbo and Fang, Tian and McKinnon, David and Tsin, Yanghai and Quan, Long}, title = {NeILF++: Inter-Reflectable Light Fields for Geometry and Material Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3601-3610} }
MAGI: Multi-Annotated Explanation-Guided Learning: Yifei Zhang,

Siyi Gu,

Yuyang Gao,

Bo Pan,

Xiaofeng Yang,

Liang Zhao; [pdf]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Yifei and Gu, Siyi and Gao, Yuyang and Pan, Bo and Yang, Xiaofeng and Zhao, Liang}, title = {MAGI: Multi-Annotated Explanation-Guided Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1977-1987} }
Adaptive Positional Encoding for Bundle-Adjusting Neural Radiance Fields: Zelin Gao,

Weichen Dai,

Yu Zhang; [pdf]
[bibtex]
@InProceedings{Gao_2023_ICCV, author = {Gao, Zelin and Dai, Weichen and Zhang, Yu}, title = {Adaptive Positional Encoding for Bundle-Adjusting Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3284-3294} }
Inducing Neural Collapse to a Fixed Hierarchy-Aware Frame for Reducing Mistake Severity: Tong Liang,

Jim Davis; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liang_2023_ICCV, author = {Liang, Tong and Davis, Jim}, title = {Inducing Neural Collapse to a Fixed Hierarchy-Aware Frame for Reducing Mistake Severity}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1443-1452} }
PlanarTrack: A Large-scale Challenging Benchmark for Planar Object Tracking: Xinran Liu,

Xiaoqiong Liu,

Ziruo Yi,

Xin Zhou,

Thanh Le,

Libo Zhang,

Yan Huang,

Qing Yang,

Heng Fan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Xinran and Liu, Xiaoqiong and Yi, Ziruo and Zhou, Xin and Le, Thanh and Zhang, Libo and Huang, Yan and Yang, Qing and Fan, Heng}, title = {PlanarTrack: A Large-scale Challenging Benchmark for Planar Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20449-20458} }
Factorized Inverse Path Tracing for Efficient and Accurate Material-Lighting Estimation: Liwen Wu,

Rui Zhu,

Mustafa B. Yaldiz,

Yinhao Zhu,

Hong Cai,

Janarbek Matai,

Fatih Porikli,

Tzu-Mao Li,

Manmohan Chandraker,

Ravi Ramamoorthi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Liwen and Zhu, Rui and Yaldiz, Mustafa B. and Zhu, Yinhao and Cai, Hong and Matai, Janarbek and Porikli, Fatih and Li, Tzu-Mao and Chandraker, Manmohan and Ramamoorthi, Ravi}, title = {Factorized Inverse Path Tracing for Efficient and Accurate Material-Lighting Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3848-3858} }
P2C: Self-Supervised Point Cloud Completion from Single Partial Clouds: Ruikai Cui,

Shi Qiu,

Saeed Anwar,

Jiawei Liu,

Chaoyue Xing,

Jing Zhang,

Nick Barnes; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cui_2023_ICCV, author = {Cui, Ruikai and Qiu, Shi and Anwar, Saeed and Liu, Jiawei and Xing, Chaoyue and Zhang, Jing and Barnes, Nick}, title = {P2C: Self-Supervised Point Cloud Completion from Single Partial Clouds}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14351-14360} }
Overwriting Pretrained Bias with Finetuning Data: Angelina Wang,

Olga Russakovsky; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Angelina and Russakovsky, Olga}, title = {Overwriting Pretrained Bias with Finetuning Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3957-3968} }
Anti-DreamBooth: Protecting Users from Personalized Text-to-image Synthesis: Thanh Van Le,

Hao Phung,

Thuan Hoang Nguyen,

Quan Dao,

Ngoc N. Tran,

Anh Tran; [pdf] [supp]
[bibtex]
@InProceedings{Van_Le_2023_ICCV, author = {Van Le, Thanh and Phung, Hao and Nguyen, Thuan Hoang and Dao, Quan and Tran, Ngoc N. and Tran, Anh}, title = {Anti-DreamBooth: Protecting Users from Personalized Text-to-image Synthesis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2116-2127} }
Contrastive Continuity on Augmentation Stability Rehearsal for Continual Self-Supervised Learning: Haoyang Cheng,

Haitao Wen,

Xiaoliang Zhang,

Heqian Qiu,

Lanxiao Wang,

Hongliang Li; [pdf] [supp]
[bibtex]
@InProceedings{Cheng_2023_ICCV, author = {Cheng, Haoyang and Wen, Haitao and Zhang, Xiaoliang and Qiu, Heqian and Wang, Lanxiao and Li, Hongliang}, title = {Contrastive Continuity on Augmentation Stability Rehearsal for Continual Self-Supervised Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5707-5717} }
Treating Pseudo-labels Generation as Image Matting for Weakly Supervised Semantic Segmentation: Changwei Wang,

Rongtao Xu,

Shibiao Xu,

Weiliang Meng,

Xiaopeng Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Changwei and Xu, Rongtao and Xu, Shibiao and Meng, Weiliang and Zhang, Xiaopeng}, title = {Treating Pseudo-labels Generation as Image Matting for Weakly Supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {755-765} }
Structural Alignment for Network Pruning through Partial Regularization: Shangqian Gao,

Zeyu Zhang,

Yanfu Zhang,

Feihu Huang,

Heng Huang; [pdf] [supp]
[bibtex]
@InProceedings{Gao_2023_ICCV, author = {Gao, Shangqian and Zhang, Zeyu and Zhang, Yanfu and Huang, Feihu and Huang, Heng}, title = {Structural Alignment for Network Pruning through Partial Regularization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17402-17412} }
Learning Long-Range Information with Dual-Scale Transformers for Indoor Scene Completion: Ziqi Wang,

Fei Luo,

Xiaoxiao Long,

Wenxiao Zhang,

Chunxia Xiao; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Ziqi and Luo, Fei and Long, Xiaoxiao and Zhang, Wenxiao and Xiao, Chunxia}, title = {Learning Long-Range Information with Dual-Scale Transformers for Indoor Scene Completion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18569-18579} }
A Game of Bundle Adjustment - Learning Efficient Convergence: Amir Belder,

Refael Vivanti,

Ayellet Tal; [pdf]
[bibtex]
@InProceedings{Belder_2023_ICCV, author = {Belder, Amir and Vivanti, Refael and Tal, Ayellet}, title = {A Game of Bundle Adjustment - Learning Efficient Convergence}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8428-8437} }
Learning Correction Filter via Degradation-Adaptive Regression for Blind Single Image Super-Resolution: Hongyang Zhou,

Xiaobin Zhu,

Jianqing Zhu,

Zheng Han,

Shi-Xue Zhang,

Jingyan Qin,

Xu-Cheng Yin; [pdf] [supp]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Hongyang and Zhu, Xiaobin and Zhu, Jianqing and Han, Zheng and Zhang, Shi-Xue and Qin, Jingyan and Yin, Xu-Cheng}, title = {Learning Correction Filter via Degradation-Adaptive Regression for Blind Single Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12365-12375} }
UMFuse: Unified Multi View Fusion for Human Editing Applications: Rishabh Jain,

Mayur Hemani,

Duygu Ceylan,

Krishna Kumar Singh,

Jingwan Lu,

Mausoom Sarkar,

Balaji Krishnamurthy; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jain_2023_ICCV, author = {Jain, Rishabh and Hemani, Mayur and Ceylan, Duygu and Singh, Krishna Kumar and Lu, Jingwan and Sarkar, Mausoom and Krishnamurthy, Balaji}, title = {UMFuse: Unified Multi View Fusion for Human Editing Applications}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7182-7191} }
CROSSFIRE: Camera Relocalization On Self-Supervised Features from an Implicit Representation: Arthur Moreau,

Nathan Piasco,

Moussab Bennehar,

Dzmitry Tsishkou,

Bogdan Stanciulescu,

Arnaud de La Fortelle; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Moreau_2023_ICCV, author = {Moreau, Arthur and Piasco, Nathan and Bennehar, Moussab and Tsishkou, Dzmitry and Stanciulescu, Bogdan and de La Fortelle, Arnaud}, title = {CROSSFIRE: Camera Relocalization On Self-Supervised Features from an Implicit Representation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {252-262} }
Discriminative Class Tokens for Text-to-Image Diffusion Models: Idan Schwartz,

Vésteinn Snæbjarnarson,

Hila Chefer,

Serge Belongie,

Lior Wolf,

Sagie Benaim; [pdf] [supp]
[bibtex]
@InProceedings{Schwartz_2023_ICCV, author = {Schwartz, Idan and Sn{\ae}bjarnarson, V\'esteinn and Chefer, Hila and Belongie, Serge and Wolf, Lior and Benaim, Sagie}, title = {Discriminative Class Tokens for Text-to-Image Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22725-22735} }
SINC: Spatial Composition of 3D Human Motions for Simultaneous Action Generation: Nikos Athanasiou,

Mathis Petrovich,

Michael J. Black,

Gül Varol; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Athanasiou_2023_ICCV, author = {Athanasiou, Nikos and Petrovich, Mathis and Black, Michael J. and Varol, G\"ul}, title = {SINC: Spatial Composition of 3D Human Motions for Simultaneous Action Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9984-9995} }
ORC: Network Group-based Knowledge Distillation using Online Role Change: Junyong Choi,

Hyeon Cho,

Seokhwa Cheung,

Wonjun Hwang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Choi_2023_ICCV, author = {Choi, Junyong and Cho, Hyeon and Cheung, Seokhwa and Hwang, Wonjun}, title = {ORC: Network Group-based Knowledge Distillation using Online Role Change}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17381-17390} }
Audiovisual Masked Autoencoders: Mariana-Iuliana Georgescu,

Eduardo Fonseca,

Radu Tudor Ionescu,

Mario Lucic,

Cordelia Schmid,

Anurag Arnab; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Georgescu_2023_ICCV, author = {Georgescu, Mariana-Iuliana and Fonseca, Eduardo and Ionescu, Radu Tudor and Lucic, Mario and Schmid, Cordelia and Arnab, Anurag}, title = {Audiovisual Masked Autoencoders}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16144-16154} }
MV-DeepSDF: Implicit Modeling with Multi-Sweep Point Clouds for 3D Vehicle Reconstruction in Autonomous Driving: Yibo Liu,

Kelly Zhu,

Guile Wu,

Yuan Ren,

Bingbing Liu,

Yang Liu,

Jinjun Shan; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Yibo and Zhu, Kelly and Wu, Guile and Ren, Yuan and Liu, Bingbing and Liu, Yang and Shan, Jinjun}, title = {MV-DeepSDF: Implicit Modeling with Multi-Sweep Point Clouds for 3D Vehicle Reconstruction in Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8306-8316} }
CHORD: Category-level Hand-held Object Reconstruction via Shape Deformation: Kailin Li,

Lixin Yang,

Haoyu Zhen,

Zenan Lin,

Xinyu Zhan,

Licheng Zhong,

Jian Xu,

Kejian Wu,

Cewu Lu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Kailin and Yang, Lixin and Zhen, Haoyu and Lin, Zenan and Zhan, Xinyu and Zhong, Licheng and Xu, Jian and Wu, Kejian and Lu, Cewu}, title = {CHORD: Category-level Hand-held Object Reconstruction via Shape Deformation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9444-9454} }
Unmasking Anomalies in Road-Scene Segmentation: Shyam Nandan Rai,

Fabio Cermelli,

Dario Fontanel,

Carlo Masone,

Barbara Caputo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Rai_2023_ICCV, author = {Rai, Shyam Nandan and Cermelli, Fabio and Fontanel, Dario and Masone, Carlo and Caputo, Barbara}, title = {Unmasking Anomalies in Road-Scene Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4037-4046} }
DomainDrop: Suppressing Domain-Sensitive Channels for Domain Generalization: Jintao Guo,

Lei Qi,

Yinghuan Shi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Guo_2023_ICCV, author = {Guo, Jintao and Qi, Lei and Shi, Yinghuan}, title = {DomainDrop: Suppressing Domain-Sensitive Channels for Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19114-19124} }
Towards Universal LiDAR-Based 3D Object Detection by Multi-Domain Knowledge Transfer: Guile Wu,

Tongtong Cao,

Bingbing Liu,

Xingxin Chen,

Yuan Ren; [pdf]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Guile and Cao, Tongtong and Liu, Bingbing and Chen, Xingxin and Ren, Yuan}, title = {Towards Universal LiDAR-Based 3D Object Detection by Multi-Domain Knowledge Transfer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8669-8678} }
StyleInV: A Temporal Style Modulated Inversion Network for Unconditional Video Generation: Yuhan Wang,

Liming Jiang,

Chen Change Loy; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Yuhan and Jiang, Liming and Loy, Chen Change}, title = {StyleInV: A Temporal Style Modulated Inversion Network for Unconditional Video Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22851-22861} }
Self-Calibrated Cross Attention Network for Few-Shot Segmentation: Qianxiong Xu,

Wenting Zhao,

Guosheng Lin,

Cheng Long; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xu_2023_ICCV, author = {Xu, Qianxiong and Zhao, Wenting and Lin, Guosheng and Long, Cheng}, title = {Self-Calibrated Cross Attention Network for Few-Shot Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {655-665} }
Anatomical Invariance Modeling and Semantic Alignment for Self-supervised Learning in 3D Medical Image Analysis: Yankai Jiang,

Mingze Sun,

Heng Guo,

Xiaoyu Bai,

Ke Yan,

Le Lu,

Minfeng Xu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jiang_2023_ICCV, author = {Jiang, Yankai and Sun, Mingze and Guo, Heng and Bai, Xiaoyu and Yan, Ke and Lu, Le and Xu, Minfeng}, title = {Anatomical Invariance Modeling and Semantic Alignment for Self-supervised Learning in 3D Medical Image Analysis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15859-15869} }
Towards High-Fidelity Text-Guided 3D Face Generation and Manipulation Using only Images: Cuican Yu,

Guansong Lu,

Yihan Zeng,

Jian Sun,

Xiaodan Liang,

Huibin Li,

Zongben Xu,

Songcen Xu,

Wei Zhang,

Hang Xu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yu_2023_ICCV, author = {Yu, Cuican and Lu, Guansong and Zeng, Yihan and Sun, Jian and Liang, Xiaodan and Li, Huibin and Xu, Zongben and Xu, Songcen and Zhang, Wei and Xu, Hang}, title = {Towards High-Fidelity Text-Guided 3D Face Generation and Manipulation Using only Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15326-15337} }
SSDA: Secure Source-Free Domain Adaptation: Sabbir Ahmed,

Abdullah Al Arafat,

Mamshad Nayeem Rizve,

Rahim Hossain,

Zhishan Guo,

Adnan Siraj Rakin; [pdf] [supp]
[bibtex]
@InProceedings{Ahmed_2023_ICCV, author = {Ahmed, Sabbir and Al Arafat, Abdullah and Rizve, Mamshad Nayeem and Hossain, Rahim and Guo, Zhishan and Rakin, Adnan Siraj}, title = {SSDA: Secure Source-Free Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19180-19190} }
ENTL: Embodied Navigation Trajectory Learner: Klemen Kotar,

Aaron Walsman,

Roozbeh Mottaghi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kotar_2023_ICCV, author = {Kotar, Klemen and Walsman, Aaron and Mottaghi, Roozbeh}, title = {ENTL: Embodied Navigation Trajectory Learner}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10863-10872} }
AGG-Net: Attention Guided Gated-Convolutional Network for Depth Image Completion: Dongyue Chen,

Tingxuan Huang,

Zhimin Song,

Shizhuo Deng,

Tong Jia; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Dongyue and Huang, Tingxuan and Song, Zhimin and Deng, Shizhuo and Jia, Tong}, title = {AGG-Net: Attention Guided Gated-Convolutional Network for Depth Image Completion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8853-8862} }
Learning Global-aware Kernel for Image Harmonization: Xintian Shen,

Jiangning Zhang,

Jun Chen,

Shipeng Bai,

Yue Han,

Yabiao Wang,

Chengjie Wang,

Yong Liu; [pdf] [arXiv]
[bibtex]
@InProceedings{Shen_2023_ICCV, author = {Shen, Xintian and Zhang, Jiangning and Chen, Jun and Bai, Shipeng and Han, Yue and Wang, Yabiao and Wang, Chengjie and Liu, Yong}, title = {Learning Global-aware Kernel for Image Harmonization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7535-7544} }
Real-Time Neural Rasterization for Large Scenes: Jeffrey Yunfan Liu,

Yun Chen,

Ze Yang,

Jingkang Wang,

Sivabalan Manivasagam,

Raquel Urtasun; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Jeffrey Yunfan and Chen, Yun and Yang, Ze and Wang, Jingkang and Manivasagam, Sivabalan and Urtasun, Raquel}, title = {Real-Time Neural Rasterization for Large Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8416-8427} }
ESTextSpotter: Towards Better Scene Text Spotting with Explicit Synergy in Transformer: Mingxin Huang,

Jiaxin Zhang,

Dezhi Peng,

Hao Lu,

Can Huang,

Yuliang Liu,

Xiang Bai,

Lianwen Jin; [pdf] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Mingxin and Zhang, Jiaxin and Peng, Dezhi and Lu, Hao and Huang, Can and Liu, Yuliang and Bai, Xiang and Jin, Lianwen}, title = {ESTextSpotter: Towards Better Scene Text Spotting with Explicit Synergy in Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19495-19505} }
UGC: Unified GAN Compression for Efficient Image-to-Image Translation: Yuxi Ren,

Jie Wu,

Peng Zhang,

Manlin Zhang,

Xuefeng Xiao,

Qian He,

Rui Wang,

Min Zheng,

Xin Pan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ren_2023_ICCV, author = {Ren, Yuxi and Wu, Jie and Zhang, Peng and Zhang, Manlin and Xiao, Xuefeng and He, Qian and Wang, Rui and Zheng, Min and Pan, Xin}, title = {UGC: Unified GAN Compression for Efficient Image-to-Image Translation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17281-17291} }
Efficient View Synthesis with Neural Radiance Distribution Field: Yushuang Wu,

Xiao Li,

Jinglu Wang,

Xiaoguang Han,

Shuguang Cui,

Yan Lu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Yushuang and Li, Xiao and Wang, Jinglu and Han, Xiaoguang and Cui, Shuguang and Lu, Yan}, title = {Efficient View Synthesis with Neural Radiance Distribution Field}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18506-18515} }
MixSpeech: Cross-Modality Self-Learning with Audio-Visual Stream Mixup for Visual Speech Translation and Recognition: Xize Cheng,

Tao Jin,

Rongjie Huang,

Linjun Li,

Wang Lin,

Zehan Wang,

Ye Wang,

Huadai Liu,

Aoxiong Yin,

Zhou Zhao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cheng_2023_ICCV, author = {Cheng, Xize and Jin, Tao and Huang, Rongjie and Li, Linjun and Lin, Wang and Wang, Zehan and Wang, Ye and Liu, Huadai and Yin, Aoxiong and Zhao, Zhou}, title = {MixSpeech: Cross-Modality Self-Learning with Audio-Visual Stream Mixup for Visual Speech Translation and Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15735-15745} }
Chordal Averaging on Flag Manifolds and Its Applications: Nathan Mankovich,

Tolga Birdal; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mankovich_2023_ICCV, author = {Mankovich, Nathan and Birdal, Tolga}, title = {Chordal Averaging on Flag Manifolds and Its Applications}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3881-3890} }
Towards Building More Robust Models with Frequency Bias: Qingwen Bu,

Dong Huang,

Heming Cui; [pdf] [arXiv]
[bibtex]
@InProceedings{Bu_2023_ICCV, author = {Bu, Qingwen and Huang, Dong and Cui, Heming}, title = {Towards Building More Robust Models with Frequency Bias}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4402-4411} }
SparseBEV: High-Performance Sparse 3D Object Detection from Multi-Camera Videos: Haisong Liu,

Yao Teng,

Tao Lu,

Haiguang Wang,

Limin Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Haisong and Teng, Yao and Lu, Tao and Wang, Haiguang and Wang, Limin}, title = {SparseBEV: High-Performance Sparse 3D Object Detection from Multi-Camera Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18580-18590} }
Boosting Whole Slide Image Classification from the Perspectives of Distribution, Correlation and Magnification: Linhao Qu,

Zhiwei Yang,

Minghong Duan,

Yingfan Ma,

Shuo Wang,

Manning Wang,

Zhijian Song; [pdf]
[bibtex]
@InProceedings{Qu_2023_ICCV, author = {Qu, Linhao and Yang, Zhiwei and Duan, Minghong and Ma, Yingfan and Wang, Shuo and Wang, Manning and Song, Zhijian}, title = {Boosting Whole Slide Image Classification from the Perspectives of Distribution, Correlation and Magnification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21463-21473} }
PolicyCleanse: Backdoor Detection and Mitigation for Competitive Reinforcement Learning: Junfeng Guo,

Ang Li,

Lixu Wang,

Cong Liu; [pdf] [supp]
[bibtex]
@InProceedings{Guo_2023_ICCV, author = {Guo, Junfeng and Li, Ang and Wang, Lixu and Liu, Cong}, title = {PolicyCleanse: Backdoor Detection and Mitigation for Competitive Reinforcement Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4699-4708} }
Ref-NeuS: Ambiguity-Reduced Neural Implicit Surface Learning for Multi-View Reconstruction with Reflection: Wenhang Ge,

Tao Hu,

Haoyu Zhao,

Shu Liu,

Ying-Cong Chen; [pdf] [supp]
[bibtex]
@InProceedings{Ge_2023_ICCV, author = {Ge, Wenhang and Hu, Tao and Zhao, Haoyu and Liu, Shu and Chen, Ying-Cong}, title = {Ref-NeuS: Ambiguity-Reduced Neural Implicit Surface Learning for Multi-View Reconstruction with Reflection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4251-4260} }
Innovating Real Fisheye Image Correction with Dual Diffusion Architecture: Shangrong Yang,

Chunyu Lin,

Kang Liao,

Yao Zhao; [pdf] [supp]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Shangrong and Lin, Chunyu and Liao, Kang and Zhao, Yao}, title = {Innovating Real Fisheye Image Correction with Dual Diffusion Architecture}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12699-12708} }
Global Perception Based Autoregressive Neural Processes: Jinyang Tai; [pdf]
[bibtex]
@InProceedings{Tai_2023_ICCV, author = {Tai, Jinyang}, title = {Global Perception Based Autoregressive Neural Processes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10487-10497} }
Class-incremental Continual Learning for Instance Segmentation with Image-level Weak Supervision: Yu-Hsing Hsieh,

Guan-Sheng Chen,

Shun-Xian Cai,

Ting-Yun Wei,

Huei-Fang Yang,

Chu-Song Chen; [pdf] [supp]
[bibtex]
@InProceedings{Hsieh_2023_ICCV, author = {Hsieh, Yu-Hsing and Chen, Guan-Sheng and Cai, Shun-Xian and Wei, Ting-Yun and Yang, Huei-Fang and Chen, Chu-Song}, title = {Class-incremental Continual Learning for Instance Segmentation with Image-level Weak Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1250-1261} }
When Prompt-based Incremental Learning Does Not Meet Strong Pretraining: Yu-Ming Tang,

Yi-Xing Peng,

Wei-Shi Zheng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tang_2023_ICCV, author = {Tang, Yu-Ming and Peng, Yi-Xing and Zheng, Wei-Shi}, title = {When Prompt-based Incremental Learning Does Not Meet Strong Pretraining}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1706-1716} }
Multimodal High-order Relation Transformer for Scene Boundary Detection: Xi Wei,

Zhangxiang Shi,

Tianzhu Zhang,

Xiaoyuan Yu,

Lei Xiao; [pdf]
[bibtex]
@InProceedings{Wei_2023_ICCV, author = {Wei, Xi and Shi, Zhangxiang and Zhang, Tianzhu and Yu, Xiaoyuan and Xiao, Lei}, title = {Multimodal High-order Relation Transformer for Scene Boundary Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22081-22090} }
Tri-MipRF: Tri-Mip Representation for Efficient Anti-Aliasing Neural Radiance Fields: Wenbo Hu,

Yuling Wang,

Lin Ma,

Bangbang Yang,

Lin Gao,

Xiao Liu,

Yuewen Ma; [pdf]
[bibtex]
@InProceedings{Hu_2023_ICCV, author = {Hu, Wenbo and Wang, Yuling and Ma, Lin and Yang, Bangbang and Gao, Lin and Liu, Xiao and Ma, Yuewen}, title = {Tri-MipRF: Tri-Mip Representation for Efficient Anti-Aliasing Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19774-19783} }
LaRS: A Diverse Panoptic Maritime Obstacle Detection Dataset and Benchmark: Lojze Žust,

Janez Perš,

Matej Kristan; [pdf] [supp]
[bibtex]
@InProceedings{Zust_2023_ICCV, author = {\v{Z}ust, Lojze and Per\v{s}, Janez and Kristan, Matej}, title = {LaRS: A Diverse Panoptic Maritime Obstacle Detection Dataset and Benchmark}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20304-20314} }
Exploring Transformers for Open-world Instance Segmentation: Jiannan Wu,

Yi Jiang,

Bin Yan,

Huchuan Lu,

Zehuan Yuan,

Ping Luo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Jiannan and Jiang, Yi and Yan, Bin and Lu, Huchuan and Yuan, Zehuan and Luo, Ping}, title = {Exploring Transformers for Open-world Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6611-6621} }
VQA Therapy: Exploring Answer Differences by Visually Grounding Answers: Chongyan Chen,

Samreen Anjum,

Danna Gurari; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Chongyan and Anjum, Samreen and Gurari, Danna}, title = {VQA Therapy: Exploring Answer Differences by Visually Grounding Answers}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15315-15325} }
Energy-based Self-Training and Normalization for Unsupervised Domain Adaptation: Samitha Herath,

Basura Fernando,

Ehsan Abbasnejad,

Munawar Hayat,

Shahram Khadivi,

Mehrtash Harandi,

Hamid Rezatofighi,

Gholamreza Haffari; [pdf] [supp]
[bibtex]
@InProceedings{Herath_2023_ICCV, author = {Herath, Samitha and Fernando, Basura and Abbasnejad, Ehsan and Hayat, Munawar and Khadivi, Shahram and Harandi, Mehrtash and Rezatofighi, Hamid and Haffari, Gholamreza}, title = {Energy-based Self-Training and Normalization for Unsupervised Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11653-11662} }
Self-Evolved Dynamic Expansion Model for Task-Free Continual Learning: Fei Ye,

Adrian G. Bors; [pdf] [supp]
[bibtex]
@InProceedings{Ye_2023_ICCV, author = {Ye, Fei and Bors, Adrian G.}, title = {Self-Evolved Dynamic Expansion Model for Task-Free Continual Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22102-22112} }
Adaptive Template Transformer for Mitochondria Segmentation in Electron Microscopy Images: Yuwen Pan,

Naisong Luo,

Rui Sun,

Meng Meng,

Tianzhu Zhang,

Zhiwei Xiong,

Yongdong Zhang; [pdf]
[bibtex]
@InProceedings{Pan_2023_ICCV, author = {Pan, Yuwen and Luo, Naisong and Sun, Rui and Meng, Meng and Zhang, Tianzhu and Xiong, Zhiwei and Zhang, Yongdong}, title = {Adaptive Template Transformer for Mitochondria Segmentation in Electron Microscopy Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21474-21484} }
Collaborative Tracking Learning for Frame-Rate-Insensitive Multi-Object Tracking: Yiheng Liu,

Junta Wu,

Yi Fu; [pdf] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Yiheng and Wu, Junta and Fu, Yi}, title = {Collaborative Tracking Learning for Frame-Rate-Insensitive Multi-Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9964-9973} }
Tangent Model Composition for Ensembling and Continual Fine-tuning: Tian Yu Liu,

Stefano Soatto; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Tian Yu and Soatto, Stefano}, title = {Tangent Model Composition for Ensembling and Continual Fine-tuning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18676-18686} }
Knowledge-Spreader: Learning Semi-Supervised Facial Action Dynamics by Consistifying Knowledge Granularity: Xiaotian Li,

Xiang Zhang,

Taoyue Wang,

Lijun Yin; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Xiaotian and Zhang, Xiang and Wang, Taoyue and Yin, Lijun}, title = {Knowledge-Spreader: Learning Semi-Supervised Facial Action Dynamics by Consistifying Knowledge Granularity}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20979-20989} }
SSF: Accelerating Training of Spiking Neural Networks with Stabilized Spiking Flow: Jingtao Wang,

Zengjie Song,

Yuxi Wang,

Jun Xiao,

Yuran Yang,

Shuqi Mei,

Zhaoxiang Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Jingtao and Song, Zengjie and Wang, Yuxi and Xiao, Jun and Yang, Yuran and Mei, Shuqi and Zhang, Zhaoxiang}, title = {SSF: Accelerating Training of Spiking Neural Networks with Stabilized Spiking Flow}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5982-5991} }
Manipulate by Seeing: Creating Manipulation Controllers from Pre-Trained Representations: Jianren Wang,

Sudeep Dasari,

Mohan Kumar Srirama,

Shubham Tulsiani,

Abhinav Gupta; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Jianren and Dasari, Sudeep and Srirama, Mohan Kumar and Tulsiani, Shubham and Gupta, Abhinav}, title = {Manipulate by Seeing: Creating Manipulation Controllers from Pre-Trained Representations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3859-3868} }
Learning Human-Human Interactions in Images from Weak Textual Supervision: Morris Alper,

Hadar Averbuch-Elor; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Alper_2023_ICCV, author = {Alper, Morris and Averbuch-Elor, Hadar}, title = {Learning Human-Human Interactions in Images from Weak Textual Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2887-2899} }
Prompt-aligned Gradient for Prompt Tuning: Beier Zhu,

Yulei Niu,

Yucheng Han,

Yue Wu,

Hanwang Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Beier and Niu, Yulei and Han, Yucheng and Wu, Yue and Zhang, Hanwang}, title = {Prompt-aligned Gradient for Prompt Tuning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15659-15669} }
Aperture Diffraction for Compact Snapshot Spectral Imaging: Tao Lv,

Hao Ye,

Quan Yuan,

Zhan Shi,

Yibo Wang,

Shuming Wang,

Xun Cao; [pdf] [supp]
[bibtex]
@InProceedings{Lv_2023_ICCV, author = {Lv, Tao and Ye, Hao and Yuan, Quan and Shi, Zhan and Wang, Yibo and Wang, Shuming and Cao, Xun}, title = {Aperture Diffraction for Compact Snapshot Spectral Imaging}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10574-10584} }
Diffusion Action Segmentation: Daochang Liu,

Qiyue Li,

Anh-Dung Dinh,

Tingting Jiang,

Mubarak Shah,

Chang Xu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Daochang and Li, Qiyue and Dinh, Anh-Dung and Jiang, Tingting and Shah, Mubarak and Xu, Chang}, title = {Diffusion Action Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10139-10149} }
Prototype Reminiscence and Augmented Asymmetric Knowledge Aggregation for Non-Exemplar Class-Incremental Learning: Wuxuan Shi,

Mang Ye; [pdf] [supp]
[bibtex]
@InProceedings{Shi_2023_ICCV, author = {Shi, Wuxuan and Ye, Mang}, title = {Prototype Reminiscence and Augmented Asymmetric Knowledge Aggregation for Non-Exemplar Class-Incremental Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1772-1781} }
Exemplar-Free Continual Transformer with Convolutions: Anurag Roy,

Vinay K. Verma,

Sravan Voonna,

Kripabandhu Ghosh,

Saptarshi Ghosh,

Abir Das; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Roy_2023_ICCV, author = {Roy, Anurag and Verma, Vinay K. and Voonna, Sravan and Ghosh, Kripabandhu and Ghosh, Saptarshi and Das, Abir}, title = {Exemplar-Free Continual Transformer with Convolutions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5897-5907} }
Scalable Video Object Segmentation with Simplified Framework: Qiangqiang Wu,

Tianyu Yang,

Wei Wu,

Antoni B. Chan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Qiangqiang and Yang, Tianyu and Wu, Wei and Chan, Antoni B.}, title = {Scalable Video Object Segmentation with Simplified Framework}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13879-13889} }
Rehearsal-Free Domain Continual Face Anti-Spoofing: Generalize More and Forget Less: Rizhao Cai,

Yawen Cui,

Zhi Li,

Zitong Yu,

Haoliang Li,

Yongjian Hu,

Alex Kot; [pdf] [supp]
[bibtex]
@InProceedings{Cai_2023_ICCV, author = {Cai, Rizhao and Cui, Yawen and Li, Zhi and Yu, Zitong and Li, Haoliang and Hu, Yongjian and Kot, Alex}, title = {Rehearsal-Free Domain Continual Face Anti-Spoofing: Generalize More and Forget Less}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8037-8048} }
Efficient Decision-based Black-box Patch Attacks on Video Recognition: Kaixun Jiang,

Zhaoyu Chen,

Hao Huang,

Jiafeng Wang,

Dingkang Yang,

Bo Li,

Yan Wang,

Wenqiang Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jiang_2023_ICCV, author = {Jiang, Kaixun and Chen, Zhaoyu and Huang, Hao and Wang, Jiafeng and Yang, Dingkang and Li, Bo and Wang, Yan and Zhang, Wenqiang}, title = {Efficient Decision-based Black-box Patch Attacks on Video Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4379-4389} }
Kick Back & Relax: Learning to Reconstruct the World by Watching SlowTV: Jaime Spencer,

Chris Russell,

Simon Hadfield,

Richard Bowden; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Spencer_2023_ICCV, author = {Spencer, Jaime and Russell, Chris and Hadfield, Simon and Bowden, Richard}, title = {Kick Back \& Relax: Learning to Reconstruct the World by Watching SlowTV}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15768-15779} }
MetaGCD: Learning to Continually Learn in Generalized Category Discovery: Yanan Wu,

Zhixiang Chi,

Yang Wang,

Songhe Feng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Yanan and Chi, Zhixiang and Wang, Yang and Feng, Songhe}, title = {MetaGCD: Learning to Continually Learn in Generalized Category Discovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1655-1665} }
Strip-MLP: Efficient Token Interaction for Vision MLP: Guiping Cao,

Shengda Luo,

Wenjian Huang,

Xiangyuan Lan,

Dongmei Jiang,

Yaowei Wang,

Jianguo Zhang; [pdf]
[bibtex]
@InProceedings{Cao_2023_ICCV, author = {Cao, Guiping and Luo, Shengda and Huang, Wenjian and Lan, Xiangyuan and Jiang, Dongmei and Wang, Yaowei and Zhang, Jianguo}, title = {Strip-MLP: Efficient Token Interaction for Vision MLP}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1494-1504} }
SAFARI: Versatile and Efficient Evaluations for Robustness of Interpretability: Wei Huang,

Xingyu Zhao,

Gaojie Jin,

Xiaowei Huang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Wei and Zhao, Xingyu and Jin, Gaojie and Huang, Xiaowei}, title = {SAFARI: Versatile and Efficient Evaluations for Robustness of Interpretability}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1988-1998} }
ChildPlay: A New Benchmark for Understanding Children's Gaze Behaviour: Samy Tafasca,

Anshul Gupta,

Jean-Marc Odobez; [pdf] [supp]
[bibtex]
@InProceedings{Tafasca_2023_ICCV, author = {Tafasca, Samy and Gupta, Anshul and Odobez, Jean-Marc}, title = {ChildPlay: A New Benchmark for Understanding Children's Gaze Behaviour}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20935-20946} }
Towards General Low-Light Raw Noise Synthesis and Modeling: Feng Zhang,

Bin Xu,

Zhiqiang Li,

Xinran Liu,

Qingbo Lu,

Changxin Gao,

Nong Sang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Feng and Xu, Bin and Li, Zhiqiang and Liu, Xinran and Lu, Qingbo and Gao, Changxin and Sang, Nong}, title = {Towards General Low-Light Raw Noise Synthesis and Modeling}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10820-10830} }
Combating Noisy Labels with Sample Selection by Mining High-Discrepancy Examples: Xiaobo Xia,

Bo Han,

Yibing Zhan,

Jun Yu,

Mingming Gong,

Chen Gong,

Tongliang Liu; [pdf] [supp]
[bibtex]
@InProceedings{Xia_2023_ICCV, author = {Xia, Xiaobo and Han, Bo and Zhan, Yibing and Yu, Jun and Gong, Mingming and Gong, Chen and Liu, Tongliang}, title = {Combating Noisy Labels with Sample Selection by Mining High-Discrepancy Examples}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1833-1843} }
Beyond the Pixel: a Photometrically Calibrated HDR Dataset for Luminance and Color Prediction: Christophe Bolduc,

Justine Giroux,

Marc Hébert,

Claude Demers,

Jean-François Lalonde; [pdf] [supp]
[bibtex]
@InProceedings{Bolduc_2023_ICCV, author = {Bolduc, Christophe and Giroux, Justine and H\'ebert, Marc and Demers, Claude and Lalonde, Jean-Fran\c{c}ois}, title = {Beyond the Pixel: a Photometrically Calibrated HDR Dataset for Luminance and Color Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8071-8081} }
What can Discriminator do? Towards Box-free Ownership Verification of Generative Adversarial Networks: Ziheng Huang,

Boheng Li,

Yan Cai,

Run Wang,

Shangwei Guo,

Liming Fang,

Jing Chen,

Lina Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Ziheng and Li, Boheng and Cai, Yan and Wang, Run and Guo, Shangwei and Fang, Liming and Chen, Jing and Wang, Lina}, title = {What can Discriminator do? Towards Box-free Ownership Verification of Generative Adversarial Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5009-5019} }
When Noisy Labels Meet Long Tail Dilemmas: A Representation Calibration Method: Manyi Zhang,

Xuyang Zhao,

Jun Yao,

Chun Yuan,

Weiran Huang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Manyi and Zhao, Xuyang and Yao, Jun and Yuan, Chun and Huang, Weiran}, title = {When Noisy Labels Meet Long Tail Dilemmas: A Representation Calibration Method}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15890-15900} }
Reinforce Data, Multiply Impact: Improved Model Accuracy and Robustness with Dataset Reinforcement: Fartash Faghri,

Hadi Pouransari,

Sachin Mehta,

Mehrdad Farajtabar,

Ali Farhadi,

Mohammad Rastegari,

Oncel Tuzel; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Faghri_2023_ICCV, author = {Faghri, Fartash and Pouransari, Hadi and Mehta, Sachin and Farajtabar, Mehrdad and Farhadi, Ali and Rastegari, Mohammad and Tuzel, Oncel}, title = {Reinforce Data, Multiply Impact: Improved Model Accuracy and Robustness with Dataset Reinforcement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17032-17043} }
An Adaptive Model Ensemble Adversarial Attack for Boosting Adversarial Transferability: Bin Chen,

Jiali Yin,

Shukai Chen,

Bohao Chen,

Ximeng Liu; [pdf] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Bin and Yin, Jiali and Chen, Shukai and Chen, Bohao and Liu, Ximeng}, title = {An Adaptive Model Ensemble Adversarial Attack for Boosting Adversarial Transferability}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4489-4498} }
Incremental Generalized Category Discovery: Bingchen Zhao,

Oisin Mac Aodha; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Bingchen and Mac Aodha, Oisin}, title = {Incremental Generalized Category Discovery}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19137-19147} }
Prototypical Mixing and Retrieval-Based Refinement for Label Noise-Resistant Image Retrieval: Xinlong Yang,

Haixin Wang,

Jinan Sun,

Shikun Zhang,

Chong Chen,

Xian-Sheng Hua,

Xiao Luo; [pdf] [supp]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Xinlong and Wang, Haixin and Sun, Jinan and Zhang, Shikun and Chen, Chong and Hua, Xian-Sheng and Luo, Xiao}, title = {Prototypical Mixing and Retrieval-Based Refinement for Label Noise-Resistant Image Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11239-11249} }
AccFlow: Backward Accumulation for Long-Range Optical Flow: Guangyang Wu,

Xiaohong Liu,

Kunming Luo,

Xi Liu,

Qingqing Zheng,

Shuaicheng Liu,

Xinyang Jiang,

Guangtao Zhai,

Wenyi Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Guangyang and Liu, Xiaohong and Luo, Kunming and Liu, Xi and Zheng, Qingqing and Liu, Shuaicheng and Jiang, Xinyang and Zhai, Guangtao and Wang, Wenyi}, title = {AccFlow: Backward Accumulation for Long-Range Optical Flow}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12119-12128} }
Guiding Local Feature Matching with Surface Curvature: Shuzhe Wang,

Juho Kannala,

Marc Pollefeys,

Daniel Barath; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Shuzhe and Kannala, Juho and Pollefeys, Marc and Barath, Daniel}, title = {Guiding Local Feature Matching with Surface Curvature}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17981-17991} }
3D-VisTA: Pre-trained Transformer for 3D Vision and Text Alignment: Ziyu Zhu,

Xiaojian Ma,

Yixin Chen,

Zhidong Deng,

Siyuan Huang,

Qing Li; [pdf] [supp]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Ziyu and Ma, Xiaojian and Chen, Yixin and Deng, Zhidong and Huang, Siyuan and Li, Qing}, title = {3D-VisTA: Pre-trained Transformer for 3D Vision and Text Alignment}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2911-2921} }
Constraining Depth Map Geometry for Multi-View Stereo: A Dual-Depth Approach with Saddle-shaped Depth Cells: Xinyi Ye,

Weiyue Zhao,

Tianqi Liu,

Zihao Huang,

Zhiguo Cao,

Xin Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ye_2023_ICCV, author = {Ye, Xinyi and Zhao, Weiyue and Liu, Tianqi and Huang, Zihao and Cao, Zhiguo and Li, Xin}, title = {Constraining Depth Map Geometry for Multi-View Stereo: A Dual-Depth Approach with Saddle-shaped Depth Cells}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17661-17670} }
SparseDet: Improving Sparsely Annotated Object Detection with Pseudo-positive Mining: Saksham Suri,

Saketh Rambhatla,

Rama Chellappa,

Abhinav Shrivastava; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Suri_2023_ICCV, author = {Suri, Saksham and Rambhatla, Saketh and Chellappa, Rama and Shrivastava, Abhinav}, title = {SparseDet: Improving Sparsely Annotated Object Detection with Pseudo-positive Mining}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6770-6781} }
Among Us: Adversarially Robust Collaborative Perception by Consensus: Yiming Li,

Qi Fang,

Jiamu Bai,

Siheng Chen,

Felix Juefei-Xu,

Chen Feng; [pdf] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Yiming and Fang, Qi and Bai, Jiamu and Chen, Siheng and Juefei-Xu, Felix and Feng, Chen}, title = {Among Us: Adversarially Robust Collaborative Perception by Consensus}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {186-195} }
BUS: Efficient and Effective Vision-Language Pre-Training with Bottom-Up Patch Summarization.: Chaoya Jiang,

Haiyang Xu,

Wei Ye,

Qinghao Ye,

Chenliang Li,

Ming Yan,

Bin Bi,

Shikun Zhang,

Fei Huang,

Songfang Huang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jiang_2023_ICCV, author = {Jiang, Chaoya and Xu, Haiyang and Ye, Wei and Ye, Qinghao and Li, Chenliang and Yan, Ming and Bi, Bin and Zhang, Shikun and Huang, Fei and Huang, Songfang}, title = {BUS: Efficient and Effective Vision-Language Pre-Training with Bottom-Up Patch Summarization.}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2900-2910} }
DiffusionDet: Diffusion Model for Object Detection: Shoufa Chen,

Peize Sun,

Yibing Song,

Ping Luo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Shoufa and Sun, Peize and Song, Yibing and Luo, Ping}, title = {DiffusionDet: Diffusion Model for Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19830-19843} }
Forward Flow for Novel View Synthesis of Dynamic Scenes: Xiang Guo,

Jiadai Sun,

Yuchao Dai,

Guanying Chen,

Xiaoqing Ye,

Xiao Tan,

Errui Ding,

Yumeng Zhang,

Jingdong Wang; [pdf] [supp]
[bibtex]
@InProceedings{Guo_2023_ICCV, author = {Guo, Xiang and Sun, Jiadai and Dai, Yuchao and Chen, Guanying and Ye, Xiaoqing and Tan, Xiao and Ding, Errui and Zhang, Yumeng and Wang, Jingdong}, title = {Forward Flow for Novel View Synthesis of Dynamic Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16022-16033} }
CopyRNeRF: Protecting the CopyRight of Neural Radiance Fields: Ziyuan Luo,

Qing Guo,

Ka Chun Cheung,

Simon See,

Renjie Wan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Luo_2023_ICCV, author = {Luo, Ziyuan and Guo, Qing and Cheung, Ka Chun and See, Simon and Wan, Renjie}, title = {CopyRNeRF: Protecting the CopyRight of Neural Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22401-22411} }
Contrastive Model Adaptation for Cross-Condition Robustness in Semantic Segmentation: David Brüggemann,

Christos Sakaridis,

Tim Broedermann,

Luc Van Gool; [pdf] [supp]
[bibtex]
@InProceedings{Bruggemann_2023_ICCV, author = {Br\"uggemann, David and Sakaridis, Christos and Broedermann, Tim and Van Gool, Luc}, title = {Contrastive Model Adaptation for Cross-Condition Robustness in Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11378-11387} }
SegRCDB: Semantic Segmentation via Formula-Driven Supervised Learning: Risa Shinoda,

Ryo Hayamizu,

Kodai Nakashima,

Nakamasa Inoue,

Rio Yokota,

Hirokatsu Kataoka; [pdf] [supp]
[bibtex]
@InProceedings{Shinoda_2023_ICCV, author = {Shinoda, Risa and Hayamizu, Ryo and Nakashima, Kodai and Inoue, Nakamasa and Yokota, Rio and Kataoka, Hirokatsu}, title = {SegRCDB: Semantic Segmentation via Formula-Driven Supervised Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20054-20063} }
Creative Birds: Self-Supervised Single-View 3D Style Transfer: Renke Wang,

Guimin Que,

Shuo Chen,

Xiang Li,

Jun Li,

Jian Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Renke and Que, Guimin and Chen, Shuo and Li, Xiang and Li, Jun and Yang, Jian}, title = {Creative Birds: Self-Supervised Single-View 3D Style Transfer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8775-8784} }
LoTE-Animal: A Long Time-span Dataset for Endangered Animal Behavior Understanding: Dan Liu,

Jin Hou,

Shaoli Huang,

Jing Liu,

Yuxin He,

Bochuan Zheng,

Jifeng Ning,

Jingdong Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Dan and Hou, Jin and Huang, Shaoli and Liu, Jing and He, Yuxin and Zheng, Bochuan and Ning, Jifeng and Zhang, Jingdong}, title = {LoTE-Animal: A Long Time-span Dataset for Endangered Animal Behavior Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20064-20075} }
DQS3D: Densely-matched Quantization-aware Semi-supervised 3D Detection: Huan-ang Gao,

Beiwen Tian,

Pengfei Li,

Hao Zhao,

Guyue Zhou; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gao_2023_ICCV, author = {Gao, Huan-ang and Tian, Beiwen and Li, Pengfei and Zhao, Hao and Zhou, Guyue}, title = {DQS3D: Densely-matched Quantization-aware Semi-supervised 3D Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21905-21915} }
Towards Inadequately Pre-trained Models in Transfer Learning: Andong Deng,

Xingjian Li,

Di Hu,

Tianyang Wang,

Haoyi Xiong,

Cheng-Zhong Xu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Deng_2023_ICCV, author = {Deng, Andong and Li, Xingjian and Hu, Di and Wang, Tianyang and Xiong, Haoyi and Xu, Cheng-Zhong}, title = {Towards Inadequately Pre-trained Models in Transfer Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19397-19408} }
Boosting Novel Category Discovery Over Domains with Soft Contrastive Learning and All in One Classifier: Zelin Zang,

Lei Shang,

Senqiao Yang,

Fei Wang,

Baigui Sun,

Xuansong Xie,

Stan Z. Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zang_2023_ICCV, author = {Zang, Zelin and Shang, Lei and Yang, Senqiao and Wang, Fei and Sun, Baigui and Xie, Xuansong and Li, Stan Z.}, title = {Boosting Novel Category Discovery Over Domains with Soft Contrastive Learning and All in One Classifier}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11858-11867} }
Class-Aware Patch Embedding Adaptation for Few-Shot Image Classification: Fusheng Hao,

Fengxiang He,

Liu Liu,

Fuxiang Wu,

Dacheng Tao,

Jun Cheng; [pdf] [supp]
[bibtex]
@InProceedings{Hao_2023_ICCV, author = {Hao, Fusheng and He, Fengxiang and Liu, Liu and Wu, Fuxiang and Tao, Dacheng and Cheng, Jun}, title = {Class-Aware Patch Embedding Adaptation for Few-Shot Image Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18905-18915} }
SegPrompt: Boosting Open-World Segmentation via Category-Level Prompt Learning: Muzhi Zhu,

Hengtao Li,

Hao Chen,

Chengxiang Fan,

Weian Mao,

Chenchen Jing,

Yifan Liu,

Chunhua Shen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhu_2023_ICCV, author = {Zhu, Muzhi and Li, Hengtao and Chen, Hao and Fan, Chengxiang and Mao, Weian and Jing, Chenchen and Liu, Yifan and Shen, Chunhua}, title = {SegPrompt: Boosting Open-World Segmentation via Category-Level Prompt Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {999-1008} }
Search for or Navigate to? Dual Adaptive Thinking for Object Navigation: Ronghao Dang,

Liuyi Wang,

Zongtao He,

Shuai Su,

Jiagui Tang,

Chengju Liu,

Qijun Chen; [pdf] [arXiv]
[bibtex]
@InProceedings{Dang_2023_ICCV, author = {Dang, Ronghao and Wang, Liuyi and He, Zongtao and Su, Shuai and Tang, Jiagui and Liu, Chengju and Chen, Qijun}, title = {Search for or Navigate to? Dual Adaptive Thinking for Object Navigation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8250-8259} }
CL-MVSNet: Unsupervised Multi-View Stereo with Dual-Level Contrastive Learning: Kaiqiang Xiong,

Rui Peng,

Zhe Zhang,

Tianxing Feng,

Jianbo Jiao,

Feng Gao,

Ronggang Wang; [pdf] [supp]
[bibtex]
@InProceedings{Xiong_2023_ICCV, author = {Xiong, Kaiqiang and Peng, Rui and Zhang, Zhe and Feng, Tianxing and Jiao, Jianbo and Gao, Feng and Wang, Ronggang}, title = {CL-MVSNet: Unsupervised Multi-View Stereo with Dual-Level Contrastive Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3769-3780} }
Federated Learning Over Images: Vertical Decompositions and Pre-Trained Backbones Are Difficult to Beat: Erdong Hu,

Yuxin Tang,

Anastasios Kyrillidis,

Chris Jermaine; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hu_2023_ICCV, author = {Hu, Erdong and Tang, Yuxin and Kyrillidis, Anastasios and Jermaine, Chris}, title = {Federated Learning Over Images: Vertical Decompositions and Pre-Trained Backbones Are Difficult to Beat}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19385-19396} }
HOSNeRF: Dynamic Human-Object-Scene Neural Radiance Fields from a Single Video: Jia-Wei Liu,

Yan-Pei Cao,

Tianyuan Yang,

Zhongcong Xu,

Jussi Keppo,

Ying Shan,

Xiaohu Qie,

Mike Zheng Shou; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Jia-Wei and Cao, Yan-Pei and Yang, Tianyuan and Xu, Zhongcong and Keppo, Jussi and Shan, Ying and Qie, Xiaohu and Shou, Mike Zheng}, title = {HOSNeRF: Dynamic Human-Object-Scene Neural Radiance Fields from a Single Video}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18483-18494} }
OmniZoomer: Learning to Move and Zoom in on Sphere at High-Resolution: Zidong Cao,

Hao Ai,

Yan-Pei Cao,

Ying Shan,

Xiaohu Qie,

Lin Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cao_2023_ICCV, author = {Cao, Zidong and Ai, Hao and Cao, Yan-Pei and Shan, Ying and Qie, Xiaohu and Wang, Lin}, title = {OmniZoomer: Learning to Move and Zoom in on Sphere at High-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12897-12907} }
Knowing Where to Focus: Event-aware Transformer for Video Grounding: Jinhyun Jang,

Jungin Park,

Jin Kim,

Hyeongjun Kwon,

Kwanghoon Sohn; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jang_2023_ICCV, author = {Jang, Jinhyun and Park, Jungin and Kim, Jin and Kwon, Hyeongjun and Sohn, Kwanghoon}, title = {Knowing Where to Focus: Event-aware Transformer for Video Grounding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13846-13856} }
TF-ICON: Diffusion-Based Training-Free Cross-Domain Image Composition: Shilin Lu,

Yanzhu Liu,

Adams Wai-Kin Kong; [pdf] [supp]
[bibtex]
@InProceedings{Lu_2023_ICCV, author = {Lu, Shilin and Liu, Yanzhu and Kong, Adams Wai-Kin}, title = {TF-ICON: Diffusion-Based Training-Free Cross-Domain Image Composition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2294-2305} }
Landscape Learning for Neural Network Inversion: Ruoshi Liu,

Chengzhi Mao,

Purva Tendulkar,

Hao Wang,

Carl Vondrick; [pdf] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Ruoshi and Mao, Chengzhi and Tendulkar, Purva and Wang, Hao and Vondrick, Carl}, title = {Landscape Learning for Neural Network Inversion}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2239-2250} }
Movement Enhancement toward Multi-Scale Video Feature Representation for Temporal Action Detection: Zixuan Zhao,

Dongqi Wang,

Xu Zhao; [pdf]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Zixuan and Wang, Dongqi and Zhao, Xu}, title = {Movement Enhancement toward Multi-Scale Video Feature Representation for Temporal Action Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13555-13564} }
Collaborative Propagation on Multiple Instance Graphs for 3D Instance Segmentation with Single-point Supervision: Shichao Dong,

Ruibo Li,

Jiacheng Wei,

Fayao Liu,

Guosheng Lin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dong_2023_ICCV, author = {Dong, Shichao and Li, Ruibo and Wei, Jiacheng and Liu, Fayao and Lin, Guosheng}, title = {Collaborative Propagation on Multiple Instance Graphs for 3D Instance Segmentation with Single-point Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16665-16674} }
PPR: Physically Plausible Reconstruction from Monocular Videos: Gengshan Yang,

Shuo Yang,

John Z. Zhang,

Zachary Manchester,

Deva Ramanan; [pdf] [supp]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Gengshan and Yang, Shuo and Zhang, John Z. and Manchester, Zachary and Ramanan, Deva}, title = {PPR: Physically Plausible Reconstruction from Monocular Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3914-3924} }
Single Image Deblurring with Row-dependent Blur Magnitude: Xiang Ji,

Zhixiang Wang,

Shin'ichi Satoh,

Yinqiang Zheng; [pdf] [supp]
[bibtex]
@InProceedings{Ji_2023_ICCV, author = {Ji, Xiang and Wang, Zhixiang and Satoh, Shin'ichi and Zheng, Yinqiang}, title = {Single Image Deblurring with Row-dependent Blur Magnitude}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12269-12280} }
Robust Heterogeneous Federated Learning under Data Corruption: Xiuwen Fang,

Mang Ye,

Xiyuan Yang; [pdf] [supp]
[bibtex]
@InProceedings{Fang_2023_ICCV, author = {Fang, Xiuwen and Ye, Mang and Yang, Xiyuan}, title = {Robust Heterogeneous Federated Learning under Data Corruption}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5020-5030} }
RMP-Loss: Regularizing Membrane Potential Distribution for Spiking Neural Networks: Yufei Guo,

Xiaode Liu,

Yuanpei Chen,

Liwen Zhang,

Weihang Peng,

Yuhan Zhang,

Xuhui Huang,

Zhe Ma; [pdf]
[bibtex]
@InProceedings{Guo_2023_ICCV, author = {Guo, Yufei and Liu, Xiaode and Chen, Yuanpei and Zhang, Liwen and Peng, Weihang and Zhang, Yuhan and Huang, Xuhui and Ma, Zhe}, title = {RMP-Loss: Regularizing Membrane Potential Distribution for Spiking Neural Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17391-17401} }
Cyclic-Bootstrap Labeling for Weakly Supervised Object Detection: Yufei Yin,

Jiajun Deng,

Wengang Zhou,

Li Li,

Houqiang Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yin_2023_ICCV, author = {Yin, Yufei and Deng, Jiajun and Zhou, Wengang and Li, Li and Li, Houqiang}, title = {Cyclic-Bootstrap Labeling for Weakly Supervised Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7008-7018} }
Deep Active Contours for Real-time 6-DoF Object Tracking: Long Wang,

Shen Yan,

Jianan Zhen,

Yu Liu,

Maojun Zhang,

Guofeng Zhang,

Xiaowei Zhou; [pdf]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Long and Yan, Shen and Zhen, Jianan and Liu, Yu and Zhang, Maojun and Zhang, Guofeng and Zhou, Xiaowei}, title = {Deep Active Contours for Real-time 6-DoF Object Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14034-14044} }
Tangent Sampson Error: Fast Approximate Two-view Reprojection Error for Central Camera Models: Mikhail Terekhov,

Viktor Larsson; [pdf] [supp]
[bibtex]
@InProceedings{Terekhov_2023_ICCV, author = {Terekhov, Mikhail and Larsson, Viktor}, title = {Tangent Sampson Error: Fast Approximate Two-view Reprojection Error for Central Camera Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3370-3378} }
Multi-grained Temporal Prototype Learning for Few-shot Video Object Segmentation: Nian Liu,

Kepan Nan,

Wangbo Zhao,

Yuanwei Liu,

Xiwen Yao,

Salman Khan,

Hisham Cholakkal,

Rao Muhammad Anwer,

Junwei Han,

Fahad Shahbaz Khan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Nian and Nan, Kepan and Zhao, Wangbo and Liu, Yuanwei and Yao, Xiwen and Khan, Salman and Cholakkal, Hisham and Anwer, Rao Muhammad and Han, Junwei and Khan, Fahad Shahbaz}, title = {Multi-grained Temporal Prototype Learning for Few-shot Video Object Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18862-18871} }
Improving 3D Imaging with Pre-Trained Perpendicular 2D Diffusion Models: Suhyeon Lee,

Hyungjin Chung,

Minyoung Park,

Jonghyuk Park,

Wi-Sun Ryu,

Jong Chul Ye; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2023_ICCV, author = {Lee, Suhyeon and Chung, Hyungjin and Park, Minyoung and Park, Jonghyuk and Ryu, Wi-Sun and Ye, Jong Chul}, title = {Improving 3D Imaging with Pre-Trained Perpendicular 2D Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10710-10720} }
Time Does Tell: Self-Supervised Time-Tuning of Dense Image Representations: Mohammadreza Salehi,

Efstratios Gavves,

Cees G.M. Snoek,

Yuki M. Asano; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Salehi_2023_ICCV, author = {Salehi, Mohammadreza and Gavves, Efstratios and Snoek, Cees G.M. and Asano, Yuki M.}, title = {Time Does Tell: Self-Supervised Time-Tuning of Dense Image Representations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16536-16547} }
CroCo v2: Improved Cross-view Completion Pre-training for Stereo Matching and Optical Flow: Philippe Weinzaepfel,

Thomas Lucas,

Vincent Leroy,

Yohann Cabon,

Vaibhav Arora,

Romain Brégier,

Gabriela Csurka,

Leonid Antsfeld,

Boris Chidlovskii,

Jerome Revaud; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Weinzaepfel_2023_ICCV, author = {Weinzaepfel, Philippe and Lucas, Thomas and Leroy, Vincent and Cabon, Yohann and Arora, Vaibhav and Br\'egier, Romain and Csurka, Gabriela and Antsfeld, Leonid and Chidlovskii, Boris and Revaud, Jerome}, title = {CroCo v2: Improved Cross-view Completion Pre-training for Stereo Matching and Optical Flow}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17969-17980} }
ExBluRF: Efficient Radiance Fields for Extreme Motion Blurred Images: Dongwoo Lee,

Jeongtaek Oh,

Jaesung Rim,

Sunghyun Cho,

Kyoung Mu Lee; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2023_ICCV, author = {Lee, Dongwoo and Oh, Jeongtaek and Rim, Jaesung and Cho, Sunghyun and Lee, Kyoung Mu}, title = {ExBluRF: Efficient Radiance Fields for Extreme Motion Blurred Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17639-17648} }
MPCViT: Searching for Accurate and Efficient MPC-Friendly Vision Transformer with Heterogeneous Attention: Wenxuan Zeng,

Meng Li,

Wenjie Xiong,

Tong Tong,

Wen-jie Lu,

Jin Tan,

Runsheng Wang,

Ru Huang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zeng_2023_ICCV, author = {Zeng, Wenxuan and Li, Meng and Xiong, Wenjie and Tong, Tong and Lu, Wen-jie and Tan, Jin and Wang, Runsheng and Huang, Ru}, title = {MPCViT: Searching for Accurate and Efficient MPC-Friendly Vision Transformer with Heterogeneous Attention}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5052-5063} }
Online Class Incremental Learning on Stochastic Blurry Task Boundary via Mask and Visual Prompt Tuning: Jun-Yeong Moon,

Keon-Hee Park,

Jung Uk Kim,

Gyeong-Moon Park; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Moon_2023_ICCV, author = {Moon, Jun-Yeong and Park, Keon-Hee and Kim, Jung Uk and Park, Gyeong-Moon}, title = {Online Class Incremental Learning on Stochastic Blurry Task Boundary via Mask and Visual Prompt Tuning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11731-11741} }
Text2Video-Zero: Text-to-Image Diffusion Models are Zero-Shot Video Generators: Levon Khachatryan,

Andranik Movsisyan,

Vahram Tadevosyan,

Roberto Henschel,

Zhangyang Wang,

Shant Navasardyan,

Humphrey Shi; [pdf] [supp]
[bibtex]
@InProceedings{Khachatryan_2023_ICCV, author = {Khachatryan, Levon and Movsisyan, Andranik and Tadevosyan, Vahram and Henschel, Roberto and Wang, Zhangyang and Navasardyan, Shant and Shi, Humphrey}, title = {Text2Video-Zero: Text-to-Image Diffusion Models are Zero-Shot Video Generators}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15954-15964} }
Masked Spiking Transformer: Ziqing Wang,

Yuetong Fang,

Jiahang Cao,

Qiang Zhang,

Zhongrui Wang,

Renjing Xu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Ziqing and Fang, Yuetong and Cao, Jiahang and Zhang, Qiang and Wang, Zhongrui and Xu, Renjing}, title = {Masked Spiking Transformer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1761-1771} }
Exploring Video Quality Assessment on User Generated Contents from Aesthetic and Technical Perspectives: Haoning Wu,

Erli Zhang,

Liang Liao,

Chaofeng Chen,

Jingwen Hou,

Annan Wang,

Wenxiu Sun,

Qiong Yan,

Weisi Lin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Haoning and Zhang, Erli and Liao, Liang and Chen, Chaofeng and Hou, Jingwen and Wang, Annan and Sun, Wenxiu and Yan, Qiong and Lin, Weisi}, title = {Exploring Video Quality Assessment on User Generated Contents from Aesthetic and Technical Perspectives}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20144-20154} }
Distributed Bundle Adjustment with Block-Based Sparse Matrix Compression for Super Large Scale Datasets: Maoteng Zheng,

Nengcheng Chen,

Junfeng Zhu,

Xiaoru Zeng,

Huanbin Qiu,

Yuyao Jiang,

Xingyue Lu,

Hao Qu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zheng_2023_ICCV, author = {Zheng, Maoteng and Chen, Nengcheng and Zhu, Junfeng and Zeng, Xiaoru and Qiu, Huanbin and Jiang, Yuyao and Lu, Xingyue and Qu, Hao}, title = {Distributed Bundle Adjustment with Block-Based Sparse Matrix Compression for Super Large Scale Datasets}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18152-18162} }
SCANet: Scene Complexity Aware Network for Weakly-Supervised Video Moment Retrieval: Sunjae Yoon,

Gwanhyeong Koo,

Dahyun Kim,

Chang D. Yoo; [pdf] [supp]
[bibtex]
@InProceedings{Yoon_2023_ICCV, author = {Yoon, Sunjae and Koo, Gwanhyeong and Kim, Dahyun and Yoo, Chang D.}, title = {SCANet: Scene Complexity Aware Network for Weakly-Supervised Video Moment Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13576-13586} }
Neural Interactive Keypoint Detection: Jie Yang,

Ailing Zeng,

Feng Li,

Shilong Liu,

Ruimao Zhang,

Lei Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Jie and Zeng, Ailing and Li, Feng and Liu, Shilong and Zhang, Ruimao and Zhang, Lei}, title = {Neural Interactive Keypoint Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15122-15132} }
Joint Implicit Neural Representation for High-fidelity and Compact Vector Fonts: Chia-Hao Chen,

Ying-Tian Liu,

Zhifei Zhang,

Yuan-Chen Guo,

Song-Hai Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Chia-Hao and Liu, Ying-Tian and Zhang, Zhifei and Guo, Yuan-Chen and Zhang, Song-Hai}, title = {Joint Implicit Neural Representation for High-fidelity and Compact Vector Fonts}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5538-5548} }
Spurious Features Everywhere - Large-Scale Detection of Harmful Spurious Features in ImageNet: Yannic Neuhaus,

Maximilian Augustin,

Valentyn Boreiko,

Matthias Hein; [pdf] [supp]
[bibtex]
@InProceedings{Neuhaus_2023_ICCV, author = {Neuhaus, Yannic and Augustin, Maximilian and Boreiko, Valentyn and Hein, Matthias}, title = {Spurious Features Everywhere - Large-Scale Detection of Harmful Spurious Features in ImageNet}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20235-20246} }
Knowledge-Aware Prompt Tuning for Generalizable Vision-Language Models: Baoshuo Kan,

Teng Wang,

Wenpeng Lu,

Xiantong Zhen,

Weili Guan,

Feng Zheng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kan_2023_ICCV, author = {Kan, Baoshuo and Wang, Teng and Lu, Wenpeng and Zhen, Xiantong and Guan, Weili and Zheng, Feng}, title = {Knowledge-Aware Prompt Tuning for Generalizable Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15670-15680} }
Delicate Textured Mesh Recovery from NeRF via Adaptive Surface Refinement: Jiaxiang Tang,

Hang Zhou,

Xiaokang Chen,

Tianshu Hu,

Errui Ding,

Jingdong Wang,

Gang Zeng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tang_2023_ICCV, author = {Tang, Jiaxiang and Zhou, Hang and Chen, Xiaokang and Hu, Tianshu and Ding, Errui and Wang, Jingdong and Zeng, Gang}, title = {Delicate Textured Mesh Recovery from NeRF via Adaptive Surface Refinement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17739-17749} }
Leveraging Inpainting for Single-Image Shadow Removal: Xiaoguang Li,

Qing Guo,

Rabab Abdelfattah,

Di Lin,

Wei Feng,

Ivor Tsang,

Song Wang; [pdf] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Xiaoguang and Guo, Qing and Abdelfattah, Rabab and Lin, Di and Feng, Wei and Tsang, Ivor and Wang, Song}, title = {Leveraging Inpainting for Single-Image Shadow Removal}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13055-13064} }
Neural Characteristic Function Learning for Conditional Image Generation: Shengxi Li,

Jialu Zhang,

Yifei Li,

Mai Xu,

Xin Deng,

Li Li; [pdf] [supp]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Shengxi and Zhang, Jialu and Li, Yifei and Xu, Mai and Deng, Xin and Li, Li}, title = {Neural Characteristic Function Learning for Conditional Image Generation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {7204-7214} }
Accurate 3D Face Reconstruction with Facial Component Tokens: Tianke Zhang,

Xuangeng Chu,

Yunfei Liu,

Lijian Lin,

Zhendong Yang,

Zhengzhuo Xu,

Chengkun Cao,

Fei Yu,

Changyin Zhou,

Chun Yuan,

Yu Li; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Tianke and Chu, Xuangeng and Liu, Yunfei and Lin, Lijian and Yang, Zhendong and Xu, Zhengzhuo and Cao, Chengkun and Yu, Fei and Zhou, Changyin and Yuan, Chun and Li, Yu}, title = {Accurate 3D Face Reconstruction with Facial Component Tokens}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9033-9042} }
Holistic Label Correction for Noisy Multi-Label Classification: Xiaobo Xia,

Jiankang Deng,

Wei Bao,

Yuxuan Du,

Bo Han,

Shiguang Shan,

Tongliang Liu; [pdf] [supp]
[bibtex]
@InProceedings{Xia_2023_ICCV, author = {Xia, Xiaobo and Deng, Jiankang and Bao, Wei and Du, Yuxuan and Han, Bo and Shan, Shiguang and Liu, Tongliang}, title = {Holistic Label Correction for Noisy Multi-Label Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1483-1493} }
Probabilistic Precision and Recall Towards Reliable Evaluation of Generative Models: Dogyun Park,

Suhyun Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Park_2023_ICCV, author = {Park, Dogyun and Kim, Suhyun}, title = {Probabilistic Precision and Recall Towards Reliable Evaluation of Generative Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20099-20109} }
Deep Multitask Learning with Progressive Parameter Sharing: Haosen Shi,

Shen Ren,

Tianwei Zhang,

Sinno Jialin Pan; [pdf] [supp]
[bibtex]
@InProceedings{Shi_2023_ICCV, author = {Shi, Haosen and Ren, Shen and Zhang, Tianwei and Pan, Sinno Jialin}, title = {Deep Multitask Learning with Progressive Parameter Sharing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19924-19935} }
Personalized Semantics Excitation for Federated Image Classification: Haifeng Xia,

Kai Li,

Zhengming Ding; [pdf]
[bibtex]
@InProceedings{Xia_2023_ICCV, author = {Xia, Haifeng and Li, Kai and Ding, Zhengming}, title = {Personalized Semantics Excitation for Federated Image Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19301-19310} }
Unified Data-Free Compression: Pruning and Quantization without Fine-Tuning: Shipeng Bai,

Jun Chen,

Xintian Shen,

Yixuan Qian,

Yong Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bai_2023_ICCV, author = {Bai, Shipeng and Chen, Jun and Shen, Xintian and Qian, Yixuan and Liu, Yong}, title = {Unified Data-Free Compression: Pruning and Quantization without Fine-Tuning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5876-5885} }
SurroundOcc: Multi-camera 3D Occupancy Prediction for Autonomous Driving: Yi Wei,

Linqing Zhao,

Wenzhao Zheng,

Zheng Zhu,

Jie Zhou,

Jiwen Lu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wei_2023_ICCV, author = {Wei, Yi and Zhao, Linqing and Zheng, Wenzhao and Zhu, Zheng and Zhou, Jie and Lu, Jiwen}, title = {SurroundOcc: Multi-camera 3D Occupancy Prediction for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21729-21740} }
Temporal Enhanced Training of Multi-view 3D Object Detector via Historical Object Prediction: Zhuofan Zong,

Dongzhi Jiang,

Guanglu Song,

Zeyue Xue,

Jingyong Su,

Hongsheng Li,

Yu Liu; [pdf] [arXiv]
[bibtex]
@InProceedings{Zong_2023_ICCV, author = {Zong, Zhuofan and Jiang, Dongzhi and Song, Guanglu and Xue, Zeyue and Su, Jingyong and Li, Hongsheng and Liu, Yu}, title = {Temporal Enhanced Training of Multi-view 3D Object Detector via Historical Object Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3781-3790} }
PARIS: Part-level Reconstruction and Motion Analysis for Articulated Objects: Jiayi Liu,

Ali Mahdavi-Amiri,

Manolis Savva; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Jiayi and Mahdavi-Amiri, Ali and Savva, Manolis}, title = {PARIS: Part-level Reconstruction and Motion Analysis for Articulated Objects}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {352-363} }
OnlineRefer: A Simple Online Baseline for Referring Video Object Segmentation: Dongming Wu,

Tiancai Wang,

Yuang Zhang,

Xiangyu Zhang,

Jianbing Shen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Dongming and Wang, Tiancai and Zhang, Yuang and Zhang, Xiangyu and Shen, Jianbing}, title = {OnlineRefer: A Simple Online Baseline for Referring Video Object Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2761-2770} }
Implicit Neural Representation for Cooperative Low-light Image Enhancement: Shuzhou Yang,

Moxuan Ding,

Yanmin Wu,

Zihan Li,

Jian Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2023_ICCV, author = {Yang, Shuzhou and Ding, Moxuan and Wu, Yanmin and Li, Zihan and Zhang, Jian}, title = {Implicit Neural Representation for Cooperative Low-light Image Enhancement}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12918-12927} }
Environment Agnostic Representation for Visual Reinforcement Learning: Hyesong Choi,

Hunsang Lee,

Seongwon Jeong,

Dongbo Min; [pdf] [supp]
[bibtex]
@InProceedings{Choi_2023_ICCV, author = {Choi, Hyesong and Lee, Hunsang and Jeong, Seongwon and Min, Dongbo}, title = {Environment Agnostic Representation for Visual Reinforcement Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {263-273} }
Deep Multiview Clustering by Contrasting Cluster Assignments: Jie Chen,

Hua Mao,

Wai Lok Woo,

Xi Peng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Jie and Mao, Hua and Woo, Wai Lok and Peng, Xi}, title = {Deep Multiview Clustering by Contrasting Cluster Assignments}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16752-16761} }
Mimic3D: Thriving 3D-Aware GANs via 3D-to-2D Imitation: Xingyu Chen,

Yu Deng,

Baoyuan Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Xingyu and Deng, Yu and Wang, Baoyuan}, title = {Mimic3D: Thriving 3D-Aware GANs via 3D-to-2D Imitation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2338-2348} }
Look at the Neighbor: Distortion-aware Unsupervised Domain Adaptation for Panoramic Semantic Segmentation: Xu Zheng,

Tianbo Pan,

Yunhao Luo,

Lin Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zheng_2023_ICCV, author = {Zheng, Xu and Pan, Tianbo and Luo, Yunhao and Wang, Lin}, title = {Look at the Neighbor: Distortion-aware Unsupervised Domain Adaptation for Panoramic Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18687-18698} }
Rethinking Safe Semi-supervised Learning: Transferring the Open-set Problem to A Close-set One: Qiankun Ma,

Jiyao Gao,

Bo Zhan,

Yunpeng Guo,

Jiliu Zhou,

Yan Wang; [pdf] [supp]
[bibtex]
@InProceedings{Ma_2023_ICCV, author = {Ma, Qiankun and Gao, Jiyao and Zhan, Bo and Guo, Yunpeng and Zhou, Jiliu and Wang, Yan}, title = {Rethinking Safe Semi-supervised Learning: Transferring the Open-set Problem to A Close-set One}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16370-16379} }
Does Physical Adversarial Example Really Matter to Autonomous Driving? Towards System-Level Effect of Adversarial Object Evasion Attack: Ningfei Wang,

Yunpeng Luo,

Takami Sato,

Kaidi Xu,

Qi Alfred Chen; [pdf] [arXiv]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Ningfei and Luo, Yunpeng and Sato, Takami and Xu, Kaidi and Chen, Qi Alfred}, title = {Does Physical Adversarial Example Really Matter to Autonomous Driving? Towards System-Level Effect of Adversarial Object Evasion Attack}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4412-4423} }
ReLeaPS : Reinforcement Learning-based Illumination Planning for Generalized Photometric Stereo: Jun Hoong Chan,

Bohan Yu,

Heng Guo,

Jieji Ren,

Zongqing Lu,

Boxin Shi; [pdf] [supp]
[bibtex]
@InProceedings{Chan_2023_ICCV, author = {Chan, Jun Hoong and Yu, Bohan and Guo, Heng and Ren, Jieji and Lu, Zongqing and Shi, Boxin}, title = {ReLeaPS : Reinforcement Learning-based Illumination Planning for Generalized Photometric Stereo}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9167-9175} }
Learning Foresightful Dense Visual Affordance for Deformable Object Manipulation: Ruihai Wu,

Chuanruo Ning,

Hao Dong; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Ruihai and Ning, Chuanruo and Dong, Hao}, title = {Learning Foresightful Dense Visual Affordance for Deformable Object Manipulation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10947-10956} }
Generalizable Neural Fields as Partially Observed Neural Processes: Jeffrey Gu,

Kuan-Chieh Wang,

Serena Yeung; [pdf] [arXiv]
[bibtex]
@InProceedings{Gu_2023_ICCV, author = {Gu, Jeffrey and Wang, Kuan-Chieh and Yeung, Serena}, title = {Generalizable Neural Fields as Partially Observed Neural Processes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5330-5339} }
CiteTracker: Correlating Image and Text for Visual Tracking: Xin Li,

Yuqing Huang,

Zhenyu He,

Yaowei Wang,

Huchuan Lu,

Ming-Hsuan Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Xin and Huang, Yuqing and He, Zhenyu and Wang, Yaowei and Lu, Huchuan and Yang, Ming-Hsuan}, title = {CiteTracker: Correlating Image and Text for Visual Tracking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9974-9983} }
Adding Conditional Control to Text-to-Image Diffusion Models: Lvmin Zhang,

Anyi Rao,

Maneesh Agrawala; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Lvmin and Rao, Anyi and Agrawala, Maneesh}, title = {Adding Conditional Control to Text-to-Image Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3836-3847} }
3D Instance Segmentation via Enhanced Spatial and Semantic Supervision: Salwa Al Khatib,

Mohamed El Amine Boudjoghra,

Jean Lahoud,

Fahad Shahbaz Khan; [pdf]
[bibtex]
@InProceedings{Al_Khatib_2023_ICCV, author = {Al Khatib, Salwa and El Amine Boudjoghra, Mohamed and Lahoud, Jean and Khan, Fahad Shahbaz}, title = {3D Instance Segmentation via Enhanced Spatial and Semantic Supervision}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {541-550} }
Unleashing Text-to-Image Diffusion Models for Visual Perception: Wenliang Zhao,

Yongming Rao,

Zuyan Liu,

Benlin Liu,

Jie Zhou,

Jiwen Lu; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Wenliang and Rao, Yongming and Liu, Zuyan and Liu, Benlin and Zhou, Jie and Lu, Jiwen}, title = {Unleashing Text-to-Image Diffusion Models for Visual Perception}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5729-5739} }
Iterative Superquadric Recomposition of 3D Objects from Multiple Views: Stephan Alaniz,

Massimiliano Mancini,

Zeynep Akata; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Alaniz_2023_ICCV, author = {Alaniz, Stephan and Mancini, Massimiliano and Akata, Zeynep}, title = {Iterative Superquadric Recomposition of 3D Objects from Multiple Views}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18013-18023} }
PHRIT: Parametric Hand Representation with Implicit Template: Zhisheng Huang,

Yujin Chen,

Di Kang,

Jinlu Zhang,

Zhigang Tu; [pdf] [supp]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Zhisheng and Chen, Yujin and Kang, Di and Zhang, Jinlu and Tu, Zhigang}, title = {PHRIT: Parametric Hand Representation with Implicit Template}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14974-14984} }
BEVPlace: Learning LiDAR-based Place Recognition using Bird's Eye View Images: Lun Luo,

Shuhang Zheng,

Yixuan Li,

Yongzhi Fan,

Beinan Yu,

Si-Yuan Cao,

Junwei Li,

Hui-Liang Shen; [pdf] [supp]
[bibtex]
@InProceedings{Luo_2023_ICCV, author = {Luo, Lun and Zheng, Shuhang and Li, Yixuan and Fan, Yongzhi and Yu, Beinan and Cao, Si-Yuan and Li, Junwei and Shen, Hui-Liang}, title = {BEVPlace: Learning LiDAR-based Place Recognition using Bird's Eye View Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8700-8709} }
Transferable Adversarial Attack for Both Vision Transformers and Convolutional Networks via Momentum Integrated Gradients: Wenshuo Ma,

Yidong Li,

Xiaofeng Jia,

Wei Xu; [pdf] [supp]
[bibtex]
@InProceedings{Ma_2023_ICCV, author = {Ma, Wenshuo and Li, Yidong and Jia, Xiaofeng and Xu, Wei}, title = {Transferable Adversarial Attack for Both Vision Transformers and Convolutional Networks via Momentum Integrated Gradients}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4630-4639} }
TrajPAC: Towards Robustness Verification of Pedestrian Trajectory Prediction Models: Liang Zhang,

Nathaniel Xu,

Pengfei Yang,

Gaojie Jin,

Cheng-Chao Huang,

Lijun Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Liang and Xu, Nathaniel and Yang, Pengfei and Jin, Gaojie and Huang, Cheng-Chao and Zhang, Lijun}, title = {TrajPAC: Towards Robustness Verification of Pedestrian Trajectory Prediction Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8327-8339} }
Adaptive Image Anonymization in the Context of Image Classification with Neural Networks: Nadiya Shvai,

Arcadi Llanza Carmona,

Amir Nakib; [pdf]
[bibtex]
@InProceedings{Shvai_2023_ICCV, author = {Shvai, Nadiya and Carmona, Arcadi Llanza and Nakib, Amir}, title = {Adaptive Image Anonymization in the Context of Image Classification with Neural Networks}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5074-5083} }
SiLK: Simple Learned Keypoints: Pierre Gleize,

Weiyao Wang,

Matt Feiszli; [pdf] [supp]
[bibtex]
@InProceedings{Gleize_2023_ICCV, author = {Gleize, Pierre and Wang, Weiyao and Feiszli, Matt}, title = {SiLK: Simple Learned Keypoints}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22499-22508} }
EfficientViT: Lightweight Multi-Scale Attention for High-Resolution Dense Prediction: Han Cai,

Junyan Li,

Muyan Hu,

Chuang Gan,

Song Han; [pdf]
[bibtex]
@InProceedings{Cai_2023_ICCV, author = {Cai, Han and Li, Junyan and Hu, Muyan and Gan, Chuang and Han, Song}, title = {EfficientViT: Lightweight Multi-Scale Attention for High-Resolution Dense Prediction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17302-17313} }
Efficient Neural Supersampling on a Novel Gaming Dataset: Antoine Mercier,

Ruan Erasmus,

Yashesh Savani,

Manik Dhingra,

Fatih Porikli,

Guillaume Berger; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mercier_2023_ICCV, author = {Mercier, Antoine and Erasmus, Ruan and Savani, Yashesh and Dhingra, Manik and Porikli, Fatih and Berger, Guillaume}, title = {Efficient Neural Supersampling on a Novel Gaming Dataset}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {296-306} }
Rapid Adaptation in Online Continual Learning: Are We Evaluating It Right?: Hasan Abed Al Kader Hammoud,

Ameya Prabhu,

Ser-Nam Lim,

Philip H.S. Torr,

Adel Bibi,

Bernard Ghanem; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Al_Kader_Hammoud_2023_ICCV, author = {Al Kader Hammoud, Hasan Abed and Prabhu, Ameya and Lim, Ser-Nam and Torr, Philip H.S. and Bibi, Adel and Ghanem, Bernard}, title = {Rapid Adaptation in Online Continual Learning: Are We Evaluating It Right?}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18852-18861} }
Label-Efficient Online Continual Object Detection in Streaming Video: Jay Zhangjie Wu,

David Junhao Zhang,

Wynne Hsu,

Mengmi Zhang,

Mike Zheng Shou; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2023_ICCV, author = {Wu, Jay Zhangjie and Zhang, David Junhao and Hsu, Wynne and Zhang, Mengmi and Shou, Mike Zheng}, title = {Label-Efficient Online Continual Object Detection in Streaming Video}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19246-19255} }
Learning Point Cloud Completion without Complete Point Clouds: A Pose-Aware Approach: Jihun Kim,

Hyeokjun Kweon,

Yunseo Yang,

Kuk-Jin Yoon; [pdf] [supp]
[bibtex]
@InProceedings{Kim_2023_ICCV, author = {Kim, Jihun and Kweon, Hyeokjun and Yang, Yunseo and Yoon, Kuk-Jin}, title = {Learning Point Cloud Completion without Complete Point Clouds: A Pose-Aware Approach}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14203-14213} }
Frequency Guidance Matters in Few-Shot Learning: Hao Cheng,

Siyuan Yang,

Joey Tianyi Zhou,

Lanqing Guo,

Bihan Wen; [pdf] [supp]
[bibtex]
@InProceedings{Cheng_2023_ICCV, author = {Cheng, Hao and Yang, Siyuan and Zhou, Joey Tianyi and Guo, Lanqing and Wen, Bihan}, title = {Frequency Guidance Matters in Few-Shot Learning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {11814-11824} }
Walking Your LiDOG: A Journey Through Multiple Domains for LiDAR Semantic Segmentation: Cristiano Saltori,

Aljosa Osep,

Elisa Ricci,

Laura Leal-Taixé; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Saltori_2023_ICCV, author = {Saltori, Cristiano and Osep, Aljosa and Ricci, Elisa and Leal-Taix\'e, Laura}, title = {Walking Your LiDOG: A Journey Through Multiple Domains for LiDAR Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {196-206} }
Diverse Cotraining Makes Strong Semi-Supervised Segmentor: Yijiang Li,

Xinjiang Wang,

Lihe Yang,

Litong Feng,

Wayne Zhang,

Ying Gao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Yijiang and Wang, Xinjiang and Yang, Lihe and Feng, Litong and Zhang, Wayne and Gao, Ying}, title = {Diverse Cotraining Makes Strong Semi-Supervised Segmentor}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16055-16067} }
Spherical Space Feature Decomposition for Guided Depth Map Super-Resolution: Zixiang Zhao,

Jiangshe Zhang,

Xiang Gu,

Chengli Tan,

Shuang Xu,

Yulun Zhang,

Radu Timofte,

Luc Van Gool; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Zixiang and Zhang, Jiangshe and Gu, Xiang and Tan, Chengli and Xu, Shuang and Zhang, Yulun and Timofte, Radu and Van Gool, Luc}, title = {Spherical Space Feature Decomposition for Guided Depth Map Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12547-12558} }
Tiled Multiplane Images for Practical 3D Photography: Numair Khan,

Lei Xiao,

Douglas Lanman; [pdf] [arXiv]
[bibtex]
@InProceedings{Khan_2023_ICCV, author = {Khan, Numair and Xiao, Lei and Lanman, Douglas}, title = {Tiled Multiplane Images for Practical 3D Photography}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10454-10464} }
VQA-GNN: Reasoning with Multimodal Knowledge via Graph Neural Networks for Visual Question Answering: Yanan Wang,

Michihiro Yasunaga,

Hongyu Ren,

Shinya Wada,

Jure Leskovec; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2023_ICCV, author = {Wang, Yanan and Yasunaga, Michihiro and Ren, Hongyu and Wada, Shinya and Leskovec, Jure}, title = {VQA-GNN: Reasoning with Multimodal Knowledge via Graph Neural Networks for Visual Question Answering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21582-21592} }
Unmasked Teacher: Towards Training-Efficient Video Foundation Models: Kunchang Li,

Yali Wang,

Yizhuo Li,

Yi Wang,

Yinan He,

Limin Wang,

Yu Qiao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Kunchang and Wang, Yali and Li, Yizhuo and Wang, Yi and He, Yinan and Wang, Limin and Qiao, Yu}, title = {Unmasked Teacher: Towards Training-Efficient Video Foundation Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19948-19960} }
Explore and Tell: Embodied Visual Captioning in 3D Environments: Anwen Hu,

Shizhe Chen,

Liang Zhang,

Qin Jin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hu_2023_ICCV, author = {Hu, Anwen and Chen, Shizhe and Zhang, Liang and Jin, Qin}, title = {Explore and Tell: Embodied Visual Captioning in 3D Environments}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2482-2491} }
FastViT: A Fast Hybrid Vision Transformer Using Structural Reparameterization: Pavan Kumar Anasosalu Vasu,

James Gabriel,

Jeff Zhu,

Oncel Tuzel,

Anurag Ranjan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Vasu_2023_ICCV, author = {Vasu, Pavan Kumar Anasosalu and Gabriel, James and Zhu, Jeff and Tuzel, Oncel and Ranjan, Anurag}, title = {FastViT: A Fast Hybrid Vision Transformer Using Structural Reparameterization}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5785-5795} }
OFVL-MS: Once for Visual Localization across Multiple Indoor Scenes: Tao Xie,

Kun Dai,

Siyi Lu,

Ke Wang,

Zhiqiang Jiang,

Jinghan Gao,

Dedong Liu,

Jie Xu,

Lijun Zhao,

Ruifeng Li; [pdf] [supp]
[bibtex]
@InProceedings{Xie_2023_ICCV, author = {Xie, Tao and Dai, Kun and Lu, Siyi and Wang, Ke and Jiang, Zhiqiang and Gao, Jinghan and Liu, Dedong and Xu, Jie and Zhao, Lijun and Li, Ruifeng}, title = {OFVL-MS: Once for Visual Localization across Multiple Indoor Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5516-5526} }
HTML: Hybrid Temporal-scale Multimodal Learning Framework for Referring Video Object Segmentation: Mingfei Han,

Yali Wang,

Zhihui Li,

Lina Yao,

Xiaojun Chang,

Yu Qiao; [pdf] [supp]
[bibtex]
@InProceedings{Han_2023_ICCV, author = {Han, Mingfei and Wang, Yali and Li, Zhihui and Yao, Lina and Chang, Xiaojun and Qiao, Yu}, title = {HTML: Hybrid Temporal-scale Multimodal Learning Framework for Referring Video Object Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {13414-13423} }
SQAD: Automatic Smartphone Camera Quality Assessment and Benchmarking: Zilin Fang,

Andrey Ignatov,

Eduard Zamfir,

Radu Timofte; [pdf] [supp]
[bibtex]
@InProceedings{Fang_2023_ICCV, author = {Fang, Zilin and Ignatov, Andrey and Zamfir, Eduard and Timofte, Radu}, title = {SQAD: Automatic Smartphone Camera Quality Assessment and Benchmarking}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20532-20542} }
PointDC: Unsupervised Semantic Segmentation of 3D Point Clouds via Cross-Modal Distillation and Super-Voxel Clustering: Zisheng Chen,

Hongbin Xu,

Weitao Chen,

Zhipeng Zhou,

Haihong Xiao,

Baigui Sun,

Xuansong Xie,

Wenxiong kang; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Zisheng and Xu, Hongbin and Chen, Weitao and Zhou, Zhipeng and Xiao, Haihong and Sun, Baigui and Xie, Xuansong and kang, Wenxiong}, title = {PointDC: Unsupervised Semantic Segmentation of 3D Point Clouds via Cross-Modal Distillation and Super-Voxel Clustering}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14290-14299} }
MV-Map: Offboard HD-Map Generation with Multi-view Consistency: Ziyang Xie,

Ziqi Pang,

Yu-Xiong Wang; [pdf] [supp]
[bibtex]
@InProceedings{Xie_2023_ICCV, author = {Xie, Ziyang and Pang, Ziqi and Wang, Yu-Xiong}, title = {MV-Map: Offboard HD-Map Generation with Multi-view Consistency}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8658-8668} }
Multi-view Self-supervised Disentanglement for General Image Denoising: Hao Chen,

Chenyuan Qu,

Yu Zhang,

Chen Chen,

Jianbo Jiao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Hao and Qu, Chenyuan and Zhang, Yu and Chen, Chen and Jiao, Jianbo}, title = {Multi-view Self-supervised Disentanglement for General Image Denoising}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12281-12291} }
Inter-Realization Channels: Unsupervised Anomaly Detection Beyond One-Class Classification: Declan McIntosh,

Alexandra Branzan Albu; [pdf] [supp]
[bibtex]
@InProceedings{McIntosh_2023_ICCV, author = {McIntosh, Declan and Albu, Alexandra Branzan}, title = {Inter-Realization Channels: Unsupervised Anomaly Detection Beyond One-Class Classification}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {6285-6295} }
Multi-Event Video-Text Retrieval: Gengyuan Zhang,

Jisen Ren,

Jindong Gu,

Volker Tresp; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Gengyuan and Ren, Jisen and Gu, Jindong and Tresp, Volker}, title = {Multi-Event Video-Text Retrieval}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {22113-22123} }
SHERF: Generalizable Human NeRF from a Single Image: Shoukang Hu,

Fangzhou Hong,

Liang Pan,

Haiyi Mei,

Lei Yang,

Ziwei Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hu_2023_ICCV, author = {Hu, Shoukang and Hong, Fangzhou and Pan, Liang and Mei, Haiyi and Yang, Lei and Liu, Ziwei}, title = {SHERF: Generalizable Human NeRF from a Single Image}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9352-9364} }
MVPSNet: Fast Generalizable Multi-view Photometric Stereo: Dongxu Zhao,

Daniel Lichy,

Pierre-Nicolas Perrin,

Jan-Michael Frahm,

Soumyadip Sengupta; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Dongxu and Lichy, Daniel and Perrin, Pierre-Nicolas and Frahm, Jan-Michael and Sengupta, Soumyadip}, title = {MVPSNet: Fast Generalizable Multi-view Photometric Stereo}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12525-12536} }
High Quality Entity Segmentation: Lu Qi,

Jason Kuen,

Tiancheng Shen,

Jiuxiang Gu,

Wenbo Li,

Weidong Guo,

Jiaya Jia,

Zhe Lin,

Ming-Hsuan Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Qi_2023_ICCV, author = {Qi, Lu and Kuen, Jason and Shen, Tiancheng and Gu, Jiuxiang and Li, Wenbo and Guo, Weidong and Jia, Jiaya and Lin, Zhe and Yang, Ming-Hsuan}, title = {High Quality Entity Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {4047-4056} }
CoTDet: Affordance Knowledge Prompting for Task Driven Object Detection: Jiajin Tang,

Ge Zheng,

Jingyi Yu,

Sibei Yang; [pdf] [arXiv]
[bibtex]
@InProceedings{Tang_2023_ICCV, author = {Tang, Jiajin and Zheng, Ge and Yu, Jingyi and Yang, Sibei}, title = {CoTDet: Affordance Knowledge Prompting for Task Driven Object Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3068-3078} }
You Never Get a Second Chance To Make a Good First Impression: Seeding Active Learning for 3D Semantic Segmentation: Nermin Samet,

Oriane Siméoni,

Gilles Puy,

Georgy Ponimatkin,

Renaud Marlet,

Vincent Lepetit; [pdf] [supp]
[bibtex]
@InProceedings{Samet_2023_ICCV, author = {Samet, Nermin and Sim\'eoni, Oriane and Puy, Gilles and Ponimatkin, Georgy and Marlet, Renaud and Lepetit, Vincent}, title = {You Never Get a Second Chance To Make a Good First Impression: Seeding Active Learning for 3D Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18445-18457} }
Scalable Multi-Temporal Remote Sensing Change Data Generation via Simulating Stochastic Change Process: Zhuo Zheng,

Shiqi Tian,

Ailong Ma,

Liangpei Zhang,

Yanfei Zhong; [pdf] [supp]
[bibtex]
@InProceedings{Zheng_2023_ICCV, author = {Zheng, Zhuo and Tian, Shiqi and Ma, Ailong and Zhang, Liangpei and Zhong, Yanfei}, title = {Scalable Multi-Temporal Remote Sensing Change Data Generation via Simulating Stochastic Change Process}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21818-21827} }
Human from Blur: Human Pose Tracking from Blurry Images: Yiming Zhao,

Denys Rozumnyi,

Jie Song,

Otmar Hilliges,

Marc Pollefeys,

Martin R. Oswald; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhao_2023_ICCV, author = {Zhao, Yiming and Rozumnyi, Denys and Song, Jie and Hilliges, Otmar and Pollefeys, Marc and Oswald, Martin R.}, title = {Human from Blur: Human Pose Tracking from Blurry Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14905-14915} }
NerfAcc: Efficient Sampling Accelerates NeRFs: Ruilong Li,

Hang Gao,

Matthew Tancik,

Angjoo Kanazawa; [pdf] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Ruilong and Gao, Hang and Tancik, Matthew and Kanazawa, Angjoo}, title = {NerfAcc: Efficient Sampling Accelerates NeRFs}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18537-18546} }
A2Q: Accumulator-Aware Quantization with Guaranteed Overflow Avoidance: Ian Colbert,

Alessandro Pappalardo,

Jakoba Petri-Koenig; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Colbert_2023_ICCV, author = {Colbert, Ian and Pappalardo, Alessandro and Petri-Koenig, Jakoba}, title = {A2Q: Accumulator-Aware Quantization with Guaranteed Overflow Avoidance}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {16989-16998} }
Uni-3D: A Universal Model for Panoptic 3D Scene Reconstruction: Xiang Zhang,

Zeyuan Chen,

Fangyin Wei,

Zhuowen Tu; [pdf]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Xiang and Chen, Zeyuan and Wei, Fangyin and Tu, Zhuowen}, title = {Uni-3D: A Universal Model for Panoptic 3D Scene Reconstruction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9256-9266} }
ARNOLD: A Benchmark for Language-Grounded Task Learning with Continuous States in Realistic 3D Scenes: Ran Gong,

Jiangyong Huang,

Yizhou Zhao,

Haoran Geng,

Xiaofeng Gao,

Qingyang Wu,

Wensi Ai,

Ziheng Zhou,

Demetri Terzopoulos,

Song-Chun Zhu,

Baoxiong Jia,

Siyuan Huang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Gong_2023_ICCV, author = {Gong, Ran and Huang, Jiangyong and Zhao, Yizhou and Geng, Haoran and Gao, Xiaofeng and Wu, Qingyang and Ai, Wensi and Zhou, Ziheng and Terzopoulos, Demetri and Zhu, Song-Chun and Jia, Baoxiong and Huang, Siyuan}, title = {ARNOLD: A Benchmark for Language-Grounded Task Learning with Continuous States in Realistic 3D Scenes}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20483-20495} }
Full-Body Articulated Human-Object Interaction: Nan Jiang,

Tengyu Liu,

Zhexuan Cao,

Jieming Cui,

Zhiyuan Zhang,

Yixin Chen,

He Wang,

Yixin Zhu,

Siyuan Huang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jiang_2023_ICCV, author = {Jiang, Nan and Liu, Tengyu and Cao, Zhexuan and Cui, Jieming and Zhang, Zhiyuan and Chen, Yixin and Wang, He and Zhu, Yixin and Huang, Siyuan}, title = {Full-Body Articulated Human-Object Interaction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9365-9376} }
FeatureNeRF: Learning Generalizable NeRFs by Distilling Foundation Models: Jianglong Ye,

Naiyan Wang,

Xiaolong Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ye_2023_ICCV, author = {Ye, Jianglong and Wang, Naiyan and Wang, Xiaolong}, title = {FeatureNeRF: Learning Generalizable NeRFs by Distilling Foundation Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8962-8973} }
SRFormer: Permuted Self-Attention for Single Image Super-Resolution: Yupeng Zhou,

Zhen Li,

Chun-Le Guo,

Song Bai,

Ming-Ming Cheng,

Qibin Hou; [pdf] [arXiv]
[bibtex]
@InProceedings{Zhou_2023_ICCV, author = {Zhou, Yupeng and Li, Zhen and Guo, Chun-Le and Bai, Song and Cheng, Ming-Ming and Hou, Qibin}, title = {SRFormer: Permuted Self-Attention for Single Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {12780-12791} }
Deep Homography Mixture for Single Image Rolling Shutter Correction: Weilong Yan,

Robby T. Tan,

Bing Zeng,

Shuaicheng Liu; [pdf]
[bibtex]
@InProceedings{Yan_2023_ICCV, author = {Yan, Weilong and Tan, Robby T. and Zeng, Bing and Liu, Shuaicheng}, title = {Deep Homography Mixture for Single Image Rolling Shutter Correction}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {9868-9877} }
Audio-Visual Glance Network for Efficient Video Recognition: Muhammad Adi Nugroho,

Sangmin Woo,

Sumin Lee,

Changick Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Nugroho_2023_ICCV, author = {Nugroho, Muhammad Adi and Woo, Sangmin and Lee, Sumin and Kim, Changick}, title = {Audio-Visual Glance Network for Efficient Video Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10150-10159} }
CLNeRF: Continual Learning Meets NeRF: Zhipeng Cai,

Matthias Müller; [pdf] [supp]
[bibtex]
@InProceedings{Cai_2023_ICCV, author = {Cai, Zhipeng and M\"uller, Matthias}, title = {CLNeRF: Continual Learning Meets NeRF}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23185-23194} }
Rendering Humans from Object-Occluded Monocular Videos: Tiange Xiang,

Adam Sun,

Jiajun Wu,

Ehsan Adeli,

Li Fei-Fei; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Xiang_2023_ICCV, author = {Xiang, Tiange and Sun, Adam and Wu, Jiajun and Adeli, Ehsan and Fei-Fei, Li}, title = {Rendering Humans from Object-Occluded Monocular Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {3239-3250} }
CrossMatch: Source-Free Domain Adaptive Semantic Segmentation via Cross-Modal Consistency Training: Yifang Yin,

Wenmiao Hu,

Zhenguang Liu,

Guanfeng Wang,

Shili Xiang,

Roger Zimmermann; [pdf]
[bibtex]
@InProceedings{Yin_2023_ICCV, author = {Yin, Yifang and Hu, Wenmiao and Liu, Zhenguang and Wang, Guanfeng and Xiang, Shili and Zimmermann, Roger}, title = {CrossMatch: Source-Free Domain Adaptive Semantic Segmentation via Cross-Modal Consistency Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21786-21796} }
Out-of-Distribution Detection for Monocular Depth Estimation: Julia Hornauer,

Adrian Holzbock,

Vasileios Belagiannis; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hornauer_2023_ICCV, author = {Hornauer, Julia and Holzbock, Adrian and Belagiannis, Vasileios}, title = {Out-of-Distribution Detection for Monocular Depth Estimation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {1911-1921} }
STEPs: Self-Supervised Key Step Extraction and Localization from Unlabeled Procedural Videos: Anshul Shah,

Benjamin Lundell,

Harpreet Sawhney,

Rama Chellappa; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shah_2023_ICCV, author = {Shah, Anshul and Lundell, Benjamin and Sawhney, Harpreet and Chellappa, Rama}, title = {STEPs: Self-Supervised Key Step Extraction and Localization from Unlabeled Procedural Videos}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {10375-10387} }
Improving Equivariance in State-of-the-Art Supervised Depth and Normal Predictors: Yuanyi Zhong,

Anand Bhattad,

Yu-Xiong Wang,

David Forsyth; [pdf] [supp]
[bibtex]
@InProceedings{Zhong_2023_ICCV, author = {Zhong, Yuanyi and Bhattad, Anand and Wang, Yu-Xiong and Forsyth, David}, title = {Improving Equivariance in State-of-the-Art Supervised Depth and Normal Predictors}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21775-21785} }
Towards Robust and Smooth 3D Multi-Person Pose Estimation from Monocular Videos in the Wild: Sungchan Park,

Eunyi You,

Inhoe Lee,

Joonseok Lee; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Park_2023_ICCV, author = {Park, Sungchan and You, Eunyi and Lee, Inhoe and Lee, Joonseok}, title = {Towards Robust and Smooth 3D Multi-Person Pose Estimation from Monocular Videos in the Wild}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {14772-14782} }
Reducing Training Time in Cross-Silo Federated Learning Using Multigraph Topology: Tuong Do,

Binh X. Nguyen,

Vuong Pham,

Toan Tran,

Erman Tjiputra,

Quang D. Tran,

Anh Nguyen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Do_2023_ICCV, author = {Do, Tuong and Nguyen, Binh X. and Pham, Vuong and Tran, Toan and Tjiputra, Erman and Tran, Quang D. and Nguyen, Anh}, title = {Reducing Training Time in Cross-Silo Federated Learning Using Multigraph Topology}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {19409-19419} }
Counting Crowds in Bad Weather: Zhi-Kai Huang,

Wei-Ting Chen,

Yuan-Chun Chiang,

Sy-Yen Kuo,

Ming-Hsuan Yang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Zhi-Kai and Chen, Wei-Ting and Chiang, Yuan-Chun and Kuo, Sy-Yen and Yang, Ming-Hsuan}, title = {Counting Crowds in Bad Weather}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23308-23319} }
FreeDoM: Training-Free Energy-Guided Conditional Diffusion Model: Jiwen Yu,

Yinhuai Wang,

Chen Zhao,

Bernard Ghanem,

Jian Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yu_2023_ICCV, author = {Yu, Jiwen and Wang, Yinhuai and Zhao, Chen and Ghanem, Bernard and Zhang, Jian}, title = {FreeDoM: Training-Free Energy-Guided Conditional Diffusion Model}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {23174-23184} }
UniT3D: A Unified Transformer for 3D Dense Captioning and Visual Grounding: Zhenyu Chen,

Ronghang Hu,

Xinlei Chen,

Matthias Nießner,

Angel X. Chang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2023_ICCV, author = {Chen, Zhenyu and Hu, Ronghang and Chen, Xinlei and Nie{\ss}ner, Matthias and Chang, Angel X.}, title = {UniT3D: A Unified Transformer for 3D Dense Captioning and Visual Grounding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18109-18119} }
SKiT: a Fast Key Information Video Transformer for Online Surgical Phase Recognition: Yang Liu,

Jiayu Huo,

Jingjing Peng,

Rachel Sparks,

Prokar Dasgupta,

Alejandro Granados,

Sebastien Ourselin; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2023_ICCV, author = {Liu, Yang and Huo, Jiayu and Peng, Jingjing and Sparks, Rachel and Dasgupta, Prokar and Granados, Alejandro and Ourselin, Sebastien}, title = {SKiT: a Fast Key Information Video Transformer for Online Surgical Phase Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21074-21084} }
Clustering based Point Cloud Representation Learning for 3D Analysis: Tuo Feng,

Wenguan Wang,

Xiaohan Wang,

Yi Yang,

Qinghua Zheng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Feng_2023_ICCV, author = {Feng, Tuo and Wang, Wenguan and Wang, Xiaohan and Yang, Yi and Zheng, Qinghua}, title = {Clustering based Point Cloud Representation Learning for 3D Analysis}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8283-8294} }
Automatic Network Pruning via Hilbert-Schmidt Independence Criterion Lasso under Information Bottleneck Principle: Song Guo,

Lei Zhang,

Xiawu Zheng,

Yan Wang,

Yuchao Li,

Fei Chao,

Chenglin Wu,

Shengchuan Zhang,

Rongrong Ji; [pdf] [supp]
[bibtex]
@InProceedings{Guo_2023_ICCV, author = {Guo, Song and Zhang, Lei and Zheng, Xiawu and Wang, Yan and Li, Yuchao and Chao, Fei and Wu, Chenglin and Zhang, Shengchuan and Ji, Rongrong}, title = {Automatic Network Pruning via Hilbert-Schmidt Independence Criterion Lasso under Information Bottleneck Principle}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {17458-17469} }
Forecast-MAE: Self-supervised Pre-training for Motion Forecasting with Masked Autoencoders: Jie Cheng,

Xiaodong Mei,

Ming Liu; [pdf] [supp]
[bibtex]
@InProceedings{Cheng_2023_ICCV, author = {Cheng, Jie and Mei, Xiaodong and Liu, Ming}, title = {Forecast-MAE: Self-supervised Pre-training for Motion Forecasting with Masked Autoencoders}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8679-8689} }
Efficient Transformer-based 3D Object Detection with Dynamic Token Halting: Mao Ye,

Gregory P. Meyer,

Yuning Chai,

Qiang Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ye_2023_ICCV, author = {Ye, Mao and Meyer, Gregory P. and Chai, Yuning and Liu, Qiang}, title = {Efficient Transformer-based 3D Object Detection with Dynamic Token Halting}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8438-8450} }
Neglected Free Lunch - Learning Image Classifiers Using Annotation Byproducts: Dongyoon Han,

Junsuk Choe,

Seonghyeok Chun,

John Joon Young Chung,

Minsuk Chang,

Sangdoo Yun,

Jean Y. Song,

Seong Joon Oh; [pdf] [supp]
[bibtex]
@InProceedings{Han_2023_ICCV, author = {Han, Dongyoon and Choe, Junsuk and Chun, Seonghyeok and Chung, John Joon Young and Chang, Minsuk and Yun, Sangdoo and Song, Jean Y. and Oh, Seong Joon}, title = {Neglected Free Lunch - Learning Image Classifiers Using Annotation Byproducts}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20200-20212} }
Rethinking the Role of Pre-Trained Networks in Source-Free Domain Adaptation: Wenyu Zhang,

Li Shen,

Chuan-Sheng Foo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Wenyu and Shen, Li and Foo, Chuan-Sheng}, title = {Rethinking the Role of Pre-Trained Networks in Source-Free Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {18841-18851} }
RLIPv2: Fast Scaling of Relational Language-Image Pre-Training: Hangjie Yuan,

Shiwei Zhang,

Xiang Wang,

Samuel Albanie,

Yining Pan,

Tao Feng,

Jianwen Jiang,

Dong Ni,

Yingya Zhang,

Deli Zhao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yuan_2023_ICCV, author = {Yuan, Hangjie and Zhang, Shiwei and Wang, Xiang and Albanie, Samuel and Pan, Yining and Feng, Tao and Jiang, Jianwen and Ni, Dong and Zhang, Yingya and Zhao, Deli}, title = {RLIPv2: Fast Scaling of Relational Language-Image Pre-Training}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {21649-21661} }
TransFace: Calibrating Transformer Training for Face Recognition from a Data-Centric Perspective: Jun Dan,

Yang Liu,

Haoyu Xie,

Jiankang Deng,

Haoran Xie,

Xuansong Xie,

Baigui Sun; [pdf] [arXiv]
[bibtex]
@InProceedings{Dan_2023_ICCV, author = {Dan, Jun and Liu, Yang and Xie, Haoyu and Deng, Jiankang and Xie, Haoran and Xie, Xuansong and Sun, Baigui}, title = {TransFace: Calibrating Transformer Training for Face Recognition from a Data-Centric Perspective}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20642-20653} }
LLM-Planner: Few-Shot Grounded Planning for Embodied Agents with Large Language Models: Chan Hee Song,

Jiaman Wu,

Clayton Washington,

Brian M Sadler,

Wei-Lun Chao,

Yu Su; [pdf] [supp]
[bibtex]
@InProceedings{Song_2023_ICCV, author = {Song, Chan Hee and Wu, Jiaman and Washington, Clayton and Sadler, Brian M and Chao, Wei-Lun and Su, Yu}, title = {LLM-Planner: Few-Shot Grounded Planning for Embodied Agents with Large Language Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {2998-3009} }
Exploring Model Transferability through the Lens of Potential Energy: Xiaotong Li,

Zixuan Hu,

Yixiao Ge,

Ying Shan,

Ling-Yu Duan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2023_ICCV, author = {Li, Xiaotong and Hu, Zixuan and Ge, Yixiao and Shan, Ying and Duan, Ling-Yu}, title = {Exploring Model Transferability through the Lens of Potential Energy}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {5429-5438} }
Video Task Decathlon: Unifying Image and Video Tasks in Autonomous Driving: Thomas E. Huang,

Yifan Liu,

Luc Van Gool,

Fisher Yu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2023_ICCV, author = {Huang, Thomas E. and Liu, Yifan and Van Gool, Luc and Yu, Fisher}, title = {Video Task Decathlon: Unifying Image and Video Tasks in Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {8647-8657} }
Aria Digital Twin: A New Benchmark Dataset for Egocentric 3D Machine Perception: Xiaqing Pan,

Nicholas Charron,

Yongqian Yang,

Scott Peters,

Thomas Whelan,

Chen Kong,

Omkar Parkhi,

Richard Newcombe,

Yuheng (Carl) Ren; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Pan_2023_ICCV, author = {Pan, Xiaqing and Charron, Nicholas and Yang, Yongqian and Peters, Scott and Whelan, Thomas and Kong, Chen and Parkhi, Omkar and Newcombe, Richard and Ren, Yuheng (Carl)}, title = {Aria Digital Twin: A New Benchmark Dataset for Egocentric 3D Machine Perception}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {20133-20143} }
PreSTU: Pre-Training for Scene-Text Understanding: Jihyung Kil,

Soravit Changpinyo,

Xi Chen,

Hexiang Hu,

Sebastian Goodman,

Wei-Lun Chao,

Radu Soricut; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kil_2023_ICCV, author = {Kil, Jihyung and Changpinyo, Soravit and Chen, Xi and Hu, Hexiang and Goodman, Sebastian and Chao, Wei-Lun and Soricut, Radu}, title = {PreSTU: Pre-Training for Scene-Text Understanding}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)}, month = {October}, year = {2023}, pages = {15270-15280} }; Back