Papers
- Back
ATM: Enhanced Alignment for Text-to-Motion Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Han_2026_WACV, author = {Han, Ke and Lyu, Yueming and Yu, Weichen and Sebe, Nicu}, title = {ATM: Enhanced Alignment for Text-to-Motion Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6862-6872} }
Contrastive Integrated Gradients: A Feature Attribution-Based Method for Explaining Whole Slide Image Classification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Vu_2026_WACV, author = {Vu, Anh Mai and Vo, Tuan L. and Bui, Ngoc Lam Quang and Le, Nam N. B. and Awasthi, Akash and Vo, Huy Q. and Nguyen, Thanh-Huy and Han, Zhu and Mohan, Chandra and Van Nguyen, Hien}, title = {Contrastive Integrated Gradients: A Feature Attribution-Based Method for Explaining Whole Slide Image Classification}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1201-1210} }
Forget Less by Learning Together through Concept Consolidation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kaushik_2026_WACV, author = {Kaushik, Arjun Ramesh and Devulapally, Naresh Kumar and Lokhande, Vishnu Suresh and Ratha, Nalini and Govindaraju, Venu}, title = {Forget Less by Learning Together through Concept Consolidation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {265-275} }
GFT: Graph Feature Tuning for Efficient Point Cloud Analysis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dhakal_2026_WACV, author = {Dhakal, Manish and Dasari, Venkat R and Sunderraman, Rajshekhar and Ding, Yi}, title = {GFT: Graph Feature Tuning for Efficient Point Cloud Analysis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7955-7964} }
Scalpel: Fine-Grained Alignment of Attention Activation Manifolds via Mixture Gaussian Bridges to Mitigate Multimodal Hallucination-
[pdf]
[arXiv]
[bibtex]@InProceedings{Shi_2026_WACV, author = {Shi, Ziqiang and Liu, Rujie and Yu, Shanshan and Munakata, Satoshi and Shirahata, Koichi}, title = {Scalpel: Fine-Grained Alignment of Attention Activation Manifolds via Mixture Gaussian Bridges to Mitigate Multimodal Hallucination}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2964-2973} }
MMCM: Multimodality-aware Metric using Clustering-based Modes for Probabilistic Human Motion Prediction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tokoro_2026_WACV, author = {Tokoro, Kyotaro and Taketsugu, Hiromu and Ukita, Norimichi}, title = {MMCM: Multimodality-aware Metric using Clustering-based Modes for Probabilistic Human Motion Prediction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2637-2647} }
ScoliGaitX: A Deep Multi-Modal Fusion Network for Scoliosis Assessment via Gait Video Analysis-
[pdf]
[bibtex]@InProceedings{Vishwakarma_2026_WACV, author = {Vishwakarma, Kaushik and Nigam, Aditya}, title = {ScoliGaitX: A Deep Multi-Modal Fusion Network for Scoliosis Assessment via Gait Video Analysis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2404-2413} }
OpenCowID: Zero-Shot Visual Identification of Dairy Cows-
[pdf]
[bibtex]@InProceedings{Prabhune_2026_WACV, author = {Prabhune, Omkar and Kim, Younghyun}, title = {OpenCowID: Zero-Shot Visual Identification of Dairy Cows}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1491-1500} }
FG-TRACER: Tracing Information Flow in Multimodal Large Language Models in Free-Form Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Saporita_2026_WACV, author = {Saporita, Alessia and Pipoli, Vittorio and Bolelli, Federico and Baraldi, Lorenzo and Acquaviva, Andrea and Ficarra, Elisa}, title = {FG-TRACER: Tracing Information Flow in Multimodal Large Language Models in Free-Form Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7903-7912} }
SpikeRain: Towards Energy-Efficient Single Image Deraining with Spiking Neural Networks-
[pdf]
[supp]
[bibtex]@InProceedings{Islam_2026_WACV, author = {Islam, Md Tanvir and Alam, Inzamamul and Bakshi, Sambit and Muhammad, Khan and Del Ser, Javier and Ahn, Sangtae}, title = {SpikeRain: Towards Energy-Efficient Single Image Deraining with Spiking Neural Networks}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1094-1105} }
CAST: Evaluating Multi-Object Trackers with Context-Aware Switch and Transfer Scores-
[pdf]
[bibtex]@InProceedings{Bai_2026_WACV, author = {Bai, Jin and Hager, Gregory D.}, title = {CAST: Evaluating Multi-Object Trackers with Context-Aware Switch and Transfer Scores}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7260-7268} }
NavMapFusion: Diffusion-based Fusion of Navigation Maps for Online Vectorized HD Map Construction-
[pdf]
[arXiv]
[bibtex]@InProceedings{Monninger_2026_WACV, author = {Monninger, Thomas and Zhang, Zihan and Staab, Steffen and Ding, Sihao}, title = {NavMapFusion: Diffusion-based Fusion of Navigation Maps for Online Vectorized HD Map Construction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7945-7954} }
DREAM: Dynamic Prompts and GuidedMix for Efficient Continual Adaptation of Visual-Language Models-
[pdf]
[bibtex]@InProceedings{Chee_2026_WACV, author = {Chee, Evelyn and Lee, Mong Li and Hsu, Wynne}, title = {DREAM: Dynamic Prompts and GuidedMix for Efficient Continual Adaptation of Visual-Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5853-5863} }
SynPlay: Large-Scale Synthetic Human Data with Real-World Diversity for Aerial-View Perception-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yim_2026_WACV, author = {Yim, Jinsub and Lee, Hyungtae and Eum, Sungmin and Shen, Yi-Ting and Zhang, Yan and Kwon, Heesung and Bhattacharyya, Shuvra S.}, title = {SynPlay: Large-Scale Synthetic Human Data with Real-World Diversity for Aerial-View Perception}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {938-947} }
Overcoming Small Data Limitations in Video-Based Infant Respiration Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Song_2026_WACV, author = {Song, Liyang and Bishnoi, Hardik and Manne, Sai Kumar Reddy and Ostadabbas, Sarah and Taylor, Briana J. and Wan, Michael}, title = {Overcoming Small Data Limitations in Video-Based Infant Respiration Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6340-6349} }
SIAM: Synchronous Interaction Attention for Human Mesh Recovery-
[pdf]
[supp]
[bibtex]@InProceedings{Ahmad_2026_WACV, author = {Ahmad, Niaz and Ullah, Saif and Lee, Youngmoon and Wang, Guanghui}, title = {SIAM: Synchronous Interaction Attention for Human Mesh Recovery}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4535-4545} }
OW-Rep: Open World Object Detection with Instance Representation Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2026_WACV, author = {Lee, Sunoh and Jeon, Minsik and Min, Jihong and Seo, Junwon}, title = {OW-Rep: Open World Object Detection with Instance Representation Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {339-349} }
Training-free Multi-view 4D Human Motion Reconstruction Virtual Reality System-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Yijie and Zheng, Ce and He, Yijie and Julin, Joel and Ichikari, Ryosuke and Ogiso, Satoki and Nakae, Satoshi and Sato, Akihiro and Kurata, Takeshi and Jeni, Laszlo A.}, title = {Training-free Multi-view 4D Human Motion Reconstruction Virtual Reality System}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {318-327} }
Beyond the Encoder: Joint Encoder-Decoder Contrastive Pre-Training Improves Dense Prediction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Quetin_2026_WACV, author = {Quetin, S\'ebastien and Ghosh, Tapotosh and Maleki, Farhad}, title = {Beyond the Encoder: Joint Encoder-Decoder Contrastive Pre-Training Improves Dense Prediction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1000-1010} }
Discrete Facial Encoding: A Framework for Data-driven Facial Display Discovery-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tran_2026_WACV, author = {Tran, Minh and Siniukov, Maksim and Jin, Zhangyu and Soleymani, Mohammad}, title = {Discrete Facial Encoding: A Framework for Data-driven Facial Display Discovery}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2348-2358} }
Zero-shot Hierarchical Plant Segmentation via Foundation Segmentation Models and Text-to-image Attention-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xing_2026_WACV, author = {Xing, Junhao and Miyakawa, Ryohei and Yang, Yang and Liu, Xinpeng and Shinoda, Risa and Santo, Hiroaki and Toda, Yosuke and Okura, Fumio}, title = {Zero-shot Hierarchical Plant Segmentation via Foundation Segmentation Models and Text-to-image Attention}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2510-2519} }
Semi-supervised Domain Adaptation via Mutual Alignment through Joint Error-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2026_WACV, author = {Zhang, Dexuan and Westfechtel, Thomas and Harada, Tatsuya}, title = {Semi-supervised Domain Adaptation via Mutual Alignment through Joint Error}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5426-5436} }
Distribution Highlighted Reference-based Label Distribution Learning for Facial Age Estimation-
[pdf]
[supp]
[bibtex]@InProceedings{Suzuki_2026_WACV, author = {Suzuki, Satoshi and Yamaguchi, Shin'ya and Takeda, Shoichiro and Kaneko, Takuhiro and Orihashi, Shota and Masumura, Ryo}, title = {Distribution Highlighted Reference-based Label Distribution Learning for Facial Age Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6464-6473} }
VISTA: A Vision and Intent-Aware Social Attention Framework for Multi-Agent Trajectory Prediction-
[pdf]
[supp]
[bibtex]@InProceedings{Da_Silva_Martins_2026_WACV, author = {Da Silva Martins, Stephane and Aldea, Emanuel and Le H\'egarat-Mascle, Sylvie}, title = {VISTA: A Vision and Intent-Aware Social Attention Framework for Multi-Agent Trajectory Prediction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {287-296} }
IMKD: Intensity-Aware Multi-Level Knowledge Distillation for Camera-Radar Fusion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mishra_2026_WACV, author = {Mishra, Shashank and Patil, Karan and Stricker, Didier and Rambach, Jason}, title = {IMKD: Intensity-Aware Multi-Level Knowledge Distillation for Camera-Radar Fusion}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6027-6038} }
WWE-UIE: A Wavelet & White Balance Efficient Network for Underwater Image Enhancement-
[pdf]
[arXiv]
[bibtex]@InProceedings{Cheng_2026_WACV, author = {Cheng, Ching-Heng and Lee, Jen-Wei and Lee, Chia-Ming and Hsu, Chih-Chung}, title = {WWE-UIE: A Wavelet \& White Balance Efficient Network for Underwater Image Enhancement}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2135-2145} }
Leveraging Semantic Attribute Binding for Free-Lunch Color Control in Diffusion Models-
[pdf]
[supp]
[bibtex]@InProceedings{Laria_2026_WACV, author = {Laria, H\'ector and Gomez-Villa, Alexandra and Qin, Jiang and Butt, Muhammad Atif and Raducanu, Bogdan and Vazquez-Corral, Javier and van de Weijer, Joost and Wang, Kai}, title = {Leveraging Semantic Attribute Binding for Free-Lunch Color Control in Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7689-7698} }
ForestSplats: Deformable Transient Field for Gaussian Splatting in the Wild-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Park_2026_WACV, author = {Park, Wongi and Nam, Myeongseok and Kim, Siwon and Jo, Sangwoo and Lee, Soomok}, title = {ForestSplats: Deformable Transient Field for Gaussian Splatting in the Wild}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6978-6987} }
3D Cell Oversegmentation Correction via Geo-Wasserstein Divergence-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2026_WACV, author = {Chen, Peter and Chang, Bryan and A Creasey, Olivia and Sneddon, Julie Beth and Gartner, Zev J and Liu, Yining}, title = {3D Cell Oversegmentation Correction via Geo-Wasserstein Divergence}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7534-7543} }
STRinGS: Selective Text Refinement in Gaussian Splatting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Raundhal_2026_WACV, author = {Raundhal, Abhinav and Behera, Gaurav and Narayanan, P. J. and Sarvadevabhatla, Ravi Kiran and Tapaswi, Makarand}, title = {STRinGS: Selective Text Refinement in Gaussian Splatting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8574-8583} }
DARB-Splatting: Generalizing Splatting with Decaying Anisotropic Radial Basis Functions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Pramuditha_2026_WACV, author = {Pramuditha, Hashiru and Viruthshaan, Vinasirajan and Arunan, Vishagar and Nazar, Saeedha and Ramasinghe, Sameera and Lucey, Simon and Rodrigo, Ranga}, title = {DARB-Splatting: Generalizing Splatting with Decaying Anisotropic Radial Basis Functions}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4504-4514} }
DenseBEV: Transforming BEV Grid Cells into 3D Objects-
[pdf]
[supp]
[bibtex]@InProceedings{Dahling_2026_WACV, author = {D\"ahling, Marius and Krebs, Sebastian and Z\"ollner, J. Marius}, title = {DenseBEV: Transforming BEV Grid Cells into 3D Objects}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2370-2379} }
Sun-E: Dataset and Benchmark for Event-Based Sun Sensing-
[pdf]
[bibtex]@InProceedings{Dolan_2026_WACV, author = {Dolan, Sydney and Golkar, Alessandro}, title = {Sun-E: Dataset and Benchmark for Event-Based Sun Sensing}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4818-4826} }
SceneEdited: A City-Scale Benchmark for 3D HD Map Updating via Image-Guided Change Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lin_2026_WACV, author = {Lin, Chun-Jung and Chin, Tat-Jun and Garg, Sourav and Dayoub, Feras}, title = {SceneEdited: A City-Scale Benchmark for 3D HD Map Updating via Image-Guided Change Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6330-6339} }
Learning from Unknown for Open-Set Test-Time Adaptation-
[pdf]
[supp]
[bibtex]@InProceedings{Rafi_2026_WACV, author = {Rafi, Taki Hasan and Agarwal, Amit and Patel, Hitesh L. and Chae, Dong-Kyu}, title = {Learning from Unknown for Open-Set Test-Time Adaptation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2993-3004} }
Enhanced Back-Projection of Vision Features for 3D Symmetry Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Aguirre_2026_WACV, author = {Aguirre, Isaac and Sipiran, Ivan}, title = {Enhanced Back-Projection of Vision Features for 3D Symmetry Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {66-76} }
START: Spatial and Textual Learning for Chart Understanding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2026_WACV, author = {Liu, Zhuoming and Gao, Xiaofeng and Niu, Feiyang and Gao, Qiaozi and Liu, Liu and Piramuthu, Robinson}, title = {START: Spatial and Textual Learning for Chart Understanding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8146-8156} }
Tables Guide Vision: Learning to See the Heart through Tabular Data-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hasny_2026_WACV, author = {Hasny, Marta and Di Folco, Maxime and Bressem, Keno and Schnabel, Julia}, title = {Tables Guide Vision: Learning to See the Heart through Tabular Data}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1716-1725} }
Adversarial Pseudo-replay for Exemplar-free Class-incremental Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Honda_2026_WACV, author = {Honda, Hiroto}, title = {Adversarial Pseudo-replay for Exemplar-free Class-incremental Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7493-7502} }
AugMapNet: Improving Spatial Latent Structure via BEV Grid Augmentation for Enhanced Vectorized Online HD Map Construction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Monninger_2026_WACV, author = {Monninger, Thomas and Anwar, Md Zafar and Antol, Stanislaw and Staab, Steffen and Ding, Sihao}, title = {AugMapNet: Improving Spatial Latent Structure via BEV Grid Augmentation for Enhanced Vectorized Online HD Map Construction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8541-8550} }
Sketch-guided Cage-based 3D Gaussian Splatting Deformation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xie_2026_WACV, author = {Xie, Tianhao and Aigerman, Noam and Belilovsky, Eugene and Popa, Tiberiu}, title = {Sketch-guided Cage-based 3D Gaussian Splatting Deformation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3658-3667} }
Mem-MLP: Real-Time 3D Human Motion Generation from Sparse Inputs-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mutlu_2026_WACV, author = {Mutlu, Sinan and Angelis, Georgios F. and Ozkan, Savas and Wisbey, Paul and Drosou, Anastasios and Ozay, Mete}, title = {Mem-MLP: Real-Time 3D Human Motion Generation from Sparse Inputs}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8343-8352} }
RapidMV: Leveraging Spatio-Angular Latent Space for Efficient and Consistent Text-to-Multi-View Synthesis-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2026_WACV, author = {Kim, Seungwook and Shi, Yichun and Li, Kejie and Cho, Minsu and Wang, Peng}, title = {RapidMV: Leveraging Spatio-Angular Latent Space for Efficient and Consistent Text-to-Multi-View Synthesis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1674-1684} }
BrandFusion: Aligning Image Generation with Brand Styles-
[pdf]
[supp]
[bibtex]@InProceedings{Gupta_2026_WACV, author = {Gupta, Parul and Khurana, Varun and Singla, Yaman Kumar and Krishnamurthy, Balaji and Dhall, Abhinav}, title = {BrandFusion: Aligning Image Generation with Brand Styles}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2316-2326} }
SurgXBench: Explainable Vision-Language Model Benchmark for Surgery-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cheng_2026_WACV, author = {Cheng, Jiajun and Zhao, Xianwu and Liu, Sainan and Yu, Xiaofan and Prakash, Ravi and Codd, Patrick J. and Katz, Jonathan Elliott and Lin, Shan}, title = {SurgXBench: Explainable Vision-Language Model Benchmark for Surgery}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8188-8198} }
SCALEX: Scalable Concept and Latent Exploration for Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zeng_2026_WACV, author = {Zeng, E. Zhixuan and Chen, Yuhao and Wong, Alexander}, title = {SCALEX: Scalable Concept and Latent Exploration for Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3617-3627} }
CanKD: Cross-Attention-based Non-local Operation for Feature-based Knowledge Distillation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sun_2026_WACV, author = {Sun, Shizhe and Ohyama, Wataru}, title = {CanKD: Cross-Attention-based Non-local Operation for Feature-based Knowledge Distillation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8606-8616} }
Reverse Personalization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kung_2026_WACV, author = {Kung, Han-Wei and Varanka, Tuomas and Sebe, Nicu}, title = {Reverse Personalization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {988-999} }
HumanBench: Two Heads, No Legs, But Mostly Human, the State of Generative Capabilities in T2I Models-
[pdf]
[supp]
[bibtex]@InProceedings{Jain_2026_WACV, author = {Jain, Anubhooti and Vatsa, Mayank and Singh, Richa}, title = {HumanBench: Two Heads, No Legs, But Mostly Human, the State of Generative Capabilities in T2I Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4087-4096} }
SmokeBench: Evaluating Multimodal Large Language Models for Wildfire Smoke Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Qi_2026_WACV, author = {Qi, Tianye and Li, Weihao and Barnes, Nick}, title = {SmokeBench: Evaluating Multimodal Large Language Models for Wildfire Smoke Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1043-1053} }
ObjectCore - Efficient Few-shot Logical Anomaly Detection using Object Representations-
[pdf]
[supp]
[bibtex]@InProceedings{Fucka_2026_WACV, author = {Fu\v{c}ka, Matic and Zavrtanik, Vitjan and Sko\v{c}aj, Danijel}, title = {ObjectCore - Efficient Few-shot Logical Anomaly Detection using Object Representations}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3857-3867} }
CLIP-IT: CLIP-based Pairing of Histology Images with Privileged Textual Information-
[pdf]
[supp]
[bibtex]@InProceedings{Karimian_2026_WACV, author = {Karimian, Banafsheh and Avanzato, Giulia and Belharbi, Soufiane and Guichemerre, Alexis and McCaffrey, Luke and Shateri, Mohammadhadi and Granger, Eric}, title = {CLIP-IT: CLIP-based Pairing of Histology Images with Privileged Textual Information}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3700-3709} }
UniTabBank: A Large Scale Multi-Lingual, Multi-Layout, Multi-Type, Multi-Format Dataset for Table Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Mondal_2026_WACV, author = {Mondal, Ajoy and Mundra, Saumya and Dasgupta, Avijit and Jawahar, C.V.}, title = {UniTabBank: A Large Scale Multi-Lingual, Multi-Layout, Multi-Type, Multi-Format Dataset for Table Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6486-6495} }
Temporal Object Captioning for Street Scene Videos from LiDAR Tracks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gopinathan_2026_WACV, author = {Gopinathan, Vignesh and Zimmermann, Urs and Arnold, Michael and Rottmann, Matthias}, title = {Temporal Object Captioning for Street Scene Videos from LiDAR Tracks}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2848-2857} }
MDUNet: Multimodal Decoding UNet for Passive Occluder-Aided Non-line-of-sight 3D Imaging-
[pdf]
[supp]
[bibtex]@InProceedings{Raji_2026_WACV, author = {Raji, Fadlullah and Murray-Bruce, John}, title = {MDUNet: Multimodal Decoding UNet for Passive Occluder-Aided Non-line-of-sight 3D Imaging}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {461-471} }
Being Positive about Negative Queries: Exclusion Aware Multimodal Retrieval using Disentangled Representations-
[pdf]
[bibtex]@InProceedings{Jha_2026_WACV, author = {Jha, Prachi and Bhatia, Sumit and Bedathur, Srikanta}, title = {Being Positive about Negative Queries: Exclusion Aware Multimodal Retrieval using Disentangled Representations}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7832-7841} }
Gaussian Swaying: Surface-Based Framework for Aerodynamic Simulation with 3D Gaussians-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yan_2026_WACV, author = {Yan, Hongru and Zhang, Xiang and Chen, Zeyuan and Wei, Fangyin and Tu, Zhuowen}, title = {Gaussian Swaying: Surface-Based Framework for Aerodynamic Simulation with 3D Gaussians}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4932-4942} }
Enhancing Vision Language Corruption Robustness using Cross-Distribution & Prompted Denoisers-
[pdf]
[supp]
[bibtex]@InProceedings{Latif_2026_WACV, author = {Latif, Sameer Shafayet and Shiper, Sadab and Kiran, K. M. Rahiduzzaman and Ishmam, Md Farhan and Hossain, Md Azam and Kamal, Abu Raihan Mostofa and Ashmafee, Md Hamjajul}, title = {Enhancing Vision Language Corruption Robustness using Cross-Distribution \& Prompted Denoisers}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5754-5765} }
FALCONEye: Finding Answers and Localizing Content in ONE-hour-long videos with multi-modal LLMs-
[pdf]
[supp]
[bibtex]@InProceedings{Plou_2026_WACV, author = {Plou, Carlos and Borja, Cesar and Martinez-Cantin, Ruben and Murillo, Ana C.}, title = {FALCONEye: Finding Answers and Localizing Content in ONE-hour-long videos with multi-modal LLMs}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1334-1344} }
WALDO: Where Unseen Model-based 6D Pose Estimation Meets Occlusion-
[pdf]
[arXiv]
[bibtex]@InProceedings{Pakdamansavoji_2026_WACV, author = {Pakdamansavoji, Sajjad and Ma, Yintao and Rasouli, Amir and Cao, Tongtong}, title = {WALDO: Where Unseen Model-based 6D Pose Estimation Meets Occlusion}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4067-4076} }
Enabling High-Quality In-the-Wild Imaging from Severely Aberrated Metalens Bursts-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mandal_2026_WACV, author = {Mandal, Debabrata and Peng, Zhihan and Wang, Yujie and Chakravarthula, Praneeth}, title = {Enabling High-Quality In-the-Wild Imaging from Severely Aberrated Metalens Bursts}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {849-859} }
CORA: Consistency-Guided Semi-Supervised Framework for Reasoning Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Howlader_2026_WACV, author = {Howlader, Prantik and Nguyen-Canh, Hoang and Das, Srijan and Xu, Jingyi and Le, Hieu and Samaras, Dimitris}, title = {CORA: Consistency-Guided Semi-Supervised Framework for Reasoning Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5934-5944} }
Gradient-Free Classifier Guidance for Diffusion Model Sampling-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shenoy_2026_WACV, author = {Shenoy, Rahul and Pan, Zhihong and Balakrishnan, Kaushik and Cheng, Qiseng and Jeon, Yongmoon and Yang, Heejune and Kim, Jaewon}, title = {Gradient-Free Classifier Guidance for Diffusion Model Sampling}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3162-3171} }
Point2Pose: A Generative Framework for 3D Human Pose Estimation with Multi-View Point Cloud Dataset-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2026_WACV, author = {Lee, Hyunsoo and Jeon, Daeum and Oh, Hyeokjae}, title = {Point2Pose: A Generative Framework for 3D Human Pose Estimation with Multi-View Point Cloud Dataset}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6744-6753} }
GDoFS: Gaussian DoF Separation for Plausible 3D Geometry in Sparse-View 3DGS-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2026_WACV, author = {Kim, Yongsung and Choi, Jooyoung and Yoon, Sungroh}, title = {GDoFS: Gaussian DoF Separation for Plausible 3D Geometry in Sparse-View 3DGS}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6643-6652} }
Gen-AFFECT: Generation of Avatar Fine-grained Facial Expressions with Consistent identiTy-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yu_2026_WACV, author = {Yu, Hao and Mallick, Rupayan and Betke, Margrit and Bargal, Sarah Adel}, title = {Gen-AFFECT: Generation of Avatar Fine-grained Facial Expressions with Consistent identiTy}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3889-3899} }
Distilling Offline Action Detection Models into Real-Time Streaming Models-
[pdf]
[bibtex]@InProceedings{Patel_2026_WACV, author = {Patel, Deep and Babazaki, Yasunori and Nagase, Yasuto and Melvin, Iain and Min, Martin Renqiang}, title = {Distilling Offline Action Detection Models into Real-Time Streaming Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6205-6214} }
From Bands to Depth: Understanding Bathymetry Decisions on Sentinel-2-
[pdf]
[arXiv]
[bibtex]@InProceedings{Chowdhury_2026_WACV, author = {Chowdhury, Satyaki Roy and Radhakrishnan, Aswathnarayan and Subramoni, Hari}, title = {From Bands to Depth: Understanding Bathymetry Decisions on Sentinel-2}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2063-2072} }
Remote Sensing Forestry Similarity Convolution-
[pdf]
[bibtex]@InProceedings{Wang_2026_WACV, author = {Wang, Shikuan and Chen, Yuangong and Gong, Jianzhou and Meng, Lingyi and Wu, Mengquan and Liu, Longxing and Yuan, Haiwei and Guo, Mingbin}, title = {Remote Sensing Forestry Similarity Convolution}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7565-7575} }
Conjuring Positive Pairs for Efficient Unification of Representation Learning and Image Synthesis-
[pdf]
[supp]
[bibtex]@InProceedings{Estepa_2026_WACV, author = {Estepa, Imanol G. and Rodr{\'\i}guez-de-Vera, Jes\'us M. and Saras\'ua, Ignacio and Nagarajan, Bhalaji and Radeva, Petia}, title = {Conjuring Positive Pairs for Efficient Unification of Representation Learning and Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {751-761} }
Root Completion from Intraoral Scans of Tooth Crowns using Diffusion with Patch Perturbation-
[pdf]
[bibtex]@InProceedings{Jang_2026_WACV, author = {Jang, Yohan and Song, In-Seok and Baek, Seung Jun}, title = {Root Completion from Intraoral Scans of Tooth Crowns using Diffusion with Patch Perturbation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {483-492} }
Multimodal Graph Representation Learning over Arbitrary Sets of Modalities-
[pdf]
[supp]
[bibtex]@InProceedings{Patapati_2026_WACV, author = {Patapati, Santosh and Srinivasan, Trisanth}, title = {Multimodal Graph Representation Learning over Arbitrary Sets of Modalities}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7104-7115} }
FlowMorph: Revealing an Optimizable Flow Latent Space for Controlled Image Morphing-
[pdf]
[supp]
[bibtex]@InProceedings{Zheng_2026_WACV, author = {Zheng, Yan and Yang, Yi and Guo, Lanqing and Wang, Zhangyang}, title = {FlowMorph: Revealing an Optimizable Flow Latent Space for Controlled Image Morphing}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2455-2464} }
Crafting Descriptive Information for a Zero-shot Method to Improve Knowledge-Based Visual Question Answering Performance-
[pdf]
[supp]
[bibtex]@InProceedings{Moradi_2026_WACV, author = {Moradi, Mohammad Mahdi and Mudur, Sudhir}, title = {Crafting Descriptive Information for a Zero-shot Method to Improve Knowledge-Based Visual Question Answering Performance}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3120-3128} }
Boosting Medical Vision-Language Pretraining via Momentum Self-Distillation under Limited Computing Resources-
[pdf]
[arXiv]
[bibtex]@InProceedings{Pham_2026_WACV, author = {Pham, Phuc and Pham, Nhu and Ly, Ngoc Quoc}, title = {Boosting Medical Vision-Language Pretraining via Momentum Self-Distillation under Limited Computing Resources}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {860-868} }
Uncertainty-Aware Vision-Language Segmentation for Medical Imaging-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Das_2026_WACV, author = {Das, Aryan and Rachamalla, Tanishq and Biswas, Koushik and Roy, Swalpa Kumar and Verma, Vinay Kumar}, title = {Uncertainty-Aware Vision-Language Segmentation for Medical Imaging}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8490-8499} }
MR-Pruner: Training-free Multi-resolution Visual Token Pruning for Multi-modal Large Language Models-
[pdf]
[bibtex]@InProceedings{Han_2026_WACV, author = {Han, Seunghoon and Lee, Hyewon and Park, Soyoung and Lee, Jong-Ryul and Lim, Sungsu}, title = {MR-Pruner: Training-free Multi-resolution Visual Token Pruning for Multi-modal Large Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1084-1093} }
SeqFeedNet: Sequential Feature Feedback Network for Background Subtraction-
[pdf]
[supp]
[bibtex]@InProceedings{Huang_2026_WACV, author = {Huang, Yu-Shun and Guo, Jing-Ming and Yang, Yi-Xiang}, title = {SeqFeedNet: Sequential Feature Feedback Network for Background Subtraction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8199-8208} }
Crash2DocAI: Automated Integration of Post-Crash Car Part Images into Technical Reports-
[pdf]
[bibtex]@InProceedings{Divis_2026_WACV, author = {Divis, Vaclav and Giovagnola, Jessica and Ben Chikha, Khalil and Hr\'uz, Marek}, title = {Crash2DocAI: Automated Integration of Post-Crash Car Part Images into Technical Reports}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8272-8281} }
CoL2A: Convolution-free Local Linear Attention for SpatioTemporal Event Processing-
[pdf]
[supp]
[bibtex]@InProceedings{Sekikawa_2026_WACV, author = {Sekikawa, Yusuke and Nagata, Jun and Araki, Itsumi and Girbau, Andreu}, title = {CoL2A: Convolution-free Local Linear Attention for SpatioTemporal Event Processing}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4869-4880} }
From Prompt to Production: Automating Brand-Safe Marketing Imagery with Text-to-Image Models-
[pdf]
[supp]
[bibtex]@InProceedings{Atighehchian_2026_WACV, author = {Atighehchian, Parmida and Wang, Henry and Kapustin, Andrei and Lerner, Boris and Jiang, Tiancheng and Jensen, Taylor and Sokhandan, Negin}, title = {From Prompt to Production: Automating Brand-Safe Marketing Imagery with Text-to-Image Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6818-6826} }
2S-CEDiff: A Two-Stage Diffusion Framework for Generating High-Fidelity Contrast-Enhanced CT Images from Non-Contrast Scans-
[pdf]
[supp]
[bibtex]@InProceedings{Wu_2026_WACV, author = {Wu, Yibang and Wang, Tzung-Dau and Lai, Shang-Hong}, title = {2S-CEDiff: A Two-Stage Diffusion Framework for Generating High-Fidelity Contrast-Enhanced CT Images from Non-Contrast Scans}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3918-3927} }
Descrip3D: Enhancing Large Language Model-based 3D Scene Understanding with Object-Level Text Descriptions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xue_2026_WACV, author = {Xue, Jintang and Zhao, Ganning and Yao, Jie-En and Chen, Hong-En and Hu, Yue and Chen, Meida and You, Suya and Kuo, C.-C. Jay}, title = {Descrip3D: Enhancing Large Language Model-based 3D Scene Understanding with Object-Level Text Descriptions}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1746-1756} }
Unconditional Priors Matter! Improving Conditional Generation of Fine-Tuned Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Phunyaphibarn_2026_WACV, author = {Phunyaphibarn, Prin and Lee, Phillip Y. and Kim, Jaihoon and Sung, Minhyuk}, title = {Unconditional Priors Matter! Improving Conditional Generation of Fine-Tuned Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3982-3992} }
MuseDance: A Diffusion-based Music-Driven Image Animation System-
[pdf]
[bibtex]@InProceedings{Dong_2026_WACV, author = {Dong, Zhikang and Hao, Weituo and Wang, Ju-Chiang and Zhang, Peng and Polak, Pawel}, title = {MuseDance: A Diffusion-based Music-Driven Image Animation System}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3813-3824} }
1LoRA: Summation Compression for Very Low-Rank Adaptation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Quercia_2026_WACV, author = {Quercia, Alessio and Cao, Zhuo and Bangun, Arya and Paul, Richard D. and Morrison, Abigail and Assent, Ira and Scharr, Hanno}, title = {1LoRA: Summation Compression for Very Low-Rank Adaptation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2253-2262} }
MaxInfo: A Training-Free Key-Frame Selection Method Using Maximum Volume for Enhanced Video Understanding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Pengyi and Abdullaeva, Irina and Gambashidze, Alexander and Kuznetsov, Andrey and Oseledets, Ivan}, title = {MaxInfo: A Training-Free Key-Frame Selection Method Using Maximum Volume for Enhanced Video Understanding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7198-7207} }
Conditional Text-to-Image Generation with Reference Guidance-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2026_WACV, author = {Kim, Taewook and Wang, Ze and Yang, Zhengyuan and Wang, Jiang and Wang, Lijuan and Liu, Zicheng and Qiu, Qiang}, title = {Conditional Text-to-Image Generation with Reference Guidance}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2879-2889} }
SDT-6D: Fully Sparse Depth-Transformer for Staged End-to-End 6D Pose Estimation in Industrial Multi-View Bin Picking-
[pdf]
[bibtex]@InProceedings{Leuze_2026_WACV, author = {Leuze, Nico and Hoh, Maximilian and Do\u{g}an, Samed and R.-Pe\~na, Nicolas and Schoettl, Alfred}, title = {SDT-6D: Fully Sparse Depth-Transformer for Staged End-to-End 6D Pose Estimation in Industrial Multi-View Bin Picking}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8406-8415} }
VideoSketcher: A Training-Free Approach for Coherent Video Sketch Transfer-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Huining and Liu, Bangzhen and Yang, Rui and Zhou, Yang and Xu, Chenshu and Pang, Xufang and He, Shengfeng}, title = {VideoSketcher: A Training-Free Approach for Coherent Video Sketch Transfer}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7333-7343} }
From Darkness to Detail: Frequency-Aware SSMs for Low-Light Vision-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Adhikarla_2026_WACV, author = {Adhikarla, Eashan and Zhang, Kai and Chen, Gong and Nicholson, John and Davison, Brian D.}, title = {From Darkness to Detail: Frequency-Aware SSMs for Low-Light Vision}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6956-6967} }
Deepfake Detection that Generalizes Across Benchmarks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yermakov_2026_WACV, author = {Yermakov, Andrii and Cech, Jan and Matas, Jiri and Fritz, Mario}, title = {Deepfake Detection that Generalizes Across Benchmarks}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {773-783} }
Mean-Shift Distillation for Diffusion Mode Seeking-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Thamizharasan_2026_WACV, author = {Thamizharasan, Vikas and Chatzis, Nikitas and Georgiev, Iliyan and Fisher, Matthew and Kalogerakis, Evangelos and Liu, Difan and Zhao, Nanxuan and Luk\'a\v{c}, Michal}, title = {Mean-Shift Distillation for Diffusion Mode Seeking}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6537-6546} }
ISALux: Illumination and Semantics-Aware Transformer Employing Mixture of Experts for Low Light Image Enhancement-
[pdf]
[supp]
[bibtex]@InProceedings{Balmez_2026_WACV, author = {Balmez, Raul and Brateanu, Alexandru and Orhei, Ciprian and Ancuti, Codruta O. and Ancuti, Cosmin}, title = {ISALux: Illumination and Semantics-Aware Transformer Employing Mixture of Experts for Low Light Image Enhancement}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7862-7872} }
CycleSL: Server-Client Cyclical Update Driven Scalable Split Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2026_WACV, author = {Wang, Mengdi and Bozkir, Efe and Kasneci, Enkelejda}, title = {CycleSL: Server-Client Cyclical Update Driven Scalable Split Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1841-1851} }
MagicDrive3D: Controllable 3D Generation for Any-View Rendering in Street Scenes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gao_2026_WACV, author = {Gao, Ruiyuan and Chen, Kai and Li, Zhihao and Hong, Lanqing and Li, Zhenguo and Xu, Qiang}, title = {MagicDrive3D: Controllable 3D Generation for Any-View Rendering in Street Scenes}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5724-5733} }
SVS-GAN for Semantic Synthesis of Traffic Videos for Autonomous Driving-
[pdf]
[supp]
[bibtex]@InProceedings{Seyam_2026_WACV, author = {Seyam, Khaled M. and Wiederer, Julian and Braun, Markus and Yang, Bin}, title = {SVS-GAN for Semantic Synthesis of Traffic Videos for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8650-8659} }
From SAM to DINOv2: Towards Distilling Foundation Models to Lightweight Baselines for Generalized Polyp Segmentation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Agnihotri_2026_WACV, author = {Agnihotri, Shivanshu and Majhi, Snehashis and Nayak, Deepak Ranjan and Jha, Debesh}, title = {From SAM to DINOv2: Towards Distilling Foundation Models to Lightweight Baselines for Generalized Polyp Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1757-1766} }
One-shot Portrait Stylizaiton via Geometric Alignment-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2026_WACV, author = {Wang, Xinrui and Guo, Zilin and Li, Zhuoru and Yu, Jinze and Zhang, Heng and Iwasawa, Yusuke and Matsuo, Yutaka and Guo, Jiaxian}, title = {One-shot Portrait Stylizaiton via Geometric Alignment}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4964-4973} }
Decoupling Shape and Texture in SAM-2 via Controlled Texture Replacement-
[pdf]
[supp]
[bibtex]@InProceedings{Cohen_2026_WACV, author = {Cohen, Inbal and Meivar, Boaz and Tu, Peihan and Avidan, Shai and Oren, Gal}, title = {Decoupling Shape and Texture in SAM-2 via Controlled Texture Replacement}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4077-4086} }
Graph-Based Spectral Attention with Multi-Spectral Images for Illuminant Estimation-
[pdf]
[supp]
[bibtex]@InProceedings{Kang_2026_WACV, author = {Kang, Dong-Hoon and Baek, Seung-Yeop and Kim, Jong-Ok}, title = {Graph-Based Spectral Attention with Multi-Spectral Images for Illuminant Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2912-2922} }
Memoire: Learning User Personas from Gallery Tags for Personalized Photo Curation-
[pdf]
[supp]
[bibtex]@InProceedings{Mathur_2026_WACV, author = {Mathur, Praful and Iftekhar, Mohsin and Sharma, Aman and Tiwari, Sarvesh and Deka, Meghali and Cherukuri, Sathish and Sheshadri, K Roopa and Valusa, Rakesh}, title = {Memoire: Learning User Personas from Gallery Tags for Personalized Photo Curation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6873-6882} }
Boosting Unsupervised Video Instance Segmentation with Automatic Quality-Guided Self-Training-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lu_2026_WACV, author = {Lu, Kaixuan and Kaya, Mehmet Onurcan and Papadopoulos, Dim P.}, title = {Boosting Unsupervised Video Instance Segmentation with Automatic Quality-Guided Self-Training}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7387-7397} }
Test Time Adaptation Using Adaptive Quantile Recalibration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mehrbod_2026_WACV, author = {Mehrbod, Paria and Vianna, Pedro and Nanfack, Geraldin and Wolf, Guy and Belilovsky, Eugene}, title = {Test Time Adaptation Using Adaptive Quantile Recalibration}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5986-5995} }
Knowledge to Sight: Reasoning over Visual Attributes via Knowledge Decomposition for Abnormality Grounding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Jun and Liu, Che and Bai, Wenjia and Liu, Mingxuan and Arcucci, Rossella and Bercea, Cosmin I. and Schnabel, Julia}, title = {Knowledge to Sight: Reasoning over Visual Attributes via Knowledge Decomposition for Abnormality Grounding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2359-2369} }
SceneEval: Evaluating Semantic Coherence in Text-Conditioned 3D Indoor Scene Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tam_2026_WACV, author = {Tam, Hou In Ivan and Pun, Hou In Derek and Wang, Austin T. and Chang, Angel X. and Savva, Manolis}, title = {SceneEval: Evaluating Semantic Coherence in Text-Conditioned 3D Indoor Scene Synthesis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7355-7365} }
MAFM3: Modular Adaptation of Foundation Models for Multi-Modal Medical AI-
[pdf]
[bibtex]@InProceedings{Qazi_2026_WACV, author = {Qazi, Mohammad Areeb and Nwadike, Munachiso S and Almakky, Ibrahim and Yaqub, Mohammad and Saeed, Numan}, title = {MAFM3: Modular Adaptation of Foundation Models for Multi-Modal Medical AI}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3494-3503} }
4D-Animal: Freely Reconstructing Animatable 3D Animals from Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhong_2026_WACV, author = {Zhong, Shanshan and Peng, Jiawei and Zheng, Zehan and Huang, Zhongzhan and Ma, Wufei and Zhang, Guofeng and Liu, Qihao and Yuille, Alan and Chen, Jieneng}, title = {4D-Animal: Freely Reconstructing Animatable 3D Animals from Videos}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {602-612} }
PVeRA: Probabilistic Vector-Based Random Matrix Adaptation-
[pdf]
[supp]
[bibtex]@InProceedings{Fillioux_2026_WACV, author = {Fillioux, Leo and Ferrante, Enzo and Courn\`ede, Paul-Henry and Vakalopoulou, Maria and Christodoulidis, Stergios}, title = {PVeRA: Probabilistic Vector-Based Random Matrix Adaptation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2465-2474} }
Rethinking Latent Variable in Learned Image Compression-
[pdf]
[supp]
[bibtex]@InProceedings{Yi_2026_WACV, author = {Yi, Fangzhou and Gong, Zhicheng and Zeng, Hui}, title = {Rethinking Latent Variable in Learned Image Compression}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8531-8540} }
Stroke Modeling Enables Vectorized Character Generation with Large Vectorized Glyph Model-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2026_WACV, author = {Zhang, Xinyue and Li, Haolong and Ma, Jiawei and Ye, Chen}, title = {Stroke Modeling Enables Vectorized Character Generation with Large Vectorized Glyph Model}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3401-3410} }
DCText: Scheduled Attention Masking for Visual Text Generation via Divide-and-Conquer Strategy-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Song_2026_WACV, author = {Song, Jaewoo and Choi, Jooyoung and Baek, Kanghyun and Lee, Sangyub and Park, Daemin and Yoon, Sungroh}, title = {DCText: Scheduled Attention Masking for Visual Text Generation via Divide-and-Conquer Strategy}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4305-4314} }
Improved Wildfire Spread Prediction with Time-Series Data and the WSTS+ Benchmark-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lahrichi_2026_WACV, author = {Lahrichi, Saad and Bova, Jake and Johnson, Jesse and Malof, Jordan}, title = {Improved Wildfire Spread Prediction with Time-Series Data and the WSTS+ Benchmark}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2890-2900} }
CADE: Continual Weakly-supervised Video Anomaly Detection with Ensembles-
[pdf]
[arXiv]
[bibtex]@InProceedings{Hashimoto_2026_WACV, author = {Hashimoto, Satoshi and Konishi, Tatsuya and Kaichi, Tomoya and Matsumoto, Kazunori and Kurokawa, Mori}, title = {CADE: Continual Weakly-supervised Video Anomaly Detection with Ensembles}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {708-717} }
DOODLE: Diffusion-based Out-of-Distribution Learning for Open-set LiDAR Semantic Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Oh_2026_WACV, author = {Oh, Changgyoon and Kim, Hyeonseong and We, Daehyun and Jeong, Jongoh and Chae, Yujeong and Yoon, Kuk-Jin}, title = {DOODLE: Diffusion-based Out-of-Distribution Learning for Open-set LiDAR Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2273-2283} }
MUSE: Model-based Uncertainty-aware Similarity Estimation for zero-shot 2D Object Detection and Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cho_2026_WACV, author = {Cho, Sungmin and Park, Sungbum and Oh, Insoo}, title = {MUSE: Model-based Uncertainty-aware Similarity Estimation for zero-shot 2D Object Detection and Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6090-6100} }
HistoMILKD: A Multiple Instance Learning based Multi-Teacher Knowledge Distillation Framework for Whole Slide Image Classification-
[pdf]
[supp]
[bibtex]@InProceedings{Mallya_2026_WACV, author = {Mallya, Mayur and Mirabadi, Ali Khajegili and Farahani, Hossein and Bashashati, Ali}, title = {HistoMILKD: A Multiple Instance Learning based Multi-Teacher Knowledge Distillation Framework for Whole Slide Image Classification}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3390-3400} }
RobustFormer: Noise-Robust Pre-training for Images and Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bastola_2026_WACV, author = {Bastola, Ashish and Luitel, Nishant and Wang, Hao and Paudel, Danda Pani and Poudel, Roshni and Razi, Abolfazl}, title = {RobustFormer: Noise-Robust Pre-training for Images and Videos}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2284-2294} }
Modeling and Learning Multiple Hypotheses for Monocular 3D Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Park_2026_WACV, author = {Park, Hyeonjeong and Xiong, Peixi and Yu, Pei and Tang, Wei}, title = {Modeling and Learning Multiple Hypotheses for Monocular 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7040-7050} }
Context-Preserving Dermoscopic Editing: Mask-Guided Lesion-Aware Diffusion for Attribute Modification-
[pdf]
[bibtex]@InProceedings{Sun_2026_WACV, author = {Sun, Tao and Jiang, Yun and Jin, Yarong and Guo, Huanting and Zhang, Zequn}, title = {Context-Preserving Dermoscopic Editing: Mask-Guided Lesion-Aware Diffusion for Attribute Modification}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5364-5373} }
Guided Texture Segmentation via Coordinate-Aware Class-Ratio Mapping-
[pdf]
[bibtex]@InProceedings{Swain_2026_WACV, author = {Swain, Bishal Ranjan and Cheoi, Kyung Joo and Ko, Jaepil}, title = {Guided Texture Segmentation via Coordinate-Aware Class-Ratio Mapping}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4253-4261} }
SD-CSFL: A Synthetic Data-Driven Conformity Scoring Framework for Robust Federated Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Alharbi_2026_WACV, author = {Alharbi, Ebtisaam and Kerim, Abdulrahman and Marcolino, Leandro Soriano and Ni, Qiang}, title = {SD-CSFL: A Synthetic Data-Driven Conformity Scoring Framework for Robust Federated Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6903-6912} }
Patch-wise Retrieval: A Bag of Practical Techniques for Instance-level Matching-
[pdf]
[supp]
[bibtex]@InProceedings{Choi_2026_WACV, author = {Choi, Wonseok and Lim, Sohwi and Hyeon-Woo, Nam and Ye-Bin, Moon and Jeong, Dong-Ju and Hwang, Jinyoung and Oh, Tae-Hyun}, title = {Patch-wise Retrieval: A Bag of Practical Techniques for Instance-level Matching}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4922-4931} }
Reviving Unsupervised Optical Flow: Concept Reevaluation, Multi-Scale Advances and Full Open-Source Release-
[pdf]
[supp]
[bibtex]@InProceedings{Jahedi_2026_WACV, author = {Jahedi, Azin and Rivinius, Marc and Senn, Noah Berenguel and Bruhn, Andres}, title = {Reviving Unsupervised Optical Flow: Concept Reevaluation, Multi-Scale Advances and Full Open-Source Release}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1533-1542} }
STARS: Self-supervised Tuning for 3D Action Recognition in Skeleton Sequences-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mehraban_2026_WACV, author = {Mehraban, Soroush and Rajabi, Mohammad Javad and Iaboni, Andrea and Taati, Babak}, title = {STARS: Self-supervised Tuning for 3D Action Recognition in Skeleton Sequences}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2858-2868} }
MedROV: Towards Real-Time Open-Vocabulary Detection Across Diverse Medical Imaging Modalities-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sheikh_2026_WACV, author = {Sheikh, Tooba Tehreem and Lahoud, Jean and Anwer, Rao Muhammad and Khan, Fahad Shahbaz and Khan, Salman and Cholakkal, Hisham}, title = {MedROV: Towards Real-Time Open-Vocabulary Detection Across Diverse Medical Imaging Modalities}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8628-8638} }
ConsensusXAI: A Framework to Examine Class-wise Agreement in Medical Imaging-
[pdf]
[supp]
[bibtex]@InProceedings{Haider_2026_WACV, author = {Haider, Abbas and Wright, David and Hogg, Ruth and Wang, Hui and Peto, Tunde and Gault, Richard}, title = {ConsensusXAI: A Framework to Examine Class-wise Agreement in Medical Imaging}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2661-2669} }
Towards Unconstrained Cross-View Pose Estimation-
[pdf]
[supp]
[bibtex]@InProceedings{Wollam_2026_WACV, author = {Wollam, Alexander and Ashley, Kyle and Shugaev, Maxim and Arend, Oliver and Semenov, Ilya and Dashtestani, Hadis and Ravi, Sumved and Jacobs, Nathan}, title = {Towards Unconstrained Cross-View Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8448-8457} }
Towards Egocentric 3D Hand Pose Estimation in Unseen Domains-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mucha_2026_WACV, author = {Mucha, Wiktor and Wray, Michael and Kampel, Martin}, title = {Towards Egocentric 3D Hand Pose Estimation in Unseen Domains}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5776-5786} }
Anatomy-VLM: A Fine-grained Vision-Language Model for Medical Interpretation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gu_2026_WACV, author = {Gu, Difei and Gao, Yunhe and Zhou, Mu and Metaxas, Dimitris}, title = {Anatomy-VLM: A Fine-grained Vision-Language Model for Medical Interpretation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2838-2847} }
FocalComm: Hard Instance-Aware Multi-Agent Perception-
[pdf]
[arXiv]
[bibtex]@InProceedings{Shenkut_2026_WACV, author = {Shenkut, Dereje and Bhagavatula, Vijayakumar}, title = {FocalComm: Hard Instance-Aware Multi-Agent Perception}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6277-6286} }
SeaClips: A Video Dataset for Maritime Object Detection.-
[pdf]
[supp]
[bibtex]@InProceedings{Denk_2026_WACV, author = {Denk, Franziska and Rankl, Christian and Almouahed, Shaban and Moser, David and Sablatnig, Robert}, title = {SeaClips: A Video Dataset for Maritime Object Detection.}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4599-4610} }
Video and Language Alignment in 2D Systems for 3D Multi-object Scenes with Multi-Information Derivative-Free Control-
[pdf]
[supp]
[bibtex]@InProceedings{Armitage_2026_WACV, author = {Armitage, Jason and Sennrich, Rico}, title = {Video and Language Alignment in 2D Systems for 3D Multi-object Scenes with Multi-Information Derivative-Free Control}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6266-6276} }
AGENet: Adaptive Edge-aware Geodesic Distance Learning for Few-Shot Medical Image Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gao_2026_WACV, author = {Gao, Ziyuan}, title = {AGENet: Adaptive Edge-aware Geodesic Distance Learning for Few-Shot Medical Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4285-4294} }
GaussianHeadTalk: Wobble-Free 3D Talking Heads with Audio Driven Gaussian Splatting-
[pdf]
[supp]
[bibtex]@InProceedings{Agarwal_2026_WACV, author = {Agarwal, Madhav and Zhang, Mingtian and Sevilla-Lara, Laura and McDonagh, Steven}, title = {GaussianHeadTalk: Wobble-Free 3D Talking Heads with Audio Driven Gaussian Splatting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8017-8027} }
SVD-Det: A Lightweight Framework for Video Forgery Detection Using Semantic and Visual Defect Cues-
[pdf]
[supp]
[bibtex]@InProceedings{Yang_2026_WACV, author = {Yang, Tsung-Shan and Zhang, Tianyu and Qian, Feng and Yan, Bing and Kuo, C.-C. Jay}, title = {SVD-Det: A Lightweight Framework for Video Forgery Detection Using Semantic and Visual Defect Cues}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7616-7625} }
milliMamba: Specular-Aware Human Pose Estimation via Dual mmWave Radar with Multi-Frame Mamba Fusion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kini_2026_WACV, author = {Kini, Niraj Prakash and Tsai, Shiau-Rung and Lin, Guan-Hsun and Peng, Wen-Hsiao and Ma, Ching-Wen and Hwang, Jenq-Neng}, title = {milliMamba: Specular-Aware Human Pose Estimation via Dual mmWave Radar with Multi-Frame Mamba Fusion}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1481-1490} }
One-Cycle Structured Pruning via Stability-Driven Subnetwork Search-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ghimire_2026_WACV, author = {Ghimire, Deepak and Kil, Dayoung and Jeong, Seonghwan and Park, Jaesik and Kim, Seong-heum}, title = {One-Cycle Structured Pruning via Stability-Driven Subnetwork Search}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5467-5476} }
Hestia: Voxel-Face-Aware Hierarchical Next-Best-View Acquisition for Efficient 3D Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lu_2026_WACV, author = {Lu, Cheng-You and Zhuang, Zhuoli and Le, Nguyen Thanh Trung and Xiao, Da and Chang, Yu-Cheng and Do, Thomas and Sridhar, Srinath and Lin, Chin-Teng}, title = {Hestia: Voxel-Face-Aware Hierarchical Next-Best-View Acquisition for Efficient 3D Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5302-5312} }
MIX-based Foreground and Background Patch Augmentation Guided by Physics and Material Properties for X-ray Detection-
[pdf]
[bibtex]@InProceedings{Liu_2026_WACV, author = {Liu, Xintong and Chang, Dongliang and Tong, Yujun and Ma, Zhanyu}, title = {MIX-based Foreground and Background Patch Augmentation Guided by Physics and Material Properties for X-ray Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {977-987} }
SGPMIL: Sparse Gaussian Process Multiple Instance Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lolos_2026_WACV, author = {Lolos, Andreas and Christodoulidis, Stergios and Moustakas, Aris L. and Dolz, Jose and Vakalopoulou, Maria}, title = {SGPMIL: Sparse Gaussian Process Multiple Instance Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {503-513} }
Beyond Real Weights: Hypercomplex Representations for Stable Quantization-
[pdf]
[arXiv]
[bibtex]@InProceedings{Ibn_Ahad_2026_WACV, author = {Ibn Ahad, Jawad and Rahman, Maisha and Biswas, Amrijit and Kabir, Muhammad Rafsan and Krambroeckers, Robin and Momen, Sifat and Mohammed, Nabeel and Rahman, Shafin}, title = {Beyond Real Weights: Hypercomplex Representations for Stable Quantization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1180-1190} }
Uncertainty-Aware Subset Selection for Robust Visual Explainability under Distribution Shifts-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gupta_2026_WACV, author = {Gupta, Madhav and Prasad, Vishak and Ramakrishnan, Ganesh}, title = {Uncertainty-Aware Subset Selection for Robust Visual Explainability under Distribution Shifts}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1643-1652} }
FastHMR: Accelerating Human Mesh Recovery via Token and Layer Merging with Diffusion Decoding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mehraban_2026_WACV, author = {Mehraban, Soroush and Iaboni, Andrea and Taati, Babak}, title = {FastHMR: Accelerating Human Mesh Recovery via Token and Layer Merging with Diffusion Decoding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6733-6743} }
See, Think, Learn: A Self-Taught Multimodal Reasoner-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sharma_2026_WACV, author = {Sharma, Sourabh and Gupta, Sonam and Sadbhawna, Sadbhawna}, title = {See, Think, Learn: A Self-Taught Multimodal Reasoner}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8313-8322} }
CSF-Net: Context-Semantic Fusion Network for Large Mask Inpainting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Heo_2026_WACV, author = {Heo, Chae-Yeon and Cho, Yeong-Jun}, title = {CSF-Net: Context-Semantic Fusion Network for Large Mask Inpainting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8292-8301} }
Virtually Unrolling the Herculaneum Papyri by Diffeomorphic Spiral Fitting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Henderson_2026_WACV, author = {Henderson, Paul}, title = {Virtually Unrolling the Herculaneum Papyri by Diffeomorphic Spiral Fitting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6401-6411} }
Joint Modeling of Corruption-Driven and Information-Limited Uncertainty for Robust 3D Gaussian Splatting-
[pdf]
[bibtex]@InProceedings{Hui_2026_WACV, author = {Hui, Zeji and Gostar, Amirali Khodadadian and Chuah, WeiQin and Bab-Hadiashar, Alireza and Tennakoon, Ruwan}, title = {Joint Modeling of Corruption-Driven and Information-Limited Uncertainty for Robust 3D Gaussian Splatting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {688-697} }
TalkingHeadBench: A Multi-Modal Benchmark & Analysis of Talking-Head DeepFake Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xiong_2026_WACV, author = {Xiong, Xinqi and Patel, Prakrut and Fan, Qingyuan and Wadhwa, Amisha and Selvam, Sarathy and Guo, Xiao and Qi, Luchao and Liu, Xiaoming and Sengupta, Roni}, title = {TalkingHeadBench: A Multi-Modal Benchmark \& Analysis of Talking-Head DeepFake Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4139-4149} }
SOAF: Scene Occlusion-aware Neural Acoustic Field-
[pdf]
[supp]
[bibtex]@InProceedings{Gao_2026_WACV, author = {Gao, Huiyu and Ma, Jiahao and Ahmedt-Aristizabal, David and Nguyen, Chuong and Liu, Miaomiao}, title = {SOAF: Scene Occlusion-aware Neural Acoustic Field}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4097-4107} }
Exploring the Boundaries of Diffusion Models for Offline Writer Identification with Sparse and Intra-Variable Data-
[pdf]
[supp]
[bibtex]@InProceedings{Dey_2026_WACV, author = {Dey, Aritra and Adak, Chandranath and Priya, Kumari and Chattopadhyay, Soumi and Chanda, Sukalpa}, title = {Exploring the Boundaries of Diffusion Models for Offline Writer Identification with Sparse and Intra-Variable Data}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7178-7187} }
QC-SF: Improving Computer Vision for Airborne LiDAR Point Clouds of Boreal Forests with Quebec Simulated Forest Dataset-
[pdf]
[supp]
[bibtex]@InProceedings{Stocker_2026_WACV, author = {Stocker, Olivier and Kouhi, Reza Mahmoudi and Gahrouei, Omid Reisi and Badard, Thierry and Guilbert, Eric}, title = {QC-SF: Improving Computer Vision for Airborne LiDAR Point Clouds of Boreal Forests with Quebec Simulated Forest Dataset}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5026-5036} }
Grounding Descriptions in Images informs Zero-Shot Visual Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Halbe_2026_WACV, author = {Halbe, Shaunak and Tian, Junjiao and Joseph, K J and Smith, James Seale and Stevo, Katherine and Balasubramanian, Vineeth N. and Kira, Zsolt}, title = {Grounding Descriptions in Images informs Zero-Shot Visual Recognition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5672-5681} }
iMotion-LLM: Instruction-Conditioned Trajectory Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Felemban_2026_WACV, author = {Felemban, Abdulwahab and Hroub, Nussair and Ding, Jian and Abdelrahman, Eslam and Shen, Xiaoqian and Mohamed, Abduallah and Elhoseiny, Mohamed}, title = {iMotion-LLM: Instruction-Conditioned Trajectory Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2710-2720} }
Hierarchical Instance Tracking to Balance Privacy Preservation with Accessible Information-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Prasad_2026_WACV, author = {Prasad, Neelima and Reynolds, Jarek and Karsanbhai, Neel and Sharma, Tanusree and Zhang, Lotus and Stangl, Abigale and Wang, Yang and Findlater, Leah and Gurari, Danna}, title = {Hierarchical Instance Tracking to Balance Privacy Preservation with Accessible Information}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5945-5955} }
Inpaint360GS: Efficient Object-Aware 3D Inpainting via Gaussian Splatting for 360deg Scenes-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2026_WACV, author = {Wang, Shaoxiang and Zhang, Shihong and Millerdurai, Christen and Westermann, R\"udiger and Stricker, Didier and Pagani, Alain}, title = {Inpaint360GS: Efficient Object-Aware 3D Inpainting via Gaussian Splatting for 360deg Scenes}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {117-127} }
Model-free Domain Adaptation for Concealed Multimodal Large-Language Models-
[pdf]
[supp]
[bibtex]@InProceedings{Mitsuzumi_2026_WACV, author = {Mitsuzumi, Yu and Kimura, Akisato and Kashima, Hisashi}, title = {Model-free Domain Adaptation for Concealed Multimodal Large-Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1231-1241} }
Photo Dating by Facial Age Aggregation-
[pdf]
[supp]
[bibtex]@InProceedings{Paplham_2026_WACV, author = {Paplh\'am, Jakub and Franc, Vojt\v{e}ch}, title = {Photo Dating by Facial Age Aggregation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8103-8112} }
Test-Time Consistency in Vision Language Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chou_2026_WACV, author = {Chou, Shih-Han and Chandhok, Shivam and Little, James J. and Sigal, Leonid}, title = {Test-Time Consistency in Vision Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7789-7798} }
CSGaussian: Progressive Rate-Distortion Compression and Segmentation for 3D Gaussian Splatting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tseng_2026_WACV, author = {Tseng, Yu-Jen and Kao, Chia-Hao and Chen, Jing-Zhong and Gnutti, Alessandro and Lo, Shao-Yuan and Lin, Yen-Yu and Peng, Wen-Hsiao}, title = {CSGaussian: Progressive Rate-Distortion Compression and Segmentation for 3D Gaussian Splatting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6883-6892} }
Conversational Image Generation: Towards Multi-Round Personalized Generation with Multi-Modal Language Models-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2026_WACV, author = {Zhang, Haochen and Sinha, Animesh and Juefei-Xu, Felix and Ma, Haoyu and Li, Kunpeng and Fan, Zhipeng and Dai, Xiaoliang and Hou, Tingbo and Zhang, Peizhao and He, Zecheng}, title = {Conversational Image Generation: Towards Multi-Round Personalized Generation with Multi-Modal Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8282-8291} }
PhyEduVideo: A Benchmark for Evaluating Text-to-Video Models for Physics Education-
[pdf]
[supp]
[bibtex]@InProceedings{K.M_2026_WACV, author = {K.M, Megha Mariam and Arun, Aditya and Laskar, Zakaria and Jawahar, C.V.}, title = {PhyEduVideo: A Benchmark for Evaluating Text-to-Video Models for Physics Education}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8690-8699} }
PEaRL: Pathway-Enhanced Representation Learning for Gene and Pathway Expression Prediction from Histology-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Majumder_2026_WACV, author = {Majumder, Sejuti and Kapse, Saarthak and Bhattacharya, Moinak and Xu, Xuan and Yurovsky, Alisa and Prasanna, Prateek}, title = {PEaRL: Pathway-Enhanced Representation Learning for Gene and Pathway Expression Prediction from Histology}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8052-8062} }
Automated Pore Detection from In-Situ FDM 3D Printing Video: A Comparative Evaluation of Modern Segmentation Models-
[pdf]
[bibtex]@InProceedings{Al_Ahad_Khan_2026_WACV, author = {Al Ahad Khan, Abdullah and Islam, Md Shariful and Li, Lin and Jiang, Lai and Ghaffari, Noushin}, title = {Automated Pore Detection from In-Situ FDM 3D Printing Video: A Comparative Evaluation of Modern Segmentation Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4673-4681} }
AD2: Analysis and Detection of Adversarial Threats in Visual Perception for End-to-End Autonomous Driving Systems-
[pdf]
[supp]
[bibtex]@InProceedings{Sahu_2026_WACV, author = {Sahu, Ishan and Hazra, Somnath and Aditya, Somak and Dey, Soumyajit}, title = {AD2: Analysis and Detection of Adversarial Threats in Visual Perception for End-to-End Autonomous Driving Systems}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1695-1704} }
FastPose-ViT: A Vision Transformer for Real-Time Spacecraft Pose Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ancey_2026_WACV, author = {Ancey, Pierre and Price, Andrew and Javed, Saqib and Salzmann, Mathieu}, title = {FastPose-ViT: A Vision Transformer for Real-Time Spacecraft Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7873-7882} }
BiPO: Bidirectional Partial Occlusion Network for Text-to-Motion Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hong_2026_WACV, author = {Hong, Seong-Eun and Lim, SooBin and Hwang, JuYeong and Chang, Minwook and Kang, HyeongYeop}, title = {BiPO: Bidirectional Partial Occlusion Network for Text-to-Motion Synthesis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {32-42} }
Improvise, Adapt, Overcome -- Telescopic Adapters for Efficient Fine-tuning of Vision Language Models in Medical Imaging-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mishra_2026_WACV, author = {Mishra, Ujjwal and Shukla, Vinita and Hambarde, Praful and Shukla, Amit}, title = {Improvise, Adapt, Overcome -- Telescopic Adapters for Efficient Fine-tuning of Vision Language Models in Medical Imaging}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7605-7615} }
How I Met Your Bias: Investigating Bias Amplification in Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Roos_2026_WACV, author = {Roos, Nathan and Iakovleva, Ekaterina and Gjergji, Ani and Pastore, Vito Paolo and Tartaglione, Enzo}, title = {How I Met Your Bias: Investigating Bias Amplification in Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5374-5383} }
Color Bind: Exploring Color Perception in Text-to-Image Models-
[pdf]
[supp]
[bibtex]@InProceedings{Shomer-Chai_2026_WACV, author = {Shomer-Chai, Shay and Peng, Wenxuan and Hariharan, Bharath and Averbuch-Elor, Hadar}, title = {Color Bind: Exploring Color Perception in Text-to-Image Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1916-1925} }
Learning Subglacial Bed Topography from Sparse Radar with Physics-Guided Residuals-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tama_2026_WACV, author = {Tama, Bayu Adhi and Wang, Jianwu and Janeja, Vandana and Cham, Mostafa}, title = {Learning Subglacial Bed Topography from Sparse Radar with Physics-Guided Residuals}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5447-5456} }
From Lightweight CNNs to SpikeNets: Benchmarking Accuracy-Energy Tradeoffs with Pruned Spiking SqueezeNet-
[pdf]
[arXiv]
[bibtex]@InProceedings{Bin_Kabir_2026_WACV, author = {Bin Kabir, Radib and Dipto, Tawsif Tashwar and Ahamed, Mehedi and Ahmed, Sabbir and Kabir, Md Hasanul}, title = {From Lightweight CNNs to SpikeNets: Benchmarking Accuracy-Energy Tradeoffs with Pruned Spiking SqueezeNet}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1137-1146} }
Zero-LEAD: Source-Free Universal Domain Adaptation for Abdominal Multi-Organ Segmentation-
[pdf]
[bibtex]@InProceedings{El-Sayed_2026_WACV, author = {El-Sayed, Ahmed and Torki, Marwan}, title = {Zero-LEAD: Source-Free Universal Domain Adaptation for Abdominal Multi-Organ Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6715-6723} }
Cross-Modal Event Encoder: Bridging Image-Text Knowledge to Event Streams-
[pdf]
[supp]
[bibtex]@InProceedings{Jeong_2026_WACV, author = {Jeong, Sungheon and Chen, Hanning and Yun, Sanggeon and Cho, Suhyeon and Huang, Wenjun and Liu, Xiangjian and Imani, Mohsen}, title = {Cross-Modal Event Encoder: Bridging Image-Text Knowledge to Event Streams}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3213-3222} }
Dual-Domain Multimodal Hyperbolic Fusion for Cardiopulmonary Disease Diagnosis in Emergency Care-
[pdf]
[bibtex]@InProceedings{Nan_2026_WACV, author = {Nan, Ke and Samaan, Maggie and Burns, Benjamin and Ning, Xia and Han, Yuchi and Xue, Yuan}, title = {Dual-Domain Multimodal Hyperbolic Fusion for Cardiopulmonary Disease Diagnosis in Emergency Care}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8700-8710} }
Procedure Learning via Regularized Gromov-Wasserstein Optimal Transport-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mahmood_2026_WACV, author = {Mahmood, Syed Ahmed and Ali, Ali Shah and Ahmed, Umer and Fateh, Fawad Javed and Zia, M. Zeeshan and Tran, Quoc-Huy}, title = {Procedure Learning via Regularized Gromov-Wasserstein Optimal Transport}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6925-6935} }
PDV: Prompt Directional Vectors for Zero-shot Composed Image Retrieval-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tursun_2026_WACV, author = {Tursun, Osman and Kalkan, Sinan and Denman, Simon and Fookes, Clinton}, title = {PDV: Prompt Directional Vectors for Zero-shot Composed Image Retrieval}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7740-7749} }
Any Detector Can Detect Anything-
[pdf]
[supp]
[bibtex]@InProceedings{Huang_2026_WACV, author = {Huang, Thomas E. and Li, Siyuan and Danelljan, Martin and Ding, Henghui and Van Gool, Luc and Yu, Fisher}, title = {Any Detector Can Detect Anything}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8437-8447} }
Automated Suturing Skill Assessment in Robot-assisted Surgery from Endoscopic Videos using Clinically-guided Evaluation Criteria-
[pdf]
[bibtex]@InProceedings{Deo_2026_WACV, author = {Deo, Atharva Sunil and Pasupulety, Ujjwal and Matsumoto, Nicholas and Moran, Jay and Yang, Cherine and Kim, Jeanine and Kocielnik, Rafal Dariusz and Naser-Tavakolian, Aurash and Hung, Andrew}, title = {Automated Suturing Skill Assessment in Robot-assisted Surgery from Endoscopic Videos using Clinically-guided Evaluation Criteria}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7218-7228} }
Efficient Text-Guided Convolutional Adapter for the Diffusion Model-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Das_2026_WACV, author = {Das, Aryan and Biswas, Koushik and Roy, Swalpa Kumar and Patro, Badri Narayana and Verma, Vinay Kumar}, title = {Efficient Text-Guided Convolutional Adapter for the Diffusion Model}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4015-4024} }
Enhancing Object Detection Training via Joint Image-Annotation Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Uziel_2026_WACV, author = {Uziel, Roy and Bialer, Oded}, title = {Enhancing Object Detection Training via Joint Image-Annotation Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1736-1745} }
Direct Visual Grounding by Directing Attention of Visual Tokens-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Esmaeilkhani_2026_WACV, author = {Esmaeilkhani, Parsa and Latecki, Longin Jan}, title = {Direct Visual Grounding by Directing Attention of Visual Tokens}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5787-5797} }
Anatomically-guided Masked Autoencoder Pre-training for Aneurysm Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Arroyo_2026_WACV, author = {Arroyo, Alberto M. Ceballos and Kim, Jisoo and Lin, Chu-Hsuan and Qin, Lei and Young, Geoffrey S. and Jiang, Huaizu}, title = {Anatomically-guided Masked Autoencoder Pre-training for Aneurysm Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5693-5702} }
DreamAnywhere: Object-Centric Panoramic 3D Scene Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Dominici_2026_WACV, author = {Dominici, Edoardo A. and Hladk\'y, Jozef and Verhoeven, Floor and Radl, Lukas and Deixelberger, Thomas and Ainetter, Stefan and Drescher, Philipp and Hauswiesner, Stefan and Coomans, Arno and Nazzaro, Giacomo and Vardis, Konstantinos and Steinberger, Markus}, title = {DreamAnywhere: Object-Centric Panoramic 3D Scene Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1-11} }
Polymorph: Energy-Efficient Multi-Label Classification for Video Streams on Embedded Devices-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ghafouri_2026_WACV, author = {Ghafouri, Saeid and Fayyaz, Mohsen and Li, Xiangchen and John, Deepu and Ji, Bo and Nikolopoulos, Dimitrios S. and Vandierendonck, Hans}, title = {Polymorph: Energy-Efficient Multi-Label Classification for Video Streams on Embedded Devices}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6432-6441} }
KD360-VoxelBEV: LiDAR and 360-degree Camera Cross Modality Knowledge Distillation for Bird's-Eye-View Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{E_2026_WACV, author = {E, Wenke and Sun, Yixin and Liu, Jiaxu and Shum, Hubert P. H. and Atapour-Abarghouei, Amir and Breckon, Toby P.}, title = {KD360-VoxelBEV: LiDAR and 360-degree Camera Cross Modality Knowledge Distillation for Bird's-Eye-View Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3483-3493} }
WSSSP-Net: Weakly Supervised Semantic Segmentation Plugin Network for Face Anti-Spoofing-
[pdf]
[supp]
[bibtex]@InProceedings{Galus_2026_WACV, author = {Galus, Krzysztof and Syga, Piotr and Kawa, Piotr}, title = {WSSSP-Net: Weakly Supervised Semantic Segmentation Plugin Network for Face Anti-Spoofing}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5247-5257} }
DiT-VTON: Diffusion Transformer Framework for Unified Multi-Category Virtual Try-On and Virtual Try-All with Integrated Image Editing-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Qi and Qiu, Shuwen and Koo, Kee Kiat and Han, Julien and Bouyarmane, Karim}, title = {DiT-VTON: Diffusion Transformer Framework for Unified Multi-Category Virtual Try-On and Virtual Try-All with Integrated Image Editing}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {202-211} }
VectorSynth: Fine-Grained Satellite Image Synthesis with Structured Semantics-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cher_2026_WACV, author = {Cher, Daniel and Wei, Brian and Sastry, Srikumar and Jacobs, Nathan}, title = {VectorSynth: Fine-Grained Satellite Image Synthesis with Structured Semantics}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7019-7029} }
FlowEO: Generative Unsupervised Domain Adaptation for Earth Observation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Le_Bellier_2026_WACV, author = {Le Bellier, Georges and Audebert, Nicolas}, title = {FlowEO: Generative Unsupervised Domain Adaptation for Earth Observation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3900-3907} }
Pose-Diverse Multi-View Virtual Try-on from a Single Frontal Image via Diffusion Transformer-
[pdf]
[supp]
[bibtex]@InProceedings{Han_2026_WACV, author = {Han, Seonghee and Chung, Minchang and Cho, Gyeongsu and Joo, Kyungdon and Kim, Taehwan}, title = {Pose-Diverse Multi-View Virtual Try-on from a Single Frontal Image via Diffusion Transformer}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3310-3319} }
ObjectMeshDeform : Towards Recovering Precise 3D Geometry of Real Objects via Image-guided Mesh Deformation of 3D Generative Priors-
[pdf]
[supp]
[bibtex]@InProceedings{Katageri_2026_WACV, author = {Katageri, Siddharth and Sinha, Sanjana and Ghosh, Sourav and Maity, Soumyadip and Bhowmick, Brojeshwar}, title = {ObjectMeshDeform : Towards Recovering Precise 3D Geometry of Real Objects via Image-guided Mesh Deformation of 3D Generative Priors}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2585-2595} }
Cluster-based Pseudo-labeling for Semi-Supervised LiDAR Semantic Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Guo_2026_WACV, author = {Guo, Qingju and Li, Shuang and Geng, Jing and Xie, Binhui and Shan, Jiawei and Li, Wei}, title = {Cluster-based Pseudo-labeling for Semi-Supervised LiDAR Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {623-634} }
Memory-Augmented Representation for Efficient Event-based Visuomotor Policy Learning with Adaptive Perception and Control-
[pdf]
[bibtex]@InProceedings{Kamal_2026_WACV, author = {Kamal, Uday and Mukhopadhyay, Saibal}, title = {Memory-Augmented Representation for Efficient Event-based Visuomotor Policy Learning with Adaptive Perception and Control}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2596-2605} }
DiffRegCD: Integrated Registration and Change Detection with Diffusion Features-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Madani_2026_WACV, author = {Madani, Seyedehanita and Chellappa, Rama and Patel, Vishal M.}, title = {DiffRegCD: Integrated Registration and Change Detection with Diffusion Features}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7503-7512} }
LangPose: Language-Aligned Motion for Robust 3D Human Pose Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liao_2026_WACV, author = {Liao, Longyun and Zheng, Rong}, title = {LangPose: Language-Aligned Motion for Robust 3D Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8073-8083} }
Accelerated Dose Generation in Gamma Knife Radiosurgery Using a Wavelet Diffusion Model for Sparse Representation-
[pdf]
[supp]
[bibtex]@InProceedings{Lee_2026_WACV, author = {Lee, Sangyoon and Mishra, Shubuendu and Watanabe, Yoichi}, title = {Accelerated Dose Generation in Gamma Knife Radiosurgery Using a Wavelet Diffusion Model for Sparse Representation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {917-926} }
Lorentz Entailment Cone for Semantic Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Hasan_2026_WACV, author = {Hasan, Zahid and Ahmed, Masud and Roy, Nirmalya}, title = {Lorentz Entailment Cone for Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5216-5225} }
Can We Challenge Open-Vocabulary Object Detectors with Generated Content in Street Scenes?-
[pdf]
[supp]
[bibtex]@InProceedings{Mutze_2026_WACV, author = {M\"utze, Annika and Ilyas, Sadia and D\"orpelkus, Christian and Rottmann, Matthias}, title = {Can We Challenge Open-Vocabulary Object Detectors with Generated Content in Street Scenes?}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {740-750} }
Lose Your Self (LoYS): An Adversarial Entropy-based Unsupervised Approach for Model Debiasing-
[pdf]
[supp]
[bibtex]@InProceedings{Pastore_2026_WACV, author = {Pastore, Vito Paolo and Ciranni, Massimiliano and Murino, Vittorio}, title = {Lose Your Self (LoYS): An Adversarial Entropy-based Unsupervised Approach for Model Debiasing}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5714-5723} }
Autocorrelation-based Fiducial Markers for Traceability-
[pdf]
[supp]
[bibtex]@InProceedings{Bencheikh_2026_WACV, author = {Bencheikh, Ismail and Dunitz, Max and d'Autume, Marie and Meinhardt-Llopis, Enric and Pic, Marc and Facciolo, Gabriele and Mus\'e, Pablo}, title = {Autocorrelation-based Fiducial Markers for Traceability}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1345-1354} }
AutoSew: A Geometric Approach to Stitching Prediction with Graph Neural Networks-
[pdf]
[supp]
[bibtex]@InProceedings{Rios-Navarro_2026_WACV, author = {R{\'\i}os-Navarro, Pablo and Garces, Elena and Lopez-Moreno, Jorge}, title = {AutoSew: A Geometric Approach to Stitching Prediction with Graph Neural Networks}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1374-1383} }
Color Preserving CMOS-SPAD Fusion for Multi-Frame HDR-
[pdf]
[bibtex]@InProceedings{Suonsivu_2026_WACV, author = {Suonsivu, Aleksi and Salmela, Lauri and Helin, Lassi and Uosukainen, Leevi and Boracchi, Giacomo}, title = {Color Preserving CMOS-SPAD Fusion for Multi-Frame HDR}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5100-5109} }
CLIP-UP: CLIP-Based Unanswerable Problem Detection for Visual Question Answering-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Vardi_2026_WACV, author = {Vardi, Ben and Nir, Oron and Shamir, Ariel}, title = {CLIP-UP: CLIP-Based Unanswerable Problem Detection for Visual Question Answering}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5898-5908} }
BoxSplitGen: A Generative Model for 3D Part Bounding Boxes in Varying Granularity-
[pdf]
[supp]
[bibtex]@InProceedings{Koo_2026_WACV, author = {Koo, Juil and Lin, Wei-Tung and Park, Chanho and Park, Chanhyeok and Sung, Minhyuk}, title = {BoxSplitGen: A Generative Model for 3D Part Bounding Boxes in Varying Granularity}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1777-1787} }
Beyond Paired Data: Self-Supervised UAV Geo-Localization from Reference Imagery Alone-
[pdf]
[supp]
[bibtex]@InProceedings{Amadei_2026_WACV, author = {Amadei, Tristan and Meinhardt-Llopis, Enric and Bascle, Benedicte and Abgrall, Corentin and Facciolo, Gabriele}, title = {Beyond Paired Data: Self-Supervised UAV Geo-Localization from Reference Imagery Alone}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7409-7419} }
Improving Animal Pose Estimation through Species Similarity Measures and Rigorous Label Definition-
[pdf]
[supp]
[bibtex]@InProceedings{Parhy_2026_WACV, author = {Parhy, Medhashree and Chanchani, Shaan and Kim, Claire and Mansky, Josh and Pan, Zian and Thakre, Parth and Chen, Haoyu and Reibman, Amy R.}, title = {Improving Animal Pose Estimation through Species Similarity Measures and Rigorous Label Definition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5662-5671} }
Training-Free Few-Shot Segmentation via Vision-Language Guided Prompting-
[pdf]
[bibtex]@InProceedings{Yoon_2026_WACV, author = {Yoon, Euihyun and Park, Taejin and Lee, Jaekoo}, title = {Training-Free Few-Shot Segmentation via Vision-Language Guided Prompting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6517-6526} }
SynchroRaMa : Lip-Synchronized and Emotion-Aware Talking Face Generation via Multi-Modal Emotion Embedding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yee_2026_WACV, author = {Yee, Phyo Thet and Kollias, Dimitrios and Mishra, Sudeepta and Dhall, Abhinav}, title = {SynchroRaMa : Lip-Synchronized and Emotion-Aware Talking Face Generation via Multi-Modal Emotion Embedding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4546-4555} }
HDR Reconstruction Boosting with Training-Free and Exposure-Consistent Diffusion-
[pdf]
[supp]
[bibtex]@InProceedings{Lin_2026_WACV, author = {Lin, Yo-Tin and Chen, Su-Kai and Hu, Hou-Ning and Lin, Yen-Yu and Liu, Yu-Lun}, title = {HDR Reconstruction Boosting with Training-Free and Exposure-Consistent Diffusion}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7513-7523} }
Exploring Automated Recognition of Instructional Activity and Discourse from Multimodal Classroom Data-
[pdf]
[supp]
[bibtex]@InProceedings{Bueno_2026_WACV, author = {Bueno, Ivo and Hou, Ruikun and B\"uhler, Babette and F\"utterer, Tim and Drimalla, James and Foster, Jonathan K. and Youngs, Peter and Gerjets, Peter and Trautwein, Ulrich and Kasneci, Enkelejda}, title = {Exploring Automated Recognition of Instructional Activity and Discourse from Multimodal Classroom Data}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6806-6817} }
GeoHSAF: Geometric Hippocampus Shape Analysis Framework for Longitudinal Alzheimer's Disease Classification-
[pdf]
[supp]
[bibtex]@InProceedings{Olaoluwa_2026_WACV, author = {Olaoluwa, Mubarak and Loukil, Heni and Sbei, Arafet and Drira, Hassen}, title = {GeoHSAF: Geometric Hippocampus Shape Analysis Framework for Longitudinal Alzheimer's Disease Classification}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2156-2167} }
Power of Boundary and Reflection: Semantic Transparent Object Segmentation using Pyramid Vision Transformer with Transparent Cues-
[pdf]
[supp]
[bibtex]@InProceedings{Vu_2026_WACV, author = {Vu, Tuan-Anh and Nguyen-Truong, Hai and Zheng, Ziqiang and Hua, Binh-Son and Guo, Qing and Tsang, Ivor W. and Yeung, Sai-Kit}, title = {Power of Boundary and Reflection: Semantic Transparent Object Segmentation using Pyramid Vision Transformer with Transparent Cues}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3360-3369} }
SCAdapter: Content-Style Disentanglement for Diffusion Style Transfer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Trinh_2026_WACV, author = {Trinh, Luan Thanh}, title = {SCAdapter: Content-Style Disentanglement for Diffusion Style Transfer}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7312-7321} }
Equivariant Sampling for Improving Diffusion Model-based Image Restoration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2026_WACV, author = {Wu, Chenxu and Kong, Qingpeng and Zhao, Peiang and Yang, Wendi and Ma, Wenxin and Tang, Fenghe and Jiang, Zihang and Zhou, S.Kevin}, title = {Equivariant Sampling for Improving Diffusion Model-based Image Restoration}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6827-6839} }
Generalization of Real World Video Deblurring By Image-to-Image Translation-
[pdf]
[supp]
[bibtex]@InProceedings{Aitbek_2026_WACV, author = {Aitbek, Kassymzhomart and Yang, Seungjoon}, title = {Generalization of Real World Video Deblurring By Image-to-Image Translation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4705-4714} }
CRISP: Cylindrical Rendering for In-Stream Point Clouds-
[pdf]
[supp]
[bibtex]@InProceedings{Kang_2026_WACV, author = {Kang, Hyungwoo and Jang, Seonyoung and Yoon, Yeojun and Oh, Byung Tae}, title = {CRISP: Cylindrical Rendering for In-Stream Point Clouds}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5550-5559} }
ProSkill: Segment-Level Skill Assessment in Procedural Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mazzamuto_2026_WACV, author = {Mazzamuto, Michele and Di Mauro, Daniele and Francesca, Gianpiero and Farinella, Giovanni Maria and Furnari, Antonino}, title = {ProSkill: Segment-Level Skill Assessment in Procedural Videos}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4849-4858} }
SilverLining: Data-First Mitigation of Spatial and Spectral Shortcuts Without Introducing New Confounders-
[pdf]
[supp]
[bibtex]@InProceedings{Unnikrishnan_2026_WACV, author = {Unnikrishnan, Balagopal and Brudno, Michael and McIntosh, Chris}, title = {SilverLining: Data-First Mitigation of Spatial and Spectral Shortcuts Without Introducing New Confounders}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1294-1303} }
Real-Time Tracking of Flexible Markers in Low-Contrast Fluoroscopy Using a Deep Neural Network Trained Solely on Synthetic Data-
[pdf]
[supp]
[bibtex]@InProceedings{Uchiyama_2026_WACV, author = {Uchiyama, Tomoki and Sakata, Yukinobu and Hirai, Ryusuke and Ishikawa, Hitoshi and Mori, Shinichiro}, title = {Real-Time Tracking of Flexible Markers in Low-Contrast Fluoroscopy Using a Deep Neural Network Trained Solely on Synthetic Data}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2670-2679} }
Ordinal-Aware Multimodal Engagement Recognition for Collaborative Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Tran_2026_WACV, author = {Tran, Nha and Ly, Dat and Ta, Phi and Nguyen, Hung and Nguyen, Hien D.}, title = {Ordinal-Aware Multimodal Engagement Recognition for Collaborative Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2424-2433} }
AuViRe: Audio-visual Speech Representation Reconstruction for Deepfake Temporal Localization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Koutlis_2026_WACV, author = {Koutlis, Christos and Papadopoulos, Symeon}, title = {AuViRe: Audio-visual Speech Representation Reconstruction for Deepfake Temporal Localization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7168-7177} }
DOTGraph: CLIP-Driven Feature Disentanglement and Optimal Transport based Graph Learning for Few-Shot Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Biswas_2026_WACV, author = {Biswas, Shreya and Yin, Zhaozheng}, title = {DOTGraph: CLIP-Driven Feature Disentanglement and Optimal Transport based Graph Learning for Few-Shot Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3638-3647} }
TA-Prompting: Enhancing Video Large Language Models for Dense Video Captioning via Temporal Anchors-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cheng_2026_WACV, author = {Cheng, Wei-Yuan and Chang, Kai-Po and Huang, Chi-Pin and Yang, Fu-En and Wang, Yu-Chiang Frank}, title = {TA-Prompting: Enhancing Video Large Language Models for Dense Video Captioning via Temporal Anchors}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {225-235} }
Predicting Task fMRI Contrasts from Resting-State fMRI Using Sparse 3D Convolutions-
[pdf]
[bibtex]@InProceedings{Sviridov_2026_WACV, author = {Sviridov, Ivan and Boyko, Maria and Sharaev, Maksim}, title = {Predicting Task fMRI Contrasts from Resting-State fMRI Using Sparse 3D Convolutions}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6320-6329} }
Causality-Driven Audits of Model Robustness-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Drenkow_2026_WACV, author = {Drenkow, Nathan and Paul, William and Ribaudo, Chris and Unberath, Mathias}, title = {Causality-Driven Audits of Model Robustness}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5956-5966} }
Harnessing Object Grounding for Time-Sensitive Video Understanding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2026_WACV, author = {Wu, Tz-Ying and Sridhar, Sharath Nittur and Tripathi, Subarna}, title = {Harnessing Object Grounding for Time-Sensitive Video Understanding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2475-2484} }
Pointmap-Conditioned Diffusion for Consistent Novel View Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nguyen_2026_WACV, author = {Nguyen, Thang-Anh-Quan and Caraffa, Laurent and Tarel, Jean-Philippe and Br\'emond, Roland}, title = {Pointmap-Conditioned Diffusion for Consistent Novel View Synthesis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6360-6370} }
Reciprocal Teaching: Dynamic Multi-Model Teacher-Student Learning for Multiple Noisy Annotations-
[pdf]
[supp]
[bibtex]@InProceedings{Ai_2026_WACV, author = {Ai, Wenjie and Nguyen, Cuong C. and Hilton, Adrian and Carneiro, Gustavo}, title = {Reciprocal Teaching: Dynamic Multi-Model Teacher-Student Learning for Multiple Noisy Annotations}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8376-8385} }
OracleGS: Grounding Generative Priors for Sparse-View Gaussian Splatting-
[pdf]
[supp]
[bibtex]@InProceedings{Topaloglu_2026_WACV, author = {Topalo\u{g}lu, Atakan and Li, Kunyi and Niemeyer, Michael and Navab, Nassir and Tekalp, A. Murat and Tombari, Federico}, title = {OracleGS: Grounding Generative Priors for Sparse-View Gaussian Splatting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {77-87} }
DICE: Discrete Inversion Enabling Controllable Editing for Masked Generative Models-
[pdf]
[supp]
[bibtex]@InProceedings{He_2026_WACV, author = {He, Xiaoxiao and Dao, Quan and Han, Ligong and Wen, Song and Bai, Minhao and Liu, Di and Zhang, Han and Juefei-Xu, Felix and Tan, Chaowei and Liu, Bo and Min, Martin Renqiang and Li, Kang and Ahmed, Faez and Srivastava, Akash and Li, Hongdong and Huang, Junzhou and Metaxas, Dimitris N.}, title = {DICE: Discrete Inversion Enabling Controllable Editing for Masked Generative Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {762-772} }
Human Pose Aggregation for Multi-View Temporal Video Alignment-
[pdf]
[bibtex]@InProceedings{Delattre_2026_WACV, author = {Delattre, Fabien and Huang, Tsung-Wei and Su, Guan-Ming and Learned-Miller, Erik}, title = {Human Pose Aggregation for Multi-View Temporal Video Alignment}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {635-646} }
RampWatch: An In-the-Wild Dataset and Text-Guided Detection Framework for Recreational Vessels-
[pdf]
[supp]
[bibtex]@InProceedings{Asim_2026_WACV, author = {Asim, Malik Muhammad and Smallwood, Claire B. and Tariq, Abdullah and Lo, Johnny and Gilani, Syed Zulqarnain}, title = {RampWatch: An In-the-Wild Dataset and Text-Guided Detection Framework for Recreational Vessels}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7576-7585} }
How to Design and Train Your Implicit Neural Representation for Video Compression-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gwilliam_2026_WACV, author = {Gwilliam, Matthew and Zhang, Roy and Padmanabhan, Namitha and Du, Hongyang and Shrivastava, Abhinav}, title = {How to Design and Train Your Implicit Neural Representation for Video Compression}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {729-739} }
Q-Former Autoencoder: A Modern Framework for Medical Anomaly Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dalmonte_2026_WACV, author = {Dalmonte, Francesco and Bayar, Emirhan and Akbas, Emre and Georgescu, Mariana-Iuliana}, title = {Q-Former Autoencoder: A Modern Framework for Medical Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7985-7995} }
Latent Uncertainty-Aware Multi-View SDF Scan Completion-
[pdf]
[supp]
[bibtex]@InProceedings{Zakeri_2026_WACV, author = {Zakeri, Faezeh and Ruppert, Lukas and Braun, Raphael and Lensch, Hendrik P.A.}, title = {Latent Uncertainty-Aware Multi-View SDF Scan Completion}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3556-3566} }
MoSCo: Real-time and Efficient Text-to-Motion Synthesis via Delta Training-
[pdf]
[bibtex]@InProceedings{Zhang_2026_WACV, author = {Zhang, Zhiyuan and Liu, Lingqiao}, title = {MoSCo: Real-time and Efficient Text-to-Motion Synthesis via Delta Training}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6298-6308} }
DPBridge: Latent Diffusion Bridge for Dense Prediction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ji_2026_WACV, author = {Ji, Haorui and Lin, Taojun and Li, Hongdong}, title = {DPBridge: Latent Diffusion Bridge for Dense Prediction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5520-5530} }
CraftSVG: Multi-Object Text-to-SVG Synthesis via Layout Guided Diffusion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Banerjee_2026_WACV, author = {Banerjee, Ayan and Mathur, Nityanand and Llados, Josep and Pal, Umapada and Dutta, Anjan}, title = {CraftSVG: Multi-Object Text-to-SVG Synthesis via Layout Guided Diffusion}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2564-2574} }
Streaming Real-Time Trajectory Prediction Using Endpoint-Aware Modeling-
[pdf]
[supp]
[bibtex]@InProceedings{Prutsch_2026_WACV, author = {Prutsch, Alexander and Schinagl, David and Possegger, Horst}, title = {Streaming Real-Time Trajectory Prediction Using Endpoint-Aware Modeling}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3005-3014} }
Splannequin: Freezing Monocular Mannequin-Challenge Footage with Dual-Detection Splatting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chien_2026_WACV, author = {Chien, Hao-Jen and Huang, Yi-Chuan and Wu, Chung-Ho and Chao, Wei-Lun and Liu, Yu-Lun}, title = {Splannequin: Freezing Monocular Mannequin-Challenge Footage with Dual-Detection Splatting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8028-8040} }
Trajectory Tactics: When Transformers Learn Exploration to Generate Online Signature-
[pdf]
[bibtex]@InProceedings{Pandey_2026_WACV, author = {Pandey, Anurag and Nigam, Aditya and Bhavsar, Arnav and Sharma, Ashutosh and Verma, Basu and Acharya, Divya and Amir, Mohd}, title = {Trajectory Tactics: When Transformers Learn Exploration to Generate Online Signature}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2306-2315} }
Hybrid State Representation for Video Procedure Planning-
[pdf]
[supp]
[bibtex]@InProceedings{Choi_2026_WACV, author = {Choi, Woo Suk and Jang, Youwon and Lee, Minsu and Zhang, Byoung-Tak}, title = {Hybrid State Representation for Video Procedure Planning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6507-6516} }
MageBench: Bridging Large Multimodal Models to Agents-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2026_WACV, author = {Zhang, Miaosen and Dai, Qi and Yang, Yifan and Bao, Jianmin and Chen, Dongdong and Qiu, Kai and Luo, Chong and Geng, Xin and Guo, Baining}, title = {MageBench: Bridging Large Multimodal Models to Agents}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1415-1427} }
Diagnose Like A REAL Pathologist: An Uncertainty-Focused Approach for Trustworthy Multi-Resolution Multiple Instance Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hong_2026_WACV, author = {Hong, Sungrae and Lee, Sol and Shin, Jisu and Jeong, Jiwon and Yi, Mun Yong}, title = {Diagnose Like A REAL Pathologist: An Uncertainty-Focused Approach for Trustworthy Multi-Resolution Multiple Instance Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6132-6141} }
Curve Skeletonization in Continuous domain for Meshes and Point Clouds-
[pdf]
[supp]
[bibtex]@InProceedings{Bardhan_2026_WACV, author = {Bardhan, Jai and Hebbalaguppe, Ramya and Udupa, Aravind}, title = {Curve Skeletonization in Continuous domain for Meshes and Point Clouds}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5079-5089} }
NerVast: Compression-Efficient Scaling of Implicit Neural Video Representations via Scene-based Parameter-sharing-
[pdf]
[supp]
[bibtex]@InProceedings{Lee_2026_WACV, author = {Lee, Yunheon and Ye, Juncheol and Kim, Jaehong and Han, Dongsu}, title = {NerVast: Compression-Efficient Scaling of Implicit Neural Video Representations via Scene-based Parameter-sharing}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2616-2625} }
Align Video Diffusion Model with Online Video-Centric Preference Optimization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2026_WACV, author = {Zhang, Jiacheng and Wu, Jie and Chen, Weifeng and Ji, Yatai and Xiao, Xuefeng and Huang, Weilin and Han, Kai}, title = {Align Video Diffusion Model with Online Video-Centric Preference Optimization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6142-6152} }
SSMRadNet : A Sample-wise State-Space Framework for Efficient and Ultra-Light Radar Segmentation and Object Detection-
[pdf]
[arXiv]
[bibtex]@InProceedings{Sen_2026_WACV, author = {Sen, Anuvab and Mohammad, Mir Sayeed and Mukhopadhyay, Saibal}, title = {SSMRadNet : A Sample-wise State-Space Framework for Efficient and Ultra-Light Radar Segmentation and Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4365-4374} }
CAMP-VQA: Caption-Embedded Multimodal Perception for No-Reference Quality Assessment of Compressed Video-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2026_WACV, author = {Wang, Xinyi and Katsenou, Angeliki and Shen, Junxiao and Bull, David}, title = {CAMP-VQA: Caption-Embedded Multimodal Perception for No-Reference Quality Assessment of Compressed Video}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2042-2051} }
HyperPose: Hyper-pose Embeddings for 3D-Aware Generative Models with Self-Supervised Disentangling of Pose and Scene-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2026_WACV, author = {Kim, Mijeong and Kim, Namgi and Han, Bohyung}, title = {HyperPose: Hyper-pose Embeddings for 3D-Aware Generative Models with Self-Supervised Disentangling of Pose and Scene}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1011-1021} }
AortaDiff: A Unified Multitask Diffusion Framework for Contrast-Free AAA Imaging-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ou_2026_WACV, author = {Ou, Yuxuan and Bi, Ning and Pan, Jiazhen and Yang, Jiancheng and Yu, Boliang and Zidan, Usama and Lee, Regent and Grau, Vicente}, title = {AortaDiff: A Unified Multitask Diffusion Framework for Contrast-Free AAA Imaging}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8242-8251} }
Beyond Faces: A Multimodal Person Clustering for Unconstrained Environments-
[pdf]
[bibtex]@InProceedings{Yoo_2026_WACV, author = {Yoo, Sahngmin and Lee, Sangwon and Jo, Seongin}, title = {Beyond Faces: A Multimodal Person Clustering for Unconstrained Environments}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4631-4640} }
High-Rate Mixout: Revisiting Mixout for Robust Domain Generalization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Aminbeidokhti_2026_WACV, author = {Aminbeidokhti, Masih and Medeiros, Heitor Rapela and Muralidharan, Srikanth and Granger, Eric and Pedersoli, Marco}, title = {High-Rate Mixout: Revisiting Mixout for Robust Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3803-3812} }
High-Level Semantics and Low-Level Features Fusion for Multi-Scale Object Detection in Dynamic Construction Environments-
[pdf]
[bibtex]@InProceedings{Bonyani_2026_WACV, author = {Bonyani, Mahdi and Soleymani, Maryam and Wang, Chao}, title = {High-Level Semantics and Low-Level Features Fusion for Multi-Scale Object Detection in Dynamic Construction Environments}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6527-6536} }
BiNAR: A Bi-Modal Framework for Non-Aligned RGB-IR 3D Reconstruction via Gaussian Splatting-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2026_WACV, author = {Wang, Zhongwen and Ling, Han and Zhang, Weihao and Sun, Yinghui and Sun, Quansen}, title = {BiNAR: A Bi-Modal Framework for Non-Aligned RGB-IR 3D Reconstruction via Gaussian Splatting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4407-4416} }
Timestamp Query Transformer for Temporal Action Segmentation-
[pdf]
[bibtex]@InProceedings{Wang_2026_WACV, author = {Wang, Tieqiao and Todorovic, Sinisa}, title = {Timestamp Query Transformer for Temporal Action Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5016-5025} }
Mitigating Backdoor Attacks via Trigger Reconstruction and Model Hardening-
[pdf]
[supp]
[bibtex]@InProceedings{Tao_2026_WACV, author = {Tao, Guanhong and Cheng, Siyuan and Shen, Guangyu and Liu, Yingqi and An, Shengwei and Zhang, Zhuo and Wang, Zhenting and Guo, Hanxi and Zhang, Xiangyu}, title = {Mitigating Backdoor Attacks via Trigger Reconstruction and Model Hardening}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {580-590} }
Visibility guided Self-Supervised Occlusion-Resilient Human Pose Estimation-
[pdf]
[supp]
[bibtex]@InProceedings{Dutta_2026_WACV, author = {Dutta, Arindam and Bose, Sarosij and Kundu, Rohit and Ta, Calvin-Khang and Bachu, Saketh and Karydis, Konstantinos and Roy-Chowdhury, Amit K.}, title = {Visibility guided Self-Supervised Occlusion-Resilient Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1054-1063} }
Feature-Disentangling RGB-NIR Fusion Network for Remote Driver Physiological Measurement-
[pdf]
[supp]
[bibtex]@InProceedings{Bouraffa_2026_WACV, author = {Bouraffa, Tayssir and Wang, Ziyuan and Str\"uber, Daniel}, title = {Feature-Disentangling RGB-NIR Fusion Network for Remote Driver Physiological Measurement}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {657-666} }
VividAnimator: An End-to-End Audio and Pose-driven Half-Body Human Animation Framework-
[pdf]
[arXiv]
[bibtex]@InProceedings{Huang_2026_WACV, author = {Huang, Donglin and Li, Yongyuan and Liu, Tianhang and Huang, Junming and Yang, Xiaoda and Wang, Chi and Xu, Weiwei}, title = {VividAnimator: An End-to-End Audio and Pose-driven Half-Body Human Animation Framework}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4325-4334} }
Delta-LLaVA: Base-then-Specialize Alignment for Token-Efficient Vision-Language Models-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zamini_2026_WACV, author = {Zamini, Mohamad and Shukla, Diksha}, title = {Delta-LLaVA: Base-then-Specialize Alignment for Token-Efficient Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3648-3657} }
CommonForms: A Large, Diverse Dataset for Form Field Detection-
[pdf]
[arXiv]
[bibtex]@InProceedings{Barrow_2026_WACV, author = {Barrow, Joe}, title = {CommonForms: A Large, Diverse Dataset for Form Field Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1170-1179} }
OpenLVLM-MIA: A Controlled Benchmark Revealing the Limits of Membership Inference Attacks on Large Vision-Language Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Miyamoto_2026_WACV, author = {Miyamoto, Ryoto and Fan, Xin and Kido, Fuyuko and Matsumoto, Tsuneo and Yamana, Hayato}, title = {OpenLVLM-MIA: A Controlled Benchmark Revealing the Limits of Membership Inference Attacks on Large Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2680-2689} }
AusSmoke meets MultiNatSmoke: a fully-labelled diverse smoke segmentation dataset-
[pdf]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Weihao and Zhao, Hongjin and Zhu, Gao and Ji, Ge-Peng and Wilson, Nicholas and Yebra, Marta and Barnes, Nick}, title = {AusSmoke meets MultiNatSmoke: a fully-labelled diverse smoke segmentation dataset}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7996-8006} }
MVAT: Multi-View Aware Teacher for Weakly Supervised 3D Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Lahlali_2026_WACV, author = {Lahlali, Saad and Fournier-Mongieux, Alexandre and Granger, Nicolas and Le Borgne, Herv\'e and Pham, Quoc-Cuong}, title = {MVAT: Multi-View Aware Teacher for Weakly Supervised 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6101-6110} }
DreamCatcher: Efficient Multi-Concept Customization via Representation Finetuning-
[pdf]
[supp]
[bibtex]@InProceedings{Lee_2026_WACV, author = {Lee, Jungwon and Lee, Changhun and Park, Eunhyeok}, title = {DreamCatcher: Efficient Multi-Concept Customization via Representation Finetuning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7062-7072} }
GorillaWatch: An Automated System for In-the-Wild Gorilla Re-Identification and Population Monitoring-
[pdf]
[bibtex]@InProceedings{Schall_2026_WACV, author = {Schall, Maximilian and Kn\"ofel, Felix Leonard and K\"onig, Noah Elias and Kubeler, Jan Jonas and von Klinski, Maximilian and Linnemann, Joan Wilhelm and Liu, Xiaoshi and Schlegelmilch, Iven Jelle and Woyciniuk, Ole and Schild, Alexandra and Wasmuht, Dante and Espinet, Magdalena Bermejo and Basas, German Illera and de Melo, Gerard}, title = {GorillaWatch: An Automated System for In-the-Wild Gorilla Re-Identification and Population Monitoring}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8364-8375} }
QCFace: Image Quality Control for boosting Face Representation & Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Doan-Ngo_2026_WACV, author = {Doan-Ngo, Duc-Phuong and Diep, Thanh-Dang and Nguyen-Duc, Thanh and LE, Thanh-Sach and Thoai, Nam}, title = {QCFace: Image Quality Control for boosting Face Representation \& Recognition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1501-1511} }
CLoCKDistill: Consistent Location and Context aware Knowledge Distillation for DETRs-
[pdf]
[arXiv]
[bibtex]@InProceedings{Lan_2026_WACV, author = {Lan, Qizhen and Tian, Qing}, title = {CLoCKDistill: Consistent Location and Context aware Knowledge Distillation for DETRs}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7188-7197} }
False Alarm Rectification for Early Smoke Segmentation-
[pdf]
[bibtex]@InProceedings{Zhao_2026_WACV, author = {Zhao, Hongjin and Li, Weihao and Ji, Ge-Peng and Barnes, Nick}, title = {False Alarm Rectification for Early Smoke Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1969-1978} }
NAPP: Noise-Adaptive Prototype Perturbation for Few-Shot Learning-
[pdf]
[bibtex]@InProceedings{Kim_2026_WACV, author = {Kim, Ilhwan and Yun, Sangwoo and Lee, Dongheon and Kim, Seongsu and Paik, Joonki}, title = {NAPP: Noise-Adaptive Prototype Perturbation for Few-Shot Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8007-8016} }
MemeTAG: Keyword-Driven Meme Classification through Tag Embedding Reconstruction-
[pdf]
[supp]
[bibtex]@InProceedings{Sharma_2026_WACV, author = {Sharma, Akshit and Patil, Prashant W}, title = {MemeTAG: Keyword-Driven Meme Classification through Tag Embedding Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7679-7688} }
DMAT: An End-to-End Framework for Joint Atmospheric Turbulence Mitigation and Object Detection-
[pdf]
[arXiv]
[bibtex]@InProceedings{Hill_2026_WACV, author = {Hill, Paul and Liu, Zhiming and Achim, Alin and Bull, David and Anantrasirichai, Nantheera}, title = {DMAT: An End-to-End Framework for Joint Atmospheric Turbulence Mitigation and Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2690-2699} }
ViGG: Robust RGB-D Point Cloud Registration using Visual-Geometric Mutual Guidance-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2026_WACV, author = {Chen, Congjia and Yan, Shen and Qu, Yufu}, title = {ViGG: Robust RGB-D Point Cloud Registration using Visual-Geometric Mutual Guidance}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {816-826} }
Learning Unified Spatio-temporal Representations for Efficient Compressed Video Understanding-
[pdf]
[supp]
[bibtex]@InProceedings{Das_Biswas_2026_WACV, author = {Das Biswas, Shristi and Soufleri, Efstathia and Roy, Arani and Roy, Kaushik}, title = {Learning Unified Spatio-temporal Representations for Efficient Compressed Video Understanding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4755-4765} }
Hymavi : A Hybrid Mamba-Attention Network in Multi-View Framework for Volumetric Medical Image Segmentation-
[pdf]
[bibtex]@InProceedings{Tran_2026_WACV, author = {Tran, Sy Dat and Gahm, Jin Kyu}, title = {Hymavi : A Hybrid Mamba-Attention Network in Multi-View Framework for Volumetric Medical Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6006-6015} }
Revisiting Layer Normalization for Point Cloud Test Time Adaptation-
[pdf]
[supp]
[bibtex]@InProceedings{Yazdanpanah_2026_WACV, author = {Yazdanpanah, Moslem and Bahri, Ali and Noori, Mehrdad and Dastani, Sahar and Barbeau, Samuel and Osowiechi, David and Hakim, Gustavo Adolfo Vargas and Ben Ayed, Ismail and Desrosiers, Christian}, title = {Revisiting Layer Normalization for Point Cloud Test Time Adaptation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {537-546} }
LooC: Effective Low-Dimensional Codebook for Compositional Vector Quantization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Jie and Wong, Kwan-Yee K. and Han, Kai}, title = {LooC: Effective Low-Dimensional Codebook for Compositional Vector Quantization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {160-170} }
DocWaveDiff: A Predict-and-Refine approach for Document Image Enhancement with Wavelet U-Nets and Diffusion models-
[pdf]
[supp]
[bibtex]@InProceedings{Marulli_2026_WACV, author = {Marulli, Matteo and Bertini, Marco}, title = {DocWaveDiff: A Predict-and-Refine approach for Document Image Enhancement with Wavelet U-Nets and Diffusion models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8511-8520} }
A-V Representation Learning via Audio Shift Prediction for Multimodal Deepfake Detection and Temporal Localization-
[pdf]
[supp]
[bibtex]@InProceedings{Anshul_2026_WACV, author = {Anshul, Ashutosh and Chng, Eng Siong and Rajan, Deepu}, title = {A-V Representation Learning via Audio Shift Prediction for Multimodal Deepfake Detection and Temporal Localization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2553-2563} }
3D Gaussian Point Encoders-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{James_2026_WACV, author = {James, Jim and Wilson, Benjamin and Lucey, Simon and Hays, James}, title = {3D Gaussian Point Encoders}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1788-1797} }
ODEt(ODEl): Shortcutting the Time and the Length in Diffusion and Flow Models for Faster Sampling-
[pdf]
[supp]
[bibtex]@InProceedings{Gudovskiy_2026_WACV, author = {Gudovskiy, Denis and Zheng, Wenzhao and Okuno, Tomoyuki and Nakata, Yohei and Keutzer, Kurt}, title = {ODEt(ODEl): Shortcutting the Time and the Length in Diffusion and Flow Models for Faster Sampling}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6111-6120} }
Can Image Splicing and Copy-Move Forgery Be Detected by the Same Model? Forensim: An Attention-Based State-Space Approach-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nandi_2026_WACV, author = {Nandi, Soumyaroop and Natarajan, Prem}, title = {Can Image Splicing and Copy-Move Forgery Be Detected by the Same Model? Forensim: An Attention-Based State-Space Approach}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6194-6204} }
Controllable Long-term Motion Generation with Extended Joint Targets-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2026_WACV, author = {Lee, Eunjong and Kim, Eunhee and Hong, Sanghoon and Jung, Eunho and Kim, Jihoon}, title = {Controllable Long-term Motion Generation with Extended Joint Targets}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5164-5173} }
CVP: Central-Peripheral Vision-Inspired Multimodal Model for Spatial Reasoning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2026_WACV, author = {Chen, Zeyuan and Zhang, Xiang and Xu, Haiyang and Xie, Jianwen and Tu, Zhuowen}, title = {CVP: Central-Peripheral Vision-Inspired Multimodal Model for Spatial Reasoning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2295-2305} }
TopoRec: Point Cloud Recognition Using Topological Data Analysis-
[pdf]
[arXiv]
[bibtex]@InProceedings{Ghosh_2026_WACV, author = {Ghosh, Anirban and Kulbaka, Iliya and Dahlin, Ian and Dutta, Ayan}, title = {TopoRec: Point Cloud Recognition Using Topological Data Analysis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7544-7553} }
SFMNet: Sparse Focal Modulation for 3D Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shrout_2026_WACV, author = {Shrout, Oren and Tal, Ayellet}, title = {SFMNet: Sparse Focal Modulation for 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6287-6297} }
Not Like Transformers: Drop the Beat Representation for Dance Generation with Mamba-Based Diffusion Model-
[pdf]
[supp]
[bibtex]@InProceedings{Park_2026_WACV, author = {Park, Sangjune and Choi, Inhyeok and Soon, Donghyeon and Jeon, Youngwoo and Joo, Kyungdon}, title = {Not Like Transformers: Drop the Beat Representation for Dance Generation with Mamba-Based Diffusion Model}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1767-1776} }
Multi-Grained Text-Guided Image Fusion for Multi-Exposure and Multi-Focus Scenarios-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tang_2026_WACV, author = {Tang, Mingwei and Nie, Jiahao and Yang, Guang and Cui, Ziqing and Li, Jie}, title = {Multi-Grained Text-Guided Image Fusion for Multi-Exposure and Multi-Focus Scenarios}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7668-7678} }
Odo: Depth-Guided Diffusion for Identity-Preserving Body Reshaping-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Khandelwal_2026_WACV, author = {Khandelwal, Siddharth and Kamath, Sridhar and Jain, Arjun}, title = {Odo: Depth-Guided Diffusion for Identity-Preserving Body Reshaping}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {22-31} }
Enhancing Visual Planning with Auxiliary Tasks and Multi-token Prediction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2026_WACV, author = {Zhang, Ce and Song, Yale and Desai, Ruta and Iuzzolino, Michael Louis and Tighe, Joseph and Bertasius, Gedas and Kottur, Satwik}, title = {Enhancing Visual Planning with Auxiliary Tasks and Multi-token Prediction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4190-4200} }
F-INR: Functional Tensor Decomposition for Implicit Neural Representations-
[pdf]
[supp]
[bibtex]@InProceedings{Vemuri_2026_WACV, author = {Vemuri, Sai Karthikeya and B\"uchner, Tim and Denzler, Joachim}, title = {F-INR: Functional Tensor Decomposition for Implicit Neural Representations}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6557-6568} }
Dronaquatics: Real-time Swimming Analytics Using Drone Captured Imagery-
[pdf]
[supp]
[bibtex]@InProceedings{Tran_2026_WACV, author = {Tran, Thu and Joseph, Harold Abraham and Lee, Kichang and Choo, Kenny Tsu Wei and Ma, Dong and Foong, Shaohui and Kandappu, Thivya and Ko, Jeonggil and Balan, Rajesh}, title = {Dronaquatics: Real-time Swimming Analytics Using Drone Captured Imagery}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4881-4889} }
GASP: Unifying Geometric and Semantic Self-Supervised Pre-training for Autonomous Driving-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ljungbergh_2026_WACV, author = {Ljungbergh, William and Lilja, Adam and Tonderski, Adam and Ling, Arvid Laveno and Lindstr\"om, Carl and Verbeke, Willem and Fu, Junsheng and Petersson, Christoffer and Hammarstrand, Lars and Felsberg, Michael}, title = {GASP: Unifying Geometric and Semantic Self-Supervised Pre-training for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3077-3087} }
Understanding the Visual Projection Space of Multimodal LLMs-
[pdf]
[bibtex]@InProceedings{Jeong_2026_WACV, author = {Jeong, Sungheon and Song, Yoojeong and Kim, Hyungjoon}, title = {Understanding the Visual Projection Space of Multimodal LLMs}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6049-6058} }
WarpRF: Multi-View Consistency for Training-Free Uncertainty Quantification and Applications in Radiance Fields-
[pdf]
[supp]
[bibtex]@InProceedings{Safadoust_2026_WACV, author = {Safadoust, Sadra and Tosi, Fabio and G\"uney, Fatma and Poggi, Matteo}, title = {WarpRF: Multi-View Consistency for Training-Free Uncertainty Quantification and Applications in Radiance Fields}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5226-5235} }
FAST-EQA: Efficient Embodied Question Answering with Global and Local Region Relevancy-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2026_WACV, author = {Zhang, Haochen and Savaliya, Nirav and Siddiqui, Faizan and Sachdeva, Enna}, title = {FAST-EQA: Efficient Embodied Question Answering with Global and Local Region Relevancy}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1664-1673} }
Flood-LDM: Generalizable Latent Diffusion Models for rapid and accurate zero-shot High-Resolution Flood Mapping-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Neo_2026_WACV, author = {Neo, Sun Han and Seneviratne, Sachith and Herath, Herath Mudiyanselage Viraj Vidura Herath and Saha, Abhishek and Rasnayaka, Sanka and Marshall, Lucy Amanda}, title = {Flood-LDM: Generalizable Latent Diffusion Models for rapid and accurate zero-shot High-Resolution Flood Mapping}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8063-8072} }
Fused Similarity Measure Based Alignment with Dual-Scale Adaptive Selection for Weakly Supervised Video Anomaly Detection-
[pdf]
[bibtex]@InProceedings{Lu_2026_WACV, author = {Lu, Yue-Gao and Xing, Hong-Jie and Li, Chun-Guo}, title = {Fused Similarity Measure Based Alignment with Dual-Scale Adaptive Selection for Weakly Supervised Video Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3193-3202} }
FARF-Net: Frequency-guided Adaptive Receptive Field Network for Edge-enhanced Polyp Segmentation-
[pdf]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Xue and Jiang, Aiwen and Yu, Hongqian and Xiao, Yang}, title = {FARF-Net: Frequency-guided Adaptive Receptive Field Network for Edge-enhanced Polyp Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2338-2347} }
PerVL-Bench: Benchmarking Multimodal Personalization for Large Vision-Language Models-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2026_WACV, author = {Kim, Minsung}, title = {PerVL-Bench: Benchmarking Multimodal Personalization for Large Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6696-6704} }
OSEG: Improving Diffusion sampling through Orthogonal Smoothed Energy Guidance-
[pdf]
[supp]
[bibtex]@InProceedings{Fahim_2026_WACV, author = {Fahim, Masud An Nur Islam and Saqib, Nazmus and Gil, Joon-Min}, title = {OSEG: Improving Diffusion sampling through Orthogonal Smoothed Energy Guidance}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5996-6005} }
Detecting Social Engagement of Elderly From Lifelog Image-streams to Identify Effective Cues for Autobiographic Recall-
[pdf]
[supp]
[bibtex]@InProceedings{Subramaniam_2026_WACV, author = {Subramaniam, Vengateswaran and Subbaraju, Vigneshwaran and Roy, Debaditya and Krishna, Pramath and Kandappu, Thivya and Xu, Qianli}, title = {Detecting Social Engagement of Elderly From Lifelog Image-streams to Identify Effective Cues for Autobiographic Recall}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3380-3389} }
Text Slider: Efficient and Plug-and-Play Continuous Concept Control for Image/Video Synthesis via LoRA Adapters-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chiu_2026_WACV, author = {Chiu, Pin-Yen and Fang, I-Sheng and Chen, Jun-Cheng}, title = {Text Slider: Efficient and Plug-and-Play Continuous Concept Control for Image/Video Synthesis via LoRA Adapters}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {613-622} }
Motion-Aware Graph Fusion Network for 3D Human Pose Estimation-
[pdf]
[supp]
[bibtex]@InProceedings{Pham_2026_WACV, author = {Pham, Yen and Yuan, Xiaohui and Zhuang, Chengyuan}, title = {Motion-Aware Graph Fusion Network for 3D Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5798-5808} }
Learning Spatio-temporal Feature Representations for Video-based Gaze Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Personnic_2026_WACV, author = {Personnic, Alexandre and Bace, Mihai}, title = {Learning Spatio-temporal Feature Representations for Video-based Gaze Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5121-5130} }
ProtoGMVAE: A Variational Auto-Encoder with True Gaussian Mixture Prior for Prototypical-based Self-Explainability-
[pdf]
[supp]
[bibtex]@InProceedings{Blanchard_2026_WACV, author = {Blanchard, Martin and Ducottet, Christophe and Muselet, Damien and Del\'ezay, Olivier}, title = {ProtoGMVAE: A Variational Auto-Encoder with True Gaussian Mixture Prior for Prototypical-based Self-Explainability}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5396-5405} }
Graph Query Networks for Object Detection with Automotive Radar-
[pdf]
[arXiv]
[bibtex]@InProceedings{Saini_2026_WACV, author = {Saini, Loveneet and Tercan, Hasan and Meisen, Tobias}, title = {Graph Query Networks for Object Detection with Automotive Radar}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6988-6997} }
GroupPortrait: Multi-ID Portrait Generation with High Identity Preservation and Fine-Grained Control-
[pdf]
[supp]
[bibtex]@InProceedings{Huang_2026_WACV, author = {Huang, Meijia and Li, Ruida and Ma, Bing and Jiang, Liangwei and Fang, Shuo and Ma, Chenguang}, title = {GroupPortrait: Multi-ID Portrait Generation with High Identity Preservation and Fine-Grained Control}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6226-6235} }
4D Multimodal Co-attention Fusion Network with Latent Contrastive Alignment for Alzheimer's Diagnosis-
[pdf]
[bibtex]@InProceedings{Wei_2026_WACV, author = {Wei, Yuxiang and Zhang, Yanteng and Xiao, Xi and Wang, Tianyang and Wang, Xiao and Calhoun, Vince D.}, title = {4D Multimodal Co-attention Fusion Network with Latent Contrastive Alignment for Alzheimer's Diagnosis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5457-5466} }
Beyond Realism: Learning the Art of Expressive Composition with StickerNet-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lu_2026_WACV, author = {Lu, Haoming and Kocharian, David and Shi, Humphrey}, title = {Beyond Realism: Learning the Art of Expressive Composition with StickerNet}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {869-878} }
ClusterMine: Robust Label-Free Visual Out-Of-Distribution Detection via Concept Mining from Text Corpora-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Adaloglou_2026_WACV, author = {Adaloglou, Nikolas and Petrusheva, Diana and Asker, Mohamed and Michels, Felix and Kollmann, Markus}, title = {ClusterMine: Robust Label-Free Visual Out-Of-Distribution Detection via Concept Mining from Text Corpora}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1999-2010} }
FAIR-SIGHT: Fairness Assurance in Image Recognition via Simultaneous Conformal Thresholding and Dynamic Output Repair-
[pdf]
[arXiv]
[bibtex]@InProceedings{Fayyazi_2026_WACV, author = {Fayyazi, Arya and Kamal, Mehdi and Pedram, Massoud}, title = {FAIR-SIGHT: Fairness Assurance in Image Recognition via Simultaneous Conformal Thresholding and Dynamic Output Repair}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6633-6642} }
T2LF: LLM-Guided Multimodal Diffusion for Text-to-Light Field Synthesis-
[pdf]
[supp]
[bibtex]@InProceedings{Yoon_2026_WACV, author = {Yoon, Soyoung and Ahn, Namhyuk and Park, In Kyu}, title = {T2LF: LLM-Guided Multimodal Diffusion for Text-to-Light Field Synthesis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7322-7332} }
LENVIZ: A High-Resolution Low-Exposure Night Vision Benchmark Dataset-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Aithal_2026_WACV, author = {Aithal, Manjushree and VidalMata, Rosaura G and Kartha, Manikandtan and Chen, Gong and Adhikarla, Eashan and Kirsten, Lucas Nedel and Fu, Zhicheng and Madhusudhana, Nikhil Ambha and Nasti, Joseph V.}, title = {LENVIZ: A High-Resolution Low-Exposure Night Vision Benchmark Dataset}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2531-2540} }
Fine-grained Defocus Blur Control for Generative Image Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shrivastava_2026_WACV, author = {Shrivastava, Ayush and Barnes, Connelly and Zhang, Xuaner and Zhang, Lingzhi and Owens, Andrew and Amirghodsi, Sohrab and Shechtman, Eli}, title = {Fine-grained Defocus Blur Control for Generative Image Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4335-4344} }
MARS: a Multimodal Alignment and Ranking System for Few-Shot Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Catalano_2026_WACV, author = {Catalano, Nico and Samele, Stefano and Pertino, Paolo and Matteucci, Matteo}, title = {MARS: a Multimodal Alignment and Ranking System for Few-Shot Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1284-1293} }
Training-free Conditional Image Embedding Framework Leveraging Large Vision Language Models-
[pdf]
[supp]
[bibtex]@InProceedings{Kawarada_2026_WACV, author = {Kawarada, Masayuki and Yamada, Kosuke and Tejero-de-Pablos, Antonio and Inoue, Naoto}, title = {Training-free Conditional Image Embedding Framework Leveraging Large Vision Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7636-7646} }
DreamMakeup: Face Makeup Customization using Latent Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Park_2026_WACV, author = {Park, Geon Yeong and Han, Inhwa and Yang, Serin and Hong, Yeobin and Jeong, Seongmin and Jeon, Heechan and Goh, Myeongjin and Yi, Sung Won and Nam, Jin and Ye, Jong Chul}, title = {DreamMakeup: Face Makeup Customization using Latent Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {422-430} }
AirLock+: Scaling UAV-to-Satellite Image Registration for Target Geolocalization and Geospatial Augmented Reality-
[pdf]
[bibtex]@InProceedings{Deng_2026_WACV, author = {Deng, Zhiyun and Case, Austin and Sentis, Luis}, title = {AirLock+: Scaling UAV-to-Satellite Image Registration for Target Geolocalization and Geospatial Augmented Reality}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3340-3349} }
Morphing Through Time: Diffusion-Based Bridging of Temporal Gaps for Robust Alignment in Change Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Madani_2026_WACV, author = {Madani, Seyedehanita and Patel, Vishal M.}, title = {Morphing Through Time: Diffusion-Based Bridging of Temporal Gaps for Robust Alignment in Change Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {431-439} }
General and Domain-Specific Zero-shot Detection of Generated Images via Conditional Likelihood-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Betser_2026_WACV, author = {Betser, Roy and Hofman, Omer and Vainshtein, Roman and Gilboa, Guy}, title = {General and Domain-Specific Zero-shot Detection of Generated Images via Conditional Likelihood}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7809-7820} }
Multi-Modal Soccer Scene Analysis with Masked Pre-Training-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Peral_2026_WACV, author = {Peral, Marc and Capellera, Guillem and Ferraz, Luis and Rubio, Antonio and Agudo, Antonio}, title = {Multi-Modal Soccer Scene Analysis with Masked Pre-Training}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3536-3545} }
Learning Group Actions In Disentangled Latent Image Representations-
[pdf]
[arXiv]
[bibtex]@InProceedings{Swarnali_2026_WACV, author = {Swarnali, Farhana Hossain and Zhang, Miaomiao and Hossain, Tonmoy}, title = {Learning Group Actions In Disentangled Latent Image Representations}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3140-3149} }
Evaluating the Capability of Video Question Generation for Expert Knowledge Elicitation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2026_WACV, author = {Zhang, Huaying and Hashimoto, Atsushi and Hirasawa, Tosho}, title = {Evaluating the Capability of Video Question Generation for Expert Knowledge Elicitation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3047-3056} }
DiRe: Diversity-promoting Regularization for Dataset Condensation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mohanty_2026_WACV, author = {Mohanty, Saumyaranjan and Reddy, Aravind and Mopuri, Konda Reddy}, title = {DiRe: Diversity-promoting Regularization for Dataset Condensation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2818-2827} }
PredMapNet: Future and Historical Reasoning for Consistent Online HD Vectorized Map Construction-
[pdf]
[arXiv]
[bibtex]@InProceedings{Lang_2026_WACV, author = {Lang, Bo and Savaliya, Nirav and Zheng, Zhihao and Feng, Jinglun and Yeh, Zheng-Hang and Chuah, Mooi Choo}, title = {PredMapNet: Future and Historical Reasoning for Consistent Online HD Vectorized Map Construction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5477-5487} }
MM-TS: Multi-Modal Temperature and Margin Schedules for Contrastive Learning with Long-Tail Data-
[pdf]
[supp]
[bibtex]@InProceedings{Sheludzko_2026_WACV, author = {Sheludzko, Siarhei and Duka, Dhimitrios and Schiele, Bernt and Kuehne, Hilde and Kukleva, Anna}, title = {MM-TS: Multi-Modal Temperature and Margin Schedules for Contrastive Learning with Long-Tail Data}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7376-7386} }
Federated Model Synchronization for Diagnostic Redefinition through a Novel Selective Parameter Unlearning-
[pdf]
[supp]
[bibtex]@InProceedings{Kundalwal_2026_WACV, author = {Kundalwal, Mayank Kumar and Mamta, Mamta and Mishra, Deepak and Ekbal, Asif}, title = {Federated Model Synchronization for Diagnostic Redefinition through a Novel Selective Parameter Unlearning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1395-1404} }
VitaGlyph: Vitalizing Artistic Typography with Flexible Dual-branch Diffusion Models-
[pdf]
[arXiv]
[bibtex]@InProceedings{Feng_2026_WACV, author = {Feng, Kailai and Zhang, Yabo and Yu, Haodong and Ji, Zhilong and Bai, Jinfeng and Zhang, Hongzhi and Zuo, Wangmeng}, title = {VitaGlyph: Vitalizing Artistic Typography with Flexible Dual-branch Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8220-8230} }
Feature Inversion as a Lens on Vision Encoders-
[pdf]
[supp]
[bibtex]@InProceedings{Allakhverdov_2026_WACV, author = {Allakhverdov, Eduard and Tarasov, Dmitrii and Goncharova, Elizaveta and Kuznetsov, Andrey}, title = {Feature Inversion as a Lens on Vision Encoders}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3598-3605} }
DTMIR-Pro: Domain Translation with Prompt-based Latent-Space Generalization for Multi-Weather Image Restoration-
[pdf]
[supp]
[bibtex]@InProceedings{Kulkarni_2026_WACV, author = {Kulkarni, Ashutosh and Patil, Prashant W. and Vipparthi, Santosh Kumar and Murala, Subrahmanyam and Raman, Balasubramanian}, title = {DTMIR-Pro: Domain Translation with Prompt-based Latent-Space Generalization for Multi-Weather Image Restoration}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3846-3856} }
Diffusion-Based Authentication of Copy Detection Patterns: A Multimodal Framework with Printer Signature Conditioning-
[pdf]
[bibtex]@InProceedings{Atoki_2026_WACV, author = {Atoki, Bolutife and Tkachenko, Iuliia and Kerautret, Bertrand and Junior, Carlos Crispim}, title = {Diffusion-Based Authentication of Copy Detection Patterns: A Multimodal Framework with Printer Signature Conditioning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1685-1694} }
BREEN: Bridge Data-Efficient Encoder-Free Multimodal Learning with Learnable Queries-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Tianle and Rao, Yongming and Hu, Winston and Cheng, Yu}, title = {BREEN: Bridge Data-Efficient Encoder-Free Multimodal Learning with Learnable Queries}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5384-5395} }
GHOST: Getting to the Bottom of Hallucinations with A Multi-round Consistency Benchmark-
[pdf]
[supp]
[bibtex]@InProceedings{VS_2026_WACV, author = {VS, Vibashan and Chang, Nadine and Schmalfuss, Jenny and Patel, Vishal M. and Yu, Zhiding and Alvarez, Jose M.}, title = {GHOST: Getting to the Bottom of Hallucinations with A Multi-round Consistency Benchmark}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6163-6173} }
MorphXAI: An Explainable Framework for Morphological Analysis of Parasites in Blood Smear Images-
[pdf]
[arXiv]
[bibtex]@InProceedings{Yousaf_2026_WACV, author = {Yousaf, Aqsa and Win, Sint Sint and Coffee, Megan and Olufowobi, Habeeb}, title = {MorphXAI: An Explainable Framework for Morphological Analysis of Parasites in Blood Smear Images}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2125-2134} }
Optimizing against Infeasible Inclusions from Data for Semantic Segmentation through Morphology-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Basu_2026_WACV, author = {Basu, Shamik and Van Gool, Luc and Sakaridis, Christos}, title = {Optimizing against Infeasible Inclusions from Data for Semantic Segmentation through Morphology}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7524-7533} }
MuSACo: Multimodal Subject-Specific Selection and Adaptation for Expression Recognition with Co-Training-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zeeshan_2026_WACV, author = {Zeeshan, Muhammad Osama and Gillet, Natacha and Koerich, Alessandro Lameiras and Pedersoli, Marco and Bremond, Francois and Granger, Eric}, title = {MuSACo: Multimodal Subject-Specific Selection and Adaptation for Expression Recognition with Co-Training}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3606-3616} }
MANTA: Physics-Informed Generalized Underwater Object Tracking-
[pdf]
[supp]
[bibtex]@InProceedings{Srinath_2026_WACV, author = {Srinath, Suhas and Jamadagni, Hemang and Chandrasekar, Aditya and A P, Prathosh}, title = {MANTA: Physics-Informed Generalized Underwater Object Tracking}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3472-3482} }
Multimodal Medical Image Binding via Shared Text Embeddings-
[pdf]
[arXiv]
[bibtex]@InProceedings{Liu_2026_WACV, author = {Liu, Yunhao and Xi, Suyang and Liu, Shiqi and Ding, Hong and Jin, Chicheng and Zhong, Chong and He, Junjun and Liu, Catherine C. and Shen, Yiqing}, title = {Multimodal Medical Image Binding via Shared Text Embeddings}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1610-1620} }
Zero-Shot Audio-Visual Editing via Cross-Modal Delta Denoising-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lin_2026_WACV, author = {Lin, Yan-Bo and Lin, Kevin and Yang, Zhengyuan and Li, Linjie and Wang, Jianfeng and Lin, Chung-Ching and Wang, Xiaofei and Bertasius, Gedas and Wang, Lijuan}, title = {Zero-Shot Audio-Visual Editing via Cross-Modal Delta Denoising}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7344-7354} }
An improved architecture for part-based animal re-identification through semantic segmentation distillation-
[pdf]
[bibtex]@InProceedings{Neto_2026_WACV, author = {Neto, Eug\^enio Dias Ribeiro and Chaumont, Marc and Subsol, G\'erard and De Garine-Wichatitsky, Michel and Guis, H\'el\`ene}, title = {An improved architecture for part-based animal re-identification through semantic segmentation distillation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5280-5289} }
SegMango: Early Deep Mango Yield Prediction based on Flower Segmentation and Weather Data-
[pdf]
[bibtex]@InProceedings{Ven_2026_WACV, author = {Ven, Janaksinh and Sharma, Charu and Syed, Azeemuddin}, title = {SegMango: Early Deep Mango Yield Prediction based on Flower Segmentation and Weather Data}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4984-4993} }
From Detection to Anticipation: Online Understanding of Struggles across Various Tasks and Activities-
[pdf]
[supp]
[bibtex]@InProceedings{Feng_2026_WACV, author = {Feng, Shijia and Wray, Michael and Mayol-Cuevas, Walterio}, title = {From Detection to Anticipation: Online Understanding of Struggles across Various Tasks and Activities}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4036-4045} }
D2Mamba: Dual Domain Guided Informed Search in State Space Model for Underwater Image Enhancement-
[pdf]
[supp]
[bibtex]@InProceedings{Pramanick_2026_WACV, author = {Pramanick, Alik and Roy, Soumajit and Sur, Arijit}, title = {D2Mamba: Dual Domain Guided Informed Search in State Space Model for Underwater Image Enhancement}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7126-7136} }
RAT4D: Rig and Animate Objects without Surface Templates in 4D-
[pdf]
[supp]
[bibtex]@InProceedings{Dabhi_2026_WACV, author = {Dabhi, Mosam and Lucey, Simon and Jeni, Laszlo A.}, title = {RAT4D: Rig and Animate Objects without Surface Templates in 4D}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {393-401} }
Reinforcement Learning-based Adaptive Control of Classifier-Free Guidance and Timestep Embeddings in Diffusion Models-
[pdf]
[bibtex]@InProceedings{You_2026_WACV, author = {You, Haochen and Liu, Baojing and He, Hongyang}, title = {Reinforcement Learning-based Adaptive Control of Classifier-Free Guidance and Timestep Embeddings in Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {43-53} }
ImageChain: Advancing Sequential Image-to-Text Reasoning in Multimodal Large Language Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Villegas_2026_WACV, author = {Villegas, Danae Sanchez and Ziegler, Ingo and Elliott, Desmond}, title = {ImageChain: Advancing Sequential Image-to-Text Reasoning in Multimodal Large Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5131-5141} }
Blur2Sharp: Human Novel Pose and View Synthesis with Generative Prior Refinement-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lai_2026_WACV, author = {Lai, Chia-Hern and Lo, I-Hsuan and Yeh, Yen-Ku and Truong, Thanh-Nguyen and Huang, Ching-Chun}, title = {Blur2Sharp: Human Novel Pose and View Synthesis with Generative Prior Refinement}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3350-3359} }
SkelSplat: Robust Multi-view 3D Human Pose Estimation with Differentiable Gaussian Rendering-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bragagnolo_2026_WACV, author = {Bragagnolo, Laura and Barcellona, Leonardo and Ghidoni, Stefano}, title = {SkelSplat: Robust Multi-view 3D Human Pose Estimation with Differentiable Gaussian Rendering}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3036-3046} }
ControlEvents: Controllable Synthesis of Event Camera Data with Foundational Prior from Image Diffusion Models-
[pdf]
[supp]
[bibtex]@InProceedings{Hu_2026_WACV, author = {Hu, Yixuan and Xue, Yuxuan and Klenk, Simon and Cremers, Daniel and Pons-Moll, Gerard}, title = {ControlEvents: Controllable Synthesis of Event Camera Data with Foundational Prior from Image Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5509-5519} }
TM-Adapter: Temporal Merge Adapter for Efficient Global Temporal Modeling-
[pdf]
[supp]
[bibtex]@InProceedings{Hahm_2026_WACV, author = {Hahm, Woo Joo and Jang, Seungwoo and Kim, Hyeon Tak and Lee, Daeun and Kim, Kwangsu}, title = {TM-Adapter: Temporal Merge Adapter for Efficient Global Temporal Modeling}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6121-6131} }
From Few-Shot to Zero-Shot Pallet Load Recognition: A Deployed Embedding-Based Vision System for Industrial Logistics-
[pdf]
[supp]
[bibtex]@InProceedings{del_Olmo_2026_WACV, author = {del Olmo, Juan Jes\'us Losada and Ballesteros, Emilio Pardo and L\'opez-de-Teruel, Pedro E. and Ruiz, Alberto}, title = {From Few-Shot to Zero-Shot Pallet Load Recognition: A Deployed Embedding-Based Vision System for Industrial Logistics}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2901-2911} }
AFRAgent : An Adaptive Feature Renormalization Based High Resolution Aware GUI agent-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Anand_2026_WACV, author = {Anand, Neeraj and Jain, Rishabh and Patnaik, Sohan and Krishnamurthy, Balaji and Sarkar, Mausoom}, title = {AFRAgent : An Adaptive Feature Renormalization Based High Resolution Aware GUI agent}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1147-1158} }
SUGAR: A Sweeter Spot for Generative Unlearning of Many Identities-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nguyen_2026_WACV, author = {Nguyen, Dung Thuy and Nguyen, Quang and Robinette, Preston K. and Jiang, Eli and Johnson, Taylor T. and Leach, Kevin}, title = {SUGAR: A Sweeter Spot for Generative Unlearning of Many Identities}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2731-2740} }
LASOR: Towards Clinically Transparent and Explainable Ophthalmic Report Generation via Lesion-Aware Segmentation-
[pdf]
[bibtex]@InProceedings{Park_2026_WACV, author = {Park, Jian and Won, Hyunseon and Kim, JeeEun and Hwang, Joon Seo and Han, Jeong Mo and Park, Ji In and Hwang, Daniel Duck-Jin and Han, Jinyoung}, title = {LASOR: Towards Clinically Transparent and Explainable Ophthalmic Report Generation via Lesion-Aware Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5194-5204} }
ST-Think: How Multimodal Large Language Models Reason About 4D Worlds from Ego-Centric Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2026_WACV, author = {Wu, Peiran and Liu, Yunze and Liu, Miao and Shen, Junxiao}, title = {ST-Think: How Multimodal Large Language Models Reason About 4D Worlds from Ego-Centric Videos}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5174-5183} }
mmWEAVER: Environment-Specific mmWave Signal Synthesis from a Photo and Activity Description-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Monjur_2026_WACV, author = {Monjur, Mahathir and Nirjon, Shahriar}, title = {mmWEAVER: Environment-Specific mmWave Signal Synthesis from a Photo and Activity Description}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1875-1884} }
Optimizing LVLMs with On-Policy Data for Effective Hallucination Mitigation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yu_2026_WACV, author = {Yu, Chengzhi and Xu, Yifan and Chen, Yifan and Zhang, Wenyi}, title = {Optimizing LVLMs with On-Policy Data for Effective Hallucination Mitigation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4733-4743} }
Overcoming Fine-Grained Visual Challenges in Animal Re-Identification via Semantic Feature Alignment-
[pdf]
[supp]
[bibtex]@InProceedings{Wu_2026_WACV, author = {Wu, Yihao and Zhao, Di and Li, Yuzhuo and Alajas, Matthew and Glen, Alistair S. and Zhang, Jingfeng and Dobbie, Gillian and Wilson, Daniel and Koh, Yun Sing}, title = {Overcoming Fine-Grained Visual Challenges in Animal Re-Identification via Semantic Feature Alignment}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {371-381} }
Better Safe Than Sorry? Overreaction Problem of Vision Language Models in Visual Emergency Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Choi_2026_WACV, author = {Choi, Dasol and Lee, Seunghyun and Song, Youngsook}, title = {Better Safe Than Sorry? Overreaction Problem of Vision Language Models in Visual Emergency Recognition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4724-4732} }
Narrating For You: Prompt-guided Audio-visual Narrating Face Generation Employing Multi-entangled Latent Space-
[pdf]
[supp]
[bibtex]@InProceedings{K_2026_WACV, author = {K, Aashish Chandra and A V, Aashutosh and Das, Abhijit}, title = {Narrating For You: Prompt-guided Audio-visual Narrating Face Generation Employing Multi-entangled Latent Space}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1314-1323} }
Semi-Supervised Hierarchical Open-Set Classification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wallin_2026_WACV, author = {Wallin, Erik and Kahl, Fredrik and Hammarstrand, Lars}, title = {Semi-Supervised Hierarchical Open-Set Classification}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1989-1998} }
BrightRate: Quality Assessment for User-Generated HDR Videos-
[pdf]
[supp]
[bibtex]@InProceedings{Saini_2026_WACV, author = {Saini, Shreshth and Chen, Bowen and Wang, Yilin and Birkbeck, Neil and Adsumilli, Balu and Bovik, Alan C.}, title = {BrightRate: Quality Assessment for User-Generated HDR Videos}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1522-1532} }
Guiding What Not to Generate: Automated Negative Prompting for Text-Image Alignment-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Park_2026_WACV, author = {Park, Sangha and Kim, Eunji and Oh, Yeongtak and Choi, Jooyoung and Yoon, Sungroh}, title = {Guiding What Not to Generate: Automated Negative Prompting for Text-Image Alignment}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6664-6675} }
LASER: Lip Landmark Assisted Speaker Detection for Robustness-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nguyen_2026_WACV, author = {Nguyen, Le Thien Phuc and Yu, Zhuoran and Lee, Yong Jae}, title = {LASER: Lip Landmark Assisted Speaker Detection for Robustness}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7291-7300} }
Spacewalk-18: A Benchmark for Multimodal and Long-form Procedural Video Understanding in Novel Domains-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tang_2026_WACV, author = {Tang, Zitian and Krishnan, Rohan Myer and Yu, Zhiqiu and Sun, Chen}, title = {Spacewalk-18: A Benchmark for Multimodal and Long-form Procedural Video Understanding in Novel Domains}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4472-4482} }
Extreme Amodal Face Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Song_2026_WACV, author = {Song, Changlin and Hou, Yunzhong and Barnes, Michael Randall and Shome, Rahul and Campbell, Dylan}, title = {Extreme Amodal Face Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2934-2943} }
Event-based Graph Representation with Spatial and Motion Vectors for Asynchronous Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Verma_2026_WACV, author = {Verma, Aayush Atul and Vaghela, Arpitsinh and Chakravarthi, Bharatesh and Chanda, Kaustav and Yang, Yezhou}, title = {Event-based Graph Representation with Spatial and Motion Vectors for Asynchronous Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3781-3791} }
PHYSPLAT: a Framework for Photorealistic Hybrid Simulation of Real and Synthetic Elements using 3D Gaussian Splatting-
[pdf]
[supp]
[bibtex]@InProceedings{Alfonso-Arsuaga_2026_WACV, author = {Alfonso-Arsuaga, Mario and Dominguez-Elvira, Henar and Casas-Guerrero, Jorge and Castiella-Aguirrezabala, Andrea and Dom{\'\i}nguez, Lorenzo Cost\'abile and Garc{\'\i}a-Gonz\'alez, Jorge and Naranjo-Almeida, Maria and Comino-Trinidad, Marc and Lopez-Moreno, Jorge}, title = {PHYSPLAT: a Framework for Photorealistic Hybrid Simulation of Real and Synthetic Elements using 3D Gaussian Splatting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1621-1631} }
VOCAL: Visual Odometry via ContrAstive Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2026_WACV, author = {Huang, Chi-Yao and Bhatt, Zeel and Yang, Yezhou}, title = {VOCAL: Visual Odometry via ContrAstive Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3297-3309} }
Multi-view Stereo with Multiple Projectors for Oneshot Entire Shape Scan based on Neural SDF and DSSS Demultiplexing-
[pdf]
[supp]
[bibtex]@InProceedings{Nishihara_2026_WACV, author = {Nishihara, Kota and Furukawa, Ryo and Sagawa, Ryusuke and Kawasaki, Hiroshi}, title = {Multi-view Stereo with Multiple Projectors for Oneshot Entire Shape Scan based on Neural SDF and DSSS Demultiplexing}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5488-5497} }
Self-Supervised Visual Prompting for Cross-Domain Road Damage Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xiao_2026_WACV, author = {Xiao, Xi and Wang, Zhuxuanzi and Mo, Mingqiao and Liu, Chen and Ma, Chenrui and Li, Yanshu and Krishnaswamy, Smita and Wang, Xiao and Wang, Tianyang}, title = {Self-Supervised Visual Prompting for Cross-Domain Road Damage Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3514-3524} }
SpecGen: Neural Spectral BRDF Generation via Spectral-Spatial Tri-plane Aggregation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jin_2026_WACV, author = {Jin, Zhenyu and Li, Wenjie and Ma, Zhanyu and Guo, Heng}, title = {SpecGen: Neural Spectral BRDF Generation via Spectral-Spatial Tri-plane Aggregation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8323-8332} }
TimeRefine: Temporal Grounding with Time Refining Video LLM-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wang_2026_WACV, author = {Wang, Xizi and Cheng, Feng and Wang, Ziyang and Wang, Huiyu and Islam, Md Mohaiminul and Torresani, Lorenzo and Bansal, Mohit and Bertasius, Gedas and Crandall, David}, title = {TimeRefine: Temporal Grounding with Time Refining Video LLM}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5067-5078} }
Towards High-Fidelity, Identity-Preserving Real-Time Makeup Transfer: Decoupling Style Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chau_2026_WACV, author = {Chau, Lydia and Yu, Zhi and Jiang, Ruowei}, title = {Towards High-Fidelity, Identity-Preserving Real-Time Makeup Transfer: Decoupling Style Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3588-3597} }
OMeGa: Joint Optimization of Explicit Meshes and Gaussian Splats for Robust Scene-Level Surface Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cao_2026_WACV, author = {Cao, Yuhang and Yan, Haojun and Yao, Danya}, title = {OMeGa: Joint Optimization of Explicit Meshes and Gaussian Splats for Robust Scene-Level Surface Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4386-4395} }
Feedback Alignment Meets Low-Rank Manifolds: A Structured Recipe for Local Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Roy_2026_WACV, author = {Roy, Arani and Apolinario, Marco P. and Das Biswas, Shristi and Roy, Kaushik}, title = {Feedback Alignment Meets Low-Rank Manifolds: A Structured Recipe for Local Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2984-2992} }
Edge-Aware Image Manipulation via Diffusion Models with a Novel Structure-Preservation Loss-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gong_2026_WACV, author = {Gong, Minsu and Ryu, Nuri and Ok, Jungseul and Cho, Sunghyun}, title = {Edge-Aware Image Manipulation via Diffusion Models with a Novel Structure-Preservation Loss}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5142-5153} }
Comp4D: Compositional 4D Scene Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Liang_2026_WACV, author = {Liang, Hanwen and Xu, Dejia and Bhatt, Neel P. and Hu, Hezhen and Liang, Hanxue and Plataniotis, Konstantinos N.}, title = {Comp4D: Compositional 4D Scene Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3567-3577} }
One-Shot Fine-Grained Re-Identification of Paint Marked Honey Bees using Vision Foundation Models-
[pdf]
[bibtex]@InProceedings{Meyers_2026_WACV, author = {Meyers, Luke and Rodr{\'\i}guez-Cordero, Josu\'e A. and M\'egret, R\'emi}, title = {One-Shot Fine-Grained Re-Identification of Paint Marked Honey Bees using Vision Foundation Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {560-569} }
PaRaChute: Pathology-Radiology Cross-Modal Fusion for Missing-Modality-Robust Survival Prediction-
[pdf]
[supp]
[bibtex]@InProceedings{Caforio_2026_WACV, author = {Caforio, Pietro and Poles, Isabella and Santambrogio, Marco D.}, title = {PaRaChute: Pathology-Radiology Cross-Modal Fusion for Missing-Modality-Robust Survival Prediction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {718-728} }
Zero-Shot Table Extraction in Business Documents: A Unified Benchmark with Error Taxonomy and Ecological Analysis-
[pdf]
[bibtex]@InProceedings{Thomas_2026_WACV, author = {Thomas, Eliott and Coustaty, Mickael and Joseph, Aur\'elie and Pham, Tri-Cong and Deloin, Gaspar and Carel, Elodie and D'andecy, Vincent Poulain and Ogier, Jean-Marc}, title = {Zero-Shot Table Extraction in Business Documents: A Unified Benchmark with Error Taxonomy and Ecological Analysis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4974-4983} }
A Unified Diffusion-Based Framework for Multi-Agent Trajectory Prediction Integrating Structured Multi-Modal Representations-
[pdf]
[bibtex]@InProceedings{Yang_2026_WACV, author = {Yang, Chenxi and Xi, Suyang and Ding, Hong and Shen, Yiqing and Liu, Yunhao}, title = {A Unified Diffusion-Based Framework for Multi-Agent Trajectory Prediction Integrating Structured Multi-Modal Representations}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6442-6452} }
From Street to Orbit: Training-Free Cross-View Retrieval via Location Semantics and LLM Guidance-
[pdf]
[arXiv]
[bibtex]@InProceedings{Min_2026_WACV, author = {Min, Jeongho and Kim, Dongyoung and Lee, Jaehyup}, title = {From Street to Orbit: Training-Free Cross-View Retrieval via Location Semantics and LLM Guidance}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {570-579} }
Training-free Detection of Text-to-video Generations via Over-coherence-
[pdf]
[bibtex]@InProceedings{Brokman_2026_WACV, author = {Brokman, Jonathan and Rachmil, Oren and Hofman, Omer and Betser, Roy and Giloni, Amit and Vainshtein, Roman and Kojima, Hisashi}, title = {Training-free Detection of Text-to-video Generations via Over-coherence}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3993-4003} }
Countering Multi-modal Representation Collapse through Rank-targeted Fusion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2026_WACV, author = {Kim, Seulgi and Kokilepersaud, Kiran and Prabhushankar, Mohit and AlRegib, Ghassan}, title = {Countering Multi-modal Representation Collapse through Rank-targeted Fusion}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4744-4754} }
MSRTrack: LLM-Powered Object Tracking with Motion and Semantic Reasoning-
[pdf]
[bibtex]@InProceedings{Shen_2026_WACV, author = {Shen, Tong and Wang, Di and Moura, Jos\'e M. F.}, title = {MSRTrack: LLM-Powered Object Tracking with Motion and Semantic Reasoning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {838-848} }
MarineEval: Assessing the Marine Intelligence of Vision-Language Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wong_2026_WACV, author = {Wong, Yuk Kwan and To, Tuan-An and Zhang, Jipeng and Zheng, Ziqiang and Yeung, Sai-Kit}, title = {MarineEval: Assessing the Marine Intelligence of Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1459-1470} }
MMHOI: Modeling Complex 3D Multi-Human Multi-Object Interactions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kogashi_2026_WACV, author = {Kogashi, Kaen and Cherian, Anoop and Kuo, Meng-Yu Jennifer}, title = {MMHOI: Modeling Complex 3D Multi-Human Multi-Object Interactions}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1512-1521} }
CLIP's Visual Embedding Projector is a Few-shot Cornucopia-
[pdf]
[supp]
[bibtex]@InProceedings{Fahes_2026_WACV, author = {Fahes, Mohammad and Vu, Tuan-Hung and Bursuc, Andrei and Perez, Patrick and De Charette, Raoul}, title = {CLIP's Visual Embedding Projector is a Few-shot Cornucopia}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3254-3264} }
MomentMix Augmentation with Length-Aware DETR for Temporally Robust Moment Retrieval-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Park_2026_WACV, author = {Park, Seojeong and Choi, Jiho and Baek, Kyungjune and Shim, Hyunjung}, title = {MomentMix Augmentation with Length-Aware DETR for Temporally Robust Moment Retrieval}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1127-1136} }
IMPACT: Interpretable Most Important Person Analysis and Classification using Transformer-based Models-
[pdf]
[supp]
[bibtex]@InProceedings{Rampuria_2026_WACV, author = {Rampuria, Akshat and Nayak, Kamakshya Prasad and Thakare, Kamalakar Vijay and Joshi, Tushar and Singh, Aditya Dhananjay and Park, Haesol and Choi, Heeseung and Dogra, Debi Prosad and Kim, Ig-Jae}, title = {IMPACT: Interpretable Most Important Person Analysis and Classification using Transformer-based Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8179-8187} }
HOLO: Holistic Lightweight Optimization for Scene Understanding with Auto-Annotation and Multimodal Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Hu_2026_WACV, author = {Hu, Xiaoyun and Yan, Xiaohan and Wang, Nan and Wei, Gang and Wang, Zhicheng}, title = {HOLO: Holistic Lightweight Optimization for Scene Understanding with Auto-Annotation and Multimodal Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7719-7729} }
UniVid: Unifying Vision Tasks with Pre-trained Video Generation Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2026_WACV, author = {Chen, Lan and Gu, Yuchao and Mao, Qi}, title = {UniVid: Unifying Vision Tasks with Pre-trained Video Generation Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6754-6763} }
Sea-CLIP: Mining Semantic-Aware Representations for Few-Shot Anomaly Detection with CLIP-
[pdf]
[supp]
[bibtex]@InProceedings{Guo_2026_WACV, author = {Guo, Xiao and Chen, Zhimin and Castillo, Carlos D. and Wang, Hongcheng and Liu, Xiaoming}, title = {Sea-CLIP: Mining Semantic-Aware Representations for Few-Shot Anomaly Detection with CLIP}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3689-3699} }
CasTex: Cascaded Text-to-Texture Synthesis via Explicit Texture Maps and Physically-Based Shading-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Aliev_2026_WACV, author = {Aliev, Mishan and Baranchuk, Dmitry and Struminsky, Kirill}, title = {CasTex: Cascaded Text-to-Texture Synthesis via Explicit Texture Maps and Physically-Based Shading}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3411-3420} }
SOPHY: Generating Simulation-Ready Objects with Physical Materials-
[pdf]
[supp]
[bibtex]@InProceedings{Cao_2026_WACV, author = {Cao, Junyi and Kalogerakis, Evangelos}, title = {SOPHY: Generating Simulation-Ready Objects with Physical Materials}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4693-4704} }
SasMamba: A Lightweight Structure-Aware Stride State Space Model for 3D Human Pose Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cui_2026_WACV, author = {Cui, Hu and Hua, Wenqiang and Huang, Renjing and Jia, Shurui and Hayama, Tessai}, title = {SasMamba: A Lightweight Structure-Aware Stride State Space Model for 3D Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2721-2730} }
MedPEFT-CL: Dual-Phase Parameter-Efficient Continual Learning with Medical Semantic Adapter and Bidirectional Memory Consolidation-
[pdf]
[bibtex]@InProceedings{Gao_2026_WACV, author = {Gao, Ziyuan and Morel, Philippe}, title = {MedPEFT-CL: Dual-Phase Parameter-Efficient Continual Learning with Medical Semantic Adapter and Bidirectional Memory Consolidation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7699-7708} }
ZebraPose: Zebra Detection and Pose Estimation using only Synthetic Data-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bonetto_2026_WACV, author = {Bonetto, Elia and Ahmad, Aamir}, title = {ZebraPose: Zebra Detection and Pose Estimation using only Synthetic Data}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6611-6620} }
Action Anticipation at a Glimpse: To What Extent Can Multimodal Cues Replace Video?-
[pdf]
[supp]
[bibtex]@InProceedings{Benavent-Lledo_2026_WACV, author = {Benavent-Lledo, Manuel and Bacharidis, Konstantinos and Manousaki, Victoria and Papoutsakis, Konstantinos and Argyros, Antonis and Garcia-Rodriguez, Jose}, title = {Action Anticipation at a Glimpse: To What Extent Can Multimodal Cues Replace Video?}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {276-286} }
Systematic Analysis of the Unintentional CSAM-Generation-Potential of Text-to-Image Models-
[pdf]
[bibtex]@InProceedings{Goller_2026_WACV, author = {G\"oller, Nicolas and Steinebach, Martin}, title = {Systematic Analysis of the Unintentional CSAM-Generation-Potential of Text-to-Image Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {493-502} }
Inpainting of Sparse Depth Maps from Monocular Depth-from-Focus on Pixel Processor Arrays-
[pdf]
[supp]
[bibtex]@InProceedings{Lewandowski_2026_WACV, author = {Lewandowski, Maciej and Dudek, Piotr}, title = {Inpainting of Sparse Depth Maps from Monocular Depth-from-Focus on Pixel Processor Arrays}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5612-5622} }
DM3Net: Dual-Camera Super-Resolution via Domain Modulation and Multi-scale Matching-
[pdf]
[supp]
[bibtex]@InProceedings{Guan_2026_WACV, author = {Guan, Cong and Ying, Jiacheng and Ieiri, Yuya and Yoshie, Osamu}, title = {DM3Net: Dual-Camera Super-Resolution via Domain Modulation and Multi-scale Matching}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7472-7481} }
Similarity-aware Probabilistic Embeddings Modeling for Video-Text Retrieval-
[pdf]
[bibtex]@InProceedings{Huang_2026_WACV, author = {Huang, Yuliang and Wei, Pengxu and Dong, Zhicheng and Lin, Liang}, title = {Similarity-aware Probabilistic Embeddings Modeling for Video-Text Retrieval}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4451-4460} }
Distilling What and Why: Enhancing Driver Intention Prediction with MLLMs-
[pdf]
[supp]
[bibtex]@InProceedings{Artham_2026_WACV, author = {Artham, Sainithin and Dasgupta, Avijit and Gangisetty, Shankar and Jawahar, C.V.}, title = {Distilling What and Why: Enhancing Driver Intention Prediction with MLLMs}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7281-7290} }
Towards Fast and Scalable Normal Integration using Continuous Components-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Milano_2026_WACV, author = {Milano, Francesco and Chung, Jen Jen and Ott, Lionel and Siegwart, Roland}, title = {Towards Fast and Scalable Normal Integration using Continuous Components}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {236-244} }
ViSTA: Visual Storytelling using Multi-modal Adapters for Text-to-Image Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dong_2026_WACV, author = {Dong, Sibo and Shaheen, Ismail and Shen, Maggie and Mallick, Rupayan and Bargal, Sarah Adel}, title = {ViSTA: Visual Storytelling using Multi-modal Adapters for Text-to-Image Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {12-21} }
Diffusion-Based Action Recognition Generalizes to Untrained Domains-
[pdf]
[supp]
[bibtex]@InProceedings{Guimaraes_2026_WACV, author = {Guimar\~aes, Rog\'erio and Xiao, Frank and Perona, Pietro and Marks, Markus}, title = {Diffusion-Based Action Recognition Generalizes to Untrained Domains}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5919-5933} }
EVTP-IVS: Effective Visual Token Pruning For Unifying Instruction Visual Segmentation In Multi-Modal Large Language Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2026_WACV, author = {Zhu, Wenhui and Chen, Xiwen and Wang, Zhipeng and Tang, Shao and Ghosh, Sayan and Dong, Xuanzhao and Koner, Rajat and Wang, Yalin}, title = {EVTP-IVS: Effective Visual Token Pruning For Unifying Instruction Visual Segmentation In Multi-Modal Large Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7158-7167} }
Data-Driven Lipschitz Continuity: A Cost-Effective Approach to Improve Adversarial Robustness-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2026_WACV, author = {Chen, Erh-Chung and Chen, Pin-Yu and Chung, I-Hsin and Lee, Che-Rung}, title = {Data-Driven Lipschitz Continuity: A Cost-Effective Approach to Improve Adversarial Robustness}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {698-707} }
MixER: From Cross-Modal to Mixed-Modal Visible-Infrared Re-Identification-
[pdf]
[supp]
[bibtex]@InProceedings{Alehdaghi_2026_WACV, author = {Alehdaghi, Mahdi and Bhattacharya, Rajarshi and Yannick, Dai and Shamsolmoali, Pourya and Cruz, Rafael M. O. and Granger, Eric}, title = {MixER: From Cross-Modal to Mixed-Modal Visible-Infrared Re-Identification}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3431-3440} }
A Fast, Simple, and Flexible Scale Informative Feature Transform Module for Arbitrary Scale Image Super-Resolution-
[pdf]
[supp]
[bibtex]@InProceedings{Kar_2026_WACV, author = {Kar, Aupendu and Biswas, Prabir Kumar}, title = {A Fast, Simple, and Flexible Scale Informative Feature Transform Module for Arbitrary Scale Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1405-1414} }
ReFineVQA: Iterative Refinement of Video Description via Feedback Generation for Video Question Answering-
[pdf]
[supp]
[bibtex]@InProceedings{Shin_2026_WACV, author = {Shin, Jeongwan and Hur, Chan and Cho, Seongmin and Choi, Jaeho and Park, Hyeyoung}, title = {ReFineVQA: Iterative Refinement of Video Description via Feedback Generation for Video Question Answering}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7647-7657} }
DUDA: Distilled Unsupervised Domain Adaptation for Lightweight Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kang_2026_WACV, author = {Kang, Beomseok and Mithun, Niluthpol Chowdhury and Rajvanshi, Abhinav and Chiu, Han-Pang and Samarasekera, Supun}, title = {DUDA: Distilled Unsupervised Domain Adaptation for Lightweight Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8124-8135} }
Human Knowledge Integrated Multi-modal Learning for Single Source Domain Generalization-
[pdf]
[supp]
[bibtex]@InProceedings{Banerjee_2026_WACV, author = {Banerjee, Ayan and Thakur, Kuntal and Gupta, Sandeep}, title = {Human Knowledge Integrated Multi-modal Learning for Single Source Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2380-2391} }
Unified Alignment Protocol: Making Sense of the Unlabeled Data in New Domains-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ahmed_2026_WACV, author = {Ahmed, Sabbir and Rizve, Mamshad Nayeem and Al Arafat, Abdullah and Liu, Jacqueline Tiffany and Hossain, Rahim and Al Nahian, Mohaiminul and Rakin, Adnan Siraj}, title = {Unified Alignment Protocol: Making Sense of the Unlabeled Data in New Domains}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2974-2983} }
ART-ASyn: Anatomy-aware Realistic Texture-based Anomaly Synthesis Framework for Chest X-Rays-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cao_2026_WACV, author = {Cao, Qinyi and Fan, Jianan and Cai, Weidong}, title = {ART-ASyn: Anatomy-aware Realistic Texture-based Anomaly Synthesis Framework for Chest X-Rays}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3792-3802} }
OPFormer: Object Pose Estimation Leveraging Foundation Model with Geometric Encoding-
[pdf]
[supp]
[bibtex]@InProceedings{Moroz_2026_WACV, author = {Moroz, Artem and Zeman, V{\'\i}t and Mik\v{s}{\'\i}k, Martin and Isianova, Elizaveta and David, Miroslav and Burget, Pavel and Burde, Varun}, title = {OPFormer: Object Pose Estimation Leveraging Foundation Model with Geometric Encoding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6621-6632} }
AnyAnomaly: Zero-Shot Customizable Video Anomaly Detection with LVLM-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ahn_2026_WACV, author = {Ahn, Sunghyun and Jo, Youngwan and Lee, Kijung and Kwon, Sein and Hong, Inpyo and Park, Sanghyun}, title = {AnyAnomaly: Zero-Shot Customizable Video Anomaly Detection with LVLM}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3026-3035} }
Global Focal and Radial Distortion Averaging from Radial Fundamental Matrices for Robust Self-Calibration-
[pdf]
[bibtex]@InProceedings{Solonets_2026_WACV, author = {Solonets, Sergei and Sinitsyn, Daniil and Cremers, Daniel}, title = {Global Focal and Radial Distortion Averaging from Radial Fundamental Matrices for Robust Self-Calibration}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4777-4786} }
Enhancing Reverse Distillation with Core Exemplar Learning for Unified Multi-Class Anomaly Detection-
[pdf]
[bibtex]@InProceedings{Lim_2026_WACV, author = {Lim, Heechul and Kim, Min-Soo and Lee, Hyun-Boo and Kang, Suk-Ju and Chon, Kang-Wook and Lee, Haeyun}, title = {Enhancing Reverse Distillation with Core Exemplar Learning for Unified Multi-Class Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7586-7595} }
AFL-PRF: Adaptive Federated Learning for Low-Quality Data: Enhancing Performance, Robustness, and Fairness-
[pdf]
[bibtex]@InProceedings{Yu_2026_WACV, author = {Yu, Pinrui and Xie, Yiming and Ye, Longtian and Yuan, Geng and Mi, Ningfang and Lin, Xue}, title = {AFL-PRF: Adaptive Federated Learning for Low-Quality Data: Enhancing Performance, Robustness, and Fairness}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {402-411} }
LightGazeNet: A Lightweight GNN-based Architecture for Gaze Estimation-
[pdf]
[bibtex]@InProceedings{Patel_2026_WACV, author = {Patel, Heena and Chowdhury, Anirban and Choksy, Pooja Jigar and Pachade, Samiksha Pradeep and Puar, Ajinkya}, title = {LightGazeNet: A Lightweight GNN-based Architecture for Gaze Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3710-3719} }
CountingDINO: A Training-free Pipeline for Class-Agnostic Counting using Unsupervised Backbones-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Pacini_2026_WACV, author = {Pacini, Giacomo and Bianchi, Lorenzo and Ciampi, Luca and Messina, Nicola and Amato, Giuseppe and Falchi, Fabrizio}, title = {CountingDINO: A Training-free Pipeline for Class-Agnostic Counting using Unsupervised Backbones}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {806-815} }
ENCORE : A Neural Collapse Perspective on Out-of-Distribution Detection in Deep Neural Networks-
[pdf]
[supp]
[bibtex]@InProceedings{Sayyed_2026_WACV, author = {Sayyed, A. Q. M. Sazzad and Bastian, Nathaniel D. and Restuccia, Francesco}, title = {ENCORE : A Neural Collapse Perspective on Out-of-Distribution Detection in Deep Neural Networks}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2944-2953} }
FAE-Net: Fashion Attribute Editing via Disentangled Latent Conditioning in Diffusion Models-
[pdf]
[supp]
[bibtex]@InProceedings{Bhargav_2026_WACV, author = {Bhargav, P. Rajith and Bhattacharya, Gaurab and Vivek, B S and Gubbi, Jayavardhana}, title = {FAE-Net: Fashion Attribute Editing via Disentangled Latent Conditioning in Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {192-201} }
Robust Multimodal Emotion Recognition from Incomplete Modalities via Query-Based Unimodal and Cross-Modal Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Miyoshi_2026_WACV, author = {Miyoshi, Ryo and Otani, Mayu and Okafuji, Yuki}, title = {Robust Multimodal Emotion Recognition from Incomplete Modalities via Query-Based Unimodal and Cross-Modal Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4901-4911} }
R3: Reconstruction, Raw, and Rain: Deraining Directly in the Bayer Domain-
[pdf]
[bibtex]@InProceedings{Rothschild_2026_WACV, author = {Rothschild, Nate and Kimhi, Moshe and Mendelson, Avi and Baskin, Chaim}, title = {R3: Reconstruction, Raw, and Rain: Deraining Directly in the Bayer Domain}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5313-5321} }
Joint Optimization of Camera Model and Deep Neural Network for Image Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Noboru_2026_WACV, author = {Noboru, Youta and Ozasa, Yuko and Tanaka, Masayuki}, title = {Joint Optimization of Camera Model and Deep Neural Network for Image Recognition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7626-7635} }
SCORP: Scene-Consistent Object Refinement via Proxy Generation and Tuning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2026_WACV, author = {Chen, Ziwei and Liu, Ziling and Huang, Zitong and Gao, Mingqi and Zheng, Feng}, title = {SCORP: Scene-Consistent Object Refinement via Proxy Generation and Tuning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {795-805} }
DirectDrag: High-Fidelity, Mask-Free, Prompt-Free Drag-based Image Editing via Readout-Guided Feature Alignment-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liao_2026_WACV, author = {Liao, Sheng-Hao and Chen, Shang-Fu and Huang, Tai-Ming and Cheng, Wen-Huang and Hua, Kai-Lung}, title = {DirectDrag: High-Fidelity, Mask-Free, Prompt-Free Drag-based Image Editing via Readout-Guided Feature Alignment}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8252-8261} }
Single-step Diffusion for Image Compression at Ultra-Low Bitrates-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Park_2026_WACV, author = {Park, Chanung and Lee, Joo Chan and Ko, Jong Hwan}, title = {Single-step Diffusion for Image Compression at Ultra-Low Bitrates}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6391-6400} }
TED-4DGS: Temporally Activated and Embedding-based Deformation for 4DGS Compression-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ho_2026_WACV, author = {Ho, Cheng-Yuan and Yang, He-Bi and Chiang, Jui-Chiu and Liu, Yu-Lun and Peng, Wen-Hsiao}, title = {TED-4DGS: Temporally Activated and Embedding-based Deformation for 4DGS Compression}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6371-6380} }
The Perceptual Observatory Characterizing Robustness and Grounding in MLLMs-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Anvekar_2026_WACV, author = {Anvekar, Tejas and Bardoliya, Fenil and Turaga, Pavan K. and Baral, Chitta and Gupta, Vivek}, title = {The Perceptual Observatory Characterizing Robustness and Grounding in MLLMs}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1653-1663} }
Seeing is Believing (and Predicting): Context-Aware Multi-Human Behavior Prediction with Vision Language Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Panchal_2026_WACV, author = {Panchal, Utsav and Liu, Yuchen and Palmieri, Luigi and Georgievski, Ilche and Aiello, Marco}, title = {Seeing is Believing (and Predicting): Context-Aware Multi-Human Behavior Prediction with Vision Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1959-1968} }
MAESTRO: Masked AutoEncoders for Multimodal, Multitemporal, and Multispectral Earth Observation Data-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Labatie_2026_WACV, author = {Labatie, Antoine and Vaccaro, Michael and Lardiere, Nina and Garioud, Anatol and Gonthier, Nicolas}, title = {MAESTRO: Masked AutoEncoders for Multimodal, Multitemporal, and Multispectral Earth Observation Data}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {212-224} }
ASC: Learning Augmentation Severity-Consistent Representations Improves Generalization via Augmentation Search-
[pdf]
[supp]
[bibtex]@InProceedings{Alamdar_2026_WACV, author = {Alamdar, Amirhossein and Jafarinia, Hossein and Noori, Mahdi and Rohban, Mohammad Hossein}, title = {ASC: Learning Augmentation Severity-Consistent Representations Improves Generalization via Augmentation Search}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1926-1936} }
View-aware Cross-modal Distillation for Multi-view Action Recognition-
[pdf]
[arXiv]
[bibtex]@InProceedings{Nguyen_2026_WACV, author = {Nguyen, Trung Thanh and Kawanishi, Yasutomo and John, Vijay and Komamizu, Takahiro and Ide, Ichiro}, title = {View-aware Cross-modal Distillation for Multi-view Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7769-7778} }
Autoregressive Styled Text Image Generation, but Make it Reliable-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zaccagnino_2026_WACV, author = {Zaccagnino, Carmine and Quattrini, Fabio and Pippi, Vittorio and Cascianelli, Silvia and Tonioni, Alessio and Cucchiara, Rita}, title = {Autoregressive Styled Text Image Generation, but Make it Reliable}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3668-3678} }
FedEFC: Federated Learning Using Enhanced Forward Correction Against Noisy Labels-
[pdf]
[arXiv]
[bibtex]@InProceedings{Yu_2026_WACV, author = {Yu, Seunghun and Ahn, Jin-Hyun and Kang, Joonhyuk}, title = {FedEFC: Federated Learning Using Enhanced Forward Correction Against Noisy Labels}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8094-8102} }
More Than Memory Savings: Zeroth-Order Optimization Mitigates Forgetting in Continual Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yu_2026_WACV, author = {Yu, Wanhao and Wang, Zheng and Niu, Shuteng and Lin, Sen and Yang, Li}, title = {More Than Memory Savings: Zeroth-Order Optimization Mitigates Forgetting in Continual Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4766-4776} }
Learning to Animate Images from A Few Videos to Portray Delicate Human Actions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Haoxin and Yu, Yingchen and Wu, Qilong and Zhang, Hanwang and Bai, Song and Li, Boyang}, title = {Learning to Animate Images from A Few Videos to Portray Delicate Human Actions}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {547-559} }
UniCalib: Targetless LiDAR-camera Calibration via Probabilistic Flow on Unified Depth Representations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Han_2026_WACV, author = {Han, Shu and Zhu, Xubo and Wu, Ji and Cai, Ximeng and Yang, Wen and Yu, Huai and Xia, Gui-Song}, title = {UniCalib: Targetless LiDAR-camera Calibration via Probabilistic Flow on Unified Depth Representations}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1906-1915} }
StreetView-Waste: A Multi-Task Dataset for Urban Waste Management-
[pdf]
[supp]
[bibtex]@InProceedings{Paulo_2026_WACV, author = {Paulo, Diogo J. and Martins, Jo\~ao and Proen\c{c}a, Hugo and Neves, Jo\~ao C.}, title = {StreetView-Waste: A Multi-Task Dataset for Urban Waste Management}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3015-3025} }
Beyond the Highlights: Video Retrieval with Salient and Surrounding Contexts-
[pdf]
[supp]
[bibtex]@InProceedings{Bang_2026_WACV, author = {Bang, Jaehun and Ye-Bin, Moon and Oh, Tae-Hyun and Joo, Kyungdon}, title = {Beyond the Highlights: Video Retrieval with Salient and Surrounding Contexts}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2188-2197} }
DF-Mamba: Deformable State Space Modeling for 3D Hand Pose Estimation in Interactions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhou_2026_WACV, author = {Zhou, Yifan and Ohkawa, Takehiko and Zhou, Guwenxiao and Goto, Kanoko and Hirose, Takumi and Sekikawa, Yusuke and Inoue, Nakamasa}, title = {DF-Mamba: Deformable State Space Modeling for 3D Hand Pose Estimation in Interactions}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5352-5363} }
Eye-for-an-eye: Appearance Transfer with Dense Semantic Correspondence in Diffusion Models-
[pdf]
[supp]
[bibtex]@InProceedings{Go_2026_WACV, author = {Go, Sooyeon and Choi, Kyungmook and Shin, Minjung and Uh, Youngjung}, title = {Eye-for-an-eye: Appearance Transfer with Dense Semantic Correspondence in Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4641-4650} }
PiSA: A Self-Augmented Data Engine and Training Strategy for 3D Understanding with Large Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Guo_2026_WACV, author = {Guo, Zilu and Lin, Hongbin and Yuan, Zhihao and Zheng, Chaoda and Qiu, Pengshuo and Jiang, Dongzhi and Zhang, Renrui and Feng, Chun-Mei and Li, Zhen}, title = {PiSA: A Self-Augmented Data Engine and Training Strategy for 3D Understanding with Large Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1273-1283} }
Analysis of Text Accuracy and Visual Alignment in Vision-Language Models for Artistic Text Generation-
[pdf]
[bibtex]@InProceedings{Alderazi_2026_WACV, author = {Alderazi, Fatima and Alfarraj, Motaz}, title = {Analysis of Text Accuracy and Visual Alignment in Vision-Language Models for Artistic Text Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {879-887} }
Do Generative Video Models Understand Physical Principles?-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Motamed_2026_WACV, author = {Motamed, Saman and Culp, Laura and Swersky, Kevin and Jaini, Priyank and Geirhos, Robert}, title = {Do Generative Video Models Understand Physical Principles?}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {948-958} }
AnyBald: Toward Realistic Diffusion-Based Hair Removal In-The-Wild-
[pdf]
[supp]
[bibtex]@InProceedings{Choi_2026_WACV, author = {Choi, Yongjun and Han, Seungoh and Kim, Soomin and Son, Sumin and Rohani, Mohsen and Maucourant, Edgar and Min, Dongbo and Joo, Kyungdon}, title = {AnyBald: Toward Realistic Diffusion-Based Hair Removal In-The-Wild}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2220-2230} }
A Multi-Agent Diffusion Approach for MRI Anomaly Segmentation via Modality-Specific LoRA Specialization-
[pdf]
[bibtex]@InProceedings{Al_Ghallabi_2026_WACV, author = {Al Ghallabi, Wafa and Zaheer, Muhammad Zaigham and Thawkar, Ritesh and Thawakar, Omkar and Khan, Salman and Khan, Fahad Shahbaz}, title = {A Multi-Agent Diffusion Approach for MRI Anomaly Segmentation via Modality-Specific LoRA Specialization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {128-137} }
ZonUI-3B: Competitive GUI Grounding with a 3B VLM Trained on a Single Consumer GPU-
[pdf]
[supp]
[bibtex]@InProceedings{Hsieh_2026_WACV, author = {Hsieh, ZongHan and Yang, ShengJing and Wei, Tzer-Jen}, title = {ZonUI-3B: Competitive GUI Grounding with a 3B VLM Trained on a Single Consumer GPU}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {959-966} }
LogicCBMs: Logic-Enhanced Concept-Based Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Vemuri_2026_WACV, author = {Vemuri, Deepika SN and Bellamkonda, Gautham and Pola, Aditya and Balasubramanian, Vineeth N}, title = {LogicCBMs: Logic-Enhanced Concept-Based Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6039-6048} }
Sketch2Stitch: GANs for Abstract Sketch-Based Dress Synthesis-
[pdf]
[supp]
[bibtex]@InProceedings{Khan_2026_WACV, author = {Khan, Faizan Farooq and Bakr, Eslam Abdelrahman and Morelli, Davide and Cornia, Marcella and Cucchiara, Rita and Elhoseiny, Mohamed}, title = {Sketch2Stitch: GANs for Abstract Sketch-Based Dress Synthesis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2209-2219} }
GAEA: A Geolocation Aware Conversational Assistant-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Campos_2026_WACV, author = {Campos, Ron and Vayani, Ashmal and Kulkarni, Parth Parag and Gupta, Rohit and Zafar, Aizan and Dutta, Aritra and Shah, Mubarak}, title = {GAEA: A Geolocation Aware Conversational Assistant}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5236-5246} }
FNOPT: Resolution-Agnostic, Self-Supervised Cloth Simulation using Meta-Optimization with Fourier Neural Operators-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2026_WACV, author = {Chen, Ruochen and Tran, Thuy and Parashar, Shaifali}, title = {FNOPT: Resolution-Agnostic, Self-Supervised Cloth Simulation using Meta-Optimization with Fourier Neural Operators}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7116-7125} }
You May Speak Freely: Improving the Fine-Grained Visual Recognition Capabilities of Multimodal Large Language Models with Answer Extraction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lawrence_2026_WACV, author = {Lawrence, Logan and Saha, Oindrila and Wei, Megan and Sun, Chen and Maji, Subhransu and Van Horn, Grant}, title = {You May Speak Freely: Improving the Fine-Grained Visual Recognition Capabilities of Multimodal Large Language Models with Answer Extraction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1428-1437} }
Diversity Preserving Coresets for Image Quality Assessment-
[pdf]
[supp]
[bibtex]@InProceedings{Nema_2026_WACV, author = {Nema, Arpita and Zhu, Hanwei and Zhang, Xi and Lin, Weisi}, title = {Diversity Preserving Coresets for Image Quality Assessment}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7925-7934} }
Frequency Is What You Need: Considering Word Frequency When Text Masking Benefits Vision-Language Model Pre-training-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liang_2026_WACV, author = {Liang, Mingliang and Larson, Martha}, title = {Frequency Is What You Need: Considering Word Frequency When Text Masking Benefits Vision-Language Model Pre-training}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3771-3780} }
RoadBench: A Vision-Language Foundation Model and Benchmark for Road Damage Understanding-
[pdf]
[arXiv]
[bibtex]@InProceedings{Xiao_2026_WACV, author = {Xiao, Xi and Zhang, Yunbei and Wang, Janet and Zhao, Lin and Wei, Yuxiang and Li, Hengjia and Li, Yanshu and Wang, Xiao and Roy, Swalpa Kumar and Xu, Hao and Wang, Tianyang}, title = {RoadBench: A Vision-Language Foundation Model and Benchmark for Road Damage Understanding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6016-6026} }
Evaluating Text-to-Image and Text-to-Video Synthesis with a Conditional Frechet Distance-
[pdf]
[supp]
[bibtex]@InProceedings{Koo_2026_WACV, author = {Koo, Jaywon and Hernandez, Jefferson and Haji-Ali, Moayed and Yang, Ziyan and Ordonez, Vicente}, title = {Evaluating Text-to-Image and Text-to-Video Synthesis with a Conditional Frechet Distance}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2052-2062} }
Optimization-Free Style Transfer for 3D Gaussian Splats-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Du_Sablon_2026_WACV, author = {Du Sablon, Raphael and Hart, David}, title = {Optimization-Free Style Transfer for 3D Gaussian Splats}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8041-8051} }
AEON: Adaptive Embedding Optimized Noise for Robust Watermarking in Diffusion Models-
[pdf]
[supp]
[bibtex]@InProceedings{Muneer_2026_WACV, author = {Muneer, Muhammad Shahid and Woo, Simon S.}, title = {AEON: Adaptive Embedding Optimized Noise for Robust Watermarking in Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5406-5415} }
mEOL: Training-Free Instruction-Guided Multimodal Embedder for Vector Graphics and Image Retrieval-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2026_WACV, author = {Kim, Kyeong Seon and Seong-Eun, Baek and Jung-Mok, Lee and Oh, Tae-Hyun}, title = {mEOL: Training-Free Instruction-Guided Multimodal Embedder for Vector Graphics and Image Retrieval}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1191-1200} }
GateFusion: Hierarchical Gated Cross-Modal Fusion for Active Speaker Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2026_WACV, author = {Wang, Yu and Ha, Juhyung and Ramirez, Frangil M. and Wang, Yuchen and Crandall, David J.}, title = {GateFusion: Hierarchical Gated Cross-Modal Fusion for Active Speaker Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1074-1083} }
From Cognitive Priors to Instance Semantics: A Unified Framework for Multi-task Affective Computing-
[pdf]
[bibtex]@InProceedings{Hu_2026_WACV, author = {Hu, Guanyu and Kollias, Dimitrios and Yang, Xinyu}, title = {From Cognitive Priors to Instance Semantics: A Unified Framework for Multi-task Affective Computing}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8551-8562} }
Detection-Driven Object Count Optimization for Text-to-Image Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zafar_2026_WACV, author = {Zafar, Oz and Cohen, Yuval and Wolf, Lior and Schwartz, Idan}, title = {Detection-Driven Object Count Optimization for Text-to-Image Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1885-1894} }
PoseAdapt: Sustainable Human Pose Estimation via Continual Learning Benchmarks and Toolkit-
[pdf]
[arXiv]
[bibtex]@InProceedings{Khan_2026_WACV, author = {Khan, Muhammad Saif Ullah and Stricker, Didier}, title = {PoseAdapt: Sustainable Human Pose Estimation via Continual Learning Benchmarks and Toolkit}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6840-6850} }
Fully Unsupervised Self-debiasing of Text-to-Image Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Vardhana_2026_WACV, author = {Vardhana, Korada Sri and Lolla, Shrikrishna and Biswas, Soma}, title = {Fully Unsupervised Self-debiasing of Text-to-Image Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1221-1230} }
Cycle-Consistent Multi-Graph Matching for Self-Supervised Annotation of C. Elegans-
[pdf]
[supp]
[bibtex]@InProceedings{Stricker_2026_WACV, author = {Stricker, Sebastian and Karg, Christoph and Hutschenreiter, Lisa and Savchynskyy, Bogdan and Kainmueller, Dagmar}, title = {Cycle-Consistent Multi-Graph Matching for Self-Supervised Annotation of C. Elegans}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7208-7217} }
Online Episodic Memory Visual Query Localization with Egocentric Streaming Object Memory-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Manigrasso_2026_WACV, author = {Manigrasso, Zaira and Dunnhofer, Matteo and Furnari, Antonino and Nottebaum, Moritz and Finocchiaro, Antonio and Marana, Davide and Forte, Rosario and Farinella, Giovanni Maria and Micheloni, Christian}, title = {Online Episodic Memory Visual Query Localization with Egocentric Streaming Object Memory}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3951-3960} }
Visual Detector Compression via Location-Aware Discriminant Analysis-
[pdf]
[arXiv]
[bibtex]@InProceedings{Lan_2026_WACV, author = {Lan, Qizhen and Choi, Jung Im and Tian, Qing}, title = {Visual Detector Compression via Location-Aware Discriminant Analysis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3546-3555} }
Salience-SGG: Enhancing Unbiased Scene Graph Generation with Iterative Salience Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Qu_2026_WACV, author = {Qu, Runfeng and Hall, Ole and Bideau, Pia K and Ouerfelli-Ethier, Julie and Rolfs, Martin and Obermayer, Klaus and Hellwich, Olaf}, title = {Salience-SGG: Enhancing Unbiased Scene Graph Generation with Iterative Salience Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1032-1042} }
SPAR-Det: Segmentation-guided and Prior-Aided Routing for Small Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Kwon_2026_WACV, author = {Kwon, Seungchan and Lim, Gyuil and Han, Youngjoon}, title = {SPAR-Det: Segmentation-guided and Prior-Aided Routing for Small Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2146-2155} }
Semi-supervised Key-Point Estimation for Echocardiography Video-
[pdf]
[supp]
[bibtex]@InProceedings{Oh_2026_WACV, author = {Oh, Seok-Hwan and Lee, Hyeon-Jik and Jung, Guil and Kim, Myeong-Gee and Kim, Young-Min and Kwon, Hyuksool and Bae, Hyeon-Min}, title = {Semi-supervised Key-Point Estimation for Echocardiography Video}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5682-5692} }
Locally Explaining Prediction Behavior via Gradual Interventions and Measuring Property Gradients-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Penzel_2026_WACV, author = {Penzel, Niklas and Denzler, Joachim}, title = {Locally Explaining Prediction Behavior via Gradual Interventions and Measuring Property Gradients}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7398-7408} }
Scalable Video Action Anticipation with Cross Linear Attentive Memory-
[pdf]
[supp]
[bibtex]@InProceedings{Zhong_2026_WACV, author = {Zhong, Zeyun and Martin, Manuel and Schneider, David and Lerch, David J. and Wu, Chengzhi and Diederichs, Frederik and Gall, Juergen and Beyerer, J\"urgen}, title = {Scalable Video Action Anticipation with Cross Linear Attentive Memory}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8113-8123} }
Are All Marine Species Created Equal? Performance Disparities in Underwater Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wille_2026_WACV, author = {Wille, Melanie and Fischer, Tobias and Raine, Scarlett}, title = {Are All Marine Species Created Equal? Performance Disparities in Underwater Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4556-4565} }
MoRe: Monocular Geometry Refinement via Graph Optimization for Cross-View Consistency-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jung_2026_WACV, author = {Jung, Dongki and Choi, Jaehoon and Lee, Yonghan and Eum, Sungmin and Kwon, Heesung and Manocha, Dinesh}, title = {MoRe: Monocular Geometry Refinement via Graph Optimization for Cross-View Consistency}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4838-4848} }
FLARES: Fast and Accurate LiDAR Multi-Range Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2026_WACV, author = {Yang, Bin and Condurache, Alexandru Paul}, title = {FLARES: Fast and Accurate LiDAR Multi-Range Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3451-3461} }
Mitigating the Modality Gap: Few-Shot Out-of-Distribution Detection with Multi-modal Prototypes and Image Bias Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2026_WACV, author = {Wang, Yimu and Riddell, Evelien and Chow, Adrian and Sedwards, Sean and Czarnecki, Krzysztof}, title = {Mitigating the Modality Gap: Few-Shot Out-of-Distribution Detection with Multi-modal Prototypes and Image Bias Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2741-2751} }
FairVLM: Enhancing Fairness and Prompt Sensitivity in Vision Language Models for Medical Image Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Rahman_2026_WACV, author = {Rahman, Md Motiur and Rahman, Saeka and Bhatt, Smriti and Faezipour, Miad}, title = {FairVLM: Enhancing Fairness and Prompt Sensitivity in Vision Language Models for Medical Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7450-7460} }
NRGMark: Localized Watermarking for Energy Transparency in Images-
[pdf]
[bibtex]@InProceedings{Agarwal_2026_WACV, author = {Agarwal, Shruti and Michel, \'Elie and Asnani, Vishal and Mathern, Tania and Collomosse, John}, title = {NRGMark: Localized Watermarking for Energy Transparency in Images}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7779-7788} }
V2XScene: Multi-View Consistent 3D Scene Simulation for Collaborative Perception-
[pdf]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Yanfei and Gong, Yi and Zeng, Yuan}, title = {V2XScene: Multi-View Consistent 3D Scene Simulation for Collaborative Perception}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6569-6579} }
SymNet: A Multi-Task Network for Joint Radio Map Reconstruction and Transmitter Localization-
[pdf]
[bibtex]@InProceedings{Ye_2026_WACV, author = {Ye, Lyuzhou and Le, Thanh Dat and Huang, Yan}, title = {SymNet: A Multi-Task Network for Joint Radio Map Reconstruction and Transmitter Localization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {150-159} }
Safe Vision-Language Models via Unsafe Weights Manipulation-
[pdf]
[supp]
[bibtex]@InProceedings{D'inca_2026_WACV, author = {D'inc\`a, Moreno and Peruzzo, Elia and Xu, Xingqian and Shi, Humphrey and Sebe, Nicu and Mancini, Massimiliano}, title = {Safe Vision-Language Models via Unsafe Weights Manipulation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4682-4692} }
CONCORD: Concept-Informed Diffusion for Dataset Distillation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gu_2026_WACV, author = {Gu, Jianyang and Wang, Haonan and Jia, Ruoxi and Vahidian, Saeed and Kungurtsev, Vyacheslav and Jiang, Wei and Chen, Yiran}, title = {CONCORD: Concept-Informed Diffusion for Dataset Distillation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5258-5268} }
CAPE: A CLIP-Aware Pointing Ensemble of Complementary Heatmap Cues for Embodied Reference Understanding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Eyiokur_2026_WACV, author = {Eyiokur, Fevziye Irem and Yaman, Dogucan and Ekenel, Haz{\i}m Kemal and Waibel, Alexander}, title = {CAPE: A CLIP-Aware Pointing Ensemble of Complementary Heatmap Cues for Embodied Reference Understanding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3939-3950} }
Learning Action Hierarchies via Hybrid Geometric Diffusion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kaushik_2026_WACV, author = {Kaushik, Arjun Ramesh and Ratha, Nalini K. and Govindaraju, Venu}, title = {Learning Action Hierarchies via Hybrid Geometric Diffusion}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3129-3139} }
Advancing Multimodal LLMs by Large-Scale 3D Visual Instruction Dataset Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{He_2026_WACV, author = {He, Liu and Zeng, Xiao and Song, Yizhi and Chen, Albert Y. C. and Xia, Lu and Verma, Shashwat and Dayal, Sankalp and Sun, Min and Kuo, Cheng-Hao and Aliaga, Daniel}, title = {Advancing Multimodal LLMs by Large-Scale 3D Visual Instruction Dataset Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5886-5897} }
Bi-ICE: An Inner Interpretable Framework for Image Classification via Bi-directional Interactions between Concept and Input Embeddings-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hong_2026_WACV, author = {Hong, Jinyung and Kim, Yearim and Park, Keun Hee and Han, Sangyu and Kwak, Nojun and Pavlic, Theodore P.}, title = {Bi-ICE: An Inner Interpretable Framework for Image Classification via Bi-directional Interactions between Concept and Input Embeddings}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3835-3845} }
Transformer-Based Inpainting for Real-Time 3D Streaming in Sparse Multi-Camera Setups-
[pdf]
[supp]
[bibtex]@InProceedings{Van_Holland_2026_WACV, author = {Van Holland, Leif and Zingsheim, Domenic and Takhsha, Mana and Dr\"oge, Hannah and Stotko, Patrick and Plack, Markus and Klein, Reinhard}, title = {Transformer-Based Inpainting for Real-Time 3D Streaming in Sparse Multi-Camera Setups}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4587-4598} }
Test-Time Adaptation for Video Highlight Detection Using Meta-Auxiliary Learning and Cross-Modality Hallucinations-
[pdf]
[arXiv]
[bibtex]@InProceedings{Islam_2026_WACV, author = {Islam, Zahidul and Paul, Sujoy and Rochan, Mrigank}, title = {Test-Time Adaptation for Video Highlight Detection Using Meta-Auxiliary Learning and Cross-Modality Hallucinations}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6893-6902} }
INRetouch: Context Aware Implicit Neural Representation for Photography Retouching-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Elezabi_2026_WACV, author = {Elezabi, Omar and Conde, Marcos V. and Wu, Zongwei and Timofte, Radu}, title = {INRetouch: Context Aware Implicit Neural Representation for Photography Retouching}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5560-5569} }
3DSceneEditor: Controllable 3D Scene Editing with Gaussian Splatting-
[pdf]
[supp]
[bibtex]@InProceedings{Yan_2026_WACV, author = {Yan, Ziyang and Shao, Yihua and Liao, Minwen and Chen, Siyu and Wang, Nan and Lin, Muyuan and Hwang, Jenq-Neng and Zhao, Hao and Remondino, Fabio and Li, Lei}, title = {3DSceneEditor: Controllable 3D Scene Editing with Gaussian Splatting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1852-1863} }
Grounding Degradations in Natural Language for All-In-One Video Restoration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Janjua_2026_WACV, author = {Janjua, Muhammad Kamran and Ghasemabadi, Amirhosein and Zhang, Kunlin and Salameh, Mohammad and Gao, Chao and Niu, Di}, title = {Grounding Degradations in Natural Language for All-In-One Video Restoration}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5734-5743} }
Stabilizing Direct Training of Spiking Neural Networks: Membrane Potential Initialization and Threshold-robust Surrogate Gradient-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kook_2026_WACV, author = {Kook, Hyunho and Yu, Byeongho and Oh, Jeong Min and Park, Eunhyeok}, title = {Stabilizing Direct Training of Spiking Neural Networks: Membrane Potential Initialization and Threshold-robust Surrogate Gradient}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8500-8510} }
RegionAligner: Bridging Ego-Exo Views for Object Correspondence via Unified Text-Visual Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Su_2026_WACV, author = {Su, Yuhao and Elhamifar, Ehsan}, title = {RegionAligner: Bridging Ego-Exo Views for Object Correspondence via Unified Text-Visual Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3265-3274} }
Matching Semantically Similar Non-Identical Objects-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Marumo_2026_WACV, author = {Marumo, Yusuke and Kawamoto, Kazuhiko and Tanaka, Satomi and Hirano, Shigenobu and Kera, Hiroshi}, title = {Matching Semantically Similar Non-Identical Objects}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2752-2764} }
SphereEdit: Spherical Semantic Editing in Diffusion Models-
[pdf]
[supp]
[bibtex]@InProceedings{Konate_2026_WACV, author = {Konate, Salamata and Hamidi, Hassan and Dolatabadi, Elham and Rudzicz, Frank and Seyyed-Kalantari, Laleh}, title = {SphereEdit: Spherical Semantic Editing in Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8084-8093} }
Pyramidal Spectrum: Frequency-based Hierarchically Vector Quantized VAE for Videos-
[pdf]
[supp]
[bibtex]@InProceedings{Prakash_2026_WACV, author = {Prakash, Tushar and Susladkar, Onkar and Mittal, Sparsh and Dhillon, Inderjit S}, title = {Pyramidal Spectrum: Frequency-based Hierarchically Vector Quantized VAE for Videos}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2073-2082} }
Large Sign Language Models: Toward 3D American Sign Language Translation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2026_WACV, author = {Zhang, Sen and He, Xiaoxiao and Liu, Di and Xia, Zhaoyang and Zhao, Mingyu and Tan, Chaowei and Li, Vivian and Liu, Bo and Metaxas, Dimitris N. and Kapadia, Mubbasir}, title = {Large Sign Language Models: Toward 3D American Sign Language Translation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3109-3119} }
Learning Mask-Aware Offsets: Two-branch Deformable Attention Networks for Inpainting with Masked Region Avoidance-
[pdf]
[supp]
[bibtex]@InProceedings{Oh_2026_WACV, author = {Oh, Hyeongseok and Paik, Joonki}, title = {Learning Mask-Aware Offsets: Two-branch Deformable Attention Networks for Inpainting with Masked Region Avoidance}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1022-1031} }
QuadraNet V2: Efficient and Sustainable Training of High-Order Neural Networks with Quadratic Adaptation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Xu_2026_WACV, author = {Xu, Chenhui and Yu, Fuxun and Xiong, Jinjun and Chen, Xiang}, title = {QuadraNet V2: Efficient and Sustainable Training of High-Order Neural Networks with Quadratic Adaptation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1365-1373} }
Occlusion Boundary and Depth: Mutual Enhancement via Multi-Task Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2026_WACV, author = {Xu, Lintao and Wang, Yinghao and Wang, Chaohui}, title = {Occlusion Boundary and Depth: Mutual Enhancement via Multi-Task Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4427-4437} }
3D Superquadric Splatting-
[pdf]
[supp]
[bibtex]@InProceedings{MacSwayne_2026_WACV, author = {MacSwayne, Daniel and Leonardis, Ales and Jiao, Jianbo}, title = {3D Superquadric Splatting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5154-5163} }
S2O: Static to Openable Enhancement for Articulated 3D Objects-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Iliash_2026_WACV, author = {Iliash, Denys and Jiang, Hanxiao and Zhang, Yiming and Savva, Manolis and Chang, Angel X.}, title = {S2O: Static to Openable Enhancement for Articulated 3D Objects}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6785-6795} }
Personalized Image Privacy Advisors via Federated Daisy-Chaining-
[pdf]
[supp]
[bibtex]@InProceedings{Banerjee_2026_WACV, author = {Banerjee, Sourasekhar and Subramaniam, Vengateswaran and Roy, Debaditya and Subbaraju, Vigneshwaran and Bhuyan, Monowar}, title = {Personalized Image Privacy Advisors via Federated Daisy-Chaining}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2808-2817} }
PoseGaussian: Pose-Driven Novel View Synthesis for Robust 3D Human Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shen_2026_WACV, author = {Shen, Ju and Chen, Chen and Nguyen, Tam V. and Asari, Vijayan K.}, title = {PoseGaussian: Pose-Driven Novel View Synthesis for Robust 3D Human Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5004-5015} }
UniGaze: Towards Universal Gaze Estimation via Large-scale Pre-Training-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Qin_2026_WACV, author = {Qin, Jiawei and Zhang, Xucong and Sugano, Yusuke}, title = {UniGaze: Towards Universal Gaze Estimation via Large-scale Pre-Training}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5809-5820} }
One Model, Many Behaviors: Training-Induced Effects on Out-of-Distribution Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Krumpl_2026_WACV, author = {Krumpl, Gerhard and Avenhaus, Henning and Possegger, Horst}, title = {One Model, Many Behaviors: Training-Induced Effects on Out-of-Distribution Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4128-4138} }
DNA: Dual-branch Network with Adaptation for Open-Set Online Handwriting Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Huang_2026_WACV, author = {Huang, Tsai-Ling and Do-Tran, Nhat-Tuong and Le, Ngoc-Hoang-Lam and Shuai, Hong-Han and Huang, Ching-Chun}, title = {DNA: Dual-branch Network with Adaptation for Open-Set Online Handwriting Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4170-4179} }
Universal Neural Architecture Space: Covering ConvNets, Transformers and Everything in Between-
[pdf]
[arXiv]
[bibtex]@InProceedings{Tybl_2026_WACV, author = {Tybl, Ondrej and Neumann, Lukas}, title = {Universal Neural Architecture Space: Covering ConvNets, Transformers and Everything in Between}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3679-3688} }
Splatter Layout: Geometry-embedded 3D Reconstruction via Surface Unfolding-
[pdf]
[supp]
[bibtex]@InProceedings{Heryanto_2026_WACV, author = {Heryanto, Bryan and You, Tackgeun and Kim, Chanwoo and Lim, Hwasup}, title = {Splatter Layout: Geometry-embedded 3D Reconstruction via Surface Unfolding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7709-7718} }
Optimal Transport for Rectified Flow Image Editing: Unifying Inversion-Based and Direct Methods-
[pdf]
[supp]
[bibtex]@InProceedings{Lupascu_2026_WACV, author = {Lupa\c{s}cu, Marian and Stupariu, Mihai Sorin}, title = {Optimal Transport for Rectified Flow Image Editing: Unifying Inversion-Based and Direct Methods}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6764-6774} }
Prompt-OT: An Optimal Transport Regularization Paradigm for Knowledge Preservation in Vision-Language Model Adaptation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2026_WACV, author = {Chen, Xiwen and Zhu, Wenhui and Qiu, Peijie and Wang, Hao and Li, Huayu and Wu, Haiyu and Dong, Xuanzhao and Sotiras, Aristeidis and Wang, Yalin and Razi, Abolfazl}, title = {Prompt-OT: An Optimal Transport Regularization Paradigm for Knowledge Preservation in Vision-Language Model Adaptation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {667-676} }
Restora-Flow: Mask-Guided Image Restoration with Flow Matching-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hadzic_2026_WACV, author = {Hadzic, Arnela and Thaler, Franz and Bogensperger, Lea and Joham, Simon Johannes and Urschler, Martin}, title = {Restora-Flow: Mask-Guided Image Restoration with Flow Matching}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4943-4952} }
Unsupervised Segmentation by Diffusing, Walking and Cutting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ivanova_2026_WACV, author = {Ivanova, Daniela and Aversa, Marco and Henderson, Paul and Williamson, John}, title = {Unsupervised Segmentation by Diffusing, Walking and Cutting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5110-5120} }
RobuMTL: Enhancing Multi-Task Learning Robustness Against Weather Conditions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shaffee_2026_WACV, author = {Shaffee, Tasneem and Reda, Sherief}, title = {RobuMTL: Enhancing Multi-Task Learning Robustness Against Weather Conditions}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5591-5600} }
SCORE: Soft Label Compression-Centric Dataset Condensation via Coding Rate Optimization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yuan_2026_WACV, author = {Yuan, Bowen and Fu, Yuxia and Wang, Zijian and Luo, Yadan and Huang, Zi}, title = {SCORE: Soft Label Compression-Centric Dataset Condensation via Coding Rate Optimization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2198-2208} }
ICONIC-444: A 3.1-Million-Image Dataset for OOD Detection Research-
[pdf]
[supp]
[bibtex]@InProceedings{Krumpl_2026_WACV, author = {Krumpl, Gerhard and Avenhaus, Henning and Possegger, Horst}, title = {ICONIC-444: A 3.1-Million-Image Dataset for OOD Detection Research}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8427-8436} }
BAFIS: Dataset + Framework to Assess Occupational Bias and Human Preference in Modern Text-to-image Models-
[pdf]
[supp]
[bibtex]@InProceedings{Klassert_2026_WACV, author = {Klassert, Thomas and Ulges, Adrian and Fu, Biying}, title = {BAFIS: Dataset + Framework to Assess Occupational Bias and Human Preference in Modern Text-to-image Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2168-2177} }
Cosine Similarity is Almost All You Need (for Prototypical-Part Models)-
[pdf]
[supp]
[bibtex]@InProceedings{Moffett_2026_WACV, author = {Moffett, Luke and Willard, Frank and Machado, Maximillian and Mokel, Emmanuel and Donnelly, Jon and Guo, Zhicheng and Costarino, Adam and Yang, Julia and Kim, Giyoung and Barnett, Alina Jade and Rudin, Cynthia}, title = {Cosine Similarity is Almost All You Need (for Prototypical-Part Models)}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1586-1596} }
Towards Photorealistic Style Transfer with Multimodal Guidance and Robustness to Content Images in Arbitrary Styles-
[pdf]
[supp]
[bibtex]@InProceedings{Zhou_2026_WACV, author = {Zhou, Ruikai and Liu, Yating and Xu, Yi}, title = {Towards Photorealistic Style Transfer with Multimodal Guidance and Robustness to Content Images in Arbitrary Styles}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4651-4660} }
Decomposition Sampling for Efficient Region Annotations in Active Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Qiu_2026_WACV, author = {Qiu, Jingna and Wilm, Frauke and \"Ottl, Mathias and Utz, Jonas and Schlereth, Maja and Schillinger, Moritz and Aubreville, Marc and Breininger, Katharina}, title = {Decomposition Sampling for Efficient Region Annotations in Active Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4160-4169} }
Codebook Knowledge with Mamba-Transformer For Low-Light Image Enhancement-
[pdf]
[bibtex]@InProceedings{Deng_2026_WACV, author = {Deng, Runhua and Jiang, Aiwen and Peng, Long and Yan, Qiuhai}, title = {Codebook Knowledge with Mamba-Transformer For Low-Light Image Enhancement}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3720-3729} }
Illuminating Darkness: Learning to Enhance Low-light Images In-the-Wild-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sharif_2026_WACV, author = {Sharif, S. M. A. and Rehman, Abdur and Abidin, Zain Ul and Dharejo, Fayaz Ali and Timofte, Radu and Naqvi, Rizwan Ali}, title = {Illuminating Darkness: Learning to Enhance Low-light Images In-the-Wild}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2263-2272} }
Food Image Generation on Multi-Noun Categories-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Pan_2026_WACV, author = {Pan, Xinyue and Chen, Yuhao and He, Jiangpeng and Zhu, Fengqing}, title = {Food Image Generation on Multi-Noun Categories}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5581-5590} }
FuLLaMa: Training-free Diffusion-based Object Removal with Context Preservation-
[pdf]
[supp]
[bibtex]@InProceedings{Demir_2026_WACV, author = {Demir, Ilke and Ciftci, Umur Aybars}, title = {FuLLaMa: Training-free Diffusion-based Object Removal with Context Preservation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8563-8573} }
Augmenting with NeRFs: Fast Relocalization on Densified Datasets-
[pdf]
[supp]
[bibtex]@InProceedings{Tomadakis_2026_WACV, author = {Tomadakis, Michael and Borissova, Rebecca and Zhang, Yuxuan and Koppal, Sanjeev}, title = {Augmenting with NeRFs: Fast Relocalization on Densified Datasets}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3067-3076} }
FCC: Fully Connected Correlation for One-Shot Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Moon_2026_WACV, author = {Moon, Seonghyeon and Kong, Haein and Khan, Muhammad Haris and Kapadia, Mubbasir and Lin, Yuewei}, title = {FCC: Fully Connected Correlation for One-Shot Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4827-4837} }
Imitating the Functionality of Image-to-Image Models Using a Single Example-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Spingarn_2026_WACV, author = {Spingarn, Nurit and Michaeli, Tomer}, title = {Imitating the Functionality of Image-to-Image Models Using a Single Example}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2178-2187} }
Performance of Conformal Prediction in Capturing Aleatoric Uncertainty-
[pdf]
[supp]
[bibtex]@InProceedings{Hagos_2026_WACV, author = {Hagos, Misgina Tsighe and Lundstr\"om, Claes}, title = {Performance of Conformal Prediction in Capturing Aleatoric Uncertainty}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2954-2963} }
HEART-PFL: Stable Personalized Federated Learning under Heterogeneity with Hierarchical Directional Alignment and Adversarial Knowledge Transfer-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2026_WACV, author = {Kim, Minjun and Kim, Minje}, title = {HEART-PFL: Stable Personalized Federated Learning under Heterogeneity with Hierarchical Directional Alignment and Adversarial Knowledge Transfer}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3370-3379} }
ArchitectHead: Continuous Level of Detail Control for 3D Gaussian Head Avatars-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yan_2026_WACV, author = {Yan, Peizhi and Ward, Rabab and Tang, Qiang and Du, Shan}, title = {ArchitectHead: Continuous Level of Detail Control for 3D Gaussian Head Avatars}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1632-1642} }
Where is the Watermark? Interpretable Watermark Detection at the Block Level-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bulychev_2026_WACV, author = {Bulychev, Maria and Marchant, Neil G. and Rubinstein, Benjamin I. P.}, title = {Where is the Watermark? Interpretable Watermark Detection at the Block Level}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7420-7429} }
HABIT: Human Action Benchmark for Interactive Traffic in CARLA-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ramesh_2026_WACV, author = {Ramesh, Mohan and Azer, Mark and Flohr, Fabian}, title = {HABIT: Human Action Benchmark for Interactive Traffic in CARLA}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7148-7157} }
SimForce: Force and Surface Electromyography from Full Body Video with Graph Neural Nets-
[pdf]
[bibtex]@InProceedings{Dasgupta_2026_WACV, author = {Dasgupta, Esha and Kim, Boeun and Yeo, Sang Hoon and Chang, Hyung Jin}, title = {SimForce: Force and Surface Electromyography from Full Body Video with Graph Neural Nets}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3320-3329} }
SAFER-AiD: Saccade-Assisted Foveal-peripheral vision Enhanced Reconstruction for Adversarial Defense-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2026_WACV, author = {Liu, Jiayang and Ts'o, Daniel and Bu, Yiming and Qiu, Qinru}, title = {SAFER-AiD: Saccade-Assisted Foveal-peripheral vision Enhanced Reconstruction for Adversarial Defense}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1726-1735} }
Patch Your Matcher: Correspondence-Aware Image-to-Image Translation Unlocks Cross-Modal Matching via Single-Modality Priors-
[pdf]
[supp]
[bibtex]@InProceedings{Frolov_2026_WACV, author = {Frolov, Anton and Rodehorst, Volker}, title = {Patch Your Matcher: Correspondence-Aware Image-to-Image Translation Unlocks Cross-Modal Matching via Single-Modality Priors}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7913-7924} }
Structured Context Learning for Generic Event Boundary Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gu_2026_WACV, author = {Gu, Xin and Li, Congcong and Wang, Xinyao and Hong, Dexiang and Zhang, Libo and Luo, Tiejian and Wen, Longyin and Fan, Heng}, title = {Structured Context Learning for Generic Event Boundary Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4808-4817} }
A Deep Network for Object Detection on Inland Waters-
[pdf]
[supp]
[bibtex]@InProceedings{Griesser_2026_WACV, author = {Griesser, Dennis and Goldluecke, Bastian and Franz, Matthias O. and Umlauf, Georg}, title = {A Deep Network for Object Detection on Inland Waters}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6590-6599} }
Geo3DVQA: Evaluating Vision-Language Models for 3D Geospatial Reasoning from Aerial Imagery-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tsujimoto_2026_WACV, author = {Tsujimoto, Mai and Wang, Junjue and Xuan, Weihao and Yokoya, Naoto}, title = {Geo3DVQA: Evaluating Vision-Language Models for 3D Geospatial Reasoning from Aerial Imagery}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4994-5003} }
Logit-Adjusted Test-Time Adaptation under Partial Class Imbalance-
[pdf]
[supp]
[bibtex]@InProceedings{Weerasinghe_2026_WACV, author = {Weerasinghe, Thilina and Tennakoon, Ruwan and Chuah, WeiQin and Bab-Hadiashar, Alireza}, title = {Logit-Adjusted Test-Time Adaptation under Partial Class Imbalance}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5977-5985} }
BlendCLIP: Bridging Synthetic and Real Domains for Zero-Shot 3D Object Classification with Multimodal Pretraining-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Khoche_2026_WACV, author = {Khoche, Ajinkya and Nagy, Gerg\H{o} L\'aszl\'o and Wozniak, Maciej and Gustafsson, Thomas and Jensfelt, Patric}, title = {BlendCLIP: Bridging Synthetic and Real Domains for Zero-Shot 3D Object Classification with Multimodal Pretraining}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5766-5775} }
Saliency-Guided DETR for Moment Retrieval and Highlight Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gordeev_2026_WACV, author = {Gordeev, Aleksandr and Dokholyan, Vladimir and Tolstykh, Irina and Kuprashevich, Maksim}, title = {Saliency-Guided DETR for Moment Retrieval and Highlight Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {907-916} }
MooTrack360: A Novel Fisheye Camera Dataset for Robust Multi Diary Cow Detection and Tracking-
[pdf]
[bibtex]@InProceedings{Christiansen_2026_WACV, author = {Christiansen, Rasmus Gjerlund K. and Van Nguyen, Toan and Malsk{\ae}r, Lasse Rose and Bodenhagen, Leon and Kraft, Dirk}, title = {MooTrack360: A Novel Fisheye Camera Dataset for Robust Multi Diary Cow Detection and Tracking}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {451-460} }
Histopath-C: Towards Realistic Domain Shifts for Histopathology Vision-Language Adaptation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Noori_2026_WACV, author = {Noori, Mehrdad and Hakim, Gustavo A. Vargas and Osowiechi, David and Shakeri, Fereshteh and Bahri, Ali and Yazdanpanah, Moslem and Dastani, Sahar and Ben Ayed, Ismail and Desrosiers, Christian}, title = {Histopath-C: Towards Realistic Domain Shifts for Histopathology Vision-Language Adaptation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4890-4900} }
Tables Decoded: DELTA for Structure, TARQA for Understanding-
[pdf]
[supp]
[bibtex]@InProceedings{Rajput_2026_WACV, author = {Rajput, Jahanvi and Kudale, Dhruv and Kasturi, Saikiran and Verma, Utkarsh and Ramakrishnan, Ganesh}, title = {Tables Decoded: DELTA for Structure, TARQA for Understanding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2775-2785} }
HumanGuideNet: Adapter-Based Alignment of Deep Neural Networks with Human Similarity Judgments-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2026_WACV, author = {Liu, Xufu and Yang, Yifan and Zhang, Zhengxin}, title = {HumanGuideNet: Adapter-Based Alignment of Deep Neural Networks with Human Similarity Judgments}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1798-1808} }
Broadcast2Pitch: Game State Reconstruction from Unconstrained Soccer Videos-
[pdf]
[supp]
[bibtex]@InProceedings{Oo_2026_WACV, author = {Oo, Yin May and Hwang, Yewon and Robbani, Muhammad Amrulloh and Chao, Vanyi and Jamsrandorj, Ankhzaya and Nguyen, Hoang Quoc and Mun, Kyung-Ryoul and Kim, Jinwook}, title = {Broadcast2Pitch: Game State Reconstruction from Unconstrained Soccer Videos}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4483-4493} }
Mixed Diffusion for 3D Indoor Scene Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hu_2026_WACV, author = {Hu, Siyi and Arroyo, Diego Mart{\'\i}n and Debats, Stephanie and Manhardt, Fabian and Carlone, Luca and Tombari, Federico}, title = {Mixed Diffusion for 3D Indoor Scene Synthesis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1262-1272} }
NERVE: Neighbourhood & Entropy-Guided Random-Walk for Training Free Open-Vocabulary Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mahatha_2026_WACV, author = {Mahatha, Kunal and Dolz, Jose and Desrosiers, Christian}, title = {NERVE: Neighbourhood \& Entropy-Guided Random-Walk for Training Free Open-Vocabulary Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3243-3253} }
PSA-MIL: A Probabilistic Spatial Attention-Based Multiple Instance Learning for Whole Slide Image Classification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Peled_2026_WACV, author = {Peled, Sharon and Maruvka, Yosef E. and Freiman, Moti}, title = {PSA-MIL: A Probabilistic Spatial Attention-Based Multiple Instance Learning for Whole Slide Image Classification}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1211-1220} }
Diverse Sketch Colorization with Content-Enhanced Style Representation and Recolorization Distillation-
[pdf]
[supp]
[bibtex]@InProceedings{Mao_2026_WACV, author = {Mao, Shuangming and Zhu, Haixiang}, title = {Diverse Sketch Colorization with Content-Enhanced Style Representation and Recolorization Distillation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1064-1073} }
STEG-AIW: Spatio-Temporal Gating and Adaptive-Timestep Inference for Efficient Spiking Neural Networks-
[pdf]
[bibtex]@InProceedings{Saju_2026_WACV, author = {Saju, Gulfam Ahmed and Spirkin, Anton and Marcelino, Felipe and Chang, Yuchou}, title = {STEG-AIW: Spatio-Temporal Gating and Adaptive-Timestep Inference for Efficient Spiking Neural Networks}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4180-4189} }
Perception-Inspired Color Space Design for Photo White Balance Editing-
[pdf]
[arXiv]
[bibtex]@InProceedings{Cheng_2026_WACV, author = {Cheng, Yang and Cui, Ziteng and Gu, Lin and Su, Shenghan and Zhang, Zenghui}, title = {Perception-Inspired Color Space Design for Photo White Balance Editing}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3741-3749} }
A Framework for Real-Time Surgical Phase Recognition with Application to Robot-Assisted Partial Nephrectomy-
[pdf]
[supp]
[bibtex]@InProceedings{Mezzina_2026_WACV, author = {Mezzina, Marco and Vercauteren, Tom and Tuytelaars, Tinne and Blaschko, Matthew B.}, title = {A Framework for Real-Time Surgical Phase Recognition with Application to Robot-Assisted Partial Nephrectomy}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {245-254} }
WiSE-OD: Benchmarking Robustness in Infrared Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Medeiros_2026_WACV, author = {Medeiros, Heitor R. and Belal, Atif and Aminbeidokhti, Masih and Granger, Eric and Pedersoli, Marco}, title = {WiSE-OD: Benchmarking Robustness in Infrared Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4912-4921} }
AuthGuard: Generalizable Deepfake Detection via Language Guidance-
[pdf]
[arXiv]
[bibtex]@InProceedings{Shen_2026_WACV, author = {Shen, Guangyu and Li, Zhihua and Xu, Xiang and Zhao, Tianchen and Zhang, Zheng and An, Dongsheng and Tu, Zhuowen and Xing, Yifan and Zhang, Qin}, title = {AuthGuard: Generalizable Deepfake Detection via Language Guidance}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6215-6225} }
Improving Out-of-Distribution Detection Using Segmented Images and Cross-View Attention Fusion-
[pdf]
[supp]
[bibtex]@InProceedings{Politowicz_2026_WACV, author = {Politowicz, Alexander and Mazumder, Sahisnu and Liu, Bing}, title = {Improving Out-of-Distribution Detection Using Segmented Images and Cross-View Attention Fusion}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5269-5279} }
VIZOR: Viewpoint-Invariant Zero-Shot Scene Graph Generation for 3D Scene Reasoning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Madhavaram_2026_WACV, author = {Madhavaram, Vivek and Sengar, Vartika and De, Arkadipta and Sharma, Charu}, title = {VIZOR: Viewpoint-Invariant Zero-Shot Scene Graph Generation for 3D Scene Reasoning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8584-8595} }
Understanding Generative AI Capabilities in Everyday Image Editing Tasks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Collins_2026_WACV, author = {Collins, Brandon and Taesiri, Mohammad Reza and Bolton, Logan and Lai, Viet Dac and Dernoncourt, Franck and Bui, Trung and Nguyen, Anh Totti}, title = {Understanding Generative AI Capabilities in Everyday Image Editing Tasks}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2231-2241} }
Gaussian Splatting Map Registration with Orthographic Bird's-Eye-View Renderings-
[pdf]
[supp]
[bibtex]@InProceedings{Leblond_2026_WACV, author = {Leblond, H. and Simon, G. and Martins, R. and Demonceaux, C. and Berger, M.-O.}, title = {Gaussian Splatting Map Registration with Orthographic Bird's-Eye-View Renderings}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6080-6089} }
IPCD: Intrinsic Point-Cloud Decomposition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sato_2026_WACV, author = {Sato, Shogo and Kaneko, Takuhiro and Takeda, Shoichiro and Shimada, Tomoyasu and Murasaki, Kazuhiko and Yoshida, Taiga and Tanida, Ryuichi and Kimura, Akisato}, title = {IPCD: Intrinsic Point-Cloud Decomposition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7094-7103} }
Diffusion Noise Optimization for Synthetic VLM Training-
[pdf]
[supp]
[bibtex]@InProceedings{Ohkubo_2026_WACV, author = {Ohkubo, Ren and Yanagi, Rintaro and Kataoka, Hirokatsu and Satoh, Yutaka}, title = {Diffusion Noise Optimization for Synthetic VLM Training}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6412-6421} }
DCSHARP: 3D Gaussian Splatting with Direction Cosine Spherical Harmonics and Shape-Aware Pruning-
[pdf]
[supp]
[bibtex]@InProceedings{Hasssan_2026_WACV, author = {Hasssan, Ahmed and Meng, Jian and Xiangli, Yuanbo and Seo, Jae-sun}, title = {DCSHARP: 3D Gaussian Splatting with Direction Cosine Spherical Harmonics and Shape-Aware Pruning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3628-3637} }
Distilling Diversity and Control in Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gandikota_2026_WACV, author = {Gandikota, Rohit and Bau, David}, title = {Distilling Diversity and Control in Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1304-1313} }
KFS-Bench: Comprehensive Evaluation of Key Frame Sampling in Long Video Understanding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Zongyao and Ishida, Kengo and Yamazaki, Satoshi and Ji, Xiaotong and Liu, Jianquan}, title = {KFS-Bench: Comprehensive Evaluation of Key Frame Sampling in Long Video Understanding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5643-5652} }
TacticalCalib: End-to-End 6-DoF Camera Pose Regression for Tactical Camera Calibration-
[pdf]
[bibtex]@InProceedings{Fan_2026_WACV, author = {Fan, Liang and Liu, Xiaoqian and Chen, Zhi and Yang, Lingkai}, title = {TacticalCalib: End-to-End 6-DoF Camera Pose Regression for Tactical Camera Calibration}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6547-6556} }
FlowCLAS: Enhancing Normalizing Flow-Based Anomaly Segmentation Via Contrastive Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Lee_2026_WACV, author = {Lee, Chang Won and Leveugle, Selina and Grouchy, Paul and Langley, Chris and Stolpner, Svetlana and Kelly, Jonathan and Waslander, Steven L.}, title = {FlowCLAS: Enhancing Normalizing Flow-Based Anomaly Segmentation Via Contrastive Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6998-7007} }
SuperRivolution: Fine-Scale Rivers from Coarse Temporal Satellite Imagery-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Daroya_2026_WACV, author = {Daroya, Rangel and Maji, Subhransu}, title = {SuperRivolution: Fine-Scale Rivers from Coarse Temporal Satellite Imagery}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7482-7492} }
Network-agnostic Distortion-robust Projections for Wide-angle Image Understanding-
[pdf]
[supp]
[bibtex]@InProceedings{Athwale_2026_WACV, author = {Athwale, Akshaya and Ahmad, Ola and Lalonde, Jean-Francois}, title = {Network-agnostic Distortion-robust Projections for Wide-angle Image Understanding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {591-601} }
Interleaved Vision-and-Language Generation via Generative Voken-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zheng_2026_WACV, author = {Zheng, Kaizhi and He, Xuehai and Wang, Xin Eric}, title = {Interleaved Vision-and-Language Generation via Generative Voken}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {472-482} }
R-MMA: Enhancing Vision-Language Models with Recurrent Adapters for Few-Shot and Cross-Domain Generalization-
[pdf]
[supp]
[bibtex]@InProceedings{Fahim_2026_WACV, author = {Fahim, Md and Ishmam, Md Farhan and Hossain, Mir Sazzat and Amin, M Ashraful and Ali, Amin Ahsan and Rahman, AKM Mahbubur}, title = {R-MMA: Enhancing Vision-Language Models with Recurrent Adapters for Few-Shot and Cross-Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6496-6506} }
TRACE: Confounder-free Adversarial Fine-tuning for Robust Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Lee_2026_WACV, author = {Lee, Wonho and Lee, Jisu and Na, Hyunsik and Park, Sohee and Choi, Daeseon}, title = {TRACE: Confounder-free Adversarial Fine-tuning for Robust Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6705-6714} }
PrevMatch: Revisiting and Maximizing Temporal Knowledge in Semi-Supervised Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shin_2026_WACV, author = {Shin, Wooseok and Park, Hyun Joon and Kim, Jin Sob and Yun, Juan and Park, Se Hong and Han, Sung Won}, title = {PrevMatch: Revisiting and Maximizing Temporal Knowledge in Semi-Supervised Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4953-4963} }
SaccadeX: Directed Acyclic Graph-based Semi-Supervised Learning of Continuous Ocular Dynamics from Sparse Neuromorphic Streams-
[pdf]
[supp]
[bibtex]@InProceedings{Bandara_2026_WACV, author = {Bandara, Nuwan and Kandappu, Thivya and Misra, Archan}, title = {SaccadeX: Directed Acyclic Graph-based Semi-Supervised Learning of Continuous Ocular Dynamics from Sparse Neuromorphic Streams}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1384-1394} }
CAAC: Confidence-Aware Attention Calibration to Reduce Hallucinations in Large Vision-Language Models-
[pdf]
[supp]
[bibtex]@InProceedings{Fazli_2026_WACV, author = {Fazli, Mehrdad and Wei, Bowen and Sari, Ahmet and Zhu, Ziwei}, title = {CAAC: Confidence-Aware Attention Calibration to Reduce Hallucinations in Large Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1242-1251} }
UCDSC: Open Set UnCertainty aware Deep Simplex Classifier for Medical Image Datasets-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Aditya_2026_WACV, author = {Aditya, Arnav and Kumar, Nitin and Shigwan, Saurabh}, title = {UCDSC: Open Set UnCertainty aware Deep Simplex Classifier for Medical Image Datasets}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4787-4796} }
SOLAR: Switchable Output Layer for Accuracy and Robustness in Once-for-All Training-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tareen_2026_WACV, author = {Tareen, Shaharyar Ahmed Khan and Fan, Lei and Yuan, Xiaojing and Lin, Qin and Hu, Bin}, title = {SOLAR: Switchable Output Layer for Accuracy and Robustness in Once-for-All Training}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7893-7902} }
Towards Streaming LiDAR Object Detection with Point Clouds as Egocentric Sequences-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2026_WACV, author = {Zhang, Mellon M. and Chou, Glen and Mukhopadhyay, Saibal}, title = {Towards Streaming LiDAR Object Detection with Point Clouds as Egocentric Sequences}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3275-3284} }
Subspace-Guided Knowledge Distillation for Efficient Model Transfer-
[pdf]
[bibtex]@InProceedings{Hayder_2026_WACV, author = {Hayder, Zeeshan and Cheraghian, Ali and Petersson, Lars and Harandi, Mehrtash}, title = {Subspace-Guided Knowledge Distillation for Efficient Model Transfer}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5057-5066} }
DexAvatar: 3D Sign Language Reconstruction with Hand and Body Pose Priors-
[pdf]
[supp]
[bibtex]@InProceedings{Kundu_2026_WACV, author = {Kundu, Kaustubh and Barua, Hrishav Bakul and Robertson-Bell, Lucy and Cai, Zhixi and Stefanov, Kalin}, title = {DexAvatar: 3D Sign Language Reconstruction with Hand and Body Pose Priors}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5842-5852} }
EmojiDiff: Advanced Facial Expression Control with High Identity Preservation in Portrait Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jiang_2026_WACV, author = {Jiang, Liangwei and Li, Ruida and Zhang, Zhifeng and Fang, Shuo and Ma, Chenguang}, title = {EmojiDiff: Advanced Facial Expression Control with High Identity Preservation in Portrait Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {328-338} }
FairScene: Learning Class-Disentangled 2D/3D Representations for Semantic Scene Completion-
[pdf]
[supp]
[bibtex]@InProceedings{Jia_2026_WACV, author = {Jia, Dian and Yu, Pei and Tang, Wei}, title = {FairScene: Learning Class-Disentangled 2D/3D Representations for Semantic Scene Completion}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3760-3770} }
A Universal Self-Attention Enhancement for Bridging Low-bit Quantization and Vision Transformers-
[pdf]
[bibtex]@InProceedings{Qian_2026_WACV, author = {Qian, Jiahe and Wang, Peisong and Zhuge, Zhengyang and Hu, Qinghao and Cheng, Jian}, title = {A Universal Self-Attention Enhancement for Bridging Low-bit Quantization and Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {360-370} }
SegMo: Segment-aligned Text to 3D Human Motion Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dang_2026_WACV, author = {Dang, Bowen and Wu, Lin and Yang, Xiaohang and Yuan, Zheng and Chen, Zhixiang}, title = {SegMo: Segment-aligned Text to 3D Human Motion Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6946-6955} }
SceneProp: Combining Neural Network and Markov Random Field for Scene-Graph Grounding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Otani_2026_WACV, author = {Otani, Keita and Harada, Tatsuya}, title = {SceneProp: Combining Neural Network and Markov Random Field for Scene-Graph Grounding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6153-6162} }
JOCA: Task-Driven Joint Optimisation of Camera Hardware and Adaptive Camera Control Algorithms-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yan_2026_WACV, author = {Yan, Chengyang and Bryson, Mitch and Dansereau, Donald G.}, title = {JOCA: Task-Driven Joint Optimisation of Camera Hardware and Adaptive Camera Control Algorithms}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3928-3938} }
TiCLS: Tightly Coupled Language Text Spotter-
[pdf]
[arXiv]
[bibtex]@InProceedings{Jang_2026_WACV, author = {Jang, Leeje and Lin, Yijun and Chiang, Yao-Yi and Weinman, Jerod}, title = {TiCLS: Tightly Coupled Language Text Spotter}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3730-3740} }
WiSAR3D - Aerial LiDAR Dataset for 3D Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Shrout_2026_WACV, author = {Shrout, Oren and Nizan, Ori and Ben-Shabat, Yizhak and Tal, Ayellet}, title = {WiSAR3D - Aerial LiDAR Dataset for 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6580-6589} }
ORCA: Object Recognition and Comprehension for Archiving Marine Species-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wong_2026_WACV, author = {Wong, Yuk-Kwan and Liang, Haixin and Ma, Zeyu and Chen, Yiwei and Zheng, Ziqiang and Gotama, Rinaldi and Sebastian, Pascal and Sparks, Lauren D. and Yeung, Sai-Kit}, title = {ORCA: Object Recognition and Comprehension for Archiving Marine Species}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1597-1609} }
Unsupervised Modular Adaptive Region Growing and RegionMix Classification for Wind Turbine Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Perez-Gonzalo_2026_WACV, author = {P\'erez-Gonzalo, Ra\"ul and Magro, Riccardo and Espersen, Andreas and Agudo, Antonio}, title = {Unsupervised Modular Adaptive Region Growing and RegionMix Classification for Wind Turbine Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3878-3888} }
Learnable Query-Enhanced Pose Transformation-
[pdf]
[bibtex]@InProceedings{Wang_2026_WACV, author = {Wang, Yi-Zhen and Shuai, Hong-Han}, title = {Learnable Query-Enhanced Pose Transformation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2032-2041} }
Exploiting Label-Independent Regularization from Spatial Patterns for Whole Slide Image Analysis-
[pdf]
[supp]
[bibtex]@InProceedings{Wu_2026_WACV, author = {Wu, Weiyi and Xu, Xinwen and Gao, Chongyang and Diao, Xingjian and Li, Siting and Gui, Jiang}, title = {Exploiting Label-Independent Regularization from Spatial Patterns for Whole Slide Image Analysis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8639-8649} }
Co-STAR: Collaborative Curriculum Self-Training with Adaptive Regularization for Source-Free Video Domain Adaptation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dadashzadeh_2026_WACV, author = {Dadashzadeh, Amirhossein and Esmati, Parsa and Mirmehdi, Majid}, title = {Co-STAR: Collaborative Curriculum Self-Training with Adaptive Regularization for Source-Free Video Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7821-7831} }
A Novel Metric for Detecting Memorization in Generative Models for Brain MRI Synthesis-
[pdf]
[arXiv]
[bibtex]@InProceedings{Scardace_2026_WACV, author = {Scardace, Antonio and Puglisi, Lemuel and Guarnera, Francesco and Battiato, Sebastiano and Ravi, Daniele}, title = {A Novel Metric for Detecting Memorization in Generative Models for Brain MRI Synthesis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3868-3877} }
FLoMo-Net: A Novel Task-Adaptive Mixture of Experts Routing Framework with Frequency and Uncertainty Correction for Medical Image Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Ahmed_2026_WACV, author = {Ahmed, Md Rayhan and Lasserre, Patricia}, title = {FLoMo-Net: A Novel Task-Adaptive Mixture of Experts Routing Framework with Frequency and Uncertainty Correction for Medical Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4025-4035} }
Detecting Out-of-Distribution Objects through Class-Conditioned Inpainting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nguyen_2026_WACV, author = {Nguyen, Quang-Huy and Zhou, Jin Peng and Liu, Zhenzhen and Bui, Khanh-Huyen and Weinberger, Kilian Q. and Chao, Wei-Lun and Le, Dung D.}, title = {Detecting Out-of-Distribution Objects through Class-Conditioned Inpainting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1937-1947} }
GrounDiff: Diffusion-Based Ground Surface Generation from Digital Surface Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dhaouadi_2026_WACV, author = {Dhaouadi, Oussema and Meier, Johannes and Kaiser, Jacques and Cremers, Daniel}, title = {GrounDiff: Diffusion-Based Ground Surface Generation from Digital Surface Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1355-1364} }
QuEENet: Quantum-Enhanced Expressive Network for Image Classification-
[pdf]
[supp]
[bibtex]@InProceedings{Bayal_2026_WACV, author = {Bayal, Shashank and Dawane, Rushikesh Govind and Komal, Komal and Vipparthi, Santosh Kumar and Murala, Subrahmanyam}, title = {QuEENet: Quantum-Enhanced Expressive Network for Image Classification}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7883-7892} }
What Happens When: Learning Temporal Orders of Events in Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ahn_2026_WACV, author = {Ahn, Daechul and Choi, Yura and Choi, Hyeonbeom and Cho, Seongwon and Kim, San and Choi, Jonghyun}, title = {What Happens When: Learning Temporal Orders of Events in Videos}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2786-2796} }
Identity Verification from Human Scent using Channel Representation of 2D Gas Chromatography-Mass Spectrometry Data-
[pdf]
[supp]
[bibtex]@InProceedings{Spetlik_2026_WACV, author = {Spetlik, Radim and Hlavsa, Jan and \v{C}echov\'a, Jana and Pojmanov\'a, Petra and Matas, Jiri and Urban, \v{S}t\v{e}p\'an}, title = {Identity Verification from Human Scent using Channel Representation of 2D Gas Chromatography-Mass Spectrometry Data}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1471-1480} }
CLUE: Bringing Machine Unlearning to Mobile Devices-
[pdf]
[supp]
[bibtex]@InProceedings{Sayyed_2026_WACV, author = {Sayyed, A.Q.M. Sazzad and Bastian, Nathaniel D. and De Lucia, Michael and Swami, Ananthram and Restuccia, Francesco}, title = {CLUE: Bringing Machine Unlearning to Mobile Devices}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3750-3759} }
SHaSaM: Submodular Hard Sample Mining for Fair Facial Attribute Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Majee_2026_WACV, author = {Majee, Anay and Iyer, Rishabh}, title = {SHaSaM: Submodular Hard Sample Mining for Fair Facial Attribute Recognition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7461-7471} }
Unified Control for Inference-Time Guidance of Denoising Diffusion Models-
[pdf]
[supp]
[bibtex]@InProceedings{Goyal_2026_WACV, author = {Goyal, Maurya and Singh, Anuj and Jamali-Rad, Hadi}, title = {Unified Control for Inference-Time Guidance of Denoising Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5437-5446} }
Hierarchical Adaptive networks with Task vectors for Test-Time Adaptation-
[pdf]
[supp]
[bibtex]@InProceedings{Ambekar_2026_WACV, author = {Ambekar, Sameer and Hasny, Marta and Daza, Laura Alexandra and Lang, Daniel M. and Schnabel, Julia}, title = {Hierarchical Adaptive networks with Task vectors for Test-Time Adaptation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4661-4672} }
SGD-Mix: Enhancing Domain-Specific Image Classification with Label-Preserving Data Augmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dong_2026_WACV, author = {Dong, Yixuan and Su, Fang-Yi and Chiang, Jung-Hsien}, title = {SGD-Mix: Enhancing Domain-Specific Image Classification with Label-Preserving Data Augmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7051-7061} }
Unsupervised Discovery of Long-Term Spatiotemporal Periodic Workflows in Human Activities-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2026_WACV, author = {Yang, Fan and Xie, Quanting and Moteki, Atsunori and Masui, Shoichi and Jiang, Shan and Uchino, Kanji and Bisk, Yonatan and Neubig, Graham}, title = {Unsupervised Discovery of Long-Term Spatiotemporal Periodic Workflows in Human Activities}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5821-5832} }
DoTA: Latent Distribution Conditioned Data Attribution for Diffusion Models-
[pdf]
[supp]
[bibtex]@InProceedings{Joshi_2026_WACV, author = {Joshi, Ninad and Srivastava, Vivek and Karande, Shirish}, title = {DoTA: Latent Distribution Conditioned Data Attribution for Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2022-2031} }
Face-LLaVA: Facial Expression and Attribute Understanding through Instruction Tuning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chaubey_2026_WACV, author = {Chaubey, Ashutosh and Guan, Xulang and Soleymani, Mohammad}, title = {Face-LLaVA: Facial Expression and Attribute Understanding through Instruction Tuning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2648-2660} }
Revisiting an Old Perspective Projection for Monocular 3D Morphable Models Regression-
[pdf]
[bibtex]@InProceedings{Chong_2026_WACV, author = {Chong, Toby and Nakajima, Ryota}, title = {Revisiting an Old Perspective Projection for Monocular 3D Morphable Models Regression}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7799-7808} }
SafeguardGS: 3D Gaussian Primitive Pruning While Avoiding Catastrophic Scene Destruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2026_WACV, author = {Lee, Yongjae and Zhang, Zhaoliang and Fan, Deliang}, title = {SafeguardGS: 3D Gaussian Primitive Pruning While Avoiding Catastrophic Scene Destruction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8479-8489} }
UI-Styler: Ultrasound Image Style Transfer with Class-Aware Prompts for Cross-Device Diagnosis Using a Frozen Black-Box Inference Network-
[pdf]
[supp]
[bibtex]@InProceedings{Do-Tran_2026_WACV, author = {Do-Tran, Nhat-Tuong and Le, Ngoc-Hoang-Lam and Huang, Ching-Chun}, title = {UI-Styler: Ultrasound Image Style Transfer with Class-Aware Prompts for Cross-Device Diagnosis Using a Frozen Black-Box Inference Network}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2765-2774} }
Dressing the Imagination: A Dataset for AI-Powered Translation of Text into Fashion Outfits and A Novel NeRA Adapter for Enhanced Feature Adaptation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Deshmukh_2026_WACV, author = {Deshmukh, Gayatri and De, Somsubhra and Sehgal, Chirag and Gupta, Jishu Sen and Mittal, Sparsh}, title = {Dressing the Imagination: A Dataset for AI-Powered Translation of Text into Fashion Outfits and A Novel NeRA Adapter for Enhanced Feature Adaptation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2094-2103} }
SENCA-st: Integrating Spatial Transcriptomics and Histopathology with Cross Attention Shared Encoder for Region Identification in Cancer Pathology-
[pdf]
[arXiv]
[bibtex]@InProceedings{Liyanaarachchi_2026_WACV, author = {Liyanaarachchi, Shanaka and Wijethunga, Chathurya and Ahamed, Shihab Aaqil and Absar, Akthas and Rodrigo, Ranga}, title = {SENCA-st: Integrating Spatial Transcriptomics and Histopathology with Cross Attention Shared Encoder for Region Identification in Cancer Pathology}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3578-3587} }
UniDiff: Parameter-Efficient Adaptation of Diffusion Models for Land Cover Classification with Multi-Modal Remotely Sensed Imagery and Sparse Annotations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hu_2026_WACV, author = {Hu, Yuzhen and Prasad, Saurabh}, title = {UniDiff: Parameter-Efficient Adaptation of Diffusion Models for Land Cover Classification with Multi-Modal Remotely Sensed Imagery and Sparse Annotations}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4611-4620} }
Show Me: Unifying Instructional Image and Video Generation with Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Pu_2026_WACV, author = {Pu, Yujiang and Huang, Zhanbo and Boddeti, Vishnu and Kong, Yu}, title = {Show Me: Unifying Instructional Image and Video Generation with Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3285-3296} }
Marshaled Learning: Bridging Large Neural Networks with Memory-Constrained Trusted Execution Environments in Federated Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Ding_2026_WACV, author = {Ding, Shiwei and Yuan, Xiaoyong and Wang, Zhenlin and Zhang, Lan Emily and Ateniese, Giuseppe}, title = {Marshaled Learning: Bridging Large Neural Networks with Memory-Constrained Trusted Execution Environments in Federated Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {647-656} }
Reconstructing Realistic and Relightable Eyes-
[pdf]
[supp]
[bibtex]@InProceedings{Khademi_2026_WACV, author = {Khademi, Wesley and Kundu, Jogendra and An, Yatong and Fix, Alexander and Colmenares, David}, title = {Reconstructing Realistic and Relightable Eyes}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2242-2252} }
Deep Image Decomposition for Medical Imaging Anonymization and Curation-
[pdf]
[supp]
[bibtex]@InProceedings{Elkin_2026_WACV, author = {Elkin, Yael and Ben-Arie, Gal and Riklin-Raviv, Tammy}, title = {Deep Image Decomposition for Medical Imaging Anonymization and Curation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7229-7238} }
An Efficient Multi-Rater Setup Towards Personalized and Diversified Medical Image Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Almorsy_2026_WACV, author = {Almorsy, Sajed and Khalafallah, Ayman and Torki, Marwan}, title = {An Efficient Multi-Rater Setup Towards Personalized and Diversified Medical Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5322-5331} }
Clear Sights on Site: A Spatial-Adaptive Channel Network for Deblurring Construction Site Images-
[pdf]
[supp]
[bibtex]@InProceedings{Bonyani_2026_WACV, author = {Bonyani, Mahdi and Soleymani, Maryam and Wang, Chao}, title = {Clear Sights on Site: A Spatial-Adaptive Channel Network for Deblurring Construction Site Images}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6936-6945} }
GRAPE (Gaussian Rendering for Accelerated Pixel Enhancement) Brings Fast and Lightweight Arbitrary Super-Resolution-
[pdf]
[supp]
[bibtex]@InProceedings{Jang_2026_WACV, author = {Jang, Jung In and Jin, Kyong Hwan}, title = {GRAPE (Gaussian Rendering for Accelerated Pixel Enhancement) Brings Fast and Lightweight Arbitrary Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7750-7758} }
HodgeFormer: Transformers for Learnable Operators on Triangular Meshes through Data-Driven Hodge Matrices-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nousias_2026_WACV, author = {Nousias, Akis and Nousias, Stavros}, title = {HodgeFormer: Transformers for Learnable Operators on Triangular Meshes through Data-Driven Hodge Matrices}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6796-6805} }
Revisiting Vision-Language Foundations for No-Reference Image Quality Assessment-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yadav_2026_WACV, author = {Yadav, Ankit and Huy, Ta Duc and Liu, Lingqiao}, title = {Revisiting Vision-Language Foundations for No-Reference Image Quality Assessment}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5416-5425} }
PS3: Part Level Instance Segmentation in 3D-
[pdf]
[supp]
[bibtex]@InProceedings{Yen_2026_WACV, author = {Yen, Hong-Xuan and Chen, Chiamin and Wang, Yanqing and Liu, Yu-Lun and Sun, Min}, title = {PS3: Part Level Instance Segmentation in 3D}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {898-906} }
UNO: Unifying One-stage Video Scene Graph Generation via Object-Centric Visual Representation Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Le_2026_WACV, author = {Le, Huy and Chung, Nhat and Kieu, Tung and Yang, Jingkang and Le, Ngan}, title = {UNO: Unifying One-stage Video Scene Graph Generation via Object-Centric Visual Representation Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2797-2807} }
ITSELF: Attention Guided Fine-Grained Alignment for Vision-Language Retrieval-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nguyen_2026_WACV, author = {Nguyen, Tien-Huy and Tran, Huu-Loc and Ngo, Thanh Duc}, title = {ITSELF: Attention Guided Fine-Grained Alignment for Vision-Language Retrieval}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1448-1458} }
Structure-Aware Feature Rectification with Region Adjacency Graphs for Training-free Open-Vocabulary Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2026_WACV, author = {Huang, Qiming and Ai, Hao and Jiao, Jianbo}, title = {Structure-Aware Feature Rectification with Region Adjacency Graphs for Training-free Open-Vocabulary Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4118-4127} }
Uplifting Table Tennis: A Robust, Real-World Application for 3D Trajectory and Spin Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kienzle_2026_WACV, author = {Kienzle, Daniel and Ludwig, Katja and Lorenz, Julian and Satoh, Shin'Ichi and Lienhart, Rainer}, title = {Uplifting Table Tennis: A Robust, Real-World Application for 3D Trajectory and Spin Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7440-7449} }
Empowering Source-Free Domain Adaptation via MLLM-Guided Reliability-Based Curriculum Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2026_WACV, author = {Chen, Dongjie and Patwari, Kartik and Lai, Zhengfeng and Zhu, Xiaoguang and Cheung, Sen-ching and Chuah, Chen-Nee}, title = {Empowering Source-Free Domain Adaptation via MLLM-Guided Reliability-Based Curriculum Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4262-4272} }
LighthouseGS: Indoor Structure-aware 3D Gaussian Splatting for Panorama-Style Mobile Captures-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Han_2026_WACV, author = {Han, Seungoh and Jang, Jaehoon and Kim, Hyunsu and Surh, Jaeheung and Kwak, Junhyung and Ha, Hyowon and Joo, Kyungdon}, title = {LighthouseGS: Indoor Structure-aware 3D Gaussian Splatting for Panorama-Style Mobile Captures}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3441-3450} }
Mitigating Object and Action Hallucinations in Multimodal LLMs via Self-Augmented Contrastive Alignment-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chang_2026_WACV, author = {Chang, Kai-Po and Cheng, Wei-Yuan and Huang, Chi-Pin and Yang, Fu-En and Wang, Yu-Chiang Frank}, title = {Mitigating Object and Action Hallucinations in Multimodal LLMs via Self-Augmented Contrastive Alignment}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3172-3181} }
Segmentation-Aware Latent Diffusion for Satellite Image Super-Resolution: Enabling Smallholder Farm Boundary Delineation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Agarwal_2026_WACV, author = {Agarwal, Aditi and Jain, Anjali and Saxena, Nikita and Deshpande, Ishan and Kazmierski, Michal and Annkah, Abigail and Sherman, Nadav and Shanmugam, Karthikeyan and Talekar, Alok and Rajan, Vaibhav}, title = {Segmentation-Aware Latent Diffusion for Satellite Image Super-Resolution: Enabling Smallholder Farm Boundary Delineation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1864-1874} }
Eff-GRot: Efficient and Generalizable Rotation Estimation with Transformers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mathioulakis_2026_WACV, author = {Mathioulakis, Fanis and Radevski, Gorjan and Tuytelaars, Tinne}, title = {Eff-GRot: Efficient and Generalizable Rotation Estimation with Transformers}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {412-421} }
Roadside Monocular 3D Detection Prompted by 2D Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ma_2026_WACV, author = {Ma, Yechi and Hua, Wei and Li, Yanan and Kong, Shu}, title = {Roadside Monocular 3D Detection Prompted by 2D Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1895-1905} }
Divide and Refine: Enhancing Multimodal Representation and Explainability for Emotion Recognition in Conversation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Mai_2026_WACV, author = {Mai, Anh-Tuan and Nguyen, Cam-Van Thi and Le, Duc-Trong}, title = {Divide and Refine: Enhancing Multimodal Representation and Explainability for Emotion Recognition in Conversation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2700-2709} }
End-to-End Fine-Tuning of 3D Texture Generation using Differentiable Rewards-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zamani_2026_WACV, author = {Zamani, AmirHossein and Xie, Tianhao and Aghdam, Amir G. and Popa, Tiberiu and Belilovsky, Eugene}, title = {End-to-End Fine-Tuning of 3D Texture Generation using Differentiable Rewards}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {171-180} }
ImageNet-sES: A First Systematic Study of Sensor-Environment Simulation Anchored by Real Recaptures-
[pdf]
[bibtex]@InProceedings{Kim_2026_WACV, author = {Kim, Ji-yoon and Baek, Eunsu and Kim, Hyung-Sin}, title = {ImageNet-sES: A First Systematic Study of Sensor-Environment Simulation Anchored by Real Recaptures}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1117-1126} }
LVM-Lite: Training Large Vision Models with Efficient Sequential Modeling-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Xianhang and Zhu, Hongru and Ren, Sucheng and Yang, Linjie and Wang, Peng and Wang, Heng and Shen, Xiaohui and Liu, Qing and Xie, Cihang}, title = {LVM-Lite: Training Large Vision Models with Efficient Sequential Modeling}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4566-4576} }
MEDAL: multi-modal MEta-space Distillation and ALignment for Visual Compatibility Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Sanny_2026_WACV, author = {Sanny, Dween Rabius and Verma, Vinay Kumar and Sircar, Prateek and Gupta, Deepak}, title = {MEDAL: multi-modal MEta-space Distillation and ALignment for Visual Compatibility Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {888-897} }
Rank-based Geographical Regularization: Revisiting Contrastive Self-Supervised Learning for Multispectral Remote Sensing Imagery-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Burgert_2026_WACV, author = {Burgert, Tom and Hackel, Leonard and Rota, Paolo and Demir, Beg\"um}, title = {Rank-based Geographical Regularization: Revisiting Contrastive Self-Supervised Learning for Multispectral Remote Sensing Imagery}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4375-4385} }
LiDAR-DHMT: LiDAR-Adaptive Dual Hierarchical Mask Transformer for Robust Freespace Detection and Semantic Segmentation-
[pdf]
[bibtex]@InProceedings{Chen_2026_WACV, author = {Chen, Siyu and Han, Ting and Zhang, Changshe and Luo, Xin and Chen, Huan and Wu, Meiliu and Cai, Guorong and Su, Jinhe}, title = {LiDAR-DHMT: LiDAR-Adaptive Dual Hierarchical Mask Transformer for Robust Freespace Detection and Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1252-1261} }
SCATR: Mitigating New Instance Suppression in LiDAR-based Tracking-by-Attention via Second Chance Assignment and Track Query Dropout-
[pdf]
[supp]
[bibtex]@InProceedings{Cheong_2026_WACV, author = {Cheong, Brian and Wang, Letian and Papais, Sandro and Waslander, Steven L.}, title = {SCATR: Mitigating New Instance Suppression in LiDAR-based Tracking-by-Attention via Second Chance Assignment and Track Query Dropout}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3330-3339} }
GeneVA: A Dataset of Human Annotations for Generative Text to Video Artifacts-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kang_2026_WACV, author = {Kang, Jenna and Silva, Maria Beatriz and Sangkloy, Patsorn and Chen, Kenneth and Williams, Niall L. and Sun, Qi}, title = {GeneVA: A Dataset of Human Annotations for Generative Text to Video Artifacts}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6174-6183} }
Domain Generalizing DINO for Visual Regression via Latent Distractor Subspace Consistency-
[pdf]
[supp]
[bibtex]@InProceedings{Reddy_2026_WACV, author = {Reddy, Nikhil and Arora, Chetan and Baktashmotlagh, Mahsa}, title = {Domain Generalizing DINO for Visual Regression via Latent Distractor Subspace Consistency}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4057-4066} }
Dragonite: Single-Step Drag-based Image Editing with Geometric-Semantic Guidance-
[pdf]
[supp]
[bibtex]@InProceedings{Jhong_2026_WACV, author = {Jhong, Meng-Ting and Huang, Tai-Ming and Chen, Shang-Fu and Cheng, Wen-Huang and Hua, Kai-Lung}, title = {Dragonite: Single-Step Drag-based Image Editing with Geometric-Semantic Guidance}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3057-3066} }
Synthesizing Compositional Videos from Text Description-
[pdf]
[supp]
[bibtex]@InProceedings{Singh_2026_WACV, author = {Singh, Prajwal and Kulkarni, Kuldeep and Raman, Shanmuganathan and Rangwani, Harsh}, title = {Synthesizing Compositional Videos from Text Description}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6775-6784} }
Layout Anything: One Transformer for Universal Room Layout Estimation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Mia_2026_WACV, author = {Mia, Md Sohag and Adnan, Muhammad Abdullah}, title = {Layout Anything: One Transformer for Universal Room Layout Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1565-1574} }
TS-PCI: Point Cloud Frame Interpolation with Time-Aware Point Cloud Sampling and Self-Supervised Learning Strategy-
[pdf]
[bibtex]@InProceedings{Matsuzaki_2026_WACV, author = {Matsuzaki, Kohei and Nonaka, Keisuke}, title = {TS-PCI: Point Cloud Frame Interpolation with Time-Aware Point Cloud Sampling and Self-Supervised Learning Strategy}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {54-65} }
UniCoRN: Latent Diffusion-based Unified Controllable Image Restoration Network across Multiple Degradations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mandal_2026_WACV, author = {Mandal, Debabrata and Chattopadhyay, Soumitri and Tong, Guansen and Chakravarthula, Praneeth}, title = {UniCoRN: Latent Diffusion-based Unified Controllable Image Restoration Network across Multiple Degradations}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1543-1553} }
MergeSlide: Continual Model Merging and Task-to-Class Prompt-Aligned Inference for Lifelong Learning on Whole Slide Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bui_2026_WACV, author = {Bui, Doanh C. and Ngo, Ba Hung and Pham, Hoai Luan and Nguyen, Khang and Nguyen, Ma{\"\i} K. and Nakashima, Yasuhiko}, title = {MergeSlide: Continual Model Merging and Task-to-Class Prompt-Aligned Inference for Lifelong Learning on Whole Slide Images}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4859-4868} }
Quantifying the Limits of Segmentation Foundation Models: Modeling Challenges in Segmenting Tree-Like and Low-Contrast Objects-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2026_WACV, author = {Zhang, Yixin and Konz, Nicholas and Kramer, Kevin and Mazurowski, Maciej A.}, title = {Quantifying the Limits of Segmentation Foundation Models: Modeling Challenges in Segmenting Tree-Like and Low-Contrast Objects}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5205-5215} }
Spec-Gloss Surfels and Normal-Diffuse Priors for Relightable Glossy Objects-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kouros_2026_WACV, author = {Kouros, Georgios and Wu, Minye and Tuytelaars, Tinne}, title = {Spec-Gloss Surfels and Normal-Diffuse Priors for Relightable Glossy Objects}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4417-4426} }
WorkZone3D: A Multimodal Dataset for 3D Work Zone Perception in Autonomous Driving-
[pdf]
[supp]
[bibtex]@InProceedings{Sural_2026_WACV, author = {Sural, Shounak and Sahu, Nishad and Rajkumar, Ragunathan}, title = {WorkZone3D: A Multimodal Dataset for 3D Work Zone Perception in Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3972-3981} }
Learning Compact Video Representations for Efficient Long-form Video Understanding in Large Multimodal Models-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2026_WACV, author = {Chen, Yuxiao and Wang, Jue and Zhang, Zhikang and Yi, Jingru and Zhang, Xu and Zou, Yang and Cai, Zhaowei and Yuan, Jianbo and Li, Xinyu and Yang, Hao and Modolo, Davide}, title = {Learning Compact Video Representations for Efficient Long-form Video Understanding in Large Multimodal Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4242-4252} }
CURIO: Curvature-Aligned and Efficient OCR for Low-Resource Historical Manuscripts-
[pdf]
[supp]
[bibtex]@InProceedings{Gunda_2026_WACV, author = {Gunda, Sai Madhusudan and Ghosh, Tathagata and Sandral, Simran Singh and Sarvadevabhatla, Ravi Kiran}, title = {CURIO: Curvature-Aligned and Efficient OCR for Low-Resource Historical Manuscripts}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2011-2021} }
Surgical Gaussian Surfels: Highly Accurate Real-time Surgical Scene Rendering using Gaussian Surfels-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sunmola_2026_WACV, author = {Sunmola, Idris O. and Zhao, Zhenjun and Schmidgall, Samuel and Wang, Yumeng and Scheikl, Paul Maria and Pham, Viet and Krieger, Axel}, title = {Surgical Gaussian Surfels: Highly Accurate Real-time Surgical Scene Rendering using Gaussian Surfels}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4515-4524} }
InteracTalker: Prompt-Based Human-Object Interaction with Co-Speech Gesture Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Rajan_2026_WACV, author = {Rajan, Sreehari and Bhosikar, Kunal and Sharma, Charu}, title = {InteracTalker: Prompt-Based Human-Object Interaction with Co-Speech Gesture Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1438-1447} }
SSMT-Net: A Semi-Supervised Multitask Transformer-Based Network for Thyroid Nodule Segmentation in Ultrasound Images-
[pdf]
[bibtex]@InProceedings{Farooq_2026_WACV, author = {Farooq, Muhammad Umar and Rehman, Abd Ur and Rehman, Azka and Usman, Muhammad and Chae, Dong-Kyu}, title = {SSMT-Net: A Semi-Supervised Multitask Transformer-Based Network for Thyroid Nodule Segmentation in Ultrasound Images}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6069-6079} }
SAVE: Sparse Autoencoder-Driven Visual Information Enhancement for Mitigating Object Hallucination-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Park_2026_WACV, author = {Park, Sangha and Yoo, Seungryong and Mok, Jisoo and Yoon, Sungroh}, title = {SAVE: Sparse Autoencoder-Driven Visual Information Enhancement for Mitigating Object Hallucination}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7935-7944} }
Non-Aligned Reference Image Quality Assessment for Novel View Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ghildyal_2026_WACV, author = {Ghildyal, Abhijay and Sureddi, Rajesh and Barman, Nabajeet and Zadtootaghaj, Saman and Bovik, Alan C}, title = {Non-Aligned Reference Image Quality Assessment for Novel View Synthesis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6350-6359} }
PSDiffusion: Harmonized Multi-Layer Image Generation via Layout and Appearance Alignment-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2026_WACV, author = {Huang, Dingbang and Li, Wenbo and Zhao, Yifei and Pan, Xinyu and Zeng, Yanhong and Dai, Bo}, title = {PSDiffusion: Harmonized Multi-Layer Image Generation via Layout and Appearance Alignment}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3233-3242} }
HiMix : Hierarchical Visual-Textual Mixing Network for Lesion Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Hwang_2026_WACV, author = {Hwang, Soojin and Sim, Jaeyoon and Kim, Won Hwa}, title = {HiMix : Hierarchical Visual-Textual Mixing Network for Lesion Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5332-5341} }
EllipssianNet: Image-guided Sampling of 2D Gaussians for Gaussian Splatting-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2026_WACV, author = {Kim, MyoungGon and Ahn, JeongHyeon and Park, Seohyeon and Kim, Hyemi and Park, Seunghyun and Hwang, Jung Ho and Han, JungHyun}, title = {EllipssianNet: Image-guided Sampling of 2D Gaussians for Gaussian Splatting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2104-2113} }
BAFLE-DCT: Bypassing Adversarial Filters via Frequency-Selective Embedding in the DCT Domain-
[pdf]
[bibtex]@InProceedings{Mendis_2026_WACV, author = {Mendis, Thilina and Kandah, Farah and Aakur, Sathyanarayanan N.}, title = {BAFLE-DCT: Bypassing Adversarial Filters via Frequency-Selective Embedding in the DCT Domain}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5967-5976} }
SSplain: Sparse and Smooth Explainer for Retinopathy of Prematurity Classification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sunger_2026_WACV, author = {Sunger, Elifnur and Imbiriba, Tales and Campbell, Peter and Erdogmus, Deniz and Ioannidis, Stratis and Dy, Jennifer}, title = {SSplain: Sparse and Smooth Explainer for Retinopathy of Prematurity Classification}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1705-1715} }
VLMDiff: Leveraging Vision-Language Models for Multi-Class Anomaly Detection with Diffusion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hicsonmez_2026_WACV, author = {Hicsonmez, Samet and El Rahman Shabayek, Abd and Aouada, Djamila}, title = {VLMDiff: Leveraging Vision-Language Models for Multi-Class Anomaly Detection with Diffusion}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6309-6319} }
MapVerse: A Benchmark for Geospatial Question Answering on Diverse Real-World Maps-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bhat_2026_WACV, author = {Bhat, Sharat and Khandelwal, Harshita and Kataria, Tushar and Gupta, Vivek}, title = {MapVerse: A Benchmark for Geospatial Question Answering on Diverse Real-World Maps}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8168-8178} }
Integrating Multi-scale and Multi-filtration Topological Features for Medical Image Classification-
[pdf]
[arXiv]
[bibtex]@InProceedings{Gu_2026_WACV, author = {Gu, Pengfei and Li, Huimin and Tang, Haoteng and Xu, Dongkuan and Enriquez, Erik and Kim, DongChul and Fu, Bin and Chen, Danny Z}, title = {Integrating Multi-scale and Multi-filtration Topological Features for Medical Image Classification}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8660-8669} }
FlyPose: Towards Robust Human Pose Estimation From Aerial Views-
[pdf]
[bibtex]@InProceedings{Farooq_2026_WACV, author = {Farooq, Hassaan and Brenner, Marvin and St\"utz, Peter}, title = {FlyPose: Towards Robust Human Pose Estimation From Aerial Views}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8617-8627} }
AdaptViG: Adaptive Vision GNN with Exponential Decay Gating-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Munir_2026_WACV, author = {Munir, Mustafa and Rahman, Md Mostafijur and Marculescu, Radu}, title = {AdaptViG: Adaptive Vision GNN with Exponential Decay Gating}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {440-450} }
SAVeD: Learning to Denoise Low-SNR Video for Improved Downstream Performance-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Stathatos_2026_WACV, author = {Stathatos, Suzanne and Hobley, Michael and Perona, Pietro and Marks, Markus}, title = {SAVeD: Learning to Denoise Low-SNR Video for Improved Downstream Performance}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6851-6861} }
See, Record, Do: Automated Generation of UI Workflows from Tutorial Videos-
[pdf]
[bibtex]@InProceedings{Beauchaine_2026_WACV, author = {Beauchaine, Adam and Shue, Craig}, title = {See, Record, Do: Automated Generation of UI Workflows from Tutorial Videos}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6256-6265} }
VADER: Towards Causal Video Anomaly Understanding with Relation-Aware Large Language Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cheng_2026_WACV, author = {Cheng, Ying and Lin, Yu-Ho and Chen, Min-Hung and Yang, Fu-En and Lai, Shang-Hong}, title = {VADER: Towards Causal Video Anomaly Understanding with Relation-Aware Large Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7301-7311} }
Pretraining Helps When Capacity Allows: Evidence from Ultra-Small ConvNets-
[pdf]
[supp]
[bibtex]@InProceedings{Muralidharan_2026_WACV, author = {Muralidharan, Srikanth and Medeiros, Heitor R. and Aminbeidokhti, Masih and Granger, Eric and Pedersoli, Marco}, title = {Pretraining Helps When Capacity Allows: Evidence from Ultra-Small ConvNets}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8333-8342} }
SmoothDiffusion-VE: Real-time Generative Video Editing Using Adaptive Feature Cache-
[pdf]
[supp]
[bibtex]@InProceedings{Munir_2026_WACV, author = {Munir, Mustafa and Zalewski, Sophia and Liu, Shiqiu and Tarjan, David and Belede, Sushmitha and Patney, Anjul and Marculescu, Radu}, title = {SmoothDiffusion-VE: Real-time Generative Video Editing Using Adaptive Feature Cache}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8468-8478} }
CropAT: Leveraging Diffusion-Generated Target-Like Cropped Objects for Pseudo-Label Refinement in Domain-Adaptive Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Huang_2026_WACV, author = {Huang, Chen-Che and Huang, Tzuhsuan and Chen, Jun-Cheng}, title = {CropAT: Leveraging Diffusion-Generated Target-Like Cropped Objects for Pseudo-Label Refinement in Domain-Adaptive Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4621-4630} }
Leveraging Sparsity for Privacy in Collaborative Inference-
[pdf]
[supp]
[bibtex]@InProceedings{Hoefler_2026_WACV, author = {Hoefler, Maximilian Andreas and Mueller, Karsten and Samek, Wojciech}, title = {Leveraging Sparsity for Privacy in Collaborative Inference}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7596-7604} }
Rethinking Real Image Editing: Unleashing Diverse Editing Operators via Multi-Objective Optimization-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2026_WACV, author = {Wang, Siyuan and Yang, Xi and Zhou, Zihao and Shao, Huiru and Zhang, Rui and Wang, Qiufeng and Cheng, Guangliang and Huang, Kaizhu}, title = {Rethinking Real Image Editing: Unleashing Diverse Editing Operators via Multi-Objective Optimization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4150-4159} }
UltraClean: A Simple Framework to Train Robust Neural Networks against Backdoor Attacks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhao_2026_WACV, author = {Zhao, Bingyin and Lao, Yingjie}, title = {UltraClean: A Simple Framework to Train Robust Neural Networks against Backdoor Attacks}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8353-8363} }
A Little More Like This: Text-to-Image Retrieval with Vision-Language Models Using Relevance Feedback-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Khaertdinov_2026_WACV, author = {Khaertdinov, Bulat and Popa, Mirela and Tintarev, Nava}, title = {A Little More Like This: Text-to-Image Retrieval with Vision-Language Models Using Relevance Feedback}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3825-3834} }
CONSTANT: Towards High-Quality One-Shot Handwriting Generation with Patch Contrastive Enhancement and Style-Aware Quantization-
[pdf]
[supp]
[bibtex]@InProceedings{Le_2026_WACV, author = {Le, Anh-Duy and Pham, Van-Linh and Vo, Thanh-Nam and Mai, Xuan Toan and Tran, Tuan-Anh}, title = {CONSTANT: Towards High-Quality One-Shot Handwriting Generation with Patch Contrastive Enhancement and Style-Aware Quantization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4295-4304} }
QAL : A Loss for Recall-Precision Balance in 3D Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Meshram_2026_WACV, author = {Meshram, Pranay and Turkar, Yash and Singh, Kartikeya and Masilamani, Praveen Raj and Adhivarahan, Charuvahan and Dantu, Karthik}, title = {QAL : A Loss for Recall-Precision Balance in 3D Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7965-7974} }
PADM: A Physics-aware Diffusion Model for Attenuation Correction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Pham_2026_WACV, author = {Pham, Trung Kien and Vu, Hoang Minh and Chu, Anh Duc and Nguyen, Dac Thai and Nguyen, Trung Thanh and Truong, Thao Nguyen and Son, Mai Hong and Nguyen, Thanh Trung and Le Nguyen, Phi}, title = {PADM: A Physics-aware Diffusion Model for Attenuation Correction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2606-2615} }
FB-4D: Spatial-Temporal Coherent Dynamic 3D Content Generation with Feature Banks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Jinwei and Gao, Huan-Ang and Li, Wenyi and Chi, Haohan and Liu, Chenyu and Du, Chenxi and Liu, Yiqian and Gao, Mingju and Zhang, Guiyu and Zhang, Zongzheng and Yi, Li and Yao, Yao and Zhao, Jingwei and Li, Hongyang and Wang, Yikai and Zhao, Hao}, title = {FB-4D: Spatial-Temporal Coherent Dynamic 3D Content Generation with Feature Banks}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5290-5301} }
MEGA-PCC: A Mamba-based Efficient Approach for Joint Geometry and Attribute Point Cloud Compression-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hsieh_2026_WACV, author = {Hsieh, Kai-Hsiang and Yim, Monyneath and Peng, Wen-Hsiao and Chiang, Jui-Chiu}, title = {MEGA-PCC: A Mamba-based Efficient Approach for Joint Geometry and Attribute Point Cloud Compression}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1820-1830} }
CalibBEV: LiDAR-Camera Calibration via BEV Alignment-
[pdf]
[supp]
[bibtex]@InProceedings{D'Addeo_2026_WACV, author = {D'Addeo, Filippo and Cipelli, Lorenzo and Cardace, Adriano and Ghelfi, Emanuele and Zinelli, Andrea and Bertozzi, Massimo}, title = {CalibBEV: LiDAR-Camera Calibration via BEV Alignment}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4345-4354} }
Interaction-via-Actions: Cattle Interaction Detection with Joint Learning of Action-Interaction Latent Space-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nakagawa_2026_WACV, author = {Nakagawa, Ren and Yang, Yang and Shinoda, Risa and Santo, Hiroaki and Oyama, Kenji and Okura, Fumio and Ohkawa, Takenao}, title = {Interaction-via-Actions: Cattle Interaction Detection with Joint Learning of Action-Interaction Latent Space}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1979-1988} }
RobustGait: Robustness Analysis for Appearance Based Gait Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sayera_2026_WACV, author = {Sayera, Reeshoon and Kumar, Akash and Mitra, Sirshapan and Kamtam, Prudvi and Rawat, Yogesh S}, title = {RobustGait: Robustness Analysis for Appearance Based Gait Recognition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2541-2552} }
DualRes: Production-ready Dynamic Object Detection-
[pdf]
[bibtex]@InProceedings{El_Hassani_2026_WACV, author = {El Hassani, Jibril and Verelst, Thomas}, title = {DualRes: Production-ready Dynamic Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7842-7851} }
DMS2F-HAD: A Dual-branch Mamba-based Spatial-Spectral Fusion Network for Hyperspectral Anomaly Detection-
[pdf]
[arXiv]
[bibtex]@InProceedings{Pant_2026_WACV, author = {Pant, Aayushma and Tamang, Lakpa and Lee, Tsz-Kwan and Aryal, Sunil}, title = {DMS2F-HAD: A Dual-branch Mamba-based Spatial-Spectral Fusion Network for Hyperspectral Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5623-5632} }
FedSCAl: Leveraging Server and Client Alignment for Unsupervised Federated Source-Free Domain Adaptation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yashwanth_2026_WACV, author = {Yashwanth, M. and Koti, Sampath and Singh, Arunabh and Marjit, Shyam and Chakraborty, Anirban}, title = {FedSCAl: Leveraging Server and Client Alignment for Unsupervised Federated Source-Free Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4108-4117} }
Meta-YOLO: Metadata-Guided Real-Time Object Detector in Aerial Imagery-
[pdf]
[supp]
[bibtex]@InProceedings{Yoon_2026_WACV, author = {Yoon, Deukryeol and Kim, Seonghak and Sung, Young Hwa and Jung, Jinho}, title = {Meta-YOLO: Metadata-Guided Real-Time Object Detector in Aerial Imagery}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7975-7984} }
SAIL: Self-supervised Learning of Lighting-Invariant Representations from Real Images with Latent Diffusion-
[pdf]
[supp]
[bibtex]@InProceedings{Djeghim_2026_WACV, author = {Djeghim, Hala and Loscos, C\'eline and Sidib\'e, D\'esir\'e}, title = {SAIL: Self-supervised Learning of Lighting-Invariant Representations from Real Images with Latent Diffusion}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3223-3232} }
Zero-Shot Video Deraining with Video Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Varanka_2026_WACV, author = {Varanka, Tuomas and Gonzalez, Juan Luis and Kim, Hyeongwoo and Garrido, Pablo and Yao, Xu}, title = {Zero-Shot Video Deraining with Video Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {677-687} }
Generalized Category Discovery for LiDAR Semantic Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2026_WACV, author = {Kim, Minseok and Boo, Jiyong and Yoon, Kuk-Jin}, title = {Generalized Category Discovery for LiDAR Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8416-8426} }
GrowTAS: Progressive Expansion from Small to Large Subnets for Efficient ViT Architecture Search-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2026_WACV, author = {Lee, Hyunju and Oh, Youngmin and Jeon, Jeimin and Baek, Donghyeon and Ham, Bumsub}, title = {GrowTAS: Progressive Expansion from Small to Large Subnets for Efficient ViT Architecture Search}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5047-5056} }
NeuroBridge: Few-Shot Cross-Modal Neuron Re-identification via Dual-Channel Deep Metric Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Wenwei and Liao, Mingwei and Cai, Lingyi and Li, Anan}, title = {NeuroBridge: Few-Shot Cross-Modal Neuron Re-identification via Dual-Channel Deep Metric Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8670-8679} }
IPTQ-ViT: Post-Training Quantization of Non-linear Functions for Integer-only Vision Transformers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2026_WACV, author = {Kim, Gihwan and Lee, Jemin and Kim, Hyungshin}, title = {IPTQ-ViT: Post-Training Quantization of Non-linear Functions for Integer-only Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7366-7375} }
DynaGSLAM: Real-Time Gaussian-Splatting SLAM for Online Rendering, Tracking, Motion Predictions of Moving Objects in Dynamic Scenes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Runfa Blark and Shaghaghi, Mahdi and Suzuki, Keito and Liu, Xinshuang and Moparthi, Varun and Du, Bang and Curtis, Walker and Renschler, Martin and Lee, Ki Myung Brian and Atanasov, Nikolay and Nguyen, Truong}, title = {DynaGSLAM: Real-Time Gaussian-Splatting SLAM for Online Rendering, Tracking, Motion Predictions of Moving Objects in Dynamic Scenes}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2434-2444} }
Denoise, Divide, Distill, and Predict (D3P): Towards Forecasting Long-horizon Real-world Anomaly from Normalcy-
[pdf]
[bibtex]@InProceedings{Merilleau_2026_WACV, author = {M\'erilleau, Quentin and Majhi, Snehashis and Dantcheva, Antitza and Kong, Quan and Garattoni, Lorenzo and Francesca, Gianpiero and Bremond, Francois}, title = {Denoise, Divide, Distill, and Predict (D3P): Towards Forecasting Long-horizon Real-world Anomaly from Normalcy}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6246-6255} }
Zero-Shot Domain Generalisation via Prompt-Driven Feature Refinement-
[pdf]
[bibtex]@InProceedings{Qiao_2026_WACV, author = {Qiao, Tingrui and Zhao, Di and Walker, Caroline and Cunningham, Chris and Koh, Yun Sing}, title = {Zero-Shot Domain Generalisation via Prompt-Driven Feature Refinement}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6184-6193} }
Generalizing Sports Feedback Generation by Watching Competitions and Reading Books: A Rock Climbing Case Study-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Rai_2026_WACV, author = {Rai, Arushi and Kovashka, Adriana}, title = {Generalizing Sports Feedback Generation by Watching Competitions and Reading Books: A Rock Climbing Case Study}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8136-8145} }
ChameleonTuner: Automatic ISP Color Tuning in Subjective Scenarios-
[pdf]
[bibtex]@InProceedings{Tan_2026_WACV, author = {Tan, Zijie and Yue, Yuxin and Rashidi, Bahador}, title = {ChameleonTuner: Automatic ISP Color Tuning in Subjective Scenarios}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {297-307} }
ControlVP: Interactive Geometric Refinement of AI-Generated Images with Consistent Vanishing Points-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Okumura_2026_WACV, author = {Okumura, Ryota and Shiohara, Kaede and Yamasaki, Toshihiko}, title = {ControlVP: Interactive Geometric Refinement of AI-Generated Images with Consistent Vanishing Points}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5744-5753} }
UnderWater SLAM with Laser-light sectioning method using ST-GAT-
[pdf]
[supp]
[bibtex]@InProceedings{Gao_2026_WACV, author = {Gao, Heyang and Ichimaru, Kazuto and Iwaguchi, Takafumi and Kawasaki, Hiroshi}, title = {UnderWater SLAM with Laser-light sectioning method using ST-GAT}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {88-96} }
Non-Contact Blood Pressure Estimation from Face Videos via Physiology-Aware Contrastive Learning-
[pdf]
[bibtex]@InProceedings{Son_2026_WACV, author = {Son, JaeHyuk and Choi, Young-Seok}, title = {Non-Contact Blood Pressure Estimation from Face Videos via Physiology-Aware Contrastive Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2414-2423} }
Shift-Equivariant Complex-Valued Convolutional Neural Networks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gabot_2026_WACV, author = {Gabot, Quentin and Lim, Teck-Yian and Fix, Jeremy and Frontera-Pons, Joana and Ren, Chengfang and Ovarlez, Jean-Philippe}, title = {Shift-Equivariant Complex-Valued Convolutional Neural Networks}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2575-2584} }
HiGlassRM: Learning to Remove High-prescription Glasses via Synthetic Dataset Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Lee_2026_WACV, author = {Lee, Sebin and Kim, Heewon}, title = {HiGlassRM: Learning to Remove High-prescription Glasses via Synthetic Dataset Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4577-4586} }
Neural Geometry Image-Based Representations with Optimal Transport (OT)-
[pdf]
[arXiv]
[bibtex]@InProceedings{Gao_2026_WACV, author = {Gao, Xiang and Liu, Yuanpeng and Li, Jiazhi and Wang, Xinmu and Guo, Minghao and Guo, Yu and Song, Xiyun and Yu, Heather and Lao, Zhiqiang and Gu, Xianfeng David}, title = {Neural Geometry Image-Based Representations with Optimal Transport (OT)}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6676-6686} }
Multimodal Adversarial Defense for Vision-Language Models by Leveraging One-To-Many Relationships-
[pdf]
[supp]
[bibtex]@InProceedings{Waseda_2026_WACV, author = {Waseda, Futa and Tejero-de-Pablos, Antonio and Echizen, Isao}, title = {Multimodal Adversarial Defense for Vision-Language Models by Leveraging One-To-Many Relationships}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6968-6977} }
FujiView: Multimodal Late-Fusion for Predicting Scenic Visibility-
[pdf]
[bibtex]@InProceedings{Bible_2026_WACV, author = {Bible, Bryceton and Hasnaeen, Nehal and Qi, Hairong}, title = {FujiView: Multimodal Late-Fusion for Predicting Scenic Visibility}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5653-5661} }
Sketch3R: Rapid and Realistic 3D VR Sketch Creation to Shape Retrieval-
[pdf]
[supp]
[bibtex]@InProceedings{Halder_2026_WACV, author = {Halder, Mritunjoy and Shukla, Shivam Ashok and Tiwari, Lokender and Mittal, Raghav and Bhowmick, Brojeshwar}, title = {Sketch3R: Rapid and Realistic 3D VR Sketch Creation to Shape Retrieval}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8680-8689} }
MapleGrasp: Mask-guided Feature Pooling for Language-driven Efficient Robotic Grasping-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bhat_2026_WACV, author = {Bhat, Vineet and Patel, Naman and Krishnamurthy, Prashanth and Karri, Ramesh and Khorrami, Farshad}, title = {MapleGrasp: Mask-guided Feature Pooling for Language-driven Efficient Robotic Grasping}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7554-7564} }
Explaining the Unseen: Multimodal Vision-Language Reasoning for Situational Awareness in Underground Mining Disasters-
[pdf]
[arXiv]
[bibtex]@InProceedings{Jewel_2026_WACV, author = {Jewel, Mizanur Rahman and Elmahallawy, Mohamed and Madria, Sanjay and Frimpong, Samuel}, title = {Explaining the Unseen: Multimodal Vision-Language Reasoning for Situational Awareness in Underground Mining Disasters}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1324-1333} }
ReBrain: Brain MRI Reconstruction from Sparse CT Slice via Retrieval-Augmented Diffusion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2026_WACV, author = {Liu, Junming and Sun, Yifei and Cheng, Weihua and Kang, Yujin and Chen, Yirong and Wang, Ding and Zeng, Guosun}, title = {ReBrain: Brain MRI Reconstruction from Sparse CT Slice via Retrieval-Augmented Diffusion}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4004-4014} }
QUOTA: Quantifying Objects with Text-to-Image Models for Any Domain-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sun_2026_WACV, author = {Sun, Wenfang and Du, Yingjun and Liu, Gaowen and Zheng, Yefeng and Snoek, Cees G. M.}, title = {QUOTA: Quantifying Objects with Text-to-Image Models for Any Domain}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6381-6390} }
Chain-of-Look Spatial Reasoning for Dense Surgical Instrument Counting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bhyri_2026_WACV, author = {Bhyri, Rishikesh and Quaranto, Brian R and Yuan, Junsong and Kim, Peter C W and Xi, Nan}, title = {Chain-of-Look Spatial Reasoning for Dense Surgical Instrument Counting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8521-8530} }
Towards Fine-Grained Adaptation of CLIP via a Self-Trained Alignment Score-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ali_2026_WACV, author = {Ali, Eman and Silva, Sathira and Arora, Chetan and Khan, Muhammad Haris}, title = {Towards Fine-Grained Adaptation of CLIP via a Self-Trained Alignment Score}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5875-5885} }
Zero-Shot Coreset Selection via Iterative Subspace Sampling-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Griffin_2026_WACV, author = {Griffin, Brent A. and Marks, Jacob and Corso, Jason J.}, title = {Zero-Shot Coreset Selection via Iterative Subspace Sampling}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2114-2124} }
Mobile-Oriented Video Diffusion: Enabling Text-to-Video Generation on Mobile Devices Without Retraining, Compression, or Pruning-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2026_WACV, author = {Kim, Bosung and Lee, Kyuhwan and Jeong, Isu and Cheon, Jungmin and Lee, Yeojin and Lee, Seulki}, title = {Mobile-Oriented Video Diffusion: Enabling Text-to-Video Generation on Mobile Devices Without Retraining, Compression, or Pruning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3961-3971} }
Efficient Vision Transformers via Token Merging with Head-wise Attention Correction-
[pdf]
[supp]
[bibtex]@InProceedings{Ichikawa_2026_WACV, author = {Ichikawa, Yuki and Motomura, Masato and Van Chu, Thiem and Fujiki, Daichi}, title = {Efficient Vision Transformers via Token Merging with Head-wise Attention Correction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3908-3917} }
GFT-GCN: Privacy-Preserving 3D Face Mesh Recognition with Spectral Diffusion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Felouat_2026_WACV, author = {Felouat, Hichem and Wang, Hanrui and Echizen, Isao}, title = {GFT-GCN: Privacy-Preserving 3D Face Mesh Recognition with Spectral Diffusion}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6236-6245} }
Disentangle and Regularize: Sign Language Production with Articulator-Based Disentanglement and Channel-Aware Regularization-
[pdf]
[supp]
[bibtex]@InProceedings{Tasyurek_2026_WACV, author = {Ta\c{s}y\"urek, S\"umeyye Meryem and K{\i}z{\i}ltepe, Tu\u{g}\c{c}e and Keles, Hacer Yalim}, title = {Disentangle and Regularize: Sign Language Production with Articulator-Based Disentanglement and Channel-Aware Regularization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8458-8467} }
Test-Time Adaptation through Semantically-guided Feature Decomposition for Few-shot Chest X-ray Diagnosis-
[pdf]
[supp]
[bibtex]@InProceedings{Mahawar_2026_WACV, author = {Mahawar, Jayant and Paul, Angshuman}, title = {Test-Time Adaptation through Semantically-guided Feature Decomposition for Few-shot Chest X-ray Diagnosis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2445-2454} }
Self-Supervised Compression and Artifact Correction for Streaming Underwater Imaging Sonar-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Qian_2026_WACV, author = {Qian, Rongsheng and Xu, Chi and Ma, Xiaoqiang and Fang, Hao and Jin, Yili and Atlas, William I. and Liu, Jiangchuan}, title = {Self-Supervised Compression and Artifact Correction for Streaming Underwater Imaging Sonar}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4201-4211} }
PointNet4D: A Lightweight 4D Point Cloud Video Backbone for Online and Offline Perception in Robotic Applications-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2026_WACV, author = {Liu, Yunze and Wang, Zifan and Wu, Peiran and Ao, Jiayang}, title = {PointNet4D: A Lightweight 4D Point Cloud Video Backbone for Online and Offline Perception in Robotic Applications}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3203-3212} }
MIST: Multilingual Incidental Dataset for Scene Text Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Mundra_2026_WACV, author = {Mundra, Saumya and Mondal, Ajoy and Jawahar, C.V.}, title = {MIST: Multilingual Incidental Dataset for Scene Text Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7658-7667} }
Unsupervised Memorability Modeling from Tip-of-the-Tongue Retrieval Queries-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bhattacharyya_2026_WACV, author = {Bhattacharyya, Sree and Singla, Yaman K. and Yarram, Sudhir and Singh, Somesh and SI, Harini and Wang, James Z.}, title = {Unsupervised Memorability Modeling from Tip-of-the-Tongue Retrieval Queries}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4234-4241} }
VAST-ReID: A Low-Light Benchmark Dataset for Person Re-Identification with Visual and Attribute-Rich Semantic Tracking-
[pdf]
[supp]
[bibtex]@InProceedings{Khan_2026_WACV, author = {Khan, Hammad and Giri, Rakesh Kumar and Thakare, Kamalakar Vijay and Choi, Heeseung and Jung, Hyungjoo and Dogra, Debi Prosad and Kim, Ig-Jae}, title = {VAST-ReID: A Low-Light Benchmark Dataset for Person Re-Identification with Visual and Attribute-Rich Semantic Tracking}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5833-5841} }
Robust Scene Coordinate Regression via Geometrically-Consistent Global Descriptors-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nguyen_2026_WACV, author = {Nguyen, Son Tung and Fontan, Alejandro and Milford, Michael and Fischer, Tobias}, title = {Robust Scene Coordinate Regression via Geometrically-Consistent Global Descriptors}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8209-8219} }
PointSt3R: Point Tracking through 3D Ground Correspondence-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Guerrier_2026_WACV, author = {Guerrier, Rhodri and Harley, Adam W. and Damen, Dima}, title = {PointSt3R: Point Tracking through 3D Ground Correspondence}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7430-7439} }
NoHumansRequired: Autonomous High-Quality Image Editing Triplet Mining-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kuprashevich_2026_WACV, author = {Kuprashevich, Maksim and Alekseenko, Grigorii and Tolstykh, Irina and Fedorov, Georgii and Suleimanov, Bulat and Dokholyan, Vladimir and Gordeev, Aleksandr}, title = {NoHumansRequired: Autonomous High-Quality Image Editing Triplet Mining}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6059-6068} }
DuPLUS: Dual-Prompt Vision-Language Model for Universal Medical Image Segmentation and Prognosis-
[pdf]
[supp]
[bibtex]@InProceedings{Saeed_2026_WACV, author = {Saeed, Numan and Saleem, Tausifa Jan and Maani, Fadillah and Ridzuan, Muhammad and Wang, Hu and Yaqub, Mohammad}, title = {DuPLUS: Dual-Prompt Vision-Language Model for Universal Medical Image Segmentation and Prognosis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8386-8395} }
Relevance-aware Multi-context Contrastive Decoding for Retrieval-augmented Visual Question Answering-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2026_WACV, author = {Kim, Jongha and Ko, Byungoh and Na, Jeehye and Yoon, Jinsung and Kim, Hyunwoo J.}, title = {Relevance-aware Multi-context Contrastive Decoding for Retrieval-augmented Visual Question Answering}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8596-8605} }
GenHSI: Controllable Generation of Human-Scene Interaction Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Zekun and Zhou, Rui and Sajnani, Rahul and Cong, Xiaoyan and Ritchie, Daniel and Sridhar, Srinath}, title = {GenHSI: Controllable Generation of Human-Scene Interaction Videos}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {138-149} }
Unified Video Anomaly Detection Model for Detecting Different Anomaly Types-
[pdf]
[supp]
[bibtex]@InProceedings{Lee_2026_WACV, author = {Lee, Kijung and Jo, Youngwan and Ahn, Sunghyun and Park, Sanghyun}, title = {Unified Video Anomaly Detection Model for Detecting Different Anomaly Types}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {784-794} }
Image-Guided Semantic Pseudo-LiDAR Point Generation for 3D Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2026_WACV, author = {Lee, Minseung and Moon, Seokha and Lee, Seung Joon and Mahjourian, Reza and Kim, Jinkyu}, title = {Image-Guided Semantic Pseudo-LiDAR Point Generation for 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7137-7147} }
PromptGAR: Flexible Promptive Group Activity Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jin_2026_WACV, author = {Jin, Zhangyu and Feng, Andrew and Chemburkar, Ankur and De Melo, Celso M.}, title = {PromptGAR: Flexible Promptive Group Activity Recognition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4461-4471} }
RPT-SR: Regional Prior attention Transformer for infrared image Super-Resolution-
[pdf]
[arXiv]
[bibtex]@InProceedings{Jin_2026_WACV, author = {Jin, Youngwan and Park, Incheol and Nalcakan, Yagiz and Ju, Hyeongjin and Yeo, Sanghyeop and Kim, Shiho}, title = {RPT-SR: Regional Prior attention Transformer for infrared image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5184-5193} }
Intraoperative 2D/3D Registration via Spherical Similarity Learning and Differentiable Levenberg-Marquardt Optimization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2026_WACV, author = {Chen, Minheng and Kong, Youyong}, title = {Intraoperative 2D/3D Registration via Spherical Similarity Learning and Differentiable Levenberg-Marquardt Optimization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7239-7249} }
M-ErasureBench: A Comprehensive Multimodal Evaluation Benchmark for Concept Erasure in Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Weng_2026_WACV, author = {Weng, Ju-Hsuan and Liao, Jia-Wei and Chou, Cheng-Fu and Chen, Jun-Cheng}, title = {M-ErasureBench: A Comprehensive Multimodal Evaluation Benchmark for Concept Erasure in Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {527-536} }
Bridging the Domain Gap in Small Multimodal Models: A Dual-level Alignment Perspective-
[pdf]
[supp]
[bibtex]@InProceedings{Dayal_2026_WACV, author = {Dayal, Aveen and Divya, Peketi and Tiwari, Nidhi and Cenkeramaddi, Linga Reddy and Mohan, C Krishna and Kumar, Abhinav}, title = {Bridging the Domain Gap in Small Multimodal Models: A Dual-level Alignment Perspective}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8262-8271} }
Leveraging Pretrained Representations for Cross-Modal Point Cloud Completion-
[pdf]
[supp]
[bibtex]@InProceedings{Kale_2026_WACV, author = {Kale, Kshitij and U, Hrishikesh and sreenidhe, V and S, Shylaja S}, title = {Leveraging Pretrained Representations for Cross-Modal Point Cloud Completion}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {97-105} }
Gated Temporal Fusion Transformers for Robust Multi-Object Tracking-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2026_WACV, author = {Kim, Jinho and Yoon, Kuk-Jin}, title = {Gated Temporal Fusion Transformers for Robust Multi-Object Tracking}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4525-4534} }
Moire Zero: An Efficient and High-Performance Neural Architecture for Moire Removal-
[pdf]
[bibtex]@InProceedings{Lee_2026_WACV, author = {Lee, Seungryong and Baek, Woojeong and Kim, Younghyun and Kim, Eunwoo and Moon, Haru and Yoo, Donggon and Park, Eunbyung}, title = {Moire Zero: An Efficient and High-Performance Neural Architecture for Moire Removal}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2520-2530} }
DermEVAL: A Dermatologist-Reviewed Benchmark for Multimodal Large Language Models-
[pdf]
[bibtex]@InProceedings{Zhao_2026_WACV, author = {Zhao, Hongjin and Li, Weihao and Qin, Zhenyue and Ji, Ge-Peng and Liu, Yang and Gedeon, Tom and Barnes, Nick}, title = {DermEVAL: A Dermatologist-Reviewed Benchmark for Multimodal Large Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {927-937} }
GAITGen: Disentangled Motion-Pathology Impaired Gait Generative Model -- Bringing Motion Generation to the Clinical Domain-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Adeli_2026_WACV, author = {Adeli, Vida and Mehraban, Soroush and Mirmehdi, Majid and Whone, Alan and Filtjens, Benjamin and Dadashzadeh, Amirhossein and Fasano, Alfonso and Iaboni, Andrea and Taati, Babak}, title = {GAITGen: Disentangled Motion-Pathology Impaired Gait Generative Model -- Bringing Motion Generation to the Clinical Domain}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3150-3161} }
Perceptually Guided 3DGS Streaming and Rendering for Mixed Reality-
[pdf]
[bibtex]@InProceedings{Zhang_2026_WACV, author = {Zhang, Yunxiang and Mupparaju, Sai Harsha and Chen, Kenneth and Kang, Jenna and Zhang, Xinyu and Omori, Maito and Arimatsu, Kazuyuki and Sun, Qi}, title = {Perceptually Guided 3DGS Streaming and Rendering for Mixed Reality}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4212-4222} }
RAVU: Retrieval Augmented Video Understanding with Compositional Reasoning over Graph-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Malik_2026_WACV, author = {Malik, Sameer and Singh, Ayush and Yamada, Moyuru and Aggarwal, Dishank}, title = {RAVU: Retrieval Augmented Video Understanding with Compositional Reasoning over Graph}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2869-2878} }
Style-Friendly SNR Sampler for Style-Driven Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Choi_2026_WACV, author = {Choi, Jooyoung and Shin, Chaehun and Oh, Yeongtak and Kim, Heeseung and Lee, Jungbeom and Yoon, Sungroh}, title = {Style-Friendly SNR Sampler for Style-Driven Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5703-5713} }
Low-Rank Expert Merging for Multi-Source Domain Adaptation in Person Re-Identification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nehdi_2026_WACV, author = {Nehdi, Taha Mustapha and Mrabah, Nairouz and Belal, Atif and Pedersoli, Marco and Granger, Eric}, title = {Low-Rank Expert Merging for Multi-Source Domain Adaptation in Person Re-Identification}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1809-1819} }
ChartQA-X: Generating Explanations for Visual Chart Reasoning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hegde_2026_WACV, author = {Hegde, Shamanthak and Fazli, Pooyan and Seifi, Hasti}, title = {ChartQA-X: Generating Explanations for Visual Chart Reasoning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6453-6463} }
BOP-Distrib: Revisiting 6D Pose Estimation Benchmarks for Better Evaluation under Visual Ambiguities-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Meden_2026_WACV, author = {Meden, Boris and Brazi, Asma and de Chamisso, Fabrice Mayran and Bourgeois, Steve and Lepetit, Vincent}, title = {BOP-Distrib: Revisiting 6D Pose Estimation Benchmarks for Better Evaluation under Visual Ambiguities}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1575-1585} }
SPOC: Spatially-Progressing Object State Change Segmentation in Video-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mandikal_2026_WACV, author = {Mandikal, Priyanka and Nagarajan, Tushar and Stoken, Alex and Xue, Zihui and Grauman, Kristen}, title = {SPOC: Spatially-Progressing Object State Change Segmentation in Video}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3504-3513} }
RealDroneVision: Dataset and Architecture Advancements for Small-Object Drone Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Sivapuram_2026_WACV, author = {Sivapuram, Arun Kumar and Peddinti, Pranav R T and Puppala, Harish and Prashanth, Komuravelli and Harsha, Jaladi Sri and Gorthi, Rama Krishna Sai}, title = {RealDroneVision: Dataset and Architecture Advancements for Small-Object Drone Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6687-6695} }
brat: Aligned Multi-View Embeddings for Brain MRI Analysis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kayser_2026_WACV, author = {Kayser, Maxime and Gridnev, Maksim and Wang, Wanting and Bain, Max and Rangnekar, Aneesh and Chatterjee, Avijit and Petrov, Aleksandr and Veeraraghavan, Harini and Swinburne, Nathaniel C.}, title = {brat: Aligned Multi-View Embeddings for Brain MRI Analysis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5864-5874} }
TalkingPose: Efficient Face and Gesture Animation with Feedback-guided Diffusion Model-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Javanmardi_2026_WACV, author = {Javanmardi, Alireza and Jaiswal, Pragati and Habtegebrial, Tewodros Amberbir and Millerdurai, Christen and Wang, Shaoxiang and Pagani, Alain and Stricker, Didier}, title = {TalkingPose: Efficient Face and Gesture Animation with Feedback-guided Diffusion Model}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3098-3108} }
Fast Vision Mamba: Pooling Spatial Dimensions for Accelerated Processing-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kapse_2026_WACV, author = {Kapse, Saarthak and Betz, Robin and Sivanandan, Srinivasan}, title = {Fast Vision Mamba: Pooling Spatial Dimensions for Accelerated Processing}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2923-2933} }
A Dataset and Framework for Learning State-invariant Object Representations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sarkar_2026_WACV, author = {Sarkar, Rohan and Kak, Avinash}, title = {A Dataset and Framework for Learning State-invariant Object Representations}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4715-4723} }
SurfDist: Interpretable Three-Dimensional Instance Segmentation Using Curved Surface Patches-
[pdf]
[arXiv]
[bibtex]@InProceedings{Borchardt_2026_WACV, author = {Borchardt, Jackson and Kato, Saul}, title = {SurfDist: Interpretable Three-Dimensional Instance Segmentation Using Curved Surface Patches}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5541-5549} }
Histogram Assisted Quality Aware Generative Model for Resolution Invariant NIR Image Colorization-
[pdf]
[arXiv]
[bibtex]@InProceedings{Attri_2026_WACV, author = {Attri, Abhinav and Dwivedi, Rajeev Ranjan and Das, Samiran and Kurmi, Vinod Kumar}, title = {Histogram Assisted Quality Aware Generative Model for Resolution Invariant NIR Image Colorization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6422-6431} }
DRWKV: Focusing on Object Edges for Low-Light Image Enhancement-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bai_2026_WACV, author = {Bai, Xuecheng and Wang, Yuxiang and Hu, Boyu and Jie, Qinyuan and Xu, Chuanzhi and Li, Kechen and Xiao, Hongru and Chung, Vera}, title = {DRWKV: Focusing on Object Edges for Low-Light Image Enhancement}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1554-1564} }
Fetal and Neonatal Cortical Surface Reconstruction with Anatomical Normal-guidance and Perceptual Enhancements-
[pdf]
[bibtex]@InProceedings{Lee_2026_WACV, author = {Lee, Jiyang and Bae, Woori and Ji, U-Geun and Yang, Hanyeol and Lee, Jong-Min}, title = {Fetal and Neonatal Cortical Surface Reconstruction with Anatomical Normal-guidance and Perceptual Enhancements}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7759-7768} }
Intra-Class Probabilistic Embeddings for Uncertainty Estimation in Vision-Language Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lin_2026_WACV, author = {Lin, Zhenxiang and Haghighat, Maryam and Browne, Will and Miller, Dimity}, title = {Intra-Class Probabilistic Embeddings for Uncertainty Estimation in Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2327-2337} }
ExDDV: A New Dataset for Explainable Deepfake Detection in Video-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hondru_2026_WACV, author = {Hondru, Vlad and Hogea, Eduard and Onchis, Darian and Ionescu, Radu Tudor}, title = {ExDDV: A New Dataset for Explainable Deepfake Detection in Video}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4273-4284} }
TriaGS: Differentiable Triangulation-Guided Geometric Consistency for 3D Gaussian Splatting-
[pdf]
[arXiv]
[bibtex]@InProceedings{Tran_2026_WACV, author = {Tran, Quan and Dang, Tuan}, title = {TriaGS: Differentiable Triangulation-Guided Geometric Consistency for 3D Gaussian Splatting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8396-8405} }
ART: Actor-Related Tubelet for Detecting Complex-shaped Action Tubes-
[pdf]
[supp]
[bibtex]@InProceedings{Zhao_2026_WACV, author = {Zhao, Jiaojiao}, title = {ART: Actor-Related Tubelet for Detecting Complex-shaped Action Tubes}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {308-317} }
Line Art Colorization with Offset Prior-based Diffusion Model-
[pdf]
[supp]
[bibtex]@InProceedings{Zhu_2026_WACV, author = {Zhu, Xuan and Cao, Miao and Zhang, Fang-Lue and Lai, Yu-Kun and Rosin, Paul L}, title = {Line Art Colorization with Offset Prior-based Diffusion Model}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5570-5580} }
F-ViTA: Foundation Model Guided Visible to Infrared Translation-
[pdf]
[supp]
[bibtex]@InProceedings{Paranjape_2026_WACV, author = {Paranjape, Jay Nitin and De Melo, Celso M and Patel, Vishal M.}, title = {F-ViTA: Foundation Model Guided Visible to Infrared Translation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5633-5642} }
DATTA: Domain-Adversarial Test-Time Adaptation for Cross-Domain WiFi-Based Human Activity Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Strohmayer_2026_WACV, author = {Strohmayer, Julian and Sterzinger, Rafael and W\"odlinger, Matthias and Kampel, Martin}, title = {DATTA: Domain-Adversarial Test-Time Adaptation for Cross-Domain WiFi-Based Human Activity Recognition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3421-3430} }
PALMS+: Modular Image-Based Floor Plan Localization Leveraging Depth Foundation Model-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cheng_2026_WACV, author = {Cheng, Yunqian and Princen, Benjamin and Manduchi, Roberto}, title = {PALMS+: Modular Image-Based Floor Plan Localization Leveraging Depth Foundation Model}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7084-7093} }
Ego-EXTRA: video-language Egocentric Dataset for EXpert-TRAinee assistance-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ragusa_2026_WACV, author = {Ragusa, Francesco and Mazzamuto, Michele and Forte, Rosario and D'Ambra, Irene and Fort, James and Engel, Jakob and Furnari, Antonino and Farinella, Giovanni Maria}, title = {Ego-EXTRA: video-language Egocentric Dataset for EXpert-TRAinee assistance}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4438-4450} }
Cluster-Guided Adversarial Perturbations for Robust Contrastive Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Seo_2026_WACV, author = {Seo, Seongyun and Han, Sungmin and Lee, Jeonghyun and Lee, Sangkyun}, title = {Cluster-Guided Adversarial Perturbations for Robust Contrastive Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {350-359} }
FSP-DETR: Few-Shot Prototypical Parasitic Ova Detection-
[pdf]
[arXiv]
[bibtex]@InProceedings{Trehan_2026_WACV, author = {Trehan, Shubham and Ramachandran, Udhav and Rao, Akash and Scimeca, Ruth and Aakur, Sathyanarayanan N.}, title = {FSP-DETR: Few-Shot Prototypical Parasitic Ova Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5342-5351} }
IDEAL-M3D: Instance Diversity-Enriched Active Learning for Monocular 3D Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Meier_2026_WACV, author = {Meier, Johannes and G\"unther, Florian and Marin, Riccardo and Dhaouadi, Oussema and Kaiser, Jacques and Cremers, Daniel}, title = {IDEAL-M3D: Instance Diversity-Enriched Active Learning for Monocular 3D Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {181-191} }
RemEdit: Efficient Diffusion Editing with Riemannian Geometry-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Adhikarla_2026_WACV, author = {Adhikarla, Eashan and Davison, Brian D.}, title = {RemEdit: Efficient Diffusion Editing with Riemannian Geometry}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5037-5046} }
VFace: A Training-Free Approach for Diffusion-Based Video Face Swapping-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Baliah_2026_WACV, author = {Baliah, Sanoojan and Abeysinghe, Yohan and Thushara, Rusiru and Muhammad, Khan and Dhall, Abhinav and Nandakumar, Karthik and Khan, Muhammad Haris}, title = {VFace: A Training-Free Approach for Diffusion-Based Video Face Swapping}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4315-4324} }
CaRS: A Causal Intervention Segmentation Framework and Benchmark Dataset for Autonomous Driving under Transitional Weather Conditions-
[pdf]
[supp]
[bibtex]@InProceedings{Madhavi_2026_WACV, author = {Madhavi, Kondapally and Kumar, K Naveen and Mohan, C Krishna and Babu, Sobhan}, title = {CaRS: A Causal Intervention Segmentation Framework and Benchmark Dataset for Autonomous Driving under Transitional Weather Conditions}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4046-4056} }
FreeCond: Free Lunch in the Input Conditions of Text-Guided Inpainting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hsiao_2026_WACV, author = {Hsiao, Teng-Fang and Ruan, Bo-Kai and Tsai, Sung-Lin and Wu, Yi-Lun and Shuai, Hong-Han}, title = {FreeCond: Free Lunch in the Input Conditions of Text-Guided Inpainting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5498-5508} }
Advancing Player Identification and Tracking with Global ID Fusion (GIF)-
[pdf]
[supp]
[bibtex]@InProceedings{Wojtulewicz_2026_WACV, author = {Wojtulewicz, Karol and Liu, Minxing and Carlsson, Niklas}, title = {Advancing Player Identification and Tracking with Global ID Fusion (GIF)}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7269-7280} }
VRAgent: Self-Refining Agent for Zero-Shot Multimodal Video Retrieval-
[pdf]
[supp]
[bibtex]@InProceedings{Shah_2026_WACV, author = {Shah, Ketul and Nathani, Pankaj and Chellappa, Rama and Heilbron, Fabian Caba}, title = {VRAgent: Self-Refining Agent for Zero-Shot Multimodal Video Retrieval}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8157-8167} }
TaxonRL: Reinforcement Learning with Intermediate Rewards for Interpretable Fine-Grained Visual Reasoning-
[pdf]
[bibtex]@InProceedings{von_Klinski_2026_WACV, author = {von Klinski, Maximilian and Schall, Maximilian}, title = {TaxonRL: Reinforcement Learning with Intermediate Rewards for Interpretable Fine-Grained Visual Reasoning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2485-2498} }
Revisiting Retentive Networks for Fast Range-View 3D LiDAR Semantic Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Mosco_2026_WACV, author = {Mosco, Simone and Fusaro, Daniel and Li, Wanmeng and Pretto, Alberto}, title = {Revisiting Retentive Networks for Fast Range-View 3D LiDAR Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2499-2509} }
Alignment and Distillation: A Robust Framework for Multimodal Domain Generalizable Human Action Recognition-
[pdf]
[bibtex]@InProceedings{Ji_2026_WACV, author = {Ji, Hyeonbin and Lee, Juyeob and Park, Eunil}, title = {Alignment and Distillation: A Robust Framework for Multimodal Domain Generalizable Human Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6913-6924} }
GraspDiffusion: Synthesizing Realistic Whole-body Hand-Object Interaction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kwon_2026_WACV, author = {Kwon, Patrick and Chen, Chen and Joo, Hanbyul}, title = {GraspDiffusion: Synthesizing Realistic Whole-body Hand-Object Interaction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2392-2403} }
Understanding Human-Like Biases in VLMs via Subjective Face Analytics-
[pdf]
[supp]
[bibtex]@InProceedings{Roygaga_2026_WACV, author = {Roygaga, Chaitanya and Bharati, Aparna}, title = {Understanding Human-Like Biases in VLMs via Subjective Face Analytics}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {514-526} }
Correcting and Quantifying Systematic Errors in 3D Box Annotations for Autonomous Driving-
[pdf]
[arXiv]
[bibtex]@InProceedings{Miro_2026_WACV, author = {Miro, Alexandre Justo and af Klinteberg, Ludvig and Timus, Bogdan and Asefaw, Aron and Khoche, Ajinkya and Gustafsson, Thomas and Mansouri, Sina Sharif and Daneshtalab, Masoud}, title = {Correcting and Quantifying Systematic Errors in 3D Box Annotations for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6724-6732} }
CaFlow: Enhancing Long-Term Action Quality Assessment with Causal Counterfactual Flow-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Han_2026_WACV, author = {Han, Ruisheng and Zhou, Kanglei and Chen, Shuang and Atapour-Abarghouei, Amir and Shum, Hubert P. H.}, title = {CaFlow: Enhancing Long-Term Action Quality Assessment with Causal Counterfactual Flow}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8231-8241} }
Learning Beyond Labels: Self-Supervised Handwritten Text Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Mitra_2026_WACV, author = {Mitra, Shree and Mondal, Ajoy and Jawahar, C.V.}, title = {Learning Beyond Labels: Self-Supervised Handwritten Text Recognition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6653-6663} }
A Woman with a Knife or A Knife with a Woman? Measuring Directional Bias Amplification in Image Captions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nair_2026_WACV, author = {Nair, Rahul and Tokas, Bhanu and Kerner, Hannah}, title = {A Woman with a Knife or A Knife with a Woman? Measuring Directional Bias Amplification in Image Captions}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {255-264} }
Vision-informed Semantic Text Alignment for Open-set Recognition in Remote Sensing-
[pdf]
[supp]
[bibtex]@InProceedings{Gole_2026_WACV, author = {Gole, Siddhant and Pal, Akash and Jha, Ankit and Chaudhuri, Subhasis and Banerjee, Biplab}, title = {Vision-informed Semantic Text Alignment for Open-set Recognition in Remote Sensing}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2828-2837} }
Guided Model Merging for Hybrid Data Learning: Leveraging Centralized Data to Refine Decentralized Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2026_WACV, author = {Zhu, Junyi and Yao, Ruicong and Ceritli, Taha and Ozkan, Savas and Blaschko, Matthew B. and Noh, Eunchung and Min, Jeongwon and Min, Cho Jung and Ozay, Mete}, title = {Guided Model Merging for Hybrid Data Learning: Leveraging Centralized Data to Refine Decentralized Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3182-3192} }
EndoPBR: Photorealistic Synthetic Data for Surgical 3D Vision via Physically-based Rendering-
[pdf]
[bibtex]@InProceedings{Han_2026_WACV, author = {Han, John J. and Wu, Jie Ying}, title = {EndoPBR: Photorealistic Synthetic Data for Surgical 3D Vision via Physically-based Rendering}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5601-5611} }
KMOPS: Keypoint-Driven Method for Multi-Object Pose and Metric Size Estimation from Stereo Images-
[pdf]
[supp]
[bibtex]@InProceedings{Wu_2026_WACV, author = {Wu, Ying-Kun and Shen, Yi and Huang, Tzuhsuan and Fang, I-Sheng and Chen, Jun-Cheng}, title = {KMOPS: Keypoint-Driven Method for Multi-Object Pose and Metric Size Estimation from Stereo Images}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7730-7739} }
Referring Change Detection in Remote Sensing Imagery-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Korkmaz_2026_WACV, author = {Korkmaz, Yilmaz and Paranjape, Jay N. and de Melo, Celso M. and Patel, Vishal M.}, title = {Referring Change Detection in Remote Sensing Imagery}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {106-116} }
Isolating the Role of Temporal Information in Video Saliency: A Controlled Experimental Analysis-
[pdf]
[supp]
[bibtex]@InProceedings{El-Jiz_2026_WACV, author = {El-Jiz, Peter and Kuemmerer, Matthias and Tangemann, Matthias and Bethge, Matthias and Bartels, Andreas and Bannert, Michael Mario}, title = {Isolating the Role of Temporal Information in Video Saliency: A Controlled Experimental Analysis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5909-5918} }
Data-Driven Loss Functions for Inference-Time Optimization in Text-to-Image-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yiflach_2026_WACV, author = {Yiflach, Sapir Esther and Atzmon, Yuval and Chechik, Gal}, title = {Data-Driven Loss Functions for Inference-Time Optimization in Text-to-Image}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3525-3535} }
ScoreNet: Netting Lightweight Quality Scores for Better Visual Assessment with Large Multi-Modality Models-
[pdf]
[supp]
[bibtex]@InProceedings{Rashidi_2026_WACV, author = {Rashidi, Bahador and Aghakasiri, Kiarash and Zhang, Shupei and Sattarifard, Amirmohsen and Zhang, Yue and Gao, Chao}, title = {ScoreNet: Netting Lightweight Quality Scores for Better Visual Assessment with Large Multi-Modality Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7008-7018} }
Digital Forensic AI You Can Explain: A Case Study on Video Source Camera Identification-
[pdf]
[bibtex]@InProceedings{Veksler_2026_WACV, author = {Veksler, Maryna and Akkaya, Kemal and Uluagac, Selcuk}, title = {Digital Forensic AI You Can Explain: A Case Study on Video Source Camera Identification}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7030-7039} }
CoreCaption: Core Caption based Text-to-Video Retrieval-
[pdf]
[supp]
[bibtex]@InProceedings{Jang_2026_WACV, author = {Jang, Junkyu}, title = {CoreCaption: Core Caption based Text-to-Video Retrieval}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6600-6610} }
M4U: Evaluating Multilingual Understanding and Reasoning for Large Multimodal Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2026_WACV, author = {Wang, Hongyu and Xu, Jiayu and Xie, Senwei and Wang, Ruiping and Li, Jialin and Xie, Zhaojie and Zhang, Bin and Xiong, Chuyan and Chen, Xilin}, title = {M4U: Evaluating Multilingual Understanding and Reasoning for Large Multimodal Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {382-392} }
Snapmoji: Instant Generation of Animatable Dual-Stylized Avatars-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2026_WACV, author = {Chen, Eric Ming and Liu, Di and Ma, Sizhuo and Vasilkovsky, Michael and Zhou, Bing and Gao, Qiang and Wang, Wenzhou and Luo, Jiahao and Metaxas, Dimitris N. and Sitzmann, Vincent and Wang, Jian}, title = {Snapmoji: Instant Generation of Animatable Dual-Stylized Avatars}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1948-1958} }
BanglaProtha: Evaluating Vision Language Models in Underrepresented Long-tail Cultural Contexts-
[pdf]
[supp]
[bibtex]@InProceedings{Fahim_2026_WACV, author = {Fahim, Md and Rahman, Md Sakib Ul and Rahman, Akm Moshiur and Ishmam, Md Farhan and Rahman, Md Tasmim and Shifat, Fariha Tanjim and Haider, Fabiha and Alam Bhuiyan, Md Farhad}, title = {BanglaProtha: Evaluating Vision Language Models in Underrepresented Long-tail Cultural Contexts}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1159-1169} }
CineVerse: Consistent Keyframe Synthesis for Cinematic Scene Composition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Phung_2026_WACV, author = {Phung, Quynh and Mai, Long and Heilbron, Fabian David Caba and Liu, Feng and Huang, Jia-Bin and Ham, Cusuh}, title = {CineVerse: Consistent Keyframe Synthesis for Cinematic Scene Composition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2626-2636} }
Language Integration in Fine-Tuning Multimodal Large Language Models for Image-Based Regression-
[pdf]
[arXiv]
[bibtex]@InProceedings{Jennings_2026_WACV, author = {Jennings, Roy H. and Paikin, Genady and Shaul, Roy and Soloveichik, Evgeny}, title = {Language Integration in Fine-Tuning Multimodal Large Language Models for Image-Based Regression}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3462-3471} }
Towards Reliable Test-Time Adaptation: Style Invariance as a Correctness Likelihood-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nam_2026_WACV, author = {Nam, Gilhyun and Kim, Taewon and Jeong, Joonhyun and Yang, Eunho}, title = {Towards Reliable Test-Time Adaptation: Style Invariance as a Correctness Likelihood}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {3088-3097} }
MBTI: Metric-Based Textual Inversion for Fine-Grained Image Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Chae_2026_WACV, author = {Chae, Byungkwan and Choi, Youngjae and Kim, Heewon}, title = {MBTI: Metric-Based Textual Inversion for Fine-Grained Image Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1106-1116} }
PRISM-CAFO: Prior-conditioned Remote-sensing Infrastructure Segmentation and Mapping for CAFOs-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hoque_2026_WACV, author = {Hoque, Oishee Bintey and Mandal, Nibir Chandra and Luong, Kyle and Wilson, Amanda and Swarup, Samarth and Marathe, Madhav and Adiga, Abhijin}, title = {PRISM-CAFO: Prior-conditioned Remote-sensing Infrastructure Segmentation and Mapping for CAFOs}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2083-2093} }
Gaussian Representations for Video-
[pdf]
[supp]
[bibtex]@InProceedings{Shah_2026_WACV, author = {Shah, Sachin and Choudhury, Anustup and Su, Guan-Ming and Pytlarz, Jaclyn and Metzler, Christopher A. and Mittal, Trisha}, title = {Gaussian Representations for Video}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {827-837} }
Semantic Map Guided Bird's-Eye View Learning for Online HD Map Construction-
[pdf]
[bibtex]@InProceedings{Ren_2026_WACV, author = {Ren, Huantao and Eraqi, Hesham M. and Musa, ABM and Moustafa, Mohamed}, title = {Semantic Map Guided Bird's-Eye View Learning for Online HD Map Construction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7852-7861} }
X-JEPA: A Novel Joint Learning Cross-Modal Predictive Alignment Framework for Remote Sensing Image Retrieval-
[pdf]
[supp]
[bibtex]@InProceedings{Choudhury_2026_WACV, author = {Choudhury, Shabnam and Salunkhe, Yash and Rajan, Vaibhav and Chaudhuri, Subhasis and Banerjee, Biplab}, title = {X-JEPA: A Novel Joint Learning Cross-Modal Predictive Alignment Framework for Remote Sensing Image Retrieval}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4355-4364} }
VLMs Guided Interpretable Decision Making in Autonomous Driving-
[pdf]
[arXiv]
[bibtex]@InProceedings{Hu_2026_WACV, author = {Hu, Xin and Jing, Taotao and Tian, Renran and Ding, Zhengming}, title = {VLMs Guided Interpretable Decision Making in Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4494-4503} }
Confidence Through Parallel Attention for Depth and Uncertainty Estimation in Dynamic Environments-
[pdf]
[supp]
[bibtex]@InProceedings{Susladkar_2026_WACV, author = {Susladkar, Onkar and Pawar, Rohit and Sehgal, Chirag and Ujjawal, Samaksh and Mittal, Sparsh}, title = {Confidence Through Parallel Attention for Depth and Uncertainty Estimation in Dynamic Environments}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4396-4406} }
Enhancing Monocular 3D Hand Reconstruction with Learned Texture Priors-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Karvounas_2026_WACV, author = {Karvounas, Giorgos and Kyriazis, Nikolaos and Oikonomidis, Iason and Pavlakos, Georgios and Argyros, Antonis A.}, title = {Enhancing Monocular 3D Hand Reconstruction with Learned Texture Priors}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7073-7083} }
ACuRE: Accurate Continuity-Regularized SpO2 Estimation Using Liquid Time-Constant Networks-
[pdf]
[supp]
[bibtex]@InProceedings{Ahmad_2026_WACV, author = {Ahmad, Shahzad and Mishra, Divya and Bano, Sania and Chanda, Sukalpa and Rawat, Yogesh Singh}, title = {ACuRE: Accurate Continuity-Regularized SpO2 Estimation Using Liquid Time-Constant Networks}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7250-7259} }
SceneShine: Illumination-aware Human Scene Gaussian Re-Splatting from Mobile Device Video-
[pdf]
[supp]
[bibtex]@InProceedings{Ren_2026_WACV, author = {Ren, Xuqian and Wang, Wenjia and Nguyen, Mai Ngoc and Kannala, Juho and Rahtu, Esa}, title = {SceneShine: Illumination-aware Human Scene Gaussian Re-Splatting from Mobile Device Video}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8302-8312} }
Gene-DML: Dual-Pathway Multi-Level Discrimination for Gene Expression Prediction from Histopathology Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Song_2026_WACV, author = {Song, Yaxuan and Fan, Jianan and Chang, Hang and Cai, Weidong}, title = {Gene-DML: Dual-Pathway Multi-Level Discrimination for Gene Expression Prediction from Histopathology Images}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5090-5099} }
PatchEAD: Unifying Industrial Visual Prompting Frameworks for Patch-Exclusive Anomaly Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2026_WACV, author = {Huang, Po-Han and Li, Jeng-Lin and Huang, Po-Hsuan and Chang, Ming-Ching and Chen, Wei-Chao}, title = {PatchEAD: Unifying Industrial Visual Prompting Frameworks for Patch-Exclusive Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5531-5540} }
DODA: Adapting Object Detectors to Dynamic Agricultural Environments in Real-Time with Diffusion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xiang_2026_WACV, author = {Xiang, Shuai and Blok, Pieter M. and Burridge, James and Wang, Haozhou and Guo, Wei}, title = {DODA: Adapting Object Detectors to Dynamic Agricultural Environments in Real-Time with Diffusion}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4797-4807} }
T2VWorldBench: A Benchmark for Evaluating World Knowledge in Text-to-Video Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2026_WACV, author = {Chen, Yubin and Guo, Xuyang and Shi, Zhenmei and Song, Zhao and Zhang, Jiahao}, title = {T2VWorldBench: A Benchmark for Evaluating World Knowledge in Text-to-Video Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6474-6485} }
Unlocking Vision-Language Models for Video Anomaly Detection via Fine-Grained Prompting-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zou_2026_WACV, author = {Zou, Shu and Tian, Xinyu and Wesemann, Lukas and Waschkowski, Fabian and Yang, Zhaoyuan and Zhang, Jing}, title = {Unlocking Vision-Language Models for Video Anomaly Detection via Fine-Grained Prompting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {4223-4233} }
HyPCA-Net: Advancing Multimodal Fusion in Medical Image Analysis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dhar_2026_WACV, author = {Dhar, Joy and Pandey, Manish Kumar and Das Chakladar, Debashis and Haghighat, Maryam and Alavi, Azadeh and Mistry, Sajib and Zaidi, Nayyar}, title = {HyPCA-Net: Advancing Multimodal Fusion in Medical Image Analysis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1831-1840} }
No MoCap Needed: Post-Training Motion Diffusion Models with Reinforcement Learning using Only Textual Prompts-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Girolamo_2026_WACV, author = {Girolamo, Macaluso and Lorenzo, Mandelli and Bicchierai, Mirko and Berretti, Stefano and Bagdanov, Andrew D.}, title = {No MoCap Needed: Post-Training Motion Diffusion Models with Reinforcement Learning using Only Textual Prompts}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {967-976} }
Back
